Move function format specification to function_tool.py

2024-09-28 14:10:55 -07:00 · 2024-09-28 14:10:55 -07:00 · 8550b76f4e
commit 8550b76f4e
parent af0a9faf7f
2 changed files with 58 additions and 38 deletions
--- a/examples/function-calling/function_tool.py
+++ b/examples/function-calling/function_tool.py
@ -3,6 +3,8 @@
 import inspect
 import re
 import json
 # Extract OpenAI function calling style definitions from functions
 #
 # Generated with: Create a python function to to generate the OpenAI function calling definition from a given function, getting the description, parameter type and parameter description from the function documentation, assuming the function documentation contains sphynx style parameter descriptions, marked with :param.
@ -36,7 +38,7 @@ def get_function_tool_json(func):
 # Generate function definition schema from function definitions
 #
 # This is from llama-cpp-python, llama_chat_format.py
-def generate_schema_from_functions(functions, namespace="functions") -> str:
+def generate_functionary_schema_from_functions(functions, namespace="functions") -> str:
    schema = (
        "// Supported function definitions that should be called when necessary.\n"
    )
@ -61,3 +63,31 @@ def generate_schema_from_functions(functions, namespace="functions") -> str:
    schema += "}} // namespace {}".format(namespace)
    return schema
 functionary_prompt_start = """<|start_header_id|>system<|end_header_id|>
 You are capable of executing available function(s) if required.
 Execute function(s) as needed.
 The function calls are not shown in the conversation and should be called covertly to answer questions.
 Ask for the required input to:recipient==all
 Use JSON for function arguments.
 Respond in this format:
 >>>${recipient}
 ${content}
 Available functions:
 """
 functionary_prompt_end = """<|eot_id|><|start_header_id|>system<|end_header_id|>
 When you send a message containing Python code to python, it will be executed in a stateful Jupyter notebook environment. python will respond with the output of the execution or time out after 60.0 seconds. The drive at '/mnt/data' can be used to save and persist user files.<|eot_id|><|start_header_id|>user<|end_header_id|>
 """
 def get_chat_tool_format(args, tools):
    return {
        'prompt': functionary_prompt_start + generate_functionary_schema_from_functions(tools) + functionary_prompt_end,
        'function_marker': '>>>',
        'function_re': r'>>>([^\n]*)\n(.*)<\|eot_id\|>',
        'user_start': '<|start_header_id|>user<|end_header_id|>\n',
        'user_end': '<|eot_id|><|start_header_id|>assistant<|end_header_id|>' + '\n',
        'tool_start': '',
        'tool_end': '<|eot_id|><|start_header_id|>assistant<|end_header_id|>'
    }
--- a/examples/function-calling/llama-cli-function-runner.py
+++ b/examples/function-calling/llama-cli-function-runner.py
@ -10,28 +10,11 @@ import re
 import json
 import functions
-from function_tool import get_function_tool_json, generate_schema_from_functions
+from function_tool import get_function_tool_json, get_chat_tool_format
 function_name_list = [ name for name in dir(functions) if not name.startswith('_') ]
 function_lookup = { name: getattr(functions, name) for name in function_name_list }
 tools = [ get_function_tool_json(f) for (n, f) in function_lookup.items() ]
 function_schema = generate_schema_from_functions(tools)
 prompt = """<|start_header_id|>system<|end_header_id|>
 You are capable of executing available function(s) if required.
 Execute function(s) as needed.
 The function calls are not shown in the conversation and should be called covertly to answer questions.
 Ask for the required input to:recipient==all
 Use JSON for function arguments.
 Respond in this format:
 >>>${recipient}
 ${content}
 Available functions:
 """ + function_schema + """<|eot_id|><|start_header_id|>system<|end_header_id|>
 When you send a message containing Python code to python, it will be executed in a stateful Jupyter notebook environment. python will respond with the output of the execution or time out after 60.0 seconds. The drive at '/mnt/data' can be used to save and persist user files.<|eot_id|><|start_header_id|>user<|end_header_id|>
 """
 def main():
    import argparse
@ -39,13 +22,17 @@ def main():
    parser = argparse.ArgumentParser(epilog='For more options: llama-cli --help')
    parser.add_argument('--display-prompt', action=argparse.BooleanOptionalAction, default=False)
    parser.add_argument('--special', action=argparse.BooleanOptionalAction, default=False)
-    parser.add_argument('--reverse-prompt', type=str, default='<|start_header_id|>user<|end_header_id|>\n')
+    parser.add_argument('--reverse-prompt', type=str)
    parser.add_argument('--ctx-size', type=int, default=1024)
    args, other_args = parser.parse_known_args()
-    if args.display_prompt: print(prompt)
+    tool_format = get_chat_tool_format(args, tools)
    if args.reverse_prompt is None: args.reverse_prompt = tool_format['user_start']
-    command = [ './llama-cli', '-i', '-p', prompt, '--reverse-prompt', args.reverse_prompt, '--escape', '--special', '--no-display-prompt', '--log-disable', '--simple-io', '--ctx-size',  str(args.ctx_size), *other_args]
+    if args.display_prompt: print(tool_format['prompt'])
    command = [ './llama-cli', '-i', '-p', tool_format['prompt'], '--reverse-prompt', args.reverse_prompt, '--escape', '--special', '--no-display-prompt', '--log-disable', '--simple-io', '--ctx-size',  str(args.ctx_size), *other_args]
    print("'" + "' '".join(command) + "'")
    process = subprocess.Popen(
        command,
@ -57,14 +44,14 @@ def main():
    if process.stdout is not None: os.set_blocking(process.stdout.fileno(), False)
    try:
-        run_loop(process, args)
+        run_loop(process, args, tool_format)
    except KeyboardInterrupt:
        print("\nInterrupted by user.")
    finally:
        process.terminate()
        process.wait()
-def run_loop(process, args):
+def run_loop(process, args, tool_format):
    pbuffer = ''
    skip_output_until_result = False
    while True:
@ -76,29 +63,32 @@ def run_loop(process, args):
                if not pdata: continue
                pbuffer += pdata
-                if(match := re.search(r'>>>([^\n]*)\n(.*)<\|eot_id\|>', pbuffer, re.S)):
+                if(match := re.search(tool_format['function_re'], pbuffer, re.S)):
                    if not args.special:
                        pdata = pdata[:match.pos]
                    pbuffer = ''
                    skip_output_until_result = False
-
+                    try:
                        if 1 < len(match.groups()):
                            tool_name = match.group(1)
-                    tool_args = match.group(2)
+                            tool_args = json.loads(match.group(2))
                        else:
                            tool = json.loads(match.group(1))
                            tool_name = tool['name']
                            tool_args = tool['arguments']
                        if tool_name == 'python':
                            result = functions._run_python(tool_args);
                        else:
                        try:
                            tool_args = json.loads(tool_args)
                            result = function_lookup[tool_name](**tool_args)
                    except ValueError as e:
                        result = {'error': 'unknown'}
-                    result = json.dumps(result) + '<|eot_id|><|start_header_id|>assistant<|end_header_id|>'
+                    result = tool_format['tool_start'] + json.dumps(result) + tool_format['tool_end']
                    process.stdin.write(result + '\n')
                    process.stdin.flush()
                    if(args.special): pdata += '\n' + result
-                elif (n := pdata.find('>>>')) >= 0:
+                elif (n := pdata.find(tool_format['function_marker'])) >= 0:
                    if not args.special:
                        pdata = pdata[:n]
                        skip_output_until_result = True
@ -114,7 +104,7 @@ def run_loop(process, args):
                user_input = sys.stdin.readline()
                if user_input:
                    user_input = user_input.rstrip()
-                    process.stdin.write(user_input + '<|eot_id|><|start_header_id|>assistant<|end_header_id|>' + '\n')
+                    process.stdin.write(user_input + tool_format['user_end'] + '\n')
                    process.stdin.flush()
 if __name__ == '__main__':