agent: nits

2024-04-09 23:50:08 +01:00 · 2024-04-09 23:50:08 +01:00 · 0532680f40
commit 0532680f40
parent 6880f1d4c0
11 changed files with 10 additions and 88 deletions
--- a/examples/agent/fastify-requirements.txt
+++ b/examples/agent/fastify-requirements.txt
@ -2,4 +2,4 @@ fastapi[all]
 pydantic
 sse-starlette
 uvicorn[all]
-typer[all]
+typer[all]
--- a/examples/agent/requirements.txt
+++ b/examples/agent/requirements.txt
@ -5,4 +5,4 @@ pydantic
 requests
 sse-starlette
 uvicorn[all]
-typer[all]
+typer[all]
--- a/examples/agent/run_sandboxed_tools.sh
+++ b/examples/agent/run_sandboxed_tools.sh
@ -71,4 +71,4 @@ docker run \
    --mount "type=bind,source=$( realpath "$script_folder" ),target=/src,readonly" \
    --mount "type=bind,source=$( realpath "$DATA_DIR" ),target=/data" \
    -p "$PORT:$PORT" \
-    -it "$LLAMA_IMAGE_NAME"
+    -it "$LLAMA_IMAGE_NAME"
--- a/examples/openai/api.py
+++ b/examples/openai/api.py
@ -87,4 +87,4 @@ class ChatCompletionResponse(BaseModel):
    choices: list[Choice]
    usage: Usage
    system_fingerprint: str
-    error: Optional[CompletionError] = None
+    error: Optional[CompletionError] = None
--- a/examples/openai/llama_cpp_server_api.py
+++ b/examples/openai/llama_cpp_server_api.py
@ -9,4 +9,4 @@ class LlamaCppServerCompletionRequest(LlamaCppParams):
    cache_prompt: Optional[bool] = None

    grammar: Optional[str] = None
-    json_schema: Optional[Json] = None
+    json_schema: Optional[Json] = None
--- a/examples/openai/prompt1.txt
+++ b/examples/openai/prompt1.txt
@ -1,43 +0,0 @@
-<|im_start|>system
-Role:
-  You are a function calling AI agent with self-recursion.
-  You can call only one function at a time and analyse data you get from function response.
-  You are provided with function signatures within <tools></tools> XML tags.
-  The current date is: March 25, 2024.
-
-Objective:
-  You may use agentic frameworks for reasoning and planning to help with user query.
-  Please call a function and wait for function results to be provided to you in the next iteration.
-  Don't make assumptions about what values to plug into function arguments.
-  Once you have called a function, results will be fed back to you within <tool_response></tool_response> XML tags.
-  Don't make assumptions about tool results if <tool_response> XML tags are not present since function hasn't been executed yet.
-  Analyze the data once you get the results and call another function.
-  At each iteration please continue adding the your analysis to previous summary.
-  Your final response should directly answer the user query with an anlysis or summary of the results of function calls.
-
-Tools:
-  Here are the available tools:
-  <tools> 
-  {"type":"function","function":{"name":"get_current_weather","description":"Get the current weather","parameters":{"type":"object","properties":{"location":{"type":"string","description":"The city and state, e.g. San Francisco, CA"},"format":{"type":"string","enum":["celsius","fahrenheit"],"description":"The temperature unit to use. Infer this from the users location."}},"required":["location","format"]}}}
-  {"type":"function","function":{"name":"get_n_day_weather_forecast","description":"Get an N-day weather forecast","parameters":{"type":"object","properties":{"location":{"type":"string","description":"The city and state, e.g. San Francisco, CA"},"format":{"type":"string","enum":["celsius","fahrenheit"],"description":"The temperature unit to use. Infer this from the users location."},"num_days":{"type":"integer","description":"The number of days to forecast"}},"required":["location","format","num_days"]}}} 
-  </tools>
-  If the provided function signatures doesn't have the function you must call, you may write executable python code in markdown syntax and call code_interpreter() function as follows:
-  <tool_call>
-  {"arguments": {"code_markdown": <python-code>, "name": "code_interpreter"}}
-  </tool_call>
-  Make sure that the json object above with code markdown block is parseable with json.loads() and the XML block with XML ElementTree.
-
-Instructions:
-  At the very first turn you don't have <tool_results> so you shouldn't not make up the results.
-  Please keep a running summary with analysis of previous function results and summaries from previous iterations.
-  Do not stop calling functions until the task has been accomplished or you've reached max iteration of 10.
-  Calling multiple functions at once can overload the system and increase cost so call one function at a time please.
-  If you plan to continue with analysis, always call another function.
-  For each function call return a valid json object (using doulbe quotes) with function name and arguments within <tool_call></tool_call> XML tags as follows:
-  <tool_call>
-  {"arguments": <args-dict>, "name": <function-name>}
-  </tool_call>
-<|im_end|>
-<|im_start|>user
-what is the weather going to be like in San Francisco and Glasgow over the next 4 days (temperature in celsius for both)<|im_end|>
-<|im_start|>assistant
--- a/examples/openai/requirements.txt
+++ b/examples/openai/requirements.txt
@ -4,4 +4,4 @@ jinja2
 pydantic
 sse-starlette
 uvicorn[all]
-typer[all]
+typer[all]
--- a/examples/openai/server.py
+++ b/examples/openai/server.py
@ -139,7 +139,7 @@ def main(
        messages = chat_request.messages

        prompt = chat_handler.render_prompt(messages)
-        
+
        if verbose:
            sys.stderr.write(f'\n# REQUEST:\n\n{chat_request.model_dump_json(indent=2)}\n\n')
            # sys.stderr.write(f'\n# MESSAGES:\n\n{TypeAdapter(list[Message]).dump_json(messages)}\n\n')
--- a/examples/openai/test_chat_handlers.py
+++ b/examples/openai/test_chat_handlers.py
@ -202,14 +202,14 @@ if __name__ == "__main__":
                ch = get_chat_handler(args, parallel_calls=True, tool_style=style)

                print(f'\n### {model_name} / {style.name} / {tool_situation}\n')
-                
+
                print(f'\nPrompt:\n\n```js\n{ch.render_prompt(TEST_MESSAGES_THOUGHT)}\n```\n')

                print(f'\nOutput format prompt:\n\n```json\n{ch.output_format_prompt.content}\n```\n')

                print(f'\nGrammar:\n\n```js\n{ch.grammar}\n```\n')

-                        
+
                # if model_name == 'hermes_2_pro_mistral':
                #     print("Skipping hermes_2_pro_mistral")
                #     continue
@ -233,38 +233,3 @@ if __name__ == "__main__":
            print(f'{f}\n\n')

        assert not failures
-    # test_templates([
-    #     Message(**{
-    #         "role": "user",
-    #         "name": None,
-    #         "tool_call_id": None,
-    #         "content": "What is the sum of 2535 squared and 32222000403 then multiplied by one and a half. What's a third of the result?",
-    #         "tool_calls": None
-    #     }),
-    #     Message(**{
-    #         "role": "assistant",
-    #         # "name": None,
-    #         "tool_call_id": None,
-    #         "content": "?",
-    #         "tool_calls": [
-    #             {
-    #                 # "id": "call_531873",
-    #                 "type": "function",
-    #                 "function": {
-    #                     "name": TOOL_NAME,
-    #                     "arguments": {
-    #                         "a": 2535,
-    #                         "b": 32222000403
-    #                     }
-    #                 }
-    #             }
-    #         ]
-    #     }),
-    #     Message(**{
-    #         "role": "tool",
-    #         "name": TOOL_NAME,
-    #         "tool_call_id": "call_531873",
-    #         "content": "32222002938",
-    #         "tool_calls": None
-    #     })
-    # ])
--- a/gguf-py/examples/reader.py
+++ b/gguf-py/examples/reader.py
@ -3,7 +3,6 @@ import sys
 from pathlib import Path
 from gguf.gguf_reader import GGUFReader

-
 sys.path.insert(0, str(Path(__file__).parent.parent))


--- a/gguf-py/gguf/gguf_reader.py
+++ b/gguf-py/gguf/gguf_reader.py
@ -50,6 +50,7 @@ class ReaderField(NamedTuple):
    types: list[GGUFValueType] = []


+
 class ReaderTensor(NamedTuple):
    name: str
    tensor_type: GGMLQuantizationType