Improved tool use

5 months ago · 238a5146f8
parent d2319209e1
commit 238a5146f8
6 changed files with 252 additions and 223 deletions
--- a/init.py
+++ b/init.py
@ -3,6 +3,6 @@ llm_client: A Python package for interacting with LLM models through Ollama.
 """
 from _llm._llm.llm import LLM
-from _llm._llm.tool_registy import register_tool, get_tools
+from _llm._llm.tool_registry import register_tool, get_tools
 __all__ = ["LLM", "register_tool", "get_tools"]
--- a/_llm/init.py
+++ b/_llm/init.py
@ -1,6 +1,6 @@
 from .llm import LLM  # re-export the class from the module
-from .tool_registy import register_tool, get_tools
+from .tool_registry import register_tool, get_tools
 # Define public API
 __all__ = ["LLM", "register_tool", "get_tools"]
--- a/_llm/llm.py
+++ b/_llm/llm.py
@ -9,19 +9,19 @@ from openai.types.chat import ChatCompletion, ChatCompletionChunk
 from openai.types.chat.chat_completion import Choice
 from openai.types.chat.chat_completion_message import ChatCompletionMessage
 from openai.types.responses import ParsedResponse
 import backoff
 import env_manager
 import json
 try:
-    from .tool_registy import get_tools, register_tool
+    from .tool_registry import get_tools, parse_function_call_arguments, execute_tool
 except ImportError:
-    from tool_registy import get_tools, register_tool
+
    from _llm._llm.tool_registry import get_tools, parse_function_call_arguments, execute_tool
 try:
    from colorprinter.print_color import *
 except ImportError:
-    from colorprinter.print_color import *
+    from colorprinter.colorprinter.print_color import *
@ -487,6 +487,7 @@ class LLM:
        # Call the OpenAI API
        else:
            response: ChatCompletion = self.client.chat.completions.create(**kwargs)
        # Try to extract backend information if available
        try:
            response_headers = getattr(response, "_headers", {})
@ -720,10 +721,64 @@ class LLM:
                else:
                    choice = response.choices[0]
                    message: ChatCompletionMessage = choice.message
                    print(message)
                    if hasattr(message, 'tool_calls') and message.tool_calls:
                        # Hantera flera verktygsanrop sequensielt
                        for tool_call in message.tool_calls:
                            try:
                                fn = getattr(tool_call, "function", None) or (tool_call.get("function") if isinstance(tool_call, dict) else None)
                                if not fn:
                                    continue
                                func_name = getattr(fn, "name", None) or (fn.get("name") if isinstance(fn, dict) else None)
                                raw_args = getattr(fn, "arguments", None) or (fn.get("arguments") if isinstance(fn, dict) else None)
                                # Automatisk JSON-parsing av argument om de kommer som sträng (för vLLM-kompatibilitet)
                                if isinstance(raw_args, str):
                                    try:
                                        parsed_args = json.loads(raw_args)
                                        # Uppdatera function.arguments med den parsade versionen för enklare användning
                                        if hasattr(fn, "arguments"):
                                            fn.arguments = parsed_args  # Uppdatera objektet direkt
                                        elif isinstance(fn, dict):
                                            fn["arguments"] = parsed_args
                                    except json.JSONDecodeError as e:
                                        print_red(f"Warning: Could not parse tool arguments as JSON: {e}")
                                        # Fallback till parse_function_call_arguments för robusthet
                                        parsed_args = parse_function_call_arguments(raw_args)
                                else:
                                    parsed_args = raw_args if isinstance(raw_args, dict) else {}
                                # Kör verktyget via tool_registry.execute_tool (validering och typ-coercion görs där)
                                tool_result = execute_tool(func_name, parsed_args)
                                # Sätt in tool-result i messages så modellen kan läsa det vidare
                                tool_content = tool_result if isinstance(tool_result, str) else json.dumps(tool_result, ensure_ascii=False)
                                self.messages.append({"role": "tool", "name": func_name, "content": tool_content})
                            except Exception as e:
                                print_red(f"Error executing tool {func_name}: {e}")
                                # append error to messages so model sees it (and you can debug)
                                self.messages.append({"role": "tool", "name": func_name or "unknown", "content": json.dumps({"error": str(e)})})
                    # fallback: older SDKs / shapes:
                    if hasattr(message, 'function_call') and message.function_call:
                        fc = message.function_call
                        func_name = getattr(fc, "name", None) or (fc.get("name") if isinstance(fc, dict) else None)
                        args_raw = getattr(fc, "arguments", None) or (fc.get("arguments") if isinstance(fc, dict) else None)
                        parsed_args = parse_function_call_arguments(args_raw)
                        try:
                            tool_result = execute_tool(func_name, parsed_args)
                            tool_content = tool_result if isinstance(tool_result, str) else json.dumps(tool_result, ensure_ascii=False)
                            self.messages.append({"role": "tool", "name": func_name, "content": tool_content})
                        except Exception as e:
                            self.messages.append({"role": "tool", "name": func_name or "unknown", "content": json.dumps({"error": str(e)})})
                    # Hämta textsvar från meddelandet
                    result: str = message.content
                    if hasattr(message, 'content_text'):
                        result: str = message.content_text
-                    # Store in message history (without tool calls for clean history)
+                        
                    # Spara i meddelandehistorik (utan verktygsanrop för ren historik)
                    self.messages.append({"role": "assistant", "content": result})
                    if not self.chat:
                        self.messages = [self.messages[0]]
@ -1120,7 +1175,6 @@ if __name__ == "__main__":
    print(response.__dict__)
    response = llm.generate("What's the weather like in San Francisco? Also calculate 15 * 7 for me.", model='vllm')
    print(response.__dict__)
    exit()
    # Define a tool for calculations
    @register_tool
@ -1198,7 +1252,7 @@ if __name__ == "__main__":
        except Exception as e:
            print(f"❌ Tools test failed: {e}")
-        # Test 3: Thinking mode (use vllm model since reasoning model doesn't exist)
+        # Test 3: Thinking mode (use vLLM model since reasoning model doesn't exist)
        print("\n3️⃣ Thinking Mode Test (using vllm)")
        print("-" * 30)
        try:
--- a/_llm/ollama-cloud-test.py
+++ b/_llm/ollama-cloud-test.py
@ -0,0 +1,13 @@
 from ollama import Client
 client = Client()
 messages = [
  {
    'role': 'user',
    'content': 'Why is the sky blue?',
  },
 ]
 for part in client.chat('gpt-oss:120b-cloud', messages=messages, stream=True):
  print(part['message']['content'], end='', flush=True)
--- a/_llm/tool_registry.py
+++ b/_llm/tool_registry.py
@ -0,0 +1,176 @@
 import inspect, json, re, ast
 from typing import Callable, Dict, Any, List, get_origin, get_args
 from pydantic import BaseModel
 TOOL_REGISTRY: Dict[str, Dict[str, Any]] = {}
 # --- type mapping ---
 def _pytype_to_jsonschema(t):
    origin = get_origin(t)
    if origin is list or origin is List:
        args = get_args(t)
        item_type = args[0] if args else str
        return {"type": "array", "items": _pytype_to_jsonschema(item_type)}
    if inspect.isclass(t) and issubclass(t, BaseModel):
        sch = t.schema()
        return {"type": "object", **sch}
    mapping = {
        str: {"type": "string"},
        int: {"type": "integer"},
        float: {"type": "number"},
        bool: {"type": "boolean"},
        dict: {"type": "object"},
        list: {"type": "array", "items": {"type": "string"}},
    }
    return mapping.get(t, {"type": "string"})
 # --- docstring parser (Google style) ---
 def _parse_google_docstring(docstring: str):
    if not docstring:
        return {"description": "", "params": {}}
    lines = [ln.rstrip() for ln in docstring.splitlines()]
    desc_lines = []
    i = 0
    while i < len(lines) and not lines[i].lower().startswith(("args:", "arguments:")):
        if lines[i].strip():
            desc_lines.append(lines[i].strip())
        i += 1
    description = " ".join(desc_lines).strip()
    params = {}
    if i < len(lines):
        i += 1
        while i < len(lines):
            line = lines[i].strip()
            if not line:
                i += 1
                continue
            m = re.match(r'^(\w+)\s*(?:\(([^)]+)\))?\s*:\s*(.*)$', line)
            if m:
                name = m.group(1)
                desc = m.group(3)
                j = i + 1
                while j < len(lines) and not re.match(r'^\w+\s*(?:\([^)]+\))?\s*:', lines[j].strip()):
                    if lines[j].strip():
                        desc += " " + lines[j].strip()
                    j += 1
                params[name] = {"description": desc.strip(), "type": m.group(2)}
                i = j
                continue
            i += 1
    return {"description": description, "params": params}
 # --- helper: make OpenAI-style function spec ---
 def _wrap_openai_function_schema(name: str, description: str, parameters: dict):
    """Create OpenAI function calling format with 'function' wrapper"""
    params = parameters.copy()
    if params.get("type") != "object":
        params = {"type": "object", "properties": params.get("properties", params), "required": params.get("required", [])}
    params.setdefault("additionalProperties", False)
    # Return in OpenAI function calling format with 'function' wrapper
    return {
        "type": "function",
        "function": {
            "name": name,
            "description": description,
            "parameters": params
        }
    }
 # --- decorator to register tools ---
 def register_tool(func: Callable = None, *, name: str = None, description: str = None, schema: dict = None):
    def _register(f):
        fname = name or f.__name__
        doc = _parse_google_docstring(f.__doc__)
        func_description = description or doc["description"] or ""
        if schema is not None:
            func_schema = schema
        else:
            sig = inspect.signature(f)
            props = {}
            required = []
            for param_name, param in sig.parameters.items():
                ann = param.annotation if param.annotation is not inspect._empty else str
                prop_schema = _pytype_to_jsonschema(ann)
                if param_name in doc["params"]:
                    prop_schema["description"] = doc["params"][param_name]["description"]
                props[param_name] = prop_schema
                if param.default is inspect._empty:
                    required.append(param_name)
            func_schema = {"type": "object", "properties": props, "required": required, "additionalProperties": False}
        TOOL_REGISTRY[fname] = {
            "callable": f,
            "schema": _wrap_openai_function_schema(fname, func_description, func_schema)
        }
        return f
    if func is None:
        return _register
    else:
        return _register(func)
 # --- what to send to model ---
 def get_tools() -> List[dict]:
    """Return OpenAI-compatible functions list with proper 'function' wrapper."""
    return [entry["schema"] for entry in TOOL_REGISTRY.values()]
 # --- robust parser for arguments ---
 def parse_function_call_arguments(raw) -> dict:
    if isinstance(raw, dict):
        return raw
    if not isinstance(raw, str):
        return {"_raw_unexpected": str(type(raw)), "value": raw}
    try:
        return json.loads(raw)
    except json.JSONDecodeError:
        pass
    try:
        return ast.literal_eval(raw)
    except Exception:
        pass
    stripped = raw.strip()
    if re.match(r'^(SELECT|WITH)\b', stripped, flags=re.IGNORECASE):
        return {"sql_query": stripped}
    m = re.search(r'\{.*\}', raw, flags=re.DOTALL)
    if m:
        candidate = m.group(0)
        try:
            return json.loads(candidate)
        except Exception:
            try:
                return ast.literal_eval(candidate)
            except Exception:
                pass
    return {"_raw": raw}
 # --- safe executor ---
 def execute_tool(name: str, args: dict):
    """
    Execute registered callable with args (basic validation).
    Returns Python object (dict/list/str).
    """
    entry = TOOL_REGISTRY.get(name)
    if not entry:
        raise RuntimeError(f"Function {name} not registered")
    fn = entry["callable"]
    # simple SQL safety example: if function expects sql_query ensure SELECT
    if "sql_query" in args:
        q = args["sql_query"].strip()
        if not re.match(r'^(SELECT|WITH)\b', q, flags=re.IGNORECASE):
            raise ValueError("Only SELECT/ WITH queries allowed in sql_query")
        if q.endswith(";"):
            args["sql_query"] = q[:-1]
    # Prepare kwargs with minimal type coercion
    sig = inspect.signature(fn)
    kwargs = {}
    for pname, param in sig.parameters.items():
        if pname not in args:
            continue
        val = args[pname]
        ann = param.annotation if param.annotation is not inspect._empty else None
        origin = get_origin(ann)
        if origin in (list, List) and isinstance(val, str):
            kwargs[pname] = [x.strip() for x in val.split(",") if x.strip() != ""]
        else:
            kwargs[pname] = val
    result = fn(**kwargs)
    return result
--- a/_llm/tool_registy.py
+++ b/_llm/tool_registy.py
@ -1,214 +0,0 @@
 # assume your client already has: import inspect, json
 from typing import Callable, Dict, Any
 import inspect, json
 import re
 from pydantic import BaseModel
 TOOL_REGISTRY: Dict[str, Dict[str, Any]] = {}
 def _parse_google_docstring(docstring: str) -> Dict[str, Any]:
    """Parse Google-style docstring to extract description and parameter info."""
    if not docstring:
        return {"description": "", "params": {}}
    # Split into lines and clean up
    lines = [line.strip() for line in docstring.strip().split('\n')]
    # Find the main description (everything before Args:)
    description_lines = []
    i = 0
    while i < len(lines):
        if lines[i].lower().startswith('args:') or lines[i].lower().startswith('arguments:'):
            break
        description_lines.append(lines[i])
        i += 1
    description = ' '.join(description_lines).strip()
    # Parse parameters section
    params = {}
    if i < len(lines):
        i += 1  # Skip the "Args:" line
        while i < len(lines):
            line = lines[i]
            if line.lower().startswith(('returns:', 'yields:', 'raises:', 'note:', 'example:')):
                break
            # Match parameter format: param_name (type): description
            match = re.match(r'^\s*(\w+)\s*(?:\(([^)]+)\))?\s*:\s*(.*)$', line)
            if match:
                param_name = match.group(1)
                param_type = match.group(2)
                param_desc = match.group(3)
                # Collect multi-line descriptions
                j = i + 1
                while j < len(lines) and lines[j] and not re.match(r'^\s*\w+\s*(?:\([^)]+\))?\s*:', lines[j]):
                    param_desc += ' ' + lines[j].strip()
                    j += 1
                params[param_name] = {
                    "description": param_desc.strip(),
                    "type": param_type.strip() if param_type else None
                }
                i = j - 1
            i += 1
    return {"description": description, "params": params}
 def _pytype_to_jsonschema(t):
    # Very-small helper; extend as needed or use pydantic models for complex types
    mapping = {str: {"type": "string"}, int: {"type": "integer"},
               float: {"type": "number"}, bool: {"type": "boolean"},
               dict: {"type": "object"}, list: {"type": "array"}}
    return mapping.get(t, {"type": "string"})  # fallback to string
 def register_tool(func: Callable = None, *, name: str = None, description: str = None, schema: dict = None):
    """
    Use as decorator or call directly:
      @register_tool
      def foo(x: int): ...
    or
      register_tool(func=myfunc, name="myfunc", schema=...)
    """
    def _register(f):
        fname = name or f.__name__
        # Parse docstring for description and parameter info
        docstring_info = _parse_google_docstring(f.__doc__)
        func_description = description or docstring_info["description"] or ""
        # If explicit schema provided, use it
        if schema is not None:
            func_schema = schema
        else:
            sig = inspect.signature(f)
            props = {}
            required = []
            for param_name, param in sig.parameters.items():
                ann = param.annotation
                # If user used a Pydantic BaseModel as a single arg, use its schema
                if inspect.isclass(ann) and issubclass(ann, BaseModel):
                    func_schema = ann.schema()
                    # wrap into a single-arg object if necessary
                    props = func_schema.get("properties", {})
                    required = func_schema.get("required", [])
                    # done early - for single-model param
                    break
                # Create property schema from type annotation
                prop_schema = _pytype_to_jsonschema(ann)
                # Add description from docstring if available
                if param_name in docstring_info["params"]:
                    prop_schema["description"] = docstring_info["params"][param_name]["description"]
                props[param_name] = prop_schema
                if param.default is inspect._empty:
                    required.append(param_name)
            if 'func_schema' not in locals():
                func_schema = {
                    "type": "object",
                    "properties": props,
                    "required": required
                }
        TOOL_REGISTRY[fname] = {
            "callable": f,
            "schema": {
                "type": "function",
                "function": {
                    "name": fname,
                    "description": func_description,
                    "parameters": func_schema
                }
            }
        }
        return f
    if func is None:
        return _register
    else:
        return _register(func)
 def get_tools() -> list:
    """Return list of function schemas (JSON) to send to the model"""
    return [v["schema"] for v in TOOL_REGISTRY.values()]
 def handle_function_call_and_inject_result(response_choice, messages):
    """
    Given the model choice (response.choices[0]) and your messages list:
      - extracts function/tool call
      - executes the registered python callable
      - appends the tool result as a tool message and returns it
    """
    # Support different shapes: some SDKs use .message.tool_calls, others .message.function_call
    msg = getattr(response_choice, "message", None) or (response_choice.get("message") if isinstance(response_choice, dict) else None)
    func_name = None
    func_args = None
    # try tool_calls style
    if msg:
        tool_calls = getattr(msg, "tool_calls", None) or (msg.get("tool_calls") if isinstance(msg, dict) else None)
        if tool_calls:
            tc = tool_calls[0]
            fn = getattr(tc, "function", None) or (tc.get("function") if isinstance(tc, dict) else None)
            func_name = getattr(fn, "name", None) or (fn.get("name") if isinstance(fn, dict) else None)
            func_args = getattr(fn, "arguments", None) or (fn.get("arguments") if isinstance(fn, dict) else None)
    # fallback to function_call
    if func_name is None:
        fc = getattr(msg, "function_call", None) or (msg.get("function_call") if isinstance(msg, dict) else None)
        if fc:
            func_name = getattr(fc, "name", None) or fc.get("name")
            args_raw = getattr(fc, "arguments", None) or fc.get("arguments")
            # arguments are often a JSON string depending on SDK shape
            if isinstance(args_raw, str):
                try:
                    func_args = json.loads(args_raw)
                except Exception:
                    func_args = None
            else:
                func_args = args_raw
    if not func_name:
        return None  # no function call found
    entry = TOOL_REGISTRY.get(func_name)
    if not entry:
        raise RuntimeError(f"Function {func_name} not registered")
    result = entry["callable"](**(func_args or {}))
    # convert result to string/JSON for tool message
    tool_content = result if isinstance(result, str) else json.dumps(result)
    # append tool message so model can see the result
    messages.append({"role": "tool", "name": func_name, "content": tool_content})
    return tool_content
 if __name__ == "__main__":
    # Example usage and test
    @register_tool
    def add(x: int, y: int) -> int:
        """Add two integers
        Args:
            x (int): First integer
            y (int): Second integer
        Returns:
            int: Sum of x and y
        """
        return x + y
    @register_tool(name="echo", description="Echoes the input string")
    def echo_message(message: str) -> str:
        """Echo the input message
        Args:
            message (str): The message to echo
        Returns:
            str: The echoed message
        """
        return message
    print("Registered tools:")
    import pprint
    for info in get_tools():
        pprint.pprint(info)