Spaces:

dexhunter
/

aideml

Running

App Files Files Community

Dixing (Dex) Xu commited on Jan 14

Commit

f92d1a2

unverified ·

1 Parent(s): 9c55a42

:sparkles: Add anthropic tool use (#39)

Browse files

* :sparkles: Add anthropic tool use

* fix: ruff format

Files changed (2) hide show

aide/backend/backend_anthropic.py +43 -8
aide/backend/utils.py +18 -0

aide/backend/backend_anthropic.py CHANGED Viewed

@@ -1,11 +1,14 @@
 """Backend for Anthropic API."""
 import time
 from .utils import FunctionSpec, OutputType, opt_messages_to_list, backoff_create
 from funcy import notnone, once, select_values
 import anthropic
 _client: anthropic.Anthropic = None  # type: ignore
 ANTHROPIC_TIMEOUT_EXCEPTIONS = (
@@ -15,6 +18,10 @@ ANTHROPIC_TIMEOUT_EXCEPTIONS = (
     anthropic.InternalServerError,
 )
 @once
 def _setup_anthropic_client():
@@ -28,23 +35,32 @@ def query(
     func_spec: FunctionSpec | None = None,
     **model_kwargs,
 ) -> tuple[OutputType, float, int, int, dict]:
     _setup_anthropic_client()
     filtered_kwargs: dict = select_values(notnone, model_kwargs)  # type: ignore
     if "max_tokens" not in filtered_kwargs:
         filtered_kwargs["max_tokens"] = 4096  # default for Claude models
-    if func_spec is not None:
-        raise NotImplementedError(
-            "Anthropic does not support function calling for now."
-        )
-    # Anthropic doesn't allow not having a user messages
     # if we only have system msg -> use it as user msg
     if system_message is not None and user_message is None:
         system_message, user_message = user_message, system_message
-    # Anthropic passes the system messages as a separate argument
     if system_message is not None:
         filtered_kwargs["system"] = system_message
@@ -59,14 +75,33 @@ def query(
     )
     req_time = time.time() - t0
-    assert len(message.content) == 1 and message.content[0].type == "text"
-    output: str = message.content[0].text
     in_tokens = message.usage.input_tokens
     out_tokens = message.usage.output_tokens
     info = {
         "stop_reason": message.stop_reason,
     }
     return output, req_time, in_tokens, out_tokens, info

 """Backend for Anthropic API."""
+import logging
 import time
 from .utils import FunctionSpec, OutputType, opt_messages_to_list, backoff_create
 from funcy import notnone, once, select_values
 import anthropic
+logger = logging.getLogger("aide")
 _client: anthropic.Anthropic = None  # type: ignore
 ANTHROPIC_TIMEOUT_EXCEPTIONS = (
     anthropic.InternalServerError,
 )
+ANTHROPIC_MODEL_ALIASES = {
+    "claude-3.5-sonnet": "claude-3-sonnet-20241022",
+}
 @once
 def _setup_anthropic_client():
     func_spec: FunctionSpec | None = None,
     **model_kwargs,
 ) -> tuple[OutputType, float, int, int, dict]:
+    """
+    Query Anthropic's API, optionally with tool use (Anthropic's equivalent to function calling).
+    """
     _setup_anthropic_client()
     filtered_kwargs: dict = select_values(notnone, model_kwargs)  # type: ignore
     if "max_tokens" not in filtered_kwargs:
         filtered_kwargs["max_tokens"] = 4096  # default for Claude models
+    model_name = filtered_kwargs.get("model", "")
+    logger.debug(f"Anthropic query called with model='{model_name}'")
+    if model_name in ANTHROPIC_MODEL_ALIASES:
+        model_name = ANTHROPIC_MODEL_ALIASES[model_name]
+    if func_spec is not None and func_spec.name == "submit_review":
+        filtered_kwargs["tools"] = [func_spec.as_anthropic_tool_dict]
+        # Force tool use
+        filtered_kwargs["tool_choice"] = func_spec.anthropic_tool_choice_dict
+    # Anthropic doesn't allow not having user messages
     # if we only have system msg -> use it as user msg
     if system_message is not None and user_message is None:
         system_message, user_message = user_message, system_message
+    # Anthropic passes system messages as a separate argument
     if system_message is not None:
         filtered_kwargs["system"] = system_message
     )
     req_time = time.time() - t0
+    # Handle tool calls if present
+    if (
+        func_spec is not None
+        and "tools" in filtered_kwargs
+        and len(message.content) > 0
+        and message.content[0].type == "tool_use"
+    ):
+        block = message.content[0]  # This is a "ToolUseBlock"
+        # block has attributes: type, id, name, input
+        assert (
+            block.name == func_spec.name
+        ), f"Function name mismatch: expected {func_spec.name}, got {block.name}"
+        output = block.input  # Anthropic calls the parameters "input"
+    else:
+        # For non-tool responses, ensure we have text content
+        assert len(message.content) == 1, "Expected single content item"
+        assert (
+            message.content[0].type == "text"
+        ), f"Expected text response, got {message.content[0].type}"
+        output = message.content[0].text
     in_tokens = message.usage.input_tokens
     out_tokens = message.usage.output_tokens
     info = {
         "stop_reason": message.stop_reason,
+        "model": message.model,
     }
     return output, req_time, in_tokens, out_tokens, info

aide/backend/utils.py CHANGED Viewed

@@ -66,6 +66,7 @@ class FunctionSpec(DataClassJsonMixin):
     @property
     def as_openai_tool_dict(self):
         return {
             "type": "function",
             "function": {
@@ -81,3 +82,20 @@ class FunctionSpec(DataClassJsonMixin):
             "type": "function",
             "function": {"name": self.name},
         }

     @property
     def as_openai_tool_dict(self):
+        """Convert to OpenAI's function format."""
         return {
             "type": "function",
             "function": {
             "type": "function",
             "function": {"name": self.name},
         }
+    @property
+    def as_anthropic_tool_dict(self):
+        """Convert to Anthropic's tool format."""
+        return {
+            "name": self.name,
+            "description": self.description,
+            "input_schema": self.json_schema,  # Anthropic uses input_schema instead of parameters
+        }
+    @property
+    def anthropic_tool_choice_dict(self):
+        """Convert to Anthropic's tool choice format."""
+        return {
+            "type": "tool",  # Anthropic uses "tool" instead of "function"
+            "name": self.name,
+        }