instructor-ai · jxnl · Nov 25, 2023 · Nov 23, 2023 · Nov 23, 2023 · Nov 23, 2023
diff --git a/instructor/function_calls.py b/instructor/function_calls.py
@@ -1,9 +1,20 @@
+from calendar import c
 import json
 from docstring_parser import parse
 from functools import wraps
 from typing import Any, Callable
 from pydantic import BaseModel, create_model, validate_arguments
 
+import enum
+
+
+class PatchMode(enum.Enum):
+    """The mode to use for patching the client"""
+
+    FUNCTION_CALL: str = "function_call"
+    TOOL_CALL: str = "tool_call"
+    JSON_MODE: str = "json_mode"
+
 
 class openai_function:
     """
@@ -176,9 +187,9 @@ def openai_schema(cls):
     def from_response(
         cls,
         completion,
-        throw_error: bool = True,
         validation_context=None,
         strict: bool = None,
+        mode: PatchMode = PatchMode.FUNCTION_CALL,
     ):
         """Execute the function from the response of an openai chat completion
 
@@ -193,11 +204,37 @@ def from_response(
         """
         message = completion.choices[0].message
 
-        return cls.model_validate_json(
-            message.function_call.arguments,
-            context=validation_context,
-            strict=strict,
-        )
+        match mode:
+            case PatchMode.FUNCTION_CALL:
+                assert (
+                    message.function_call.name == cls.openai_schema["name"]
+                ), "Function name does not match"
+                return cls.model_validate_json(
+                    message.function_call.arguments,
+                    context=validation_context,
+                    strict=strict,
+                )
+            case PatchMode.TOOL_CALL:
+                assert (
+                    len(message.tool_calls) == 1
+                ), "Instructor does not support multiple tool calls, use List[Model] instead."
+                tool_call = message.tool_calls[0]
+                assert (
+                    tool_call.function.name == cls.openai_schema["name"]
+                ), "Tool name does not match"
+                return cls.model_validate_json(
+                    tool_call.function.arguments,
+                    context=validation_context,
+                    strict=strict,
+                )
+            case PatchMode.JSON_MODE:
+                return cls.model_validate_json(
+                    message.content,
+                    context=validation_context,
+                    strict=strict,
+                )
+            case _:
+                raise ValueError(f"Invalid patch mode: {mode}")
 
 
 def openai_schema(cls) -> OpenAISchema:

diff --git a/instructor/patch.py b/instructor/patch.py
@@ -7,7 +7,12 @@
 from openai.types.chat import ChatCompletion, ChatCompletionMessage
 from pydantic import BaseModel, ValidationError
 
-from .function_calls import OpenAISchema, openai_schema
+from .function_calls import OpenAISchema, openai_schema, PatchMode
+
+import logging
+
+logger = logging.getLogger(__name__)
+
 
 OVERRIDE_DOCS = """
 Creates a new chat completion for the provided messages and parameters.
@@ -29,13 +34,55 @@
 """
 
 
-def handle_response_model(response_model: Type[BaseModel], kwargs):
+def handle_response_model(
+    *, response_model: Type[BaseModel], kwargs, mode: PatchMode = PatchMode.FUNCTION_CALL
+):
     new_kwargs = kwargs.copy()
     if response_model is not None:
         if not issubclass(response_model, OpenAISchema):
             response_model = openai_schema(response_model)  # type: ignore
-        new_kwargs["functions"] = [response_model.openai_schema]  # type: ignore
-        new_kwargs["function_call"] = {"name": response_model.openai_schema["name"]}  # type: ignore
+
+        match mode:
+            case PatchMode.FUNCTION_CALL:
+                print("Patching function call")
+                new_kwargs["functions"] = [response_model.openai_schema]  # type: ignore
+                new_kwargs["function_call"] = {
+                    "name": response_model.openai_schema["name"]
+                }  # type: ignore
+            case PatchMode.TOOL_CALL:
+                print("Patching tool call")
+                new_kwargs["tools"] = [
+                    {
+                        "type": "function",
+                        "function": response_model.openai_schema,
+                    }
+                ]
+                new_kwargs["tool_choice"] = {
+                    "type": "function",
+                    "function": {"name": response_model.openai_schema["name"]},
+                }
+            case PatchMode.JSON_MODE:
+                print("Patching json mode")
+                new_kwargs["response_format"] = {"type": "json_object"}
+
+                # check that the first message is a system message
+                # if it is not, add a system message to the beginning
+                message = f"Make sure that your response to any message matchs the json_schema below, do not deviate at all: \n{response_model.model_json_schema()['properties']}"
+
+                if new_kwargs["messages"][0]["role"] != "system":
+                    new_kwargs["messages"].insert(
+                        0,
+                        {
+                            "role": "system",
+                            "content": message,
+                        },
+                    )
+
+                # if the first message is a system append the schema to the end
+                if new_kwargs["messages"][0]["role"] == "system":
+                    new_kwargs["messages"][0]["content"] += f"\n\n{message}"
+            case _:
+                raise ValueError(f"Invalid patch mode: {mode}")
 
     if new_kwargs.get("stream", False) and response_model is not None:
         import warnings
@@ -48,7 +95,7 @@ def handle_response_model(response_model: Type[BaseModel], kwargs):
 
 
 def process_response(
-    response, response_model, validation_context: dict = None, strict=None
+    response, *, response_model: Type[BaseModel], validation_context: dict = None, strict=None, mode: PatchMode = PatchMode.FUNCTION_CALL
 ):  # type: ignore
     """Processes a OpenAI response with the response model, if available
     It can use `validation_context` and `strict` to validate the response
@@ -62,25 +109,13 @@ def process_response(
     """
     if response_model is not None:
         model = response_model.from_response(
-            response, validation_context=validation_context, strict=strict
+            response, validation_context=validation_context, strict=strict, mode=mode
         )
         model._raw_response = response
         return model
     return response
 
 
-def dump_message(message: ChatCompletionMessage) -> dict:
-    """Dumps a message to a dict, to be returned to the OpenAI API.
-
-    Workaround for an issue with the OpenAI API, where the `tool_calls` field isn't allowed to be present in requests
-    if it isn't used.
-    """
-    dumped_message = message.model_dump()
-    if not dumped_message.get("tool_calls"):
-        del dumped_message["tool_calls"]
-    return dumped_message
-
-
 async def retry_async(
     func,
     response_model,
@@ -89,20 +124,18 @@ async def retry_async(
     kwargs,
     max_retries,
     strict: Optional[bool] = None,
+    mode: PatchMode = PatchMode.FUNCTION_CALL,
 ):
     retries = 0
     while retries <= max_retries:
         try:
             response: ChatCompletion = await func(*args, **kwargs)
-            return (
-                process_response(
+            return process_response(
                     response,
-                    response_model,
-                    validation_context,
+                    response_model=response_model,
+                    validation_context=validation_context,
                     strict=strict,
-                ),
-                None,
-            )
+                    mode=mode)
         except (ValidationError, JSONDecodeError) as e:
             kwargs["messages"].append(response.choices[0].message)  # type: ignore
             kwargs["messages"].append(
@@ -124,20 +157,18 @@ def retry_sync(
     kwargs,
     max_retries,
     strict: Optional[bool] = None,
+    mode: PatchMode = PatchMode.FUNCTION_CALL,
 ):
     retries = 0
     while retries <= max_retries:
         # Excepts ValidationError, and JSONDecodeError
         try:
             response = func(*args, **kwargs)
-            return (
-                process_response(
-                    response, response_model, validation_context, strict=strict
-                ),
-                None,
-            )
+            return process_response(
+                    response, response_model=response_model, validation_context=validation_context, strict=strict, mode=mode
+                )
         except (ValidationError, JSONDecodeError) as e:
-            kwargs["messages"].append(dump_message(response.choices[0].message))
+            kwargs["messages"].append(response.choices[0].message)
             kwargs["messages"].append(
                 {
                     "role": "user",
@@ -156,7 +187,7 @@ def is_async(func: Callable) -> bool:
     )
 
 
-def wrap_chatcompletion(func: Callable) -> Callable:
+def wrap_chatcompletion(func: Callable, mode:PatchMode=PatchMode.FUNCTION_CALL) -> Callable:
     func_is_async = is_async(func)
 
     @wraps(func)
@@ -167,17 +198,16 @@ async def new_chatcompletion_async(
         *args,
         **kwargs,
     ):
-        response_model, new_kwargs = handle_response_model(response_model, kwargs)  # type: ignore
-        response, error = await retry_async(
+        response_model, new_kwargs = handle_response_model(response_model=response_model, kwargs=kwargs, mode=mode)  # type: ignore
+        response = await retry_async(
             func=func,
             response_model=response_model,
             validation_context=validation_context,
             max_retries=max_retries,
             args=args,
             kwargs=new_kwargs,
+            mode=mode,
         )  # type: ignore
-        if error:
-            raise ValueError(error)
         return response
 
     @wraps(func)
@@ -188,17 +218,16 @@ def new_chatcompletion_sync(
         *args,
         **kwargs,
     ):
-        response_model, new_kwargs = handle_response_model(response_model, kwargs)  # type: ignore
-        response, error = retry_sync(
+        response_model, new_kwargs = handle_response_model(response_model=response_model, kwargs=kwargs, mode=mode)  # type: ignore
+        response = retry_sync(
             func=func,
             response_model=response_model,
             validation_context=validation_context,
             max_retries=max_retries,
             args=args,
             kwargs=new_kwargs,
+            mode=mode
         )  # type: ignore
-        if error:
-            raise ValueError(error)
         return response
 
     wrapper_function = (
@@ -208,7 +237,7 @@ def new_chatcompletion_sync(
     return wrapper_function
 
 
-def patch(client: Union[OpenAI, AsyncOpenAI]):
+def patch(client: Union[OpenAI, AsyncOpenAI], mode: PatchMode=PatchMode.FUNCTION_CALL):
     """
     Patch the `client.chat.completions.create` method
 
@@ -220,11 +249,11 @@ def patch(client: Union[OpenAI, AsyncOpenAI]):
     - `strict` parameter to use strict json parsing
     """
 
-    client.chat.completions.create = wrap_chatcompletion(client.chat.completions.create)
+    client.chat.completions.create = wrap_chatcompletion(client.chat.completions.create, mode=mode)
     return client
 
 
-def apatch(client: AsyncOpenAI):
+def apatch(client: AsyncOpenAI, mode:PatchMode=PatchMode.FUNCTION_CALL):
     """
     No longer necessary, use `patch` instead.
 
@@ -237,4 +266,4 @@ def apatch(client: AsyncOpenAI):
     - `validation_context` parameter to validate the response using the pydantic model
     - `strict` parameter to use strict json parsing
     """
-    return patch(client)
+    return patch(client, mode=mode)
diff --git a/tests/openai/test_modes.py b/tests/openai/test_modes.py
@@ -0,0 +1,60 @@
+from instructor.function_calls import OpenAISchema, PatchMode
+from openai import OpenAI
+
+
+client = OpenAI()
+
+class UserExtract(OpenAISchema):
+    name: str
+    age: int
+
+
+def test_tool_call():
+    response = client.chat.completions.create(
+        model="gpt-3.5-turbo-1106",
+        messages=[
+            {
+                "role": "user",
+                "content": "Extract jason is 25 years old, mary is 30 years old",
+            },
+        ],
+        tools=[
+            {
+                "type": "function",
+                "function": UserExtract.openai_schema,
+            }
+        ],
+        tool_choice={
+            "type": "function",
+            "function": {"name": UserExtract.openai_schema["name"]},
+        },
+    )
+    response_message = response.choices[0].message
+    tool_calls = response_message.tool_calls
+    assert len(tool_calls) == 1
+    assert tool_calls[0].function.name == "UserExtract"
+    assert tool_calls[0].function
+    user = UserExtract.from_response(response, mode=PatchMode.TOOL_CALL)
+    assert user.name.lower() == "jason"
+    assert user.age == 25
+
+
+def test_json_mode():
+    response = client.chat.completions.create(
+        model="gpt-3.5-turbo-1106",
+        response_format={"type": "json_object"},
+        messages=[
+            {
+                "role": "system",
+                "content": f"Make sure that your response to any message matchs the json_schema below, do not deviate at all: \n{UserExtract.model_json_schema()['properties']}",
+            },
+            {
+                "role": "user",
+                "content": "Extract jason is 25 years old",
+            },
+        ],
+    )
+    print(response.choices[0].message.content)
+    user = UserExtract.from_response(response, mode=PatchMode.JSON_MODE)
+    assert user.name.lower() == "jason"
+    assert user.age == 25