mirror of
https://github.com/kennethreitz/instructor.git
synced 2026-06-05 22:50:18 +00:00
1ec9114d61
Co-authored-by: Jason Liu <jxnl@users.noreply.github.com>
216 lines
7.4 KiB
Python
216 lines
7.4 KiB
Python
import inspect
|
|
|
|
from functools import wraps
|
|
from json import JSONDecodeError
|
|
from pydantic import ValidationError, BaseModel
|
|
from typing import Callable, Type, Optional
|
|
from .function_calls import OpenAISchema, openai_schema
|
|
|
|
OVERRIDE_DOCS = """
|
|
Creates a new chat completion for the provided messages and parameters.
|
|
|
|
See: https://platform.openai.com/docs/api-reference/chat-completions/create
|
|
|
|
Additional Notes:
|
|
|
|
Using the `response_model` parameter, you can specify a response model to use for parsing the response from OpenAI's API. If its present, the response will be parsed using the response model, otherwise it will be returned as is.
|
|
|
|
If `stream=True` is specified, the response will be parsed using the `from_stream_response` method of the response model, if available, otherwise it will be parsed using the `from_response` method.
|
|
|
|
If need to obtain the raw response from OpenAI's API, you can access it using the `_raw_response` attribute of the response model.
|
|
|
|
Parameters:
|
|
response_model (Union[Type[BaseModel], Type[OpenAISchema]]): The response model to use for parsing the response from OpenAI's API, if available (default: None)
|
|
max_retries (int): The maximum number of retries to attempt if the response is not valid (default: 0)
|
|
validation_context (dict): The validation context to use for validating the response (default: None)
|
|
"""
|
|
|
|
|
|
def handle_response_model(response_model: Type[BaseModel], kwargs):
|
|
new_kwargs = kwargs.copy()
|
|
if response_model is not None:
|
|
if not issubclass(response_model, OpenAISchema):
|
|
response_model = openai_schema(response_model) # type: ignore
|
|
new_kwargs["functions"] = [response_model.openai_schema] # type: ignore
|
|
new_kwargs["function_call"] = {"name": response_model.openai_schema["name"]} # type: ignore
|
|
|
|
if new_kwargs.get("stream", False) and response_model is not None:
|
|
import warnings
|
|
|
|
warnings.warn(
|
|
"stream=True is not supported when using response_model parameter"
|
|
)
|
|
|
|
return response_model, new_kwargs
|
|
|
|
|
|
def process_response(
|
|
response, response_model, validation_context: dict = None, strict=None
|
|
): # type: ignore
|
|
"""Processes a OpenAI response with the response model, if available
|
|
It can use `validation_context` and `strict` to validate the response
|
|
via the pydantic model
|
|
|
|
Args:
|
|
response (ChatCompletion): The response from OpenAI's API
|
|
response_model (BaseModel): The response model to use for parsing the response
|
|
validation_context (dict, optional): The validation context to use for validating the response. Defaults to None.
|
|
strict (bool, optional): Whether to use strict json parsing. Defaults to None.
|
|
"""
|
|
if response_model is not None:
|
|
model = response_model.from_response(
|
|
response, validation_context=validation_context, strict=strict
|
|
)
|
|
model._raw_response = response
|
|
return model
|
|
return response
|
|
|
|
|
|
async def retry_async(
|
|
func,
|
|
response_model,
|
|
validation_context,
|
|
args,
|
|
kwargs,
|
|
max_retries,
|
|
strict: Optional[bool] = None,
|
|
):
|
|
retries = 0
|
|
while retries <= max_retries:
|
|
try:
|
|
response = await func(*args, **kwargs)
|
|
return (
|
|
process_response(
|
|
response,
|
|
response_model,
|
|
validation_context,
|
|
strict=strict,
|
|
),
|
|
None,
|
|
)
|
|
except (ValidationError, JSONDecodeError) as e:
|
|
kwargs["messages"].append(dict(**response.choices[0].message)) # type: ignore
|
|
kwargs["messages"].append(
|
|
{
|
|
"role": "user",
|
|
"content": f"Recall the function correctly, exceptions found\n{e}",
|
|
}
|
|
)
|
|
retries += 1
|
|
if retries > max_retries:
|
|
raise e
|
|
|
|
|
|
def retry_sync(
|
|
func,
|
|
response_model,
|
|
validation_context,
|
|
args,
|
|
kwargs,
|
|
max_retries,
|
|
strict: Optional[bool] = None,
|
|
):
|
|
retries = 0
|
|
while retries <= max_retries:
|
|
# Excepts ValidationError, and JSONDecodeError
|
|
try:
|
|
response = func(*args, **kwargs)
|
|
return (
|
|
process_response(
|
|
response, response_model, validation_context, strict=strict
|
|
),
|
|
None,
|
|
)
|
|
except (ValidationError, JSONDecodeError) as e:
|
|
kwargs["messages"].append(response.choices[0].message) # type: ignore
|
|
kwargs["messages"].append(
|
|
{
|
|
"role": "user",
|
|
"content": f"Recall the function correctly, exceptions found\n{e}",
|
|
}
|
|
)
|
|
retries += 1
|
|
if retries > max_retries:
|
|
raise e
|
|
|
|
|
|
def wrap_chatcompletion(func: Callable, is_async: bool = None) -> Callable:
|
|
@wraps(func)
|
|
async def new_chatcompletion_async(
|
|
response_model=None,
|
|
validation_context=None,
|
|
max_retries=1,
|
|
*args,
|
|
**kwargs,
|
|
):
|
|
response_model, new_kwargs = handle_response_model(response_model, kwargs) # type: ignore
|
|
response, error = await retry_async(
|
|
func=func,
|
|
response_model=response_model,
|
|
validation_context=validation_context,
|
|
max_retries=max_retries,
|
|
args=args,
|
|
kwargs=new_kwargs,
|
|
) # type: ignore
|
|
if error:
|
|
raise ValueError(error)
|
|
return response
|
|
|
|
@wraps(func)
|
|
def new_chatcompletion_sync(
|
|
response_model=None,
|
|
validation_context=None,
|
|
max_retries=1,
|
|
*args,
|
|
**kwargs,
|
|
):
|
|
response_model, new_kwargs = handle_response_model(response_model, kwargs) # type: ignore
|
|
response, error = retry_sync(
|
|
func=func,
|
|
response_model=response_model,
|
|
validation_context=validation_context,
|
|
max_retries=max_retries,
|
|
args=args,
|
|
kwargs=new_kwargs,
|
|
) # type: ignore
|
|
if error:
|
|
raise ValueError(error)
|
|
return response
|
|
|
|
wrapper_function = new_chatcompletion_async if is_async else new_chatcompletion_sync
|
|
wrapper_function.__doc__ = OVERRIDE_DOCS
|
|
return wrapper_function
|
|
|
|
|
|
def patch(client):
|
|
"""
|
|
Patch the `client.chat.completions.create` method
|
|
|
|
Enables the following features:
|
|
|
|
- `response_model` parameter to parse the response from OpenAI's API
|
|
- `max_retries` parameter to retry the function if the response is not valid
|
|
- `validation_context` parameter to validate the response using the pydantic model
|
|
- `strict` parameter to use strict json parsing
|
|
"""
|
|
|
|
client.chat.completions.create = wrap_chatcompletion(client.chat.completions.create)
|
|
return client
|
|
|
|
|
|
def apatch(client):
|
|
"""
|
|
Patch the `client.chat.completions.acreate` and `client.chat.completions.acreate` methods
|
|
|
|
Enables the following features:
|
|
|
|
- `response_model` parameter to parse the response from OpenAI's API
|
|
- `max_retries` parameter to retry the function if the response is not valid
|
|
- `validation_context` parameter to validate the response using the pydantic model
|
|
- `strict` parameter to use strict json parsing
|
|
"""
|
|
client.chat.completions.create = wrap_chatcompletion(
|
|
client.chat.completions.create, is_async=True
|
|
)
|
|
return client
|