mirror of
https://github.com/kennethreitz/instructor.git
synced 2026-06-05 22:50:18 +00:00
57 lines
1.7 KiB
Python
57 lines
1.7 KiB
Python
import openai
|
|
import instructor
|
|
from typing import Iterable
|
|
from pydantic import BaseModel, ConfigDict
|
|
|
|
client = instructor.patch(openai.OpenAI())
|
|
|
|
|
|
class SyntheticQA(BaseModel):
|
|
question: str
|
|
answer: str
|
|
|
|
model_config = ConfigDict(
|
|
json_schema_extra={
|
|
"examples": [
|
|
{"question": "What is the capital of France?", "answer": "Paris"},
|
|
{
|
|
"question": "What is the largest planet in our solar system?",
|
|
"answer": "Jupiter",
|
|
},
|
|
{
|
|
"question": "Who wrote 'To Kill a Mockingbird'?",
|
|
"answer": "Harper Lee",
|
|
},
|
|
{
|
|
"question": "What element does 'O' represent on the periodic table?",
|
|
"answer": "Oxygen",
|
|
},
|
|
]
|
|
}
|
|
)
|
|
|
|
|
|
def get_synthetic_data() -> Iterable[SyntheticQA]:
|
|
return client.chat.completions.create(
|
|
model="gpt-3.5-turbo",
|
|
messages=[
|
|
{"role": "system", "content": "Generate synthetic examples"},
|
|
{
|
|
"role": "user",
|
|
"content": "Generate the exact examples you see in the examples of this prompt. ",
|
|
},
|
|
],
|
|
response_model=Iterable[SyntheticQA],
|
|
) # type: ignore
|
|
|
|
|
|
if __name__ == "__main__":
|
|
for example in get_synthetic_data():
|
|
print(example)
|
|
"""
|
|
question='What is the capital of France?' answer='Paris'
|
|
question='What is the largest planet in our solar system?' answer='Jupiter'
|
|
question="Who wrote 'To Kill a Mockingbird'?" answer='Harper Lee'
|
|
question="What element does 'O' represent on the periodic table?" answer='Oxygen'
|
|
"""
|