from langsmith import wrappers, Client
from openai import AsyncOpenAI
# 可选:包装 OpenAI 客户端以跟踪所有模型调用。
oai_client = wrappers.wrap_openai(AsyncOpenAI())
# 可选:添加 'traceable' 装饰器以跟踪此函数的输入/输出。
@traceable
async def researcher_app(inputs: dict) -> str:
instructions = """You are an excellent researcher. Given a high-level research idea, \
list 5 concrete questions that should be investigated to determine if the idea is worth pursuing."""
response = await oai_client.chat.completions.create(
model="gpt-5.4-mini",
messages=[
{"role": "system", "content": instructions},
{"role": "user", "content": inputs["idea"]},
],
)
return response.choices[0].message.content
# 评估器函数可以是同步或异步的
def concise(inputs: dict, outputs: dict) -> bool:
return len(outputs["output"]) < 3 * len(inputs["idea"])
ls_client = Client()
ideas = [
"universal basic income",
"nuclear fusion",
"hyperloop",
"nuclear powered rockets",
]
dataset = ls_client.create_dataset("research ideas")
ls_client.create_examples(
dataset_name=dataset.name,
examples=[{"inputs": {"idea": i}} for i in ideas],
)
# 也可以直接使用 'aevaluate' 函数:
# from langsmith import aevaluate
# await aevaluate(...)
results = await ls_client.aevaluate(
researcher_app,
data=dataset,
evaluators=[concise],
# 可选,添加并发。
max_concurrency=2, # 可选,添加并发。
experiment_prefix="gpt-5.4-mini-baseline" # 可选,默认随机。
)