from synth_ai.sdk.eval import EvalJob
job = await EvalJob.create(
task_app_url="http://localhost:8103",
app_id="banking77",
seeds=[0, 1, 2, 3, 4],
policy={"model": "gpt-4o", "provider": "openai"}
)
# Poll until complete
result = await job.wait()
print(f"Mean reward: {result.summary.mean_reward}")