|
72 | 72 | "\n", |
73 | 73 | "load_dotenv()\n", |
74 | 74 | "# Patch the existing notebook loop so we can await coroutines safely\n", |
75 | | - "nest_asyncio.apply()\n" |
| 75 | + "nest_asyncio.apply()" |
76 | 76 | ] |
77 | 77 | }, |
78 | 78 | { |
|
115 | 115 | " ]\n", |
116 | 116 | ")\n", |
117 | 117 | "\n", |
118 | | - "scientist_questions\n" |
| 118 | + "scientist_questions" |
119 | 119 | ] |
120 | 120 | }, |
121 | 121 | { |
|
156 | 156 | " ]\n", |
157 | 157 | ")\n", |
158 | 158 | "\n", |
159 | | - "weather_queries\n" |
| 159 | + "weather_queries" |
160 | 160 | ] |
161 | 161 | }, |
162 | 162 | { |
|
187 | 187 | "evaluator_llm = LangchainLLMWrapper(ChatOpenAI(model=\"gpt-4o-mini\"))\n", |
188 | 188 | "\n", |
189 | 189 | "qa_metrics = [FactualCorrectness(llm=evaluator_llm)]\n", |
190 | | - "tool_metrics = [ToolCallF1()] # rule-based, no LLM required\n" |
| 190 | + "tool_metrics = [ToolCallF1()] # rule-based, no LLM required" |
191 | 191 | ] |
192 | 192 | }, |
193 | 193 | { |
|
210 | 210 | "AG_UI_ENDPOINT = \"http://localhost:8000/agentic_chat\" # Update to match your agent\n", |
211 | 211 | "\n", |
212 | 212 | "RUN_FACTUAL_EVAL = False\n", |
213 | | - "RUN_TOOL_EVAL = False\n" |
| 213 | + "RUN_TOOL_EVAL = False" |
214 | 214 | ] |
215 | 215 | }, |
216 | 216 | { |
|
328 | 328 | " metadata=True,\n", |
329 | 329 | " )\n", |
330 | 330 | "\n", |
| 331 | + "\n", |
331 | 332 | "if RUN_FACTUAL_EVAL:\n", |
332 | 333 | " factual_result = await evaluate_factual()\n", |
333 | 334 | " factual_df = factual_result.to_pandas()\n", |
334 | | - " display(factual_df)\n" |
| 335 | + " display(factual_df)" |
335 | 336 | ] |
336 | 337 | }, |
337 | 338 | { |
|
426 | 427 | " evaluator_llm=evaluator_llm,\n", |
427 | 428 | " )\n", |
428 | 429 | "\n", |
| 430 | + "\n", |
429 | 431 | "if RUN_TOOL_EVAL:\n", |
430 | 432 | " tool_result = await evaluate_tool_usage()\n", |
431 | 433 | " tool_df = tool_result.to_pandas()\n", |
432 | | - " display(tool_df)\n" |
| 434 | + " display(tool_df)" |
433 | 435 | ] |
434 | 436 | }, |
435 | 437 | { |
|
480 | 482 | "\n", |
481 | 483 | "messages_from_snapshot = convert_messages_snapshot(snapshot)\n", |
482 | 484 | "\n", |
483 | | - "messages_from_stream, messages_from_snapshot\n" |
| 485 | + "messages_from_stream, messages_from_snapshot" |
484 | 486 | ] |
485 | 487 | }, |
486 | 488 | { |
|
0 commit comments