@@ -37,8 +37,8 @@ def test_evaluate_call():
3737 dspy .settings .configure (
3838 lm = DummyLM (
3939 {
40- "What is 1+1?" : "[[ ## answer ## ]] \n 2" ,
41- "What is 2+2?" : "[[ ## answer ## ]] \n 4" ,
40+ "What is 1+1?" : { " answer" : "2" } ,
41+ "What is 2+2?" : { " answer" : "4" } ,
4242 }
4343 )
4444 )
@@ -55,9 +55,7 @@ def test_evaluate_call():
5555
5656
5757def test_multithread_evaluate_call ():
58- dspy .settings .configure (
59- lm = DummyLM ({"What is 1+1?" : "[[ ## answer ## ]]\n 2" , "What is 2+2?" : "[[ ## answer ## ]]\n 4" })
60- )
58+ dspy .settings .configure (lm = DummyLM ({"What is 1+1?" : {"answer" : "2" }, "What is 2+2?" : {"answer" : "4" }}))
6159 devset = [new_example ("What is 1+1?" , "2" ), new_example ("What is 2+2?" , "4" )]
6260 program = Predict ("question -> answer" )
6361 assert program (question = "What is 1+1?" ).answer == "2"
@@ -80,9 +78,7 @@ def __call__(self, *args, **kwargs):
8078 time .sleep (1 )
8179 return super ().__call__ (* args , ** kwargs )
8280
83- dspy .settings .configure (
84- lm = SlowLM ({"What is 1+1?" : "[[ ## answer ## ]]\n 2" , "What is 2+2?" : "[[ ## answer ## ]]\n 4" })
85- )
81+ dspy .settings .configure (lm = SlowLM ({"What is 1+1?" : {"answer" : "2" }, "What is 2+2?" : {"answer" : "4" }}))
8682
8783 devset = [new_example ("What is 1+1?" , "2" ), new_example ("What is 2+2?" , "4" )]
8884 program = Predict ("question -> answer" )
@@ -112,9 +108,7 @@ def sleep_then_interrupt():
112108
113109
114110def test_evaluate_call_bad ():
115- dspy .settings .configure (
116- lm = DummyLM ({"What is 1+1?" : "[[ ## answer ## ]]\n 0" , "What is 2+2?" : "[[ ## answer ## ]]\n 0" })
117- )
111+ dspy .settings .configure (lm = DummyLM ({"What is 1+1?" : {"answer" : "0" }, "What is 2+2?" : {"answer" : "0" }}))
118112 devset = [new_example ("What is 1+1?" , "2" ), new_example ("What is 2+2?" , "4" )]
119113 program = Predict ("question -> answer" )
120114 ev = Evaluate (
0 commit comments