Skip to content

Commit 8b7d00d

Browse files
committed
perplexity samples + results
1 parent 9372c1f commit 8b7d00d

File tree

5 files changed

+647
-4
lines changed

5 files changed

+647
-4
lines changed
Lines changed: 50 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,50 @@
1+
{"question_id": "arena_hard_0", "grade": "base"}
2+
{"question_id": "arena_hard_1", "grade": "base"}
3+
{"question_id": "arena_hard_3", "grade": "base"}
4+
{"question_id": "arena_hard_2", "grade": "base"}
5+
{"question_id": "arena_hard_4", "grade": "base"}
6+
{"question_id": "arena_hard_5", "grade": "base"}
7+
{"question_id": "arena_hard_6", "grade": "base"}
8+
{"question_id": "arena_hard_7", "grade": "base"}
9+
{"question_id": "arena_hard_9", "grade": "base"}
10+
{"question_id": "arena_hard_8", "grade": "base"}
11+
{"question_id": "arena_hard_10", "grade": "base"}
12+
{"question_id": "arena_hard_11", "grade": "base"}
13+
{"question_id": "arena_hard_12", "grade": "base"}
14+
{"question_id": "arena_hard_13", "grade": "base"}
15+
{"question_id": "arena_hard_14", "grade": "base"}
16+
{"question_id": "arena_hard_15", "grade": "base"}
17+
{"question_id": "arena_hard_16", "grade": "base"}
18+
{"question_id": "arena_hard_17", "grade": "base"}
19+
{"question_id": "arena_hard_18", "grade": "base"}
20+
{"question_id": "arena_hard_20", "grade": "base"}
21+
{"question_id": "arena_hard_19", "grade": "base"}
22+
{"question_id": "arena_hard_22", "grade": "base"}
23+
{"question_id": "arena_hard_21", "grade": "base"}
24+
{"question_id": "arena_hard_23", "grade": "base"}
25+
{"question_id": "arena_hard_24", "grade": "base"}
26+
{"question_id": "arena_hard_25", "grade": "base"}
27+
{"question_id": "arena_hard_26", "grade": "base"}
28+
{"question_id": "arena_hard_27", "grade": "base"}
29+
{"question_id": "arena_hard_28", "grade": "base"}
30+
{"question_id": "arena_hard_29", "grade": "base"}
31+
{"question_id": "arena_hard_31", "grade": "base"}
32+
{"question_id": "arena_hard_30", "grade": "base"}
33+
{"question_id": "arena_hard_33", "grade": "base"}
34+
{"question_id": "arena_hard_32", "grade": "base"}
35+
{"question_id": "arena_hard_35", "grade": "base"}
36+
{"question_id": "arena_hard_34", "grade": "base"}
37+
{"question_id": "arena_hard_37", "grade": "base"}
38+
{"question_id": "arena_hard_36", "grade": "base"}
39+
{"question_id": "arena_hard_39", "grade": "base"}
40+
{"question_id": "arena_hard_38", "grade": "base"}
41+
{"question_id": "arena_hard_40", "grade": "base"}
42+
{"question_id": "arena_hard_41", "grade": "base"}
43+
{"question_id": "arena_hard_42", "grade": "base"}
44+
{"question_id": "arena_hard_43", "grade": "base"}
45+
{"question_id": "arena_hard_44", "grade": "base"}
46+
{"question_id": "arena_hard_45", "grade": "base"}
47+
{"question_id": "arena_hard_46", "grade": "base"}
48+
{"question_id": "arena_hard_47", "grade": "base"}
49+
{"question_id": "arena_hard_48", "grade": "base"}
50+
{"question_id": "arena_hard_49", "grade": "base"}
Lines changed: 250 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,250 @@
1+
{"question_id": "simple_qa_1", "grade": "B"}
2+
{"question_id": "simple_qa_2", "grade": "C"}
3+
{"question_id": "simple_qa_0", "grade": "C"}
4+
{"question_id": "simple_qa_3", "grade": "C"}
5+
{"question_id": "simple_qa_5", "grade": "C"}
6+
{"question_id": "simple_qa_4", "grade": "C"}
7+
{"question_id": "simple_qa_6", "grade": "B"}
8+
{"question_id": "simple_qa_7", "grade": "A"}
9+
{"question_id": "simple_qa_8", "grade": "C"}
10+
{"question_id": "simple_qa_9", "grade": "C"}
11+
{"question_id": "simple_qa_10", "grade": "C"}
12+
{"question_id": "simple_qa_11", "grade": "B"}
13+
{"question_id": "simple_qa_12", "grade": "C"}
14+
{"question_id": "simple_qa_13", "grade": "A"}
15+
{"question_id": "simple_qa_14", "grade": "C"}
16+
{"question_id": "simple_qa_15", "grade": "C"}
17+
{"question_id": "simple_qa_16", "grade": "A"}
18+
{"question_id": "simple_qa_18", "grade": "B"}
19+
{"question_id": "simple_qa_17", "grade": "A"}
20+
{"question_id": "simple_qa_19", "grade": "C"}
21+
{"question_id": "simple_qa_20", "grade": "C"}
22+
{"question_id": "simple_qa_22", "grade": "B"}
23+
{"question_id": "simple_qa_23", "grade": "C"}
24+
{"question_id": "simple_qa_21", "grade": "B"}
25+
{"question_id": "simple_qa_24", "grade": "C"}
26+
{"question_id": "simple_qa_25", "grade": "C"}
27+
{"question_id": "simple_qa_27", "grade": "C"}
28+
{"question_id": "simple_qa_26", "grade": "A"}
29+
{"question_id": "simple_qa_28", "grade": "A"}
30+
{"question_id": "simple_qa_29", "grade": "C"}
31+
{"question_id": "simple_qa_30", "grade": "B"}
32+
{"question_id": "simple_qa_32", "grade": "A"}
33+
{"question_id": "simple_qa_31", "grade": "C"}
34+
{"question_id": "simple_qa_33", "grade": "C"}
35+
{"question_id": "simple_qa_36", "grade": "B"}
36+
{"question_id": "simple_qa_34", "grade": "C"}
37+
{"question_id": "simple_qa_37", "grade": "B"}
38+
{"question_id": "simple_qa_35", "grade": "C"}
39+
{"question_id": "simple_qa_38", "grade": "B"}
40+
{"question_id": "simple_qa_40", "grade": "C"}
41+
{"question_id": "simple_qa_39", "grade": "C"}
42+
{"question_id": "simple_qa_41", "grade": "C"}
43+
{"question_id": "simple_qa_42", "grade": "C"}
44+
{"question_id": "simple_qa_43", "grade": "B"}
45+
{"question_id": "simple_qa_44", "grade": "B"}
46+
{"question_id": "simple_qa_45", "grade": "C"}
47+
{"question_id": "simple_qa_47", "grade": "C"}
48+
{"question_id": "simple_qa_46", "grade": "B"}
49+
{"question_id": "simple_qa_49", "grade": "A"}
50+
{"question_id": "simple_qa_48", "grade": "C"}
51+
{"question_id": "simple_qa_51", "grade": "A"}
52+
{"question_id": "simple_qa_50", "grade": "C"}
53+
{"question_id": "simple_qa_53", "grade": "C"}
54+
{"question_id": "simple_qa_52", "grade": "A"}
55+
{"question_id": "simple_qa_54", "grade": "A"}
56+
{"question_id": "simple_qa_56", "grade": "A"}
57+
{"question_id": "simple_qa_57", "grade": "C"}
58+
{"question_id": "simple_qa_55", "grade": "B"}
59+
{"question_id": "simple_qa_58", "grade": "B"}
60+
{"question_id": "simple_qa_59", "grade": "C"}
61+
{"question_id": "simple_qa_60", "grade": "C"}
62+
{"question_id": "simple_qa_62", "grade": "C"}
63+
{"question_id": "simple_qa_61", "grade": "C"}
64+
{"question_id": "simple_qa_63", "grade": "C"}
65+
{"question_id": "simple_qa_64", "grade": "C"}
66+
{"question_id": "simple_qa_65", "grade": "C"}
67+
{"question_id": "simple_qa_67", "grade": "C"}
68+
{"question_id": "simple_qa_66", "grade": "C"}
69+
{"question_id": "simple_qa_68", "grade": "C"}
70+
{"question_id": "simple_qa_70", "grade": "B"}
71+
{"question_id": "simple_qa_71", "grade": "C"}
72+
{"question_id": "simple_qa_69", "grade": "A"}
73+
{"question_id": "simple_qa_72", "grade": "C"}
74+
{"question_id": "simple_qa_75", "grade": "C"}
75+
{"question_id": "simple_qa_73", "grade": "B"}
76+
{"question_id": "simple_qa_74", "grade": "C"}
77+
{"question_id": "simple_qa_77", "grade": "C"}
78+
{"question_id": "simple_qa_76", "grade": "B"}
79+
{"question_id": "simple_qa_78", "grade": "C"}
80+
{"question_id": "simple_qa_79", "grade": "C"}
81+
{"question_id": "simple_qa_81", "grade": "A"}
82+
{"question_id": "simple_qa_82", "grade": "C"}
83+
{"question_id": "simple_qa_83", "grade": "C"}
84+
{"question_id": "simple_qa_84", "grade": "A"}
85+
{"question_id": "simple_qa_85", "grade": "A"}
86+
{"question_id": "simple_qa_86", "grade": "A"}
87+
{"question_id": "simple_qa_87", "grade": "C"}
88+
{"question_id": "simple_qa_88", "grade": "C"}
89+
{"question_id": "simple_qa_89", "grade": "C"}
90+
{"question_id": "simple_qa_90", "grade": "C"}
91+
{"question_id": "simple_qa_91", "grade": "A"}
92+
{"question_id": "simple_qa_92", "grade": "C"}
93+
{"question_id": "simple_qa_93", "grade": "A"}
94+
{"question_id": "simple_qa_94", "grade": "A"}
95+
{"question_id": "simple_qa_96", "grade": "C"}
96+
{"question_id": "simple_qa_95", "grade": "C"}
97+
{"question_id": "simple_qa_97", "grade": "A"}
98+
{"question_id": "simple_qa_80", "grade": "C"}
99+
{"question_id": "simple_qa_98", "grade": "C"}
100+
{"question_id": "simple_qa_100", "grade": "C"}
101+
{"question_id": "simple_qa_99", "grade": "B"}
102+
{"question_id": "simple_qa_101", "grade": "C"}
103+
{"question_id": "simple_qa_102", "grade": "C"}
104+
{"question_id": "simple_qa_103", "grade": "B"}
105+
{"question_id": "simple_qa_104", "grade": "C"}
106+
{"question_id": "simple_qa_105", "grade": "B"}
107+
{"question_id": "simple_qa_107", "grade": "C"}
108+
{"question_id": "simple_qa_106", "grade": "C"}
109+
{"question_id": "simple_qa_108", "grade": "C"}
110+
{"question_id": "simple_qa_109", "grade": "B"}
111+
{"question_id": "simple_qa_110", "grade": "B"}
112+
{"question_id": "simple_qa_111", "grade": "C"}
113+
{"question_id": "simple_qa_112", "grade": "B"}
114+
{"question_id": "simple_qa_113", "grade": "C"}
115+
{"question_id": "simple_qa_114", "grade": "B"}
116+
{"question_id": "simple_qa_115", "grade": "C"}
117+
{"question_id": "simple_qa_116", "grade": "B"}
118+
{"question_id": "simple_qa_117", "grade": "A"}
119+
{"question_id": "simple_qa_119", "grade": "B"}
120+
{"question_id": "simple_qa_118", "grade": "C"}
121+
{"question_id": "simple_qa_120", "grade": "C"}
122+
{"question_id": "simple_qa_121", "grade": "B"}
123+
{"question_id": "simple_qa_122", "grade": "C"}
124+
{"question_id": "simple_qa_123", "grade": "C"}
125+
{"question_id": "simple_qa_124", "grade": "C"}
126+
{"question_id": "simple_qa_126", "grade": "C"}
127+
{"question_id": "simple_qa_127", "grade": "C"}
128+
{"question_id": "simple_qa_125", "grade": "B"}
129+
{"question_id": "simple_qa_128", "grade": "C"}
130+
{"question_id": "simple_qa_131", "grade": "C"}
131+
{"question_id": "simple_qa_130", "grade": "A"}
132+
{"question_id": "simple_qa_129", "grade": "A"}
133+
{"question_id": "simple_qa_132", "grade": "C"}
134+
{"question_id": "simple_qa_134", "grade": "A"}
135+
{"question_id": "simple_qa_135", "grade": "A"}
136+
{"question_id": "simple_qa_133", "grade": "B"}
137+
{"question_id": "simple_qa_138", "grade": "C"}
138+
{"question_id": "simple_qa_136", "grade": "C"}
139+
{"question_id": "simple_qa_139", "grade": "C"}
140+
{"question_id": "simple_qa_137", "grade": "C"}
141+
{"question_id": "simple_qa_142", "grade": "C"}
142+
{"question_id": "simple_qa_141", "grade": "C"}
143+
{"question_id": "simple_qa_140", "grade": "C"}
144+
{"question_id": "simple_qa_143", "grade": "C"}
145+
{"question_id": "simple_qa_144", "grade": "C"}
146+
{"question_id": "simple_qa_145", "grade": "C"}
147+
{"question_id": "simple_qa_146", "grade": "C"}
148+
{"question_id": "simple_qa_147", "grade": "B"}
149+
{"question_id": "simple_qa_148", "grade": "C"}
150+
{"question_id": "simple_qa_150", "grade": "C"}
151+
{"question_id": "simple_qa_149", "grade": "A"}
152+
{"question_id": "simple_qa_151", "grade": "B"}
153+
{"question_id": "simple_qa_152", "grade": "C"}
154+
{"question_id": "simple_qa_153", "grade": "C"}
155+
{"question_id": "simple_qa_154", "grade": "C"}
156+
{"question_id": "simple_qa_155", "grade": "C"}
157+
{"question_id": "simple_qa_156", "grade": "B"}
158+
{"question_id": "simple_qa_157", "grade": "A"}
159+
{"question_id": "simple_qa_158", "grade": "B"}
160+
{"question_id": "simple_qa_159", "grade": "B"}
161+
{"question_id": "simple_qa_160", "grade": "C"}
162+
{"question_id": "simple_qa_162", "grade": "C"}
163+
{"question_id": "simple_qa_163", "grade": "A"}
164+
{"question_id": "simple_qa_161", "grade": "B"}
165+
{"question_id": "simple_qa_165", "grade": "C"}
166+
{"question_id": "simple_qa_164", "grade": "C"}
167+
{"question_id": "simple_qa_166", "grade": "C"}
168+
{"question_id": "simple_qa_168", "grade": "A"}
169+
{"question_id": "simple_qa_169", "grade": "C"}
170+
{"question_id": "simple_qa_167", "grade": "C"}
171+
{"question_id": "simple_qa_170", "grade": "C"}
172+
{"question_id": "simple_qa_172", "grade": "B"}
173+
{"question_id": "simple_qa_173", "grade": "B"}
174+
{"question_id": "simple_qa_171", "grade": "C"}
175+
{"question_id": "simple_qa_175", "grade": "C"}
176+
{"question_id": "simple_qa_174", "grade": "C"}
177+
{"question_id": "simple_qa_177", "grade": "C"}
178+
{"question_id": "simple_qa_176", "grade": "C"}
179+
{"question_id": "simple_qa_179", "grade": "C"}
180+
{"question_id": "simple_qa_178", "grade": "A"}
181+
{"question_id": "simple_qa_181", "grade": "B"}
182+
{"question_id": "simple_qa_180", "grade": "C"}
183+
{"question_id": "simple_qa_182", "grade": "C"}
184+
{"question_id": "simple_qa_183", "grade": "C"}
185+
{"question_id": "simple_qa_184", "grade": "C"}
186+
{"question_id": "simple_qa_187", "grade": "C"}
187+
{"question_id": "simple_qa_185", "grade": "A"}
188+
{"question_id": "simple_qa_186", "grade": "C"}
189+
{"question_id": "simple_qa_189", "grade": "C"}
190+
{"question_id": "simple_qa_188", "grade": "C"}
191+
{"question_id": "simple_qa_190", "grade": "C"}
192+
{"question_id": "simple_qa_191", "grade": "C"}
193+
{"question_id": "simple_qa_192", "grade": "B"}
194+
{"question_id": "simple_qa_193", "grade": "B"}
195+
{"question_id": "simple_qa_194", "grade": "C"}
196+
{"question_id": "simple_qa_195", "grade": "C"}
197+
{"question_id": "simple_qa_197", "grade": "B"}
198+
{"question_id": "simple_qa_196", "grade": "B"}
199+
{"question_id": "simple_qa_198", "grade": "A"}
200+
{"question_id": "simple_qa_199", "grade": "C"}
201+
{"question_id": "simple_qa_200", "grade": "C"}
202+
{"question_id": "simple_qa_201", "grade": "B"}
203+
{"question_id": "simple_qa_202", "grade": "C"}
204+
{"question_id": "simple_qa_204", "grade": "C"}
205+
{"question_id": "simple_qa_205", "grade": "B"}
206+
{"question_id": "simple_qa_203", "grade": "C"}
207+
{"question_id": "simple_qa_206", "grade": "A"}
208+
{"question_id": "simple_qa_207", "grade": "B"}
209+
{"question_id": "simple_qa_208", "grade": "C"}
210+
{"question_id": "simple_qa_209", "grade": "B"}
211+
{"question_id": "simple_qa_211", "grade": "A"}
212+
{"question_id": "simple_qa_210", "grade": "B"}
213+
{"question_id": "simple_qa_212", "grade": "A"}
214+
{"question_id": "simple_qa_213", "grade": "A"}
215+
{"question_id": "simple_qa_215", "grade": "C"}
216+
{"question_id": "simple_qa_217", "grade": "A"}
217+
{"question_id": "simple_qa_218", "grade": "C"}
218+
{"question_id": "simple_qa_216", "grade": "C"}
219+
{"question_id": "simple_qa_219", "grade": "C"}
220+
{"question_id": "simple_qa_214", "grade": "B"}
221+
{"question_id": "simple_qa_220", "grade": "C"}
222+
{"question_id": "simple_qa_221", "grade": "C"}
223+
{"question_id": "simple_qa_222", "grade": "B"}
224+
{"question_id": "simple_qa_223", "grade": "A"}
225+
{"question_id": "simple_qa_226", "grade": "C"}
226+
{"question_id": "simple_qa_225", "grade": "C"}
227+
{"question_id": "simple_qa_224", "grade": "B"}
228+
{"question_id": "simple_qa_227", "grade": "B"}
229+
{"question_id": "simple_qa_228", "grade": "B"}
230+
{"question_id": "simple_qa_230", "grade": "B"}
231+
{"question_id": "simple_qa_231", "grade": "C"}
232+
{"question_id": "simple_qa_229", "grade": "C"}
233+
{"question_id": "simple_qa_233", "grade": "C"}
234+
{"question_id": "simple_qa_232", "grade": "A"}
235+
{"question_id": "simple_qa_234", "grade": "B"}
236+
{"question_id": "simple_qa_235", "grade": "C"}
237+
{"question_id": "simple_qa_236", "grade": "A"}
238+
{"question_id": "simple_qa_237", "grade": "C"}
239+
{"question_id": "simple_qa_238", "grade": "B"}
240+
{"question_id": "simple_qa_239", "grade": "C"}
241+
{"question_id": "simple_qa_240", "grade": "B"}
242+
{"question_id": "simple_qa_241", "grade": "B"}
243+
{"question_id": "simple_qa_242", "grade": "C"}
244+
{"question_id": "simple_qa_244", "grade": "C"}
245+
{"question_id": "simple_qa_243", "grade": "C"}
246+
{"question_id": "simple_qa_246", "grade": "B"}
247+
{"question_id": "simple_qa_247", "grade": "A"}
248+
{"question_id": "simple_qa_245", "grade": "A"}
249+
{"question_id": "simple_qa_248", "grade": "C"}
250+
{"question_id": "simple_qa_249", "grade": "C"}

0 commit comments

Comments
 (0)