Skip to content

Commit eaf6ef2

Browse files
authored
[Fix] fix sample num and peer evaluator in SciReasoner (#2378)
1 parent c512d07 commit eaf6ef2

File tree

4 files changed

+47
-27
lines changed

4 files changed

+47
-27
lines changed

opencompass/configs/datasets/SciReasoner/peer_gen.py

Lines changed: 44 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -111,28 +111,48 @@
111111
dataset_postprocessor=dict(type=PEER_postprocess_default),
112112
)
113113

114-
115-
116-
117-
PEER_datasets.append(
118-
dict(
119-
abbr=f'SciReasoner-PEER_{task}',
120-
type=PEER_Dataset,
121-
path='opencompass/SciReasoner-PEER',
122-
task=task,
123-
reader_cfg=reader_cfg,
124-
infer_cfg=infer_cfg,
125-
eval_cfg=cascade_eval_llm_cfg),
126-
)
127-
mini_PEER_datasets.append(
128-
dict(
129-
abbr=f'SciReasoner-PEER_{task}-mini',
130-
type=PEER_Dataset,
131-
path='opencompass/SciReasoner-PEER',
132-
task=task,
133-
mini_set=True,
134-
reader_cfg=reader_cfg,
135-
infer_cfg=infer_cfg,
136-
eval_cfg=cascade_eval_llm_cfg),
137-
)
114+
if task != 'stability':
115+
PEER_datasets.append(
116+
dict(
117+
abbr=f'SciReasoner-PEER_{task}',
118+
type=PEER_Dataset,
119+
path='opencompass/SciReasoner-PEER',
120+
task=task,
121+
reader_cfg=reader_cfg,
122+
infer_cfg=infer_cfg,
123+
eval_cfg=cascade_eval_llm_cfg),
124+
)
125+
mini_PEER_datasets.append(
126+
dict(
127+
abbr=f'SciReasoner-PEER_{task}-mini',
128+
type=PEER_Dataset,
129+
path='opencompass/SciReasoner-PEER',
130+
task=task,
131+
mini_set=True,
132+
reader_cfg=reader_cfg,
133+
infer_cfg=infer_cfg,
134+
eval_cfg=cascade_eval_llm_cfg),
135+
)
136+
else:
137+
PEER_datasets.append(
138+
dict(
139+
abbr=f'SciReasoner-PEER_{task}',
140+
type=PEER_Dataset,
141+
path='opencompass/SciReasoner-PEER',
142+
task=task,
143+
reader_cfg=reader_cfg,
144+
infer_cfg=infer_cfg,
145+
eval_cfg=eval_stability_cfg),
146+
)
147+
mini_PEER_datasets.append(
148+
dict(
149+
abbr=f'SciReasoner-PEER_{task}-mini',
150+
type=PEER_Dataset,
151+
path='opencompass/SciReasoner-PEER',
152+
task=task,
153+
mini_set=True,
154+
reader_cfg=reader_cfg,
155+
infer_cfg=infer_cfg,
156+
eval_cfg=eval_stability_cfg),
157+
)
138158

opencompass/datasets/SciReasoner/LLM4Chem/evaluator.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -58,7 +58,7 @@ def load(path, task, max_cut=-1, mini_set=False, hf_hub=False):
5858
if mini_set:
5959
import random
6060
random.seed(1024)
61-
test_data = random.sample(test_data, 50)
61+
test_data = random.sample(test_data, min(len(test_data), 150))
6262
random.seed()
6363

6464
dataset = DatasetDict({

opencompass/datasets/SciReasoner/Mol_Instructions/biotext.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -218,7 +218,7 @@ def load(path, task, max_cut=-1, mini_set=False, hf_hub=False):
218218
if mini_set:
219219
import random
220220
random.seed(1024)
221-
test_data = random.sample(test_data, 50)
221+
test_data = random.sample(test_data, min(len(test_data), 150))
222222
random.seed()
223223

224224
dataset = DatasetDict({

opencompass/datasets/SciReasoner/opi/evaluator.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -51,7 +51,7 @@ def load(path, task, max_cut=-1, mini_set=False, hf_hub=False):
5151
if mini_set:
5252
import random
5353
random.seed(1024)
54-
test_data = random.sample(test_data, 50)
54+
test_data = random.sample(test_data, min(len(test_data), 150))
5555
random.seed()
5656

5757
dataset = DatasetDict({

0 commit comments

Comments
 (0)