Skip to content

Commit 45d1d63

Browse files
authored
update viz subset (#295)
1 parent f84275b commit 45d1d63

File tree

1 file changed

+11
-8
lines changed

1 file changed

+11
-8
lines changed

evalscope/report/app.py

Lines changed: 11 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -250,7 +250,10 @@ def normalize_score(score):
250250
def get_model_prediction(work_dir: str, model_name: str, dataset_name: str, subset_name: str):
251251
data_path = os.path.join(work_dir, OutputsStructure.REVIEWS_DIR, model_name)
252252
subset_name = subset_name.replace('/', '_') # for collection report
253-
origin_df = pd.read_json(os.path.join(data_path, f'{dataset_name}_{subset_name}.jsonl'), lines=True)
253+
review_path = os.path.join(data_path, f'{dataset_name}_{subset_name}.jsonl')
254+
logger.debug(f'review_path: {review_path}')
255+
origin_df = pd.read_json(review_path, lines=True)
256+
254257
ds = []
255258
for i, item in origin_df.iterrows():
256259
raw_input = item['raw_input']
@@ -274,7 +277,7 @@ def get_model_prediction(work_dir: str, model_name: str, dataset_name: str, subs
274277

275278
def get_table_data(data_review_df: pd.DataFrame, page: int = 1, rows_per_page: int = 1) -> pd.DataFrame:
276279
if data_review_df is None:
277-
return None
280+
return pd.DataFrame(), None
278281

279282
logger.debug(f'page: {page}, rows_per_page: {rows_per_page}')
280283
start = (page - 1) * rows_per_page
@@ -515,19 +518,19 @@ def update_single_report_score(report_list):
515518
@gr.on(
516519
triggers=[dataset_radio.change, report_list.change],
517520
inputs=[dataset_radio, report_list],
518-
outputs=[dataset_plot, dataset_table, subset_select])
521+
outputs=[dataset_plot, dataset_table, subset_select, data_review_df])
519522
def update_single_report_dataset(dataset_name, report_list):
520523
logger.debug(f'Updating single report dataset: {dataset_name}')
521524
report_df = get_data_frame(report_list)
522525
data_score_df, styler = get_single_dataset_df(report_df, dataset_name)
523526
data_score_plot = plot_single_dataset_scores(data_score_df)
524527
subsets = data_score_df[ReportKey.subset_name].unique().tolist()
525528
logger.debug(f'subsets: {subsets}')
526-
return data_score_plot, styler, gr.update(choices=subsets, value=subsets[0])
529+
return data_score_plot, styler, gr.update(choices=subsets, value=None), None
527530

528531
@gr.on(
529-
triggers=[report_list.change, dataset_radio.change, subset_radio.change],
530-
inputs=[work_dir, model_name, dataset_radio, subset_radio],
532+
triggers=[subset_select.change],
533+
inputs=[work_dir, model_name, dataset_radio, subset_select],
531534
outputs=[data_review_df, page_number])
532535
def update_single_report_subset(work_dir, model_name, dataset_name, subset_name):
533536
if not subset_name:
@@ -566,9 +569,9 @@ def filter_data(data_review_df, answer_mode):
566569
inputs=[filtered_review_df, page_number],
567570
outputs=[data_review_table])
568571
def update_table(filtered_df, page_number):
572+
if filtered_df is None:
573+
return gr.update(value=None)
569574
subset_df, styler = get_table_data(filtered_df, page_number)
570-
if subset_df is None:
571-
return gr.skip()
572575
return styler
573576

574577
return SingleModelComponents(report_name=report_name)

0 commit comments

Comments
 (0)