fix when score is a string (#750)

peteryang1 · web-flow · commit 3265fe7d3da4 · 2025-04-03T23:48:38.000+08:00
diff --git a/rdagent/scenarios/data_science/proposal/exp_gen/prompts_v2.yaml b/rdagent/scenarios/data_science/proposal/exp_gen/prompts_v2.yaml
@@ -200,7 +200,7 @@ output_format:
   hypothesis: |-
     For each of the identified problem, you should propose a hypothesis strictly following to the JSON schema. Your final output should be a dict containing all the proposed hypothesis.
     {
-      "problem name 1": {
+      "problem name 1 (Should be exactly same as the problem name provided)": {
         "reason": "Provide a clear, logical progression from problem identification to hypothesis formulation, grounded in evidence (e.g., trace history, domain principles, or competition constraints). Refer to the Hypothesis Guidelines for better understanding. Reason should be short with no more than two sentences.",
         {% if not pipeline %}"component": "The component name that the hypothesis focus on. Must be one of ('DataLoadSpec', 'FeatureEng', 'Model', 'Ensemble', 'Workflow').",
         {% else %}"component": "The component name that the hypothesis focus on. Must be 'Pipeline'.",
diff --git a/rdagent/scenarios/data_science/proposal/exp_gen/proposal.py b/rdagent/scenarios/data_science/proposal/exp_gen/proposal.py
@@ -326,15 +326,20 @@ def hypothesis_rank(self, hypothesis_dict: dict, problem_dict: dict, pipeline: b
             "feasibility_score": 0.1,
             "risk_reward_balance_score": 0.1,
         }
-        scores = pd.DataFrame(
-            {
-                problem_name: {
-                    score_key: hypothesis_dict[problem_name]["evaluation"].get(score_key, 0) * weight
-                    for score_key, weight in weights.items()
-                }
-                for problem_name in hypothesis_dict
-            }
-        )
+        scores_dict = {}
+        for problem_name in hypothesis_dict:
+            scores_dict[problem_name] = {}
+            for score_key in weights:
+                if score_key not in hypothesis_dict[problem_name]["evaluation"]:
+                    scores_dict[problem_name][score_key] = 0
+                else:
+                    try:
+                        scores_dict[problem_name][score_key] = (
+                            float(hypothesis_dict[problem_name]["evaluation"][score_key]) * weights[score_key]
+                        )
+                    except (ValueError, TypeError):
+                        scores_dict[problem_name][score_key] = 0
+        scores = pd.DataFrame(scores_dict)
         scores_sorted = scores.sum().sort_values(ascending=False)
         if len(scores_sorted) > 5:
             scores_sorted = scores_sorted[: len(scores_sorted) // 2]

Original file line number	Diff line number	Diff line change
`@@ -200,7 +200,7 @@ output_format:`
`200`	`200`	`hypothesis: \|-`
`201`	`201`	`For each of the identified problem, you should propose a hypothesis strictly following to the JSON schema. Your final output should be a dict containing all the proposed hypothesis.`
`202`	`202`	`{`
`203`		`- "problem name 1": {`
	`203`	`+ "problem name 1 (Should be exactly same as the problem name provided)": {`
`204`	`204`	`"reason": "Provide a clear, logical progression from problem identification to hypothesis formulation, grounded in evidence (e.g., trace history, domain principles, or competition constraints). Refer to the Hypothesis Guidelines for better understanding. Reason should be short with no more than two sentences.",`
`205`	`205`	`{% if not pipeline %}"component": "The component name that the hypothesis focus on. Must be one of ('DataLoadSpec', 'FeatureEng', 'Model', 'Ensemble', 'Workflow').",`
`206`	`206`	`{% else %}"component": "The component name that the hypothesis focus on. Must be 'Pipeline'.",`