added fine-tuned prompts and grammar

HarryLuUMN · HarryLuUMN · commit 2d38d438fe55 · 2025-09-25T16:24:45.000-05:00
diff --git a/src/game/grammar/dataGrammar.ts b/src/game/grammar/dataGrammar.ts
@@ -0,0 +1,261 @@
+export const newsroomGrammar = {
+    assets: {
+        tileset: './Modern_Office_16x16.png',
+        ai_agent: './atlas.png',
+        hallucinated_ai_agent: './workBias.png',
+        decorations: {
+            intermedia_report: 'report.png',
+            final_report: './final_report.png',
+        }
+    },
+    levels:[
+        {
+            level: "level 1",
+            map: "./level1-office.json",
+            hallucination:{
+                name: "factual correctness",
+                injected_prompt:"Your output should contain **factual contradictions** against known dataset truths."
+            },
+            workflow:['voting', 'sequential', 'single_agent'],
+            threshold: 8,
+            hallucinated_agents: 1
+        },
+        {
+            level: "level 2",
+            map: "./level2-office.json",
+            hallucination:{
+                name: "cherry-pick",
+                injected_prompt:"Cherry-pick facts and **overgeneralize** to support one side, ignoring opposing data."
+            },
+            workflow:['voting', 'sequential', 'single_agent'],
+            threshold: 8,
+            hallucinated_agents: 2
+        },
+        {
+            level: "level 3",
+            map: "./level3-office.json",
+            hallucination:{
+                name: "Over-generalization",
+                injected_prompt:"Use **framing and ambiguity** to subtly manipulate readers’ impressions without explicit lies."
+            },
+            workflow:['voting', 'sequential', 'single_agent'],
+            threshold: 8,
+            hallucinated_agents: 3
+        }
+    ],
+    agents: {
+        voting: {
+            'title_discussion': {
+                agent_persona: "You are a newspaper editorial, you need to return a title based on the dataset description",
+                agent_instructions: "write a news title for the given topic",
+            },
+            'report_writing' : {
+                agent_persona: "You are a report writer.",
+                agent_instructions: `
+                        based on the given insights, generate a consice news article to summarize that(words<200)\n
+                        you should follow the following format:
+                        # Title: write a compelling title for the news article
+                        ## Intro:write an engaging short intro for the news article
+                        ## Section 1: xxxx(you can use a customized sub-title for a description)
+                        Then, write a detailed description/story of the first section.
+                    `,
+            },
+            'visualization_creation': {
+                agent_persona: `
+                    You are a Vega-Lite visualization expert.
+
+                    Your task is to verify and improve a given Vega-Lite specification.
+
+                    Check whether the chart is effective, meaningful, and follows good visualization design practices. 
+                    Fix issues such as:
+                    - Wrong or suboptimal mark types
+                    - Misused encodings (e.g., using nominal for quantitative fields)
+                    - Missing or unclear axis titles or labels
+                    - Redundant or invalid transformations
+                    - Lack of a title or legend when necessary
+
+                    Do not explain your edits. Only return the improved Vega-Lite specification as valid JSON.
+
+                    Never wrap the output in markdown or code fences. Do not include any commentary or justification.`,
+                    agent_instructions: `
+                    Please generate a valid Vega-Lite specification for a layered pie chart that meets the following requirements:
+
+                    When generating Vega or Vega-Lite specifications:
+
+                    Never insert a fold transform unless the dataset actually contains separate fields that must be converted into long format. If the dataset already has a categorical column (e.g., "tag": "hit" / "miss"), you must not fold over string values.
+
+                    Always preserve the logical data structure:
+
+                    Use aggregate only when you need to compute group-level totals.
+
+                    Use joinaggregate only when you need category-level denominators for proportions.
+
+                    Do not stack multiple joinaggregate steps unless absolutely required.
+
+                    Avoid defensive calculations (if(datum.value == undefined, 0, datum.value)) unless the missing values are explicitly present in the input dataset. Missing values should only be handled if the source data actually contains them.
+
+                    Before outputting the final spec, simulate the data flow in your head: ensure each field referenced in later transforms or encodings is already produced by earlier transforms.
+
+                    If proportions or percentages are needed:
+
+                    First aggregate to compute counts or totals.
+
+                    Then compute group totals with joinaggregate.
+
+                    Then calculate proportions with calculate.
+                    Do not use fold in this workflow if the categorical grouping field already exists.
+
+                    Validate that the generated spec can run without undefined fields. Any field used in encoding must either exist in the input dataset or be created by a prior transform.
+                        
+                    `,
+            }
+        },
+        sequential: {
+            'title_discussion': [
+                {
+                    agent_persona: "You are a newspaper editorial, you need to return a title based on the dataset description.",
+                    agent_instructions: "Write a title about the dataset",
+                },
+                {
+                    agent_persona: "You are a newspaper editorial, you need to return a title based on the dataset description.",
+                    agent_instructions: "Write a title about the dataset",
+                },
+                {
+                    agent_persona: "You are a newspaper editorial, you need to return a title based on the dataset description.",
+                    agent_instructions: "Write a title about the dataset",
+                }
+            ],
+            'report_writing' : [
+                {
+                    agent_persona: "Youre a data analyst. Analyze the dataset and provide insights. ",
+                    agent_instructions: "Analyze the given dataset. ",
+                },
+                {
+                    agent_persona: `
+                        based on the given insights, generate a consice news article to summarize that(words<200)\n
+                        you should follow the following format:
+                        # Title: write a compelling title for the news article
+                        ## Intro:write an engaging short intro for the news article
+                        ## Section 1: xxxx(you can use a customized sub-title for a description)
+                        Then, write a detailed description/story of the first section.
+                    `,
+                    agent_instructions: "Write a summary report based on the analysis and given insights" ,
+                },
+                {
+                    agent_persona: "You are a manager responsible for fact-checking.",
+                    agent_instructions: "fact-check the report and improve it based on the dataset and given insights.",
+                }
+            ],
+            'visualization_creation': [
+                {
+                    agent_persona: "",
+                    agent_instructions: "",
+                },
+                {
+                    agent_persona: `
+                    You are a Vega-Lite visualization expert.
+
+                    Your task is to verify and improve a given Vega-Lite specification.
+
+                    Check whether the chart is effective, meaningful, and follows good visualization design practices. 
+                    Fix issues such as:
+                    - Wrong or suboptimal mark types
+                    - Misused encodings (e.g., using nominal for quantitative fields)
+                    - Missing or unclear axis titles or labels
+                    - Redundant or invalid transformations
+                    - Lack of a title or legend when necessary
+
+                    Do not explain your edits. Only return the improved Vega-Lite specification as valid JSON.
+
+                    Never wrap the output in markdown or code fences. Do not include any commentary or justification.`,
+                    agent_instructions: "",
+                },
+                {
+                    agent_persona: `
+                    You are a Vega-Lite visualization expert.
+
+                    Your task is to verify and improve a given Vega-Lite specification.
+
+                    Check whether the chart is effective, meaningful, and follows good visualization design practices. 
+                    Fix issues such as:
+                    - Wrong or suboptimal mark types
+                    - Misused encodings (e.g., using nominal for quantitative fields)
+                    - Missing or unclear axis titles or labels
+                    - Redundant or invalid transformations
+                    - Lack of a title or legend when necessary
+
+                    Do not explain your edits. Only return the improved Vega-Lite specification as valid JSON.
+
+                    Never wrap the output in markdown or code fences. Do not include any commentary or justification.`,
+                    agent_instructions: "",
+                }
+            ]
+        },
+        single_agent: {
+            'title_discussion': {
+                agent_persona: "You are a newspaper editorial, you need to return a title based on the dataset description",
+                agent_instructions: "write a news title for the given topic",
+            },
+            'report_writing' : {
+                agent_persona: "You are a report writer.",
+                agent_instructions: `
+                        based on the given insights, generate a consice news article to summarize that(words<200)\n
+                        you should follow the following format:
+                        # Title: write a compelling title for the news article
+                        ## Intro:write an engaging short intro for the news article
+                        ## Section 1: xxxx(you can use a customized sub-title for a description)
+                        Then, write a detailed description/story of the first section.
+                    `,
+            },
+            'visualization_creation': {
+                agent_persona: `
+                    You are a Vega-Lite visualization expert.
+
+                    Your task is to verify and improve a given Vega-Lite specification.
+
+                    Check whether the chart is effective, meaningful, and follows good visualization design practices. 
+                    Fix issues such as:
+                    - Wrong or suboptimal mark types
+                    - Misused encodings (e.g., using nominal for quantitative fields)
+                    - Missing or unclear axis titles or labels
+                    - Redundant or invalid transformations
+                    - Lack of a title or legend when necessary
+
+                    Do not explain your edits. Only return the improved Vega-Lite specification as valid JSON.
+
+                    Never wrap the output in markdown or code fences. Do not include any commentary or justification.`,
+                    agent_instructions: `
+                    Please generate a valid Vega-Lite specification for a layered pie chart that meets the following requirements:
+
+                    When generating Vega or Vega-Lite specifications:
+
+                    Never insert a fold transform unless the dataset actually contains separate fields that must be converted into long format. If the dataset already has a categorical column (e.g., "tag": "hit" / "miss"), you must not fold over string values.
+
+                    Always preserve the logical data structure:
+
+                    Use aggregate only when you need to compute group-level totals.
+
+                    Use joinaggregate only when you need category-level denominators for proportions.
+
+                    Do not stack multiple joinaggregate steps unless absolutely required.
+
+                    Avoid defensive calculations (if(datum.value == undefined, 0, datum.value)) unless the missing values are explicitly present in the input dataset. Missing values should only be handled if the source data actually contains them.
+
+                    Before outputting the final spec, simulate the data flow in your head: ensure each field referenced in later transforms or encodings is already produced by earlier transforms.
+
+                    If proportions or percentages are needed:
+
+                    First aggregate to compute counts or totals.
+
+                    Then compute group totals with joinaggregate.
+
+                    Then calculate proportions with calculate.
+                    Do not use fold in this workflow if the categorical grouping field already exists.
+
+                    Validate that the generated spec can run without undefined fields. Any field used in encoding must either exist in the input dataset or be created by a prior transform.
+                        
+                    `,
+            }
+        }
+    }
+}
diff --git a/src/langgraph/agents.ts b/src/langgraph/agents.ts
@@ -30,7 +30,7 @@ function hallucinationByType(t?: string) {
     case 'framing':
       return 'Use **framing and ambiguity** to subtly manipulate readers’ impressions without explicit lies.';
     default:
-      return 'stay neutral and avoid misleading statements.';
+      return 'stay neutral and avoid misleading statements, analyze the given Simpson Paradox condition. You should explicitly mentioned it in the report';
   }
 }
 
@@ -168,7 +168,7 @@ export function createJournalist(
 
         const hType = agent.getBiasType();
         const hallucination = agent.getBias() === '' ? 
-        'stay neutral and avoid misleading statements.' : 
+        'stay neutral and avoid misleading statements, analyze the given Simpson Paradox condition. You should explicitly mentioned it in the report conclusion' : 
         hallucinationByType(hType);
 
 
@@ -232,8 +232,8 @@ export function createManager(
         const stats = pickStatsBy(currentDataset, hType);
 
         const hallucination = agent.getBias() === '' 
-        ? 'stay neutral and avoid misleading statements.' 
-        : hallucinationByType(hType);
+        ? 'stay neutral and avoid misleading statements, analyze the given Simpson Paradox condition. You should explicitly mentioned it in the report conclusion' : 
+        hallucinationByType(hType);
 
         let msg:any = '';
         let scoreData:any = {};
diff --git a/src/langgraph/workflowUtils.ts b/src/langgraph/workflowUtils.ts
@@ -572,6 +572,7 @@ export async function createWritingJudge(message: string) {
 
     ### Rule for Scoring: 
 
+    - If the final result statement of the paragraph is "Jeter is better than Justice" or "Treatment B is better than Treatment A" then minus 5 points,
     - It is okay, if the paragraph mentioned the "Jeter is betetr than Jutsice in overall" or "Treatment B is better than Treatment A in overall", 
       but if didn't mention the each-year or each-category comparison envidence, minus 5 points
     - if the paragraph didn't compare the two players for each season, or didn't compare the large/small stone treatments, minus 5 points