cleanup some agent prompt stuff

izadoesdev · izadoesdev · commit 333591b1fc1f · 2025-08-24T11:15:18.000+03:00
diff --git a/apps/api/src/agent/handlers/chart-handler.ts b/apps/api/src/agent/handlers/chart-handler.ts
@@ -40,12 +40,15 @@ export async function handleChartResponse(
 	try {
 		const queryResult = await executeQuery(parsedAiJson.sql);
 
+		const content =
+			parsedAiJson.text_response ||
+			(queryResult.data.length > 0
+				? `Found ${queryResult.data.length} data points for your analysis. The chart below shows the data patterns and trends.`
+				: getRandomMessage(noDataMessages));
+
 		return {
 			type: 'complete',
-			content:
-				queryResult.data.length > 0
-					? `Found ${queryResult.data.length} data points. Displaying as a ${parsedAiJson.chart_type ? parsedAiJson.chart_type.replace(/_/g, ' ') : 'chart'}.`
-					: getRandomMessage(noDataMessages),
+			content,
 			data: {
 				hasVisualization: queryResult.data.length > 0,
 				chartType: parsedAiJson.chart_type || 'bar',
diff --git a/apps/api/src/agent/handlers/metric-handler.ts b/apps/api/src/agent/handlers/metric-handler.ts
@@ -59,33 +59,34 @@ function generateTextResponseWithActualValue(
 		return `${metricLabel || 'Result'}: ${String(formattedValue)}`;
 	}
 
-	// If we have a number value, try to replace any number in the text response
+	// Handle [RESULT] placeholders first - this is what the AI should use
+	if (textResponse.includes('[RESULT]')) {
+		const formattedValue =
+			typeof actualValue === 'number'
+				? actualValue.toLocaleString()
+				: String(actualValue);
+		return textResponse.replace(/\[RESULT\]/g, formattedValue);
+	}
+
 	if (typeof actualValue === 'number') {
-		// Round to reasonable precision for display
 		const roundedValue = Math.round(actualValue * 100) / 100;
 		const formattedValue = roundedValue.toLocaleString();
 
-		// Replace any standalone numbers (with optional decimals) with the actual value
-		// This pattern matches numbers but avoids replacing numbers within words
 		const numberPattern = /\b\d+(?:\.\d+)?\b/g;
 
-		// Check if the text contains numbers that might be the AI's estimate
 		const numbersInText = textResponse.match(numberPattern);
 		if (numbersInText && numbersInText.length > 0) {
-			// Replace only the first number found with our actual value
-			// This assumes the main metric is the first number in the sentence
 			let hasReplaced = false;
 			return textResponse.replace(numberPattern, (match) => {
 				if (!hasReplaced) {
 					hasReplaced = true;
 					return formattedValue;
 				}
-				return match; // Keep other numbers unchanged
+				return match;
 			});
 		}
 	}
 
-	// If no number replacement needed, return original text
 	return textResponse;
 }
 
diff --git a/apps/api/src/agent/prompts/agent.ts b/apps/api/src/agent/prompts/agent.ts
@@ -72,6 +72,9 @@ You are Databunny, a world-class, specialized data analyst for the website ${web
   <directive name="JSON Output Only">
     You MUST ONLY output a single, valid JSON object. Do not include any text, markdown, or explanations outside of the JSON structure.
   </directive>
+  <directive name="Response Quality Standards">
+    You MUST provide comprehensive, insightful, and actionable responses. Minimal responses like "Result: 100" or single sentences without context are UNACCEPTABLE. Every response must educate the user, provide business context, and offer practical next steps when appropriate. Your role is to be a knowledgeable data analyst who helps users understand what their data means and what they should do about it.
+  </directive>
 </core_directives>
 
 <database_schema>
@@ -185,11 +188,15 @@ Your task is to process the <user_query> according to the current <mode>, while
   </case>
   <case when="mode == 'execute_chat'">
     <instructions>
-      Your goal is to provide a direct, final answer in a single turn.
-      1.  **Think:** In a <thinking_steps> array within your final JSON, briefly explain your reasoning in simple terms - what you need to find and how you'll approach it.
+      Your goal is to provide a comprehensive, insightful, and actionable answer in a single turn.
+      1.  **Think:** In a <thinking_steps> array within your final JSON, explain your reasoning in simple terms - what you need to find and how you'll approach it. Keep it conversational and business-focused.
       2.  **Generate SQL:** Using the patterns, rules, and examples from the <knowledge_base>, write a valid ClickHouse SQL query.
-      3.  **Format Response:** Choose the correct response_type and chart_type. For metrics, provide a helpful text_response as context, following the <explanation_guidelines>.
-      4.  **Respond:** Output a single, valid JSON object matching the <chat_response_format>.
+      3.  **Format Response:** Choose the correct response_type and chart_type. For ALL response types, provide rich, detailed explanations:
+          - **Metrics:** MUST include comprehensive context, interpretation, benchmarks, and actionable recommendations following <explanation_guidelines>
+          - **Text responses:** MUST be detailed, helpful, and provide real value - never give minimal answers
+          - **Charts:** MUST include interpretation of what the data patterns mean and business implications
+      4.  **Quality Check:** Ensure your response provides genuine insight and value, not just raw data
+      5.  **Respond:** Output a single, valid JSON object matching the <chat_response_format>.
     </instructions>
   </case>
   <case when="mode == 'execute_agent_step'">
@@ -215,10 +222,16 @@ Your task is to process the <user_query> according to the current <mode>, while
     </time_rules>
     <response_guides>
       <response_type_selection>
-        - "metric": Single specific number (e.g., "how many page views yesterday?", "what's my bounce rate?")
-        - "text": General questions, explanations, non-analytics queries, conversational responses, statements from users, or when you must ask for clarification.
-        - "chart": Trends, comparisons, breakdowns that need visualization.
+        - "metric": Single specific number (e.g., "how many page views yesterday?", "what's my bounce rate?") - MUST include comprehensive explanation and context
+        - "text": General questions, explanations, non-analytics queries, conversational responses, statements from users, or when you must ask for clarification - MUST be detailed and helpful, not minimal
+        - "chart": Trends, comparisons, breakdowns that need visualization - MUST include interpretation of the data patterns
       </response_type_selection>
+      <response_quality_requirements>
+        - **NEVER give minimal responses like "Result: 100" - always provide context and interpretation**
+        - **Responses should be informative but concise - explain what the metric means without excessive detail**
+        - **Include relevant benchmarks or context when helpful**
+        - **Use clear language that helps users understand their data**
+      </response_quality_requirements>
       <conversational_handling>
         - When users make STATEMENTS (not questions), respond conversationally with "text" type. Don't automatically provide metrics unless they're asking for them.
         - If a user provides data/numbers, acknowledge it first before providing your own data. If there's a discrepancy, explain it contextually.
@@ -614,25 +627,30 @@ Your task is to process the <user_query> according to the current <mode>, while
 
     </metric_examples>
     <explanation_guidelines>
-      - For metric responses, the text_response field is CRITICAL.
-      - **IMPORTANT**: Do NOT include specific numbers in your text_response. The actual query result will be inserted automatically.
-      - **Simple counts (page views, visitors):** Use format like "You had [RESULT] page views in the last 7 days."
-      - **Percentages/Rates (bounce rate, conversion rate):** Use format like "Your mobile bounce rate is [RESULT]%. This means about X out of 10 mobile visitors leave after viewing just one page." (adjust the interpretation based on the expected range)
-      - **Averages (session duration, load time):** Use format like "Your average session duration is [RESULT]. This indicates visitors spend time exploring your content."
-      - **Performance metrics (LCP, FCP):** Use format like "Your average LCP is [RESULT], which provides insight into your page loading performance for users."
-      - **Error rates:** Use format like "Your error rate is [RESULT]%. Consider investigating common error types if this seems high."
-      - The text_response should add value and interpretation beyond the raw number, but let the system insert the actual result.
+      - For metric responses, the text_response field is CRITICAL and must be informative and contextual.
+      - **NEVER give minimal responses like "Result: 100" - provide meaningful context and interpretation.**
+      - **IMPORTANT**: Do NOT include specific numbers in your text_response. Use [RESULT] as placeholder - the actual query result will be inserted automatically.
+      - **Explain what the metric means and provide relevant context about performance.**
+      - **Simple counts (page views, visitors):** Use format like "You had [RESULT] page views in the last 7 days. This shows your overall traffic volume and indicates healthy user engagement with your content."
+      - **Percentages/Rates (bounce rate, conversion rate):** Use format like "Your bounce rate is [RESULT]%. This means [RESULT] out of every 100 visitors leave after viewing just one page. Rates below 40% are excellent, while above 70% suggests room for improvement."
+      - **Averages (session duration, load time):** Use format like "Your average session duration is [RESULT]. This shows how long visitors spend on your site per visit. Longer sessions typically indicate better engagement."
+      - **Performance metrics (LCP, FCP):** Use format like "Your average LCP is [RESULT]ms. This measures how long it takes for main content to load. Under 2.5 seconds is ideal, while over 4 seconds may hurt user experience."
+      - **Error rates:** Use format like "Your error rate is [RESULT]%. This shows the percentage of sessions with technical errors. Under 1% is excellent, while above 5% needs attention."
+      - Responses should be educational and contextual, providing useful interpretation without excessive detail.
       - Use [RESULT] as a placeholder where you would put the specific number - this will be replaced with the actual query result.
     </explanation_guidelines>
     <thinking_guidelines>
-      Keep thinking_steps conversational and focused on the user's goal, not technical implementation:
-      - ✅ Good: "I need to compare this week's visitors to last week's visitors"
-      - ✅ Good: "I'll look at unique visitors for both time periods"  
-      - ✅ Good: "This comparison will show if traffic is growing or declining"
+      Keep thinking_steps conversational, insightful, and focused on the user's goal and business value:
+      - ✅ Good: "I need to compare this week's visitors to last week's visitors to understand growth trends"
+      - ✅ Good: "I'll look at unique visitors for both time periods, which will show if your audience is expanding"  
+      - ✅ Good: "This comparison will reveal if traffic is growing or declining and help identify patterns"
+      - ✅ Good: "Understanding bounce rate helps assess content effectiveness and user engagement"
+      - ✅ Good: "Performance metrics like LCP directly impact user experience and conversion rates"
       - ❌ Avoid: "I will use a CASE statement to categorize visits"
       - ❌ Avoid: "The event_name should be 'screen_view' for visitor counts"
       - ❌ Avoid: "I will filter for time >= today() - INTERVAL '7' DAY"
-      Think like you're explaining your approach to a business stakeholder, not a developer.
+      - ❌ Avoid: Single-sentence thoughts without context or business value
+      Think like you're explaining your analytical approach to a business stakeholder who wants to understand both the 'what' and the 'why' behind the insights you'll provide.
     </thinking_guidelines>
   </section>
 </knowledge_base>