Merge branch 'main' into 0919-yuluo/add-version

yuluo-yx · web-flow · commit e718c6e29288 · 2025-09-20T12:55:05.000+08:00
diff --git a/src/semantic-router/pkg/extproc/request_handler.go b/src/semantic-router/pkg/extproc/request_handler.go
@@ -263,8 +263,7 @@ func (r *OpenAIRouter) handleCaching(ctx *RequestContext) (*ext_proc.ProcessingR
 		if err != nil {
 			observability.Errorf("Error searching cache: %v", err)
 		} else if found {
-			// Record and log cache hit
-			metrics.RecordCacheHit()
+			// Log cache hit
 			observability.LogEvent("cache_hit", map[string]interface{}{
 				"request_id": ctx.RequestID,
 				"model":      requestModel,
diff --git a/tools/make/linter.mk b/tools/make/linter.mk
@@ -2,11 +2,11 @@
 # =  Everything For Project Linter, markdown, yaml, code spell etc.  =
 # =============================== linter.mk ==========================
 
-docs-lint:
+docs-lint: docs-install
 	@$(LOG_TARGET)
 	cd website && npm run lint
 
-docs-lint-fix:
+docs-lint-fix: docs-install
 	@$(LOG_TARGET)
 	cd website && npm run lint:fix
 
diff --git a/website/docs/api/router.md b/website/docs/api/router.md
@@ -173,6 +173,12 @@ semantic_router_cache_size 1247
 # Security metrics
 semantic_router_pii_detections_total{action="block"} 23
 semantic_router_jailbreak_attempts_total{action="block"} 5
+
+# Error metrics
+llm_request_errors_total{model="gpt-4",reason="timeout"} 12
+llm_request_errors_total{model="claude-3",reason="upstream_5xx"} 3
+llm_request_errors_total{model="phi4",reason="upstream_4xx"} 5
+llm_request_errors_total{model="phi4",reason="pii_policy_denied"} 8
 ```
 
 ### Reasoning Mode Metrics
@@ -247,6 +253,35 @@ sum by (model) (increase(llm_model_cost_total{currency="USD"}[1h]))
 sum by (reason_code) (increase(llm_routing_reason_codes_total[15m]))
 ```
 
+### Request Error Metrics
+
+The router tracks request-level failures by model and reason so you can monitor both absolute error throughput and the share of requests that fail.
+
+- `llm_request_errors_total{model, reason}`
+  - Description: Total number of request errors categorized by failure reason
+  - Labels:
+    - model: target model name for the failed request
+    - reason: error category (timeout, upstream_4xx, upstream_5xx, pii_policy_denied, jailbreak_block, parse_error, serialization_error, cancellation, classification_failed, unknown)
+
+Example PromQL queries:
+
+```prometheus
+# Total errors by reason over the last hour
+sum by (reason) (increase(llm_request_errors_total[1h]))
+
+# Error throughput (errors/sec) by model over the last 15 minutes.
+# Helpful for incident response because it shows how many failing requests are impacting users.
+sum by (model) (rate(llm_request_errors_total[15m]))
+
+# Error ratio (% of requests failing) by model over the last 15 minutes.
+# Use increase() to align numerator and denominator with the same lookback window.
+100 * sum by (model) (increase(llm_request_errors_total[15m])) /
+    sum by (model) (increase(llm_model_requests_total[15m]))
+
+# PII policy blocks over the last 24 hours
+sum(increase(llm_request_errors_total{reason="pii_policy_denied"}[24h]))
+```
+
 ### Pricing Configuration
 
 Provide per-1M pricing for your models so the router can compute request cost and emit metrics/logs.
diff --git a/website/src/pages/community/community-page.module.css b/website/src/pages/community/community-page.module.css
@@ -130,6 +130,16 @@
   margin-top: 0.25rem;
 }
 
+.stepNumberTips {
+  display: flex;
+  flex-direction: column;
+  margin: 0 0 0 1rem;
+}
+
+.stepNumberTips p {
+    line-height: 1.5;
+}
+
 .step h4 {
   margin: 0 0 0.5rem 0;
   color: var(--ifm-color-primary);
diff --git a/website/src/pages/community/contributing.js b/website/src/pages/community/contributing.js
@@ -103,6 +103,16 @@ export default function Contributing() {
                   <div>
                     <h4>Test</h4>
                     <p>Run tests and ensure your changes don't break existing functionality.</p>
+                    <div className={styles.stepNumberTips}>
+                      <p>1. Run precommit hooks, ensure compliance with the project submission guidelines;</p>
+                      <p>
+                        2. You can refer to
+                        {' '}
+                        <a href="/docs/getting-started/installation">Install the local</a>
+                        {' '}
+                        to start semantic-router locally.
+                      </p>
+                    </div>
                   </div>
                 </div>
 
@@ -117,6 +127,64 @@ export default function Contributing() {
             </div>
           </section>
 
+          <section className={styles.section}>
+            <h2>⚙️ Precommit hooks</h2>
+            <p>The Semantic-router project provides a precommit hook to standardize the entire project, including Go, Python, Rust, Markdown, and spelling error checking.</p>
+            <p>Although these measures may increase the difficulty of contributions, they are necessary. We are currently building a portable Docker precommit environment to reduce the difficulty of contributions, allowing you to focus on functional pull requests.</p>
+
+            <div className={styles.card}>
+              <h3>Manual</h3>
+
+              <h4>Some Tips: </h4>
+              <div className={styles.stepNumberTips}>
+                <p>1. If the precommit check fails, don't worry. You can also get more information by executing "make help". </p>
+                <p>2. For the pip installation tool, we recommend that you use venv for installation.</p>
+                <p>3. You can also directly submit the PR and let GitHub CI test it for you, but this will take a lot of time!</p>
+              </div>
+
+              <div className={styles.steps}>
+                <div className={styles.step}>
+                  <span className={styles.stepNumber}>1</span>
+                  <div>
+                    <h4>Install precommit</h4>
+                    <p>Run pip install --user precommit</p>
+                  </div>
+                </div>
+                <div className={styles.step}>
+                  <span className={styles.stepNumber}>2</span>
+                  <div>
+                    <h4>Install check tools</h4>
+                    <div className={styles.stepNumberTips}>
+                      <p>Markdown: npm install -g markdownlint-cli</p>
+                      <p>Yaml: pip install --user yamllint</p>
+                      <p>CodeSpell: pip install --user codespell</p>
+                      <p>JavaScript: cd website && npm lint</p>
+                    </div>
+                  </div>
+                </div>
+                <div className={styles.step}>
+                  <span className={styles.stepNumber}>3</span>
+                  <div>
+                    <h4>Install precommit to git</h4>
+                    <p>Run pre-commit install, then pre-commit installed at .git/hooks/pre-commit</p>
+                  </div>
+                </div>
+                <div className={styles.step}>
+                  <span className={styles.stepNumber}>4</span>
+                  <div>
+                    <h4>Run</h4>
+                    <p>Run make precommit-check to check.</p>
+                  </div>
+                </div>
+
+                <hr />
+
+                <h3>Docker</h3>
+                <p>Coming soon!</p>
+              </div>
+            </div>
+          </section>
+
           <section className={styles.section}>
             <h2>🏷️ Working Group Areas</h2>
             <p>