Merge branch 'feat/multi-process'

LuckyYC · LuckyYC · commit 1a632edfbd0d · 2025-09-28T22:02:19.000+08:00
diff --git a/README.md b/README.md
@@ -120,7 +120,7 @@ VITE_API_BASE_URL=/api  # Base API URL for frontend requests (supports reverse p
 MULTIPROCESS_THRESHOLD=1000
 
 # Minimum number of concurrent users each child process should handle (prevents excessive processes and resource waste)
-MIN_USERS_PER_PROCESS=600
+MIN_USERS_PER_PROCESS=500
 
 # ⚠️ IMPORTANT NOTES:
 #   - When concurrency ≥ 1000, enabling multi-process mode is strongly recommended for performance.
diff --git a/README_CN.md b/README_CN.md
@@ -119,7 +119,7 @@ VITE_API_BASE_URL=/api
 # 当并发用户数超过此阈值，系统将自动启用多进程模式（需多核 CPU 支持）
 MULTIPROCESS_THRESHOLD: 1000
 # 每个子进程至少承载的并发用户数（避免进程过多导致资源浪费）
-MIN_USERS_PER_PROCESS: 600
+MIN_USERS_PER_PROCESS: 500
 # ⚠️ 重要提示：
 #   - 当并发量 ≥ 1000 时，强烈建议启用多进程以提升性能。
 #   - 多进程模式依赖多核 CPU 资源，请确保部署环境满足资源要求
diff --git a/backend/service/upload_service.py b/backend/service/upload_service.py
@@ -206,7 +206,7 @@ async def process_cert_files(
         raise HTTPException(status_code=400, detail=str(e))
     except Exception as e:
         logger.error(f"Error processing certificate files: {e}")
-        raise HTTPException(status_code=500, detail="Internal server error")
+        raise HTTPException(status_code=500, detail="Upload failed")
 
 
 async def process_dataset_files(task_id: str, files: List[UploadFile]):
@@ -275,7 +275,7 @@ async def process_dataset_files(task_id: str, files: List[UploadFile]):
         raise HTTPException(status_code=400, detail=str(e))
     except Exception as e:
         logger.error(f"Error processing dataset files: {e}")
-        raise HTTPException(status_code=500, detail="Internal server error")
+        raise HTTPException(status_code=500, detail="Upload failed")
 
 
 async def upload_file_svc(
diff --git a/docker-compose.dev.yml b/docker-compose.dev.yml
@@ -64,7 +64,7 @@ services:
       ENABLE_MULTIPROCESS: auto
       LOCUST_CPU_CORES: 4.0
       MULTIPROCESS_THRESHOLD: 1000           # Enable multiprocess only for 1000+ users
-      MIN_USERS_PER_PROCESS: 600             # Each process handles at least 600 users
+      MIN_USERS_PER_PROCESS: 500             # Each process handles at least 600 users
       # Process management and stability
       PYTHONUNBUFFERED: 1                    # Ensure immediate log output
       LOCUST_WORKER_HEARTBEAT_INTERVAL: 3    # Worker heartbeat interval (seconds)
diff --git a/docker-compose.yml b/docker-compose.yml
@@ -58,7 +58,7 @@ services:
       ENABLE_MULTIPROCESS: auto
       LOCUST_CPU_CORES: 2.0
       MULTIPROCESS_THRESHOLD: 1000           # Enable multiprocess only for 1000+ users
-      MIN_USERS_PER_PROCESS: 600             # Each process handles at least 600 users
+      MIN_USERS_PER_PROCESS: 500             # Each process handles at least 600 users
       # Process management and stability
       PYTHONUNBUFFERED: 1                    # Ensure immediate log output
       LOCUST_WORKER_HEARTBEAT_INTERVAL: 3    # Worker heartbeat interval (seconds)
diff --git a/frontend/public/locales/en/translation.json b/frontend/public/locales/en/translation.json
@@ -409,14 +409,22 @@
       "promptFieldPathTooltip": "The key in your request payload that contains the user prompt (needed for performance metrics calculation)",
       "streamingResponseConfiguration": "Streaming Response Configuration",
       "streamLinePrefix": "Stream Line Prefix",
-      "streamLinePrefixTooltip": "Text that appears at the beginning of each streaming data line (e.g., \"data:\", \"event:\")",
+      "streamLinePrefixTooltip": "Text that appears at the beginning of each data line (e.g., \"data:\", \"event:\")",
       "dataFormatTooltip": "Format of the streaming data after removing the prefix",
       "jsonFormat": "JSON Format",
       "plainText": "Plain Text",
       "contentFieldPath": "Content Field Path",
       "contentFieldPathTooltip": "Dot-notation path to the main content in each JSON chunk (e.g., choices.0.delta.content)",
       "reasoningFieldPath": "Reasoning Field Path",
       "reasoningFieldPathTooltip": "Dot-notation path to reasoning content in JSON (optional, for models that support reasoning)",
+      "usageFieldPath": "Token Usage Field",
+      "usageFieldPathTooltip": "Field path for token usage statistics (for token throughput calculation, if not filled or filled incorrectly, the built-in tokenizer will be used to estimate)",
+      "promptTokensFieldPath": "Prompt Tokens Field Path",
+      "promptTokensFieldPathTooltip": "Dot-notation path to prompt tokens count field (e.g., usage.prompt_tokens)",
+      "completionTokensFieldPath": "Completion Tokens Field Path",
+      "completionTokensFieldPathTooltip": "Dot-notation path to completion tokens count field (e.g., usage.completion_tokens)",
+      "totalTokensFieldPath": "Total Tokens Field Path",
+      "totalTokensFieldPathTooltip": "Dot-notation path to total tokens count field (e.g., usage.total_tokens)",
       "streamTerminationConfiguration": "Stream Termination Configuration",
       "endLinePrefix": "End Line Prefix",
       "endLinePrefixTooltip": "Prefix for lines that contain stream termination signals (usually same as stream prefix)",
@@ -427,7 +435,7 @@
       "nonStreamingResponseConfiguration": "Non-Streaming Response Configuration",
       "nonStreamingContentFieldPathTooltip": "Dot-notation path to the main content in the response JSON (e.g., choices.0.message.content)",
       "nonStreamingReasoningFieldPathTooltip": "Dot-notation path to reasoning content (optional, for models with reasoning capabilities)",
-      "fieldMappingDescription": "Configure field mappings for both prompt field and response data extraction. This mapping is essential for updating request payloads with test data and parsing streaming/non-streaming responses correctly.",
+      "fieldMappingDescription": "⚠️ Please accurately configure the mapping between the prompt and the response data field. This mapping directly affects the accuracy of data set replacement, load test execution, and performance metrics (such as response latency and token throughput). If the response does not contain the usage field, the built-in tokenizer will be used to estimate the token count.",
       "testIt": "Test It",
       "nextStep": "Next Step",
       "previousStep": "Previous",
diff --git a/frontend/public/locales/zh/translation.json b/frontend/public/locales/zh/translation.json
@@ -174,9 +174,9 @@
       "apiKeyDescription": "用于身份验证的API密钥",
       "aiConfigDescription": "配置AI服务请求信息，用于对性能结果进行AI分析。",
       "pleaseEnterHostUrl": "请输入AI服务主机URL",
-      "enterBaseUrlDescription": "输入AI服务的基础URL（例如，https://api.openai.com）",
+      "enterBaseUrlDescription": "输入AI服务的基础URL，如：https://api.openai.com",
       "pleaseEnterModelName": "请输入AI模型名称",
-      "enterModelDescription": "输入用于分析的模型名称（例如，gpt-3.5-turbo，gpt-4）",
+      "enterModelDescription": "输入用于分析的模型名称，如：gpt-4o",
       "pleaseEnterApiKey": "请输入API密钥",
       "enterApiKeyDescription": "输入用于身份验证的API密钥",
       "enterApiKeyWithoutBearer": "输入API密钥（不包含Bearer前缀）"
@@ -408,26 +408,34 @@
       "promptFieldPath": "提示词字段路径",
       "promptFieldPathTooltip": "请求参数中包含用户提示词的键（性能指标计算需要）",
       "streamingResponseConfiguration": "流式响应配置",
-      "streamLinePrefix": "流前缀",
-      "streamLinePrefixTooltip": "出现在每个流数据行开头的文本（例如，data:、event:）",
-      "dataFormatTooltip": "移除前缀后流数据的格式",
+      "streamLinePrefix": "数据行流前缀",
+      "streamLinePrefixTooltip": "出现在每个数据行开头的文本，如：data:、event:",
+      "dataFormatTooltip": "移除前缀后的数据格式",
       "jsonFormat": "JSON格式",
       "plainText": "纯文本",
       "contentFieldPath": "content字段路径",
-      "contentFieldPathTooltip": "content字段路径,使用点分割（例如，choices.0.delta.content）",
+      "contentFieldPathTooltip": "content字段路径,使用点分割，如：choices.0.delta.content",
       "reasoningFieldPath": "reasoning_content字段路径",
-      "reasoningFieldPathTooltip": "reasoning_content字段路径,使用点分割（可选，适用于深度思考模型）",
+      "reasoningFieldPathTooltip": "reasoning_content字段路径,使用点分割，如：choices.0.delta.reasoning_content",
+      "usageFieldPath": "Token使用统计字段",
+      "usageFieldPathTooltip": "Token使用统计信息的字段路径（用于token吞吐计算，若未填写或者填写错误则按照内置tokenizer估算）",
+      "promptTokensFieldPath": "prompt_tokens字段路径",
+      "promptTokensFieldPathTooltip": "prompt_tokens字段路径，使用点分割，如：usage.prompt_tokens",
+      "completionTokensFieldPath": "completion_tokens字段路径",
+      "completionTokensFieldPathTooltip": "completion_tokens字段路径，使用点分割，如：usage.completion_tokens",
+      "totalTokensFieldPath": "total_tokens字段路径",
+      "totalTokensFieldPathTooltip": "total_tokens字段路径，使用点分割，如：usage.total_tokens",
       "streamTerminationConfiguration": "流终止配置",
       "endLinePrefix": "结束行前缀",
       "endLinePrefixTooltip": "包含流终止信号的行前缀（通常与流前缀相同）",
       "stopSignal": "停止信号",
-      "stopSignalTooltip": "流式输出结束的标志（例如，[DONE]、STOP、finished）",
+      "stopSignalTooltip": "流式输出结束的标志，如：[DONE]、STOP、finished",
       "endFieldPath": "结束字段路径",
-      "endFieldPathTooltip": "指示完成的字段的JSON路径（可选，例如choices.0.finish_reason）",
+      "endFieldPathTooltip": "指示完成的字段的JSON路径，如： choices.0.finish_reason",
       "nonStreamingResponseConfiguration": "非流式响应配置",
-      "nonStreamingContentFieldPathTooltip": "content字段路径,使用点分割（例如，choices.0.delta.content）",
-      "nonStreamingReasoningFieldPathTooltip": "reasoning_content字段路径,使用点分割（可选，适用于深度思考模型）",
-      "fieldMappingDescription": "配置提示词字段和响应数据提取的字段映射。此映射对于使用数据集更新请求参数和正确解析流式/非流式响应至关重要。",
+      "nonStreamingContentFieldPathTooltip": "content字段路径,使用点分割，如：choices.0.delta.content",
+      "nonStreamingReasoningFieldPathTooltip": "reasoning_content字段路径,使用点分割，如：choices.0.delta.reasoning_content",
+      "fieldMappingDescription": "⚠️ 请准确配置提示词（prompt）与响应数据字段的映射关系。该映射直接影响数据集替换、压测执行及性能指标（如 响应时延、token吞吐量）的统计准确性。若响应中未包含 usage 字段，系统将回退至内置 tokenizer 估算 token 数量。",
       "testIt": "测试",
       "nextStep": "下一步",
       "previousStep": "上一步",
@@ -479,7 +487,7 @@
       "systemHeader": "系统请求头",
       "headerNamePlaceholder": "请求头名称",
       "headerValuePlaceholder": "请求头值",
-      "cookieNamePlaceholder": "Cookie名称（例如session_token）",
+      "cookieNamePlaceholder": "Cookie名称，如：session_token",
       "cookieValuePlaceholder": "Cookie值",
       "close": "关闭"
     },
diff --git a/frontend/src/components/CreateJobForm.tsx b/frontend/src/components/CreateJobForm.tsx
@@ -89,7 +89,6 @@ const CreateJobFormContent: React.FC<CreateJobFormProps> = ({
     if (apiPath === '/chat/completions') {
       const isStreamMode = streamMode !== false; // Default to streaming if not specified
       return {
-        prompt: 'messages.0.content',
         ...(isStreamMode
           ? CHAT_COMPLETIONS_FIELD_MAPPING.STREAMING
           : CHAT_COMPLETIONS_FIELD_MAPPING.NON_STREAMING),
@@ -98,11 +97,13 @@ const CreateJobFormContent: React.FC<CreateJobFormProps> = ({
     // For non-chat/completions APIs, return empty values (only show placeholders)
     return {
       prompt: '',
-      stream_prefix: '',
+      stream_prefix: 'data:',
       data_format: 'json',
       content: '',
       reasoning_content: '',
-      usage: '',
+      prompt_tokens: 'usage.prompt_tokens',
+      completion_tokens: 'usage.completion_tokens',
+      total_tokens: 'usage.total_tokens',
       end_prefix: '',
       stop_flag: '',
       end_field: '',
@@ -2159,8 +2160,79 @@ const CreateJobFormContent: React.FC<CreateJobFormProps> = ({
                         </Col>
                       </Row>
 
-                      <Row gutter={24} style={{ marginTop: 16 }}>
-                        <Col span={12}>
+                      <Row gutter={16} style={{ marginTop: 16 }}>
+                        <Col span={8}>
+                          <Form.Item
+                            name={['field_mapping', 'prompt_tokens']}
+                            label={
+                              <span>
+                                {t(
+                                  'components.createJobForm.promptTokensFieldPath'
+                                )}
+                                <Tooltip
+                                  title={t(
+                                    'components.createJobForm.promptTokensFieldPathTooltip'
+                                  )}
+                                >
+                                  <InfoCircleOutlined
+                                    style={{ marginLeft: 5 }}
+                                  />
+                                </Tooltip>
+                              </span>
+                            }
+                          >
+                            <Input placeholder='usage.prompt_tokens' />
+                          </Form.Item>
+                        </Col>
+
+                        <Col span={8}>
+                          <Form.Item
+                            name={['field_mapping', 'completion_tokens']}
+                            label={
+                              <span>
+                                {t(
+                                  'components.createJobForm.completionTokensFieldPath'
+                                )}
+                                <Tooltip
+                                  title={t(
+                                    'components.createJobForm.completionTokensFieldPathTooltip'
+                                  )}
+                                >
+                                  <InfoCircleOutlined
+                                    style={{ marginLeft: 5 }}
+                                  />
+                                </Tooltip>
+                              </span>
+                            }
+                          >
+                            <Input placeholder='usage.completion_tokens' />
+                          </Form.Item>
+                        </Col>
+                        <Col span={8}>
+                          <Form.Item
+                            name={['field_mapping', 'total_tokens']}
+                            label={
+                              <span>
+                                {t(
+                                  'components.createJobForm.totalTokensFieldPath'
+                                )}
+                                <Tooltip
+                                  title={t(
+                                    'components.createJobForm.totalTokensFieldPathTooltip'
+                                  )}
+                                >
+                                  <InfoCircleOutlined
+                                    style={{ marginLeft: 5 }}
+                                  />
+                                </Tooltip>
+                              </span>
+                            }
+                          >
+                            <Input placeholder='usage.total_tokens' />
+                          </Form.Item>
+                        </Col>
+                      </Row>
+                      {/* <Col span={12}>
                           <Form.Item
                             name={['field_mapping', 'usage']}
                             label={
@@ -2180,8 +2252,7 @@ const CreateJobFormContent: React.FC<CreateJobFormProps> = ({
                           >
                             <Input placeholder='usage' />
                           </Form.Item>
-                        </Col>
-                      </Row>
+                        </Col> */}
                     </>
                   )
                 );
@@ -2271,7 +2342,7 @@ const CreateJobFormContent: React.FC<CreateJobFormProps> = ({
                     },
                   ]}
                 >
-                  <Input placeholder='[DONE]' />
+                  <Input placeholder='stop' />
                 </Form.Item>
               </Col>
             </Row>
diff --git a/frontend/src/utils/constants.ts b/frontend/src/utils/constants.ts
@@ -27,21 +27,27 @@ export const DEFAULT_FORM_VALUES = {
 // Chat completions field mapping defaults
 export const CHAT_COMPLETIONS_FIELD_MAPPING = {
   STREAMING: {
+    prompt: 'messages.0.content',
     stream_prefix: 'data:',
     data_format: 'json',
     content: 'choices.0.delta.content',
     reasoning_content: 'choices.0.delta.reasoning_content',
-    usage: 'usage',
+    prompt_tokens: 'usage.prompt_tokens',
+    completion_tokens: 'usage.completion_tokens',
+    total_tokens: 'usage.total_tokens',
     end_prefix: 'data:',
     stop_flag: '[DONE]',
     end_field: '',
   },
   NON_STREAMING: {
+    prompt: 'messages.0.content',
     stream_prefix: '',
     data_format: 'json',
     content: 'choices.0.message.content',
     reasoning_content: 'choices.0.message.reasoning_content',
-    usage: 'usage',
+    prompt_tokens: 'usage.prompt_tokens',
+    completion_tokens: 'usage.completion_tokens',
+    total_tokens: 'usage.total_tokens',
     end_prefix: '',
     stop_flag: '',
     end_field: '',
diff --git a/st_engine/config/multiprocess.py b/st_engine/config/multiprocess.py
@@ -24,7 +24,7 @@ def __init__(self) -> None:
                 os.environ.get("MULTIPROCESS_THRESHOLD", "1000")
             )
             self.min_users_per_process = int(
-                os.environ.get("MIN_USERS_PER_PROCESS", "600")
+                os.environ.get("MIN_USERS_PER_PROCESS", "500")
             )
             self.force_single_process = (
                 os.environ.get("FORCE_SINGLE_PROCESS", "false").lower() == "true"
diff --git a/st_engine/engine/core.py b/st_engine/engine/core.py
@@ -28,7 +28,7 @@ class StreamMetrics:
     first_thinking_token_time: Optional[float] = None
     content: str = ""
     reasoning_content: str = ""
-    usage: Optional[Dict[str, Optional[int]]] = field(default=None)
+    usage: Optional[Dict[str, Optional[int]]] = field(default_factory=dict)
 
 
 @dataclass
@@ -66,7 +66,9 @@ class FieldMapping:
     content: str = ""
     reasoning_content: str = ""
     prompt: str = ""
-    usage: str = ""
+    prompt_tokens: str = ""
+    completion_tokens: str = ""
+    total_tokens: str = ""
 
 
 @dataclass
@@ -75,7 +77,7 @@ class TokenStats:
 
     reqs_count: int = 0
     completion_tokens: int = 0
-    all_tokens: int = 0
+    total_tokens: int = 0
 
 
 # === GLOBAL STATE MANAGEMENT ===
@@ -243,10 +245,16 @@ def parse_field_mapping(field_mapping_str: str) -> FieldMapping:
                 stop_flag=mapping_dict.get("stop_flag", "[DONE]"),
                 end_prefix=mapping_dict.get("end_prefix", ""),
                 end_field=mapping_dict.get("end_field", ""),
-                content=mapping_dict.get("content", ""),
-                reasoning_content=mapping_dict.get("reasoning_content", ""),
-                prompt=mapping_dict.get("prompt", ""),
-                usage=mapping_dict.get("usage", ""),
+                content=mapping_dict.get("content", "choices.0.delta.content"),
+                reasoning_content=mapping_dict.get(
+                    "reasoning_content", "choices.0.delta.reasoning_content"
+                ),
+                prompt=mapping_dict.get("prompt", "messages.0.content"),
+                prompt_tokens=mapping_dict.get("prompt_tokens", "usage.prompt_tokens"),
+                completion_tokens=mapping_dict.get(
+                    "completion_tokens", "usage.completion_tokens"
+                ),
+                total_tokens=mapping_dict.get("total_tokens", "usage.total_tokens"),
             )
         except (json.JSONDecodeError, TypeError):
             return FieldMapping()
diff --git a/st_engine/engine/locustfile.py b/st_engine/engine/locustfile.py
diff --git a/st_engine/engine/request_processor.py b/st_engine/engine/request_processor.py
diff --git a/st_engine/utils/common.py b/st_engine/utils/common.py
diff --git a/st_engine/utils/stats_manager.py b/st_engine/utils/stats_manager.py

Original file line number	Diff line number	Diff line change
`@@ -24,7 +24,7 @@ def __init__(self) -> None:`
`24`	`24`	`os.environ.get("MULTIPROCESS_THRESHOLD", "1000")`
`25`	`25`	`)`
`26`	`26`	`self.min_users_per_process = int(`
`27`		`- os.environ.get("MIN_USERS_PER_PROCESS", "600")`
	`27`	`+ os.environ.get("MIN_USERS_PER_PROCESS", "500")`
`28`	`28`	`)`
`29`	`29`	`self.force_single_process = (`
`30`	`30`	`os.environ.get("FORCE_SINGLE_PROCESS", "false").lower() == "true"`