Skip to content

Commit 1bf5b04

Browse files
committed
update app.py
1 parent d4c2ff0 commit 1bf5b04

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

vllm/demo/gradio_demo/app.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -88,7 +88,7 @@ def chat_with_model_streaming(user_input, history):
8888
first_token_latency = first_token_time - start_time if first_token_time is not None else 0
8989
elapsed_time = time.time() - first_token_time
9090
tps = token_count / elapsed_time if elapsed_time > 0 else 0 # ✅ 计算 Tokens Per Second
91-
speed_text = f"⏳ 首字延迟: {first_token_latency:.2f} | ⏱️ 耗时: {elapsed_time:.2f} 秒 | 🔢 Tokens: {token_count} | ⚡ 速度: {tps:.2f} TPS" # ⏳
91+
speed_text = f"⏳ 首字延迟: {first_token_latency:.2f} | ⏱️ 耗时: {elapsed_time:.2f} 秒 | 🔢 Tokens: {token_count} | ⚡ 速度: {tps:.2f} TPS" # ⏳
9292
yield history + [(user_input, bot_response)], "", speed_text # ✅ 返回推理速度
9393

9494
except Exception as e:

0 commit comments

Comments
 (0)