We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent a6dae30 commit 1b7b097Copy full SHA for 1b7b097
tools/mock-vllm/app.py
@@ -2,6 +2,7 @@
2
import time
3
from typing import List, Optional
4
5
+import uvicorn
6
from fastapi import FastAPI
7
from pydantic import BaseModel
8
@@ -79,3 +80,7 @@ def estimate_tokens(text: str) -> int:
79
80
# Some SDKs look for token_usage; keep it as an alias for convenience.
81
"token_usage": usage,
82
}
83
+
84
85
+if __name__ == "__main__":
86
+ uvicorn.run(app, host="0.0.0.0", port=8000)
0 commit comments