We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent c077c78 commit 262e825Copy full SHA for 262e825
tools/mock-vllm/app.py
@@ -2,6 +2,7 @@
2
import time
3
from typing import List, Optional
4
5
+import uvicorn
6
from fastapi import FastAPI
7
from pydantic import BaseModel
8
@@ -79,3 +80,7 @@ def estimate_tokens(text: str) -> int:
79
80
# Some SDKs look for token_usage; keep it as an alias for convenience.
81
"token_usage": usage,
82
}
83
+
84
85
+if __name__ == "__main__":
86
+ uvicorn.run(app, host="0.0.0.0", port=8000)
0 commit comments