Skip to content

Commit 1baeb9e

Browse files
committed
Resolve conflicts and fix test case
Signed-off-by: Qifan Deng <[email protected]>
1 parent 789a4f2 commit 1baeb9e

File tree

2 files changed

+1
-65
lines changed

2 files changed

+1
-65
lines changed

pkg/dataset/custom_dataset_test.go

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -193,9 +193,8 @@ var _ = Describe("CustomDataset", Ordered, func() {
193193
Prompt: testPrompt,
194194
MaxTokens: &n,
195195
}
196-
tokens, finishReason, err := dataset.GetTokens(req, common.ModeRandom)
196+
tokens, _, err := dataset.GetTokens(req, common.ModeRandom)
197197
Expect(err).NotTo(HaveOccurred())
198-
Expect(finishReason).To(Equal(LengthFinishReason))
199198
Expect(len(tokens)).To(BeNumerically("<=", 2))
200199
})
201200
})

pkg/llm-d-inference-sim/simulator.go

Lines changed: 0 additions & 63 deletions
Original file line numberDiff line numberDiff line change
@@ -259,69 +259,6 @@ func (s *VllmSimulator) initDataset() error {
259259
return nil
260260
}
261261

262-
func (s *VllmSimulator) newListener() (net.Listener, error) {
263-
s.logger.Info("Server starting", "port", s.config.Port)
264-
listener, err := net.Listen("tcp4", fmt.Sprintf(":%d", s.config.Port))
265-
if err != nil {
266-
return nil, err
267-
}
268-
return listener, nil
269-
}
270-
271-
// startServer starts http server on port defined in command line
272-
func (s *VllmSimulator) startServer(ctx context.Context, listener net.Listener) error {
273-
r := fasthttprouter.New()
274-
275-
// support completion APIs
276-
r.POST("/v1/chat/completions", s.HandleChatCompletions)
277-
r.POST("/v1/completions", s.HandleTextCompletions)
278-
// supports /models API
279-
r.GET("/v1/models", s.HandleModels)
280-
// support load/unload of lora adapter
281-
r.POST("/v1/load_lora_adapter", s.HandleLoadLora)
282-
r.POST("/v1/unload_lora_adapter", s.HandleUnloadLora)
283-
// supports /metrics prometheus API
284-
r.GET("/metrics", fasthttpadaptor.NewFastHTTPHandler(promhttp.HandlerFor(s.registry, promhttp.HandlerOpts{})))
285-
// supports standard Kubernetes health and readiness checks
286-
r.GET("/health", s.HandleHealth)
287-
r.GET("/ready", s.HandleReady)
288-
r.POST("/tokenize", s.HandleTokenize)
289-
290-
server := fasthttp.Server{
291-
ErrorHandler: s.HandleError,
292-
Handler: r.Handler,
293-
Logger: s,
294-
}
295-
296-
// Start server in a goroutine
297-
serverErr := make(chan error, 1)
298-
go func() {
299-
s.logger.Info("HTTP server starting")
300-
serverErr <- server.Serve(listener)
301-
}()
302-
303-
// Wait for either context cancellation or server error
304-
select {
305-
case <-ctx.Done():
306-
s.logger.Info("Shutdown signal received, shutting down HTTP server gracefully")
307-
308-
// Gracefully shutdown the server
309-
if err := server.Shutdown(); err != nil {
310-
s.logger.Error(err, "Error during server shutdown")
311-
return err
312-
}
313-
314-
s.logger.Info("HTTP server stopped")
315-
return nil
316-
317-
case err := <-serverErr:
318-
if err != nil {
319-
s.logger.Error(err, "HTTP server failed")
320-
}
321-
return err
322-
}
323-
}
324-
325262
// Print prints to a log, implementation of fasthttp.Logger
326263
func (s *VllmSimulator) Printf(format string, args ...interface{}) {
327264
s.logger.Info("Server error", "msg", fmt.Sprintf(format, args...))

0 commit comments

Comments
 (0)