You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: pkg/llm-d-inference-sim/simulator_test.go
+32-1Lines changed: 32 additions & 1 deletion
Original file line number
Diff line number
Diff line change
@@ -981,7 +981,7 @@ var _ = Describe("Simulator", func() {
981
981
forlen(simulator.runReqChan) >0 {
982
982
<-simulator.runReqChan
983
983
}
984
-
fori:=0; i<maxNumOfReq; i++ {
984
+
forrangemaxNumOfReq {
985
985
simulator.runReqChan<-1
986
986
}
987
987
@@ -1000,5 +1000,36 @@ var _ = Describe("Simulator", func() {
1000
1000
Entry("factor: 20000.0", 20000.0, 310),
1001
1001
)
1002
1002
1003
+
DescribeTable("when time-factor-under-load is > 1, and the sim is partially loaded, the time to first token should be linear interpolation between time-to-first-token and time-factor-under-load * time-to-first-token",
0 commit comments