Skip to content

Commit 16f4b2e

Browse files
authored
Fix inter token latency test (#274)
Signed-off-by: irar2 <[email protected]>
1 parent 47e69db commit 16f4b2e

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

pkg/llm-d-inference-sim/latencies_test.go

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -75,8 +75,8 @@ var _ = Describe("Check random latencies", Ordered, func() {
7575
latency += simulator.getInterTokenLatency()
7676
}
7777

78-
Expect(latency).To(BeNumerically(">=", int(float32(interTokenLatency)*0.3*float32(numberOfTokens))))
79-
Expect(latency).To(BeNumerically("<=", int(float32(interTokenLatency)*1.7*float32(numberOfTokens))))
78+
Expect(latency).To(BeNumerically(">=", int(float32(interTokenLatency)*0.3*float32(numberOfTokens-1))))
79+
Expect(latency).To(BeNumerically("<=", int(float32(interTokenLatency)*1.7*float32(numberOfTokens-1))))
8080
},
8181
func(interTokenLatency int, stddev int, numberOfTokens int) string {
8282
return fmt.Sprintf("interTokenLatency: %d stddev: %d, numberOfTokens: %d", interTokenLatency,

0 commit comments

Comments
 (0)