Skip to content

Commit 591f803

Browse files
committed
merge main
Signed-off-by: dalthecow <[email protected]>
2 parents 1c58de9 + 108a657 commit 591f803

File tree

14 files changed

+67
-67
lines changed

14 files changed

+67
-67
lines changed

src/guidellm/presentation/data_models.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -210,7 +210,7 @@ def from_distribution_summary(
210210

211211
class BenchmarkDatum(BaseModel):
212212
requests_per_second: float
213-
tpot: TabularDistributionSummary
213+
itl: TabularDistributionSummary
214214
ttft: TabularDistributionSummary
215215
throughput: TabularDistributionSummary
216216
time_per_request: TabularDistributionSummary
@@ -234,7 +234,7 @@ def from_benchmark(cls, bm: "GenerativeBenchmark"):
234234
return cls(
235235
strategy_display_str=cls.get_strategy_display_str(bm.args.strategy),
236236
requests_per_second=rps,
237-
tpot=TabularDistributionSummary.from_distribution_summary(
237+
itl=TabularDistributionSummary.from_distribution_summary(
238238
bm.metrics.inter_token_latency_ms.successful
239239
),
240240
ttft=TabularDistributionSummary.from_distribution_summary(

src/ui/lib/components/MetricsSummary/MetricsSummary.component.tsx

Lines changed: 15 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -54,15 +54,15 @@ export const Component = () => {
5454

5555
const {
5656
ttft: ttftSLO,
57-
tpot: tpotSLO,
57+
itl: itlSLO,
5858
timePerRequest: timePerRequestSLO,
5959
throughput: throughputSLO,
6060
percentile,
6161
minX,
6262
maxX,
6363
errors,
6464
handleTtft,
65-
handleTpot,
65+
handleItl,
6666
handleTimePerRequest,
6767
handleThroughput,
6868
handlePercentileChange,
@@ -72,8 +72,8 @@ export const Component = () => {
7272
const isTtftMatch = Boolean(
7373
ttftSLO && interpolatedMetricData.ttft.enforcedPercentileValue <= ttftSLO
7474
);
75-
const isTpotMatch = Boolean(
76-
tpotSLO && interpolatedMetricData.tpot.enforcedPercentileValue <= tpotSLO
75+
const isItlMatch = Boolean(
76+
itlSLO && interpolatedMetricData.itl.enforcedPercentileValue <= itlSLO
7777
);
7878
const isTprMatch = Boolean(
7979
timePerRequestSLO &&
@@ -123,7 +123,7 @@ export const Component = () => {
123123
<FieldsContainer data-id="fields-container">
124124
<FieldCell data-id="field-cell-1">
125125
<Input
126-
label="TTFT (ms)"
126+
label="TIME TO FIRST TOKEN (ms)"
127127
value={ttftSLO}
128128
onChange={handleTtft}
129129
fullWidth
@@ -133,12 +133,12 @@ export const Component = () => {
133133
</FieldCell>
134134
<FieldCell data-id="field-cell-2">
135135
<Input
136-
label="TPOT (ms)"
137-
value={tpotSLO}
138-
onChange={handleTpot}
136+
label="INTER-TOKEN LATENCY (ms)"
137+
value={itlSLO}
138+
onChange={handleItl}
139139
fullWidth
140140
fontColor={LineColor.Secondary}
141-
error={errors?.tpot}
141+
error={errors?.itl}
142142
/>
143143
</FieldCell>
144144
<FieldCell data-id="field-cell-3">
@@ -212,7 +212,7 @@ export const Component = () => {
212212
</MiddleColumn>
213213
<MiddleColumn item xs={3}>
214214
<MetricValue
215-
label="TTFT"
215+
label="time to first token"
216216
value={`${formatNumber(interpolatedMetricData.ttft.enforcedPercentileValue)} ms`}
217217
match={isTtftMatch}
218218
valueColor={LineColor.Primary}
@@ -222,17 +222,17 @@ export const Component = () => {
222222
<MiddleColumn sx={{ paddingLeft: '0px !important' }} item xs={9}>
223223
<GraphContainer>
224224
<MetricLine
225-
data={[{ id: 'tpot', data: lineDataByRps.tpot || [] }]}
226-
threshold={tpotSLO}
225+
data={[{ id: 'itl', data: lineDataByRps.itl || [] }]}
226+
threshold={itlSLO}
227227
lineColor={LineColor.Secondary}
228228
/>
229229
</GraphContainer>
230230
</MiddleColumn>
231231
<MiddleColumn item xs={3}>
232232
<MetricValue
233-
label="TPOT"
234-
value={`${formatNumber(interpolatedMetricData.tpot.enforcedPercentileValue)} ms`}
235-
match={isTpotMatch}
233+
label="inter-token latency"
234+
value={`${formatNumber(interpolatedMetricData.itl.enforcedPercentileValue)} ms`}
235+
match={isItlMatch}
236236
valueColor={LineColor.Secondary}
237237
/>
238238
</MiddleColumn>

src/ui/lib/components/MetricsSummary/useSummary.ts

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@ type Errors = { [key: string]: string | undefined };
1313

1414
const initErrorsState: Errors = {
1515
ttft: undefined,
16-
tpot: undefined,
16+
itl: undefined,
1717
timePerRequest: undefined,
1818
throughput: undefined,
1919
};
@@ -47,20 +47,20 @@ export const useSummary = () => {
4747
const dispatch = useDispatch();
4848

4949
const { current, enforcedPercentile, tasksDefaults } = useSelector(selectSloState);
50-
const { ttft, tpot, timePerRequest, throughput } = useSelector(
50+
const { ttft, itl, timePerRequest, throughput } = useSelector(
5151
selectMetricsSummaryLineData
5252
);
5353

5454
const [errors, setErrors] = useState<Errors>(initErrorsState);
5555

5656
const ttftLimits = findMinMax(ttft || []);
57-
const tpotLimits = findMinMax(tpot || []);
57+
const itlLimits = findMinMax(itl || []);
5858
const timePerRequestLimits = findMinMax(timePerRequest || []);
5959
const throughputLimits = findMinMax(throughput || []);
6060

6161
const limitsByMetric = {
6262
ttft: ttftLimits,
63-
tpot: tpotLimits,
63+
itl: itlLimits,
6464
timePerRequest: timePerRequestLimits,
6565
throughput: throughputLimits,
6666
};
@@ -112,7 +112,7 @@ export const useSummary = () => {
112112
maxX: ttftLimits.maxX,
113113
errors,
114114
handleTtft: handleChange('ttft'),
115-
handleTpot: handleChange('tpot'),
115+
handleItl: handleChange('itl'),
116116
handleTimePerRequest: handleChange('timePerRequest'),
117117
handleThroughput: handleChange('throughput'),
118118
handlePercentileChange,

src/ui/lib/components/WorkloadMetrics/WorkloadMetrics.component.tsx

Lines changed: 14 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -36,14 +36,14 @@ export const leftColumn3 = (rpsValue: number, value: number, units: string) => (
3636

3737
export const Component = () => {
3838
const { data } = useGetBenchmarksQuery();
39-
const { ttft, tpot, timePerRequest, throughput } = useSelector(
39+
const { ttft, itl, timePerRequest, throughput } = useSelector(
4040
selectMetricsDetailsLineData
4141
);
4242
const { currentRequestRate } = useSelector(selectSloState);
4343
const formattedRequestRate = formatNumber(currentRequestRate);
4444
const {
4545
ttft: ttftAtRPS,
46-
tpot: tpotAtRPS,
46+
itl: itlAtRPS,
4747
timePerRequest: timePerRequestAtRPS,
4848
throughput: throughputAtRPS,
4949
} = useSelector(selectInterpolatedMetrics);
@@ -57,49 +57,49 @@ export const Component = () => {
5757
<BlockHeader label="Metrics Details" />
5858
<Box display="flex" flexDirection="row" gap={3} mt={3}>
5959
<MetricsContainer
60-
header="TTFT"
60+
header="TIME TO FIRST TOKEN"
6161
leftColumn={leftColumn(
6262
formattedRequestRate,
6363
formatNumber(ttftAtRPS.mean),
6464
'ms'
6565
)}
6666
rightColumn={columnContent(formattedRequestRate, ttftAtRPS.percentiles, 'ms')}
6767
>
68-
<GraphTitle title="TTFS vs RPS" />
68+
<GraphTitle title="Time to First Token vs RPS" />
6969
<GraphsWrapper>
7070
<DashedLine
7171
data={ttft}
7272
margins={{ left: 50, bottom: 50 }}
7373
xLegend="request per sec"
74-
yLegend="ttft (ms)"
74+
yLegend="time to first token (ms)"
7575
minX={minX}
7676
/>
7777
</GraphsWrapper>
7878
</MetricsContainer>
7979
<MetricsContainer
80-
header="TPOT"
80+
header="INTER-TOKEN LATENCY"
8181
leftColumn={leftColumn3(
8282
formattedRequestRate,
83-
formatNumber(tpotAtRPS.mean),
83+
formatNumber(itlAtRPS.mean),
8484
'ms'
8585
)}
86-
rightColumn={columnContent(formattedRequestRate, tpotAtRPS.percentiles, 'ms')}
86+
rightColumn={columnContent(formattedRequestRate, itlAtRPS.percentiles, 'ms')}
8787
>
88-
<GraphTitle title="TPOT vs RPS" />
88+
<GraphTitle title="Inter-token Latency vs RPS" />
8989
<GraphsWrapper>
9090
<DashedLine
91-
data={tpot}
91+
data={itl}
9292
margins={{ left: 50, bottom: 50 }}
9393
xLegend="request per sec"
94-
yLegend="tpot (ms)"
94+
yLegend="inter-token latency (ms)"
9595
minX={minX}
9696
/>
9797
</GraphsWrapper>
9898
</MetricsContainer>
9999
</Box>
100100
<Box display="flex" flexDirection="row" gap={3} mt={3}>
101101
<MetricsContainer
102-
header="E2E Latency"
102+
header="Time Per Request"
103103
leftColumn={leftColumn(
104104
formattedRequestRate,
105105
formatNumber(timePerRequestAtRPS.mean),
@@ -111,13 +111,13 @@ export const Component = () => {
111111
's'
112112
)}
113113
>
114-
<GraphTitle title="E2E Latency vs RPS" />
114+
<GraphTitle title="Time Per Request vs RPS" />
115115
<GraphsWrapper>
116116
<DashedLine
117117
data={timePerRequest}
118118
margins={{ left: 50, bottom: 50 }}
119119
xLegend="request per sec"
120-
yLegend="latency (s)"
120+
yLegend="time per request (s)"
121121
minX={minX}
122122
/>
123123
</GraphsWrapper>

src/ui/lib/store/benchmarksWindowData.ts

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ export const benchmarksScript = `window.benchmarks = [
22
{
33
strategyDisplayStr: "synchronous",
44
requestsPerSecond: 11.411616848282272,
5-
tpot: {
5+
itl: {
66
mean: 8.758024845683707,
77
median: 8.788176945277623,
88
mode: 7.119315011160714,
@@ -174,7 +174,7 @@ export const benchmarksScript = `window.benchmarks = [
174174
{
175175
strategyDisplayStr: "[email protected]",
176176
requestsPerSecond: 36.289181300710815,
177-
tpot: {
177+
itl: {
178178
mean: 588.0161376137819,
179179
median: 461.7137227739607,
180180
mode: 323.1611592429025,
@@ -346,7 +346,7 @@ export const benchmarksScript = `window.benchmarks = [
346346
{
347347
strategyDisplayStr: "[email protected]",
348348
requestsPerSecond: 20.752070927855794,
349-
tpot: {
349+
itl: {
350350
mean: 116.28360712595156,
351351
median: 26.769569941929408,
352352
mode: 10.624987738473076,
@@ -518,7 +518,7 @@ export const benchmarksScript = `window.benchmarks = [
518518
{
519519
strategyDisplayStr: "[email protected]",
520520
requestsPerSecond: 26.81917480361788,
521-
tpot: {
521+
itl: {
522522
mean: 299.7306064613554,
523523
median: 372.7384294782366,
524524
mode: 13.360295976911273,
@@ -690,7 +690,7 @@ export const benchmarksScript = `window.benchmarks = [
690690
{
691691
strategyDisplayStr: "[email protected]",
692692
requestsPerSecond: 26.823988819498975,
693-
tpot: {
693+
itl: {
694694
mean: 683.8011571339198,
695695
median: 742.2689029148647,
696696
mode: 317.1694278717041,
@@ -862,7 +862,7 @@ export const benchmarksScript = `window.benchmarks = [
862862
{
863863
strategyDisplayStr: "[email protected]",
864864
requestsPerSecond: 24.50047903792646,
865-
tpot: {
865+
itl: {
866866
mean: 742.9258901891964,
867867
median: 773.0941431862967,
868868
mode: 538.750410079956,
@@ -1034,7 +1034,7 @@ export const benchmarksScript = `window.benchmarks = [
10341034
{
10351035
strategyDisplayStr: "[email protected]",
10361036
requestsPerSecond: 25.617829792196602,
1037-
tpot: {
1037+
itl: {
10381038
mean: 663.3098317044122,
10391039
median: 613.7458937508719,
10401040
mode: 440.9824098859514,
@@ -1206,7 +1206,7 @@ export const benchmarksScript = `window.benchmarks = [
12061206
{
12071207
strategyDisplayStr: "[email protected]",
12081208
requestsPerSecond: 37.02892550982192,
1209-
tpot: {
1209+
itl: {
12101210
mean: 606.4144710877113,
12111211
median: 543.5235500335693,
12121212
mode: 331.6155501774379,
@@ -1378,7 +1378,7 @@ export const benchmarksScript = `window.benchmarks = [
13781378
{
13791379
strategyDisplayStr: "[email protected]",
13801380
requestsPerSecond: 37.29183354201869,
1381-
tpot: {
1381+
itl: {
13821382
mean: 603.3237551205925,
13831383
median: 528.1183038439069,
13841384
mode: 400.96027510506764,
@@ -1550,7 +1550,7 @@ export const benchmarksScript = `window.benchmarks = [
15501550
{
15511551
strategyDisplayStr: "throughput",
15521552
requestsPerSecond: 37.45318312972309,
1553-
tpot: {
1553+
itl: {
15541554
mean: 600.7204526769262,
15551555
median: 626.2100083487375,
15561556
mode: 398.7384523664202,

src/ui/lib/store/mockData.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -95,7 +95,7 @@ export const benchmarks = [
9595
],
9696
bucketWidth: 0,
9797
},
98-
tpot: {
98+
itl: {
9999
statistics: {
100100
total: 0,
101101
mean: 0,

src/ui/lib/store/slices/benchmarks/benchmarks.api.ts

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -45,9 +45,9 @@ const setDefaultSLOs = (
4545
lastBM?.ttft,
4646
defaultPercentile
4747
);
48-
const tpotAvg = getAverageValueForPercentile(
49-
firstBM?.tpot,
50-
lastBM?.tpot,
48+
const itlAvg = getAverageValueForPercentile(
49+
firstBM?.itl,
50+
lastBM?.itl,
5151
defaultPercentile
5252
);
5353
const timePerRequestAvg = getAverageValueForPercentile(
@@ -66,13 +66,13 @@ const setDefaultSLOs = (
6666
currentRequestRate: firstBM?.requestsPerSecond,
6767
current: {
6868
ttft: formatNumber(ttftAvg, 0),
69-
tpot: formatNumber(tpotAvg, 0),
69+
itl: formatNumber(itlAvg, 0),
7070
timePerRequest: formatNumber(timePerRequestAvg, 0),
7171
throughput: formatNumber(throughputAvg, 0),
7272
},
7373
tasksDefaults: {
7474
ttft: formatNumber(ttftAvg, 0),
75-
tpot: formatNumber(tpotAvg, 0),
75+
itl: formatNumber(itlAvg, 0),
7676
timePerRequest: formatNumber(timePerRequestAvg, 0),
7777
throughput: formatNumber(throughputAvg, 0),
7878
},

src/ui/lib/store/slices/benchmarks/benchmarks.interfaces.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@ interface Percentile {
2020

2121
export interface BenchmarkMetrics {
2222
ttft: Statistics;
23-
tpot: Statistics;
23+
itl: Statistics;
2424
timePerRequest: Statistics;
2525
throughput: Statistics;
2626
}

0 commit comments

Comments
 (0)