We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ef9a3df commit 963ad46Copy full SHA for 963ad46
cpp/include/tensorrt_llm/batch_manager/llmRequest.h
@@ -1828,9 +1828,10 @@ class GenericLlmRequest
1828
1829
void updatePerfMetrics(executor::IterationType iter)
1830
{
1831
+ auto const currentTokenTime = getSteadyClockNow();
1832
+
1833
if (!mPerfMetrics.firstIter)
1834
- auto const currentTokenTime = getSteadyClockNow();
1835
mPerfMetrics.firstIter = iter;
1836
mPerfMetrics.timingMetrics.firstTokenTime = currentTokenTime;
1837
}
@@ -1839,7 +1840,6 @@ class GenericLlmRequest
1839
1840
1841
if (isFinished())
1842
1843
mPerfMetrics.lastIter = iter;
1844
mPerfMetrics.timingMetrics.lastTokenTime = currentTokenTime;
1845
0 commit comments