@@ -701,25 +701,23 @@ func (s *VllmSimulator) getTimeToFirstToken(nPromptTokens int, nCachedPromptToke
701701		if  s .config .KVCacheTransferLatency  ==  0  &&  s .config .KVCacheTransferLatencyStdDev  ==  0  {
702702			// is disaggregated PD and ttft is calculated using number of prompt tokens 
703703			kvCacheTransT  :=  s .config .KVCacheTransferTimePerToken  *  nPromptTokens 
704- 			return  int ( common .RandomNorm (float64 ( kvCacheTransT ),  float64 ( s .config .KVCacheTransferTimeStdDev )) )
704+ 			return  common .RandomNorm (kvCacheTransT ,  s .config .KVCacheTransferTimeStdDev )
705705		}
706706		// is disaggregated PD and *not* using number of prompt tokens 
707- 		return  int ( common .RandomNorm (float64 ( s .config .KVCacheTransferLatency ),  float64 ( s .config .KVCacheTransferLatencyStdDev )) )
707+ 		return  common .RandomNorm (s .config .KVCacheTransferLatency ,  s .config .KVCacheTransferLatencyStdDev )
708708	}
709709	if  s .config .TimeToFirstToken  ==  0  &&  s .config .TimeToFirstTokenStdDev  ==  0  {
710710		// is aggregated PD and ttft is calculated using number of prompt tokens that are not in kv cache 
711711		prefillTime  :=  s .config .PrefillOverhead  +  (nPromptTokens - nCachedPromptTokens )* s .config .PrefillTimePerToken 
712- 		return  int ( common .RandomNorm (float64 ( prefillTime ),  float64 ( s .config .PrefillTimeStdDev )) )
712+ 		return  common .RandomNorm (prefillTime ,  s .config .PrefillTimeStdDev )
713713	}
714714	// is aggregated PD and *not* using number of prompt tokens 
715- 	return  int ( common .RandomNorm (float64 ( s .config .TimeToFirstToken ),  float64 ( s .config .TimeToFirstTokenStdDev )) )
715+ 	return  common .RandomNorm (s .config .TimeToFirstToken ,  s .config .TimeToFirstTokenStdDev )
716716}
717717
718718// returns inter token latency 
719719func  (s  * VllmSimulator ) getInterTokenLatency () int  {
720- 	mean  :=  float64 (s .config .InterTokenLatency )
721- 	stddev  :=  float64 (s .config .InterTokenLatencyStdDev )
722- 	return  int (common .RandomNorm (mean , stddev ))
720+ 	return  common .RandomNorm (s .config .InterTokenLatency , s .config .InterTokenLatencyStdDev )
723721}
724722
725723// returns total inter token latency for the given number of tokens 
0 commit comments