File tree Expand file tree Collapse file tree 1 file changed +6
-1
lines changed Expand file tree Collapse file tree 1 file changed +6
-1
lines changed Original file line number Diff line number Diff line change @@ -3583,6 +3583,11 @@ export class WhisperTokenizer extends PreTrainedTokenizer {
3583
3583
let chunk = new_chunk ( ) ;
3584
3584
let time_offset = 0.0 ;
3585
3585
const timestamp_begin = this . timestamp_begin ;
3586
+ // Whisper timestamp tokens start from 0.00 and go to timestamp 30.00 in 0.02 increments.
3587
+ // We can calculate the last time stamp token as timestamp_begin plus the number of tokens
3588
+ // tokens from 0.00 to 30.00 which is 1500.
3589
+ const total_timestamp_tokens = 1500 ; // (30.00 - 0.00) / 0.02
3590
+ const timestamp_end = timestamp_begin + total_timestamp_tokens ;
3586
3591
3587
3592
let previous_tokens = [ ] ;
3588
3593
let previous_token_timestamps = [ ] ;
@@ -3670,7 +3675,7 @@ export class WhisperTokenizer extends PreTrainedTokenizer {
3670
3675
} else {
3671
3676
// 2/ This is a regular special token, ignoring it
3672
3677
}
3673
- } else if ( token >= timestamp_begin ) {
3678
+ } else if ( token >= timestamp_begin && token <= timestamp_end ) {
3674
3679
// 3/ Timestamp token
3675
3680
const time = ( token - timestamp_begin ) * time_precision + time_offset ;
3676
3681
const rounded_time = round ( time , 2 ) ;
You can’t perform that action at this time.
0 commit comments