@@ -91,7 +91,6 @@ class JSUTProcessor(BaseProcessor):
9191 """JSUT processor."""
9292 cleaner_names : str = None
9393 speaker_name : str = "jsut"
94- target_rate : int = 24000
9594 train_f_name : str = "text_kana/basic5000.yaml"
9695
9796 def create_items (self ):
@@ -105,8 +104,6 @@ def create_items(self):
105104 for k , v in data_json .items ():
106105 utt_id = k
107106 phones = v ['phone_level3' ]
108- # phones = phones.replace("I", "i")
109- # phones = phones.replace("U", "u")
110107 phones = phones .split ("-" )
111108 phones = [_sil ] + phones + [_sil ]
112109 wav_path = os .path .join (self .data_dir , "wav" , f"{ utt_id } .wav" )
@@ -129,9 +126,9 @@ def get_one_sample(self, item):
129126 audio , rate = sf .read (wav_path )
130127 audio = audio .astype (np .float32 )
131128
132- if rate != self .target_rate :
133- assert rate > self .target_rate
134- audio = librosa .resample (audio , rate , self .target_rate )
129+ # if rate != self.target_rate:
130+ # assert rate > self.target_rate
131+ # audio = librosa.resample(audio, rate, self.target_rate)
135132
136133 # convert text to ids
137134 text_ids = np .asarray (self .text_to_sequence (text ), np .int32 )
0 commit comments