Skip to content

Commit 68662a9

Browse files
songguocolakevinlin09
authored andcommitted
feat(model/qwen3-tts-realtime): add sample_rate/volume/speech_rate/format/bit_rate param
1 parent df607b8 commit 68662a9

File tree

2 files changed

+33
-1
lines changed

2 files changed

+33
-1
lines changed

dashscope/audio/qwen_tts_realtime/qwen_tts_realtime.py

Lines changed: 31 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -158,6 +158,12 @@ def update_session(self,
158158
response_format: AudioFormat = AudioFormat.
159159
PCM_24000HZ_MONO_16BIT,
160160
mode: str = 'server_commit',
161+
sample_rate: int = None,
162+
volume: int = None,
163+
speech_rate: float = None,
164+
audio_format: str = None,
165+
pitch_rate: float = None,
166+
bit_rate: int = None,
161167
language_type: str = None,
162168
**kwargs) -> None:
163169
'''
@@ -173,13 +179,38 @@ def update_session(self,
173179
response mode, server_commit or commit
174180
language_type: str
175181
language type for synthesized audio, default is 'auto'
182+
sample_rate: int
183+
sampleRate for tts, range [8000,16000,22050,24000,44100,48000] default is 24000
184+
volume: int
185+
volume for tts, range [0,100] default is 50
186+
speech_rate: float
187+
speech_rate for tts, range [0.5~2.0] default is 1.0
188+
audio_format: str
189+
format for tts, support mp3,wav,pcm,opus, default is 'pcm'
190+
pitch_rate: float
191+
pitch_rate for tts, range [0.5~2.0] default is 1.0
192+
bit_rate: int
193+
bit_rate for tts, support 6~510,default is 128kbps. only work on format: opus/mp3
176194
'''
177195
self.config = {
178196
'voice': voice,
179197
'mode': mode,
180198
'response_format': response_format.format,
181199
'sample_rate': response_format.sample_rate,
182200
}
201+
if sample_rate is not None: # 如果配置,则更新
202+
self.config['sample_rate'] = sample_rate
203+
if volume is not None:
204+
self.config['volume'] = volume
205+
if speech_rate is not None:
206+
self.config['speech_rate'] = speech_rate
207+
if audio_format is not None:
208+
self.config['response_format'] = audio_format # 如果配置,则更新
209+
if pitch_rate is not None:
210+
self.config['pitch_rate'] = pitch_rate
211+
if bit_rate is not None:
212+
self.config['bit_rate'] = bit_rate
213+
183214
if language_type is not None:
184215
self.config['language_type'] = language_type
185216
self.config.update(kwargs)

dashscope/multimodal/multimodal_request_params.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -217,7 +217,8 @@ class ClientInfo:
217217

218218
def to_dict(self):
219219
info = {
220-
"user_id": self.user_id
220+
"user_id": self.user_id,
221+
"sdk": "python"
221222
}
222223
if self.device is not None:
223224
info["device"] = self.device.to_dict()

0 commit comments

Comments
 (0)