spring-ai-alibaba
diff --git a/‎pom.xml‎
Lines changed: 3 additions & 3 deletions b/‎pom.xml‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎spring-ai-alibaba-audio-example/dashscope-audio/README.md‎
Lines changed: 0 additions & 2 deletions b/‎spring-ai-alibaba-audio-example/dashscope-audio/README.md‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎spring-ai-alibaba-audio-example/dashscope-audio/src/main/java/com/alibaba/cloud/ai/example/audio/AudioSpeechController.java‎
Lines changed: 38 additions & 40 deletions b/‎spring-ai-alibaba-audio-example/dashscope-audio/src/main/java/com/alibaba/cloud/ai/example/audio/AudioSpeechController.java‎
Lines changed: 38 additions & 40 deletions
diff --git a/‎spring-ai-alibaba-audio-example/dashscope-audio/src/main/java/com/alibaba/cloud/ai/example/audio/AudioTranscriptionController.java‎
Lines changed: 31 additions & 26 deletions b/‎spring-ai-alibaba-audio-example/dashscope-audio/src/main/java/com/alibaba/cloud/ai/example/audio/AudioTranscriptionController.java‎
Lines changed: 31 additions & 26 deletions
diff --git a/‎spring-ai-alibaba-chat-example/ark-chat/README.md‎
Lines changed: 0 additions & 35 deletions b/‎spring-ai-alibaba-chat-example/ark-chat/README.md‎
Lines changed: 0 additions & 35 deletions
diff --git a/‎spring-ai-alibaba-chat-example/ark-chat/application.yml‎
Lines changed: 0 additions & 32 deletions b/‎spring-ai-alibaba-chat-example/ark-chat/application.yml‎
Lines changed: 0 additions & 32 deletions
diff --git a/‎spring-ai-alibaba-chat-example/dashscope-chat/pom.xml‎
Lines changed: 0 additions & 4 deletions b/‎spring-ai-alibaba-chat-example/dashscope-chat/pom.xml‎
Lines changed: 0 additions & 4 deletions
diff --git a/‎spring-ai-alibaba-chat-example/moonshot-chat/README.md‎
Lines changed: 0 additions & 5 deletions b/‎spring-ai-alibaba-chat-example/moonshot-chat/README.md‎
Lines changed: 0 additions & 5 deletions
@@ -47,8 +47,8 @@
 
 		<!-- Spring AI Alibaba -->
 		<!-- Install Spring AI Alibaba in your local. -->
-		<spring-ai-alibaba.version>1.1.0.0-M5</spring-ai-alibaba.version>
-		<spring-ai-alibaba.extensions.version>1.1.0.0-M5</spring-ai-alibaba.extensions.version>
+		<spring-ai-alibaba.version>1.1.0.0-RC1</spring-ai-alibaba.version>
+		<spring-ai-alibaba-extensions.version>1.1.0.0-RC1</spring-ai-alibaba-extensions.version>
 
 		<!-- maven plugin -->
 		<maven-deploy-plugin.version>3.1.1</maven-deploy-plugin.version>
@@ -109,7 +109,7 @@
             <dependency>
                 <groupId>com.alibaba.cloud.ai</groupId>
                 <artifactId>spring-ai-alibaba-extensions-bom</artifactId>
-                <version>${spring-ai-alibaba.extensions.version}</version>
+                <version>${spring-ai-alibaba-extensions.version}</version>
                 <type>pom</type>
                 <scope>import</scope>
             </dependency>
 
@@ -1,5 +1,3 @@
 # Spring AI Alibaba Audio Example
 
 演示使用阿里通义大模型进行音频处理。包含语音转录和语音合成。
-
-> Tips: 此模块最新示例基于 spring ai alibaba 1.0.0.3，中央仓库未发布，请本地编译安装。
@@ -16,104 +16,102 @@
 
 package com.alibaba.cloud.ai.example.audio;
 
-import com.alibaba.cloud.ai.dashscope.api.DashScopeAudioSpeechApi;
-import com.alibaba.cloud.ai.dashscope.audio.DashScopeAudioSpeechOptions;
-import com.alibaba.cloud.ai.dashscope.audio.synthesis.SpeechSynthesisModel;
-import com.alibaba.cloud.ai.dashscope.audio.synthesis.SpeechSynthesisPrompt;
-import com.alibaba.cloud.ai.dashscope.audio.synthesis.SpeechSynthesisResponse;
+import java.io.File;
+import java.io.FileOutputStream;
+import java.io.IOException;
+import java.util.concurrent.CountDownLatch;
+
 import jakarta.annotation.PreDestroy;
 
+import com.alibaba.cloud.ai.dashscope.audio.DashScopeAudioSpeechModel;
+import com.alibaba.cloud.ai.dashscope.audio.DashScopeAudioSpeechOptions;
 import com.alibaba.cloud.ai.dashscope.spec.DashScopeModel;
 import org.apache.commons.io.FileUtils;
+import org.springframework.ai.audio.tts.TextToSpeechModel;
+import org.springframework.ai.audio.tts.TextToSpeechPrompt;
+import org.springframework.ai.audio.tts.TextToSpeechResponse;
+import org.springframework.beans.factory.annotation.Qualifier;
 import org.springframework.boot.ApplicationArguments;
 import org.springframework.boot.ApplicationRunner;
 import org.springframework.web.bind.annotation.GetMapping;
 import org.springframework.web.bind.annotation.RequestMapping;
 import org.springframework.web.bind.annotation.RestController;
 import reactor.core.publisher.Flux;
 
-import java.io.File;
-import java.io.FileOutputStream;
-import java.io.IOException;
-import java.nio.ByteBuffer;
-import java.util.concurrent.CountDownLatch;
-
 /**
  * 语音转文本（语音识别）
+ * <a href="https://help.aliyun.com/zh/model-studio/real-time-speech-recognition">语音识别</a>
+ *
  * @author yuluo
  * @author <a href="mailto:yuluo08290126@gmail.com">yuluo</a>
+ * @see DashScopeAudioSpeechModel
  */
 
 @RestController
 @RequestMapping("/ai/speech")
 public class AudioSpeechController implements ApplicationRunner {
 
-	private final SpeechSynthesisModel speechSynthesisModel;
+	private final TextToSpeechModel speechSynthesisModel;
 
 	private static final String TEXT = "白日依山尽，黄河入海流。这是测试";
 
 	private static final String FILE_PATH = "spring-ai-alibaba-audio-example/dashscope-audio/src/main/resources/gen/tts";
 
-	public AudioSpeechController(SpeechSynthesisModel speechSynthesisModel) {
+	public AudioSpeechController(
+		@Qualifier("dashScopeSpeechSynthesisModel") TextToSpeechModel speechSynthesisModel) {
 
 		this.speechSynthesisModel = speechSynthesisModel;
 	}
 
-	@GetMapping
+	@GetMapping("/call")
 	public void tts() throws IOException {
 
-		SpeechSynthesisResponse response = speechSynthesisModel.call(
-				new SpeechSynthesisPrompt(
-						TEXT,
-						DashScopeAudioSpeechOptions.builder()
-								.model(DashScopeModel.AudioModel.SAMBERT_ZHICHU_V1.getValue())
-								.build()
-						)
+		TextToSpeechResponse response = speechSynthesisModel.call(
+			new TextToSpeechPrompt(
+				TEXT,
+				DashScopeAudioSpeechOptions.builder()
+					.model(DashScopeModel.AudioModel.COSYVOICE_V1.getValue())
+					.build()
+			)
 		);
 
 		File file = new File(FILE_PATH + "/output.mp3");
 		try (FileOutputStream fos = new FileOutputStream(file)) {
-			ByteBuffer byteBuffer = response.getResult().getOutput().getAudio();
-			fos.write(byteBuffer.array());
-		}
-		catch (IOException e) {
+			fos.write(response.getResult().getOutput());
+		} catch (IOException e) {
 			throw new IOException(e.getMessage());
 		}
 	}
 
 	@GetMapping("/stream")
 	public void streamTTS() {
 
-		Flux<SpeechSynthesisResponse> response = speechSynthesisModel.stream(
-				new SpeechSynthesisPrompt(
-						TEXT,
-						DashScopeAudioSpeechOptions.builder()
-								.model(DashScopeModel.AudioModel.SAMBERT_ZHITING_V1.getValue())
-								.build()
-				)
+		Flux<TextToSpeechResponse> response = speechSynthesisModel.stream(
+			new TextToSpeechPrompt(
+				TEXT,
+				DashScopeAudioSpeechOptions.builder()
+					.model(DashScopeModel.AudioModel.SAMBERT_ZHITING_V1.getValue())
+					.build()
+			)
 		);
 
 		CountDownLatch latch = new CountDownLatch(1);
 		File file = new File(FILE_PATH + "/output-stream.mp3");
 		try (FileOutputStream fos = new FileOutputStream(file)) {
 
 			response.doFinally(
-					signal -> latch.countDown()
+				signal -> latch.countDown()
 			).subscribe(synthesisResponse -> {
-				ByteBuffer byteBuffer = synthesisResponse.getResult().getOutput().getAudio();
-				byte[] bytes = new byte[byteBuffer.remaining()];
-				byteBuffer.get(bytes);
+				byte[] bytes = synthesisResponse.getResult().getOutput();
 				try {
 					fos.write(bytes);
-				}
-				catch (IOException e) {
+				} catch (IOException e) {
 					throw new RuntimeException(e);
 				}
 			});
 
 			latch.await();
-		}
-		catch (IOException | InterruptedException e) {
+		} catch (IOException | InterruptedException e) {
 			throw new RuntimeException(e);
 		}
 	}
 
@@ -16,6 +16,12 @@
 
 package com.alibaba.cloud.ai.example.audio;
 
+import java.util.concurrent.Executors;
+import java.util.concurrent.ScheduledExecutorService;
+import java.util.stream.Collectors;
+
+import com.alibaba.cloud.ai.dashscope.api.DashScopeAudioTranscriptionApi;
+import com.alibaba.cloud.ai.dashscope.audio.DashScopeAudioTranscriptionModel;
 import com.alibaba.cloud.ai.dashscope.audio.DashScopeAudioTranscriptionOptions;
 import com.alibaba.cloud.ai.dashscope.audio.transcription.AudioTranscriptionModel;
 import com.alibaba.cloud.ai.dashscope.spec.DashScopeModel;
@@ -32,14 +38,13 @@
 import org.springframework.web.bind.annotation.RestController;
 import reactor.core.publisher.Flux;
 
-import java.util.concurrent.Executors;
-import java.util.concurrent.ScheduledExecutorService;
-import java.util.stream.Collectors;
-
 /**
  * 语音转文本（语音合成）
+ * <a href="https://help.aliyun.com/zh/model-studio/text-to-speech">语音合成</a>
+ *
  * @author yuluo
  * @author <a href="mailto:yuluo08290126@gmail.com">yuluo</a>
+ * @see DashScopeAudioTranscriptionModel
  */
 
 @RestController
@@ -50,8 +55,8 @@ public class AudioTranscriptionController {
 
 	private static final Logger log = LoggerFactory.getLogger(AudioTranscriptionController.class);
 
-	// 模型列表：https://help.aliyun.com/zh/model-studio/sambert-websocket-api
-	private static final String DEFAULT_MODEL = DashScopeModel.AudioModel.PARAFORMER_V2.getValue();
+	public static final String AUDIO_FILE_URL =
+		"https://dashscope.oss-cn-beijing.aliyuncs.com/samples/audio/paraformer/hello_world_female2.wav";
 
 	private final ScheduledExecutorService scheduler = Executors.newScheduledThreadPool(1);
 
@@ -68,16 +73,15 @@ public String callSTT() {
 
 		// 录音文件支持HTTP / HTTPS协议
 		// 若录音文件存储在阿里云OSS，使用RESTful API方式支持使用以 oss://为前缀的临时 URL
-		Resource resource = new DefaultResourceLoader()
-			.getResource("https://dashscope.oss-cn-beijing.aliyuncs.com/samples/audio/paraformer/hello_world_female2.wav");
+		Resource resource = new DefaultResourceLoader().getResource(AUDIO_FILE_URL);
 
 		AudioTranscriptionResponse response = transcriptionModel.call(
-				new AudioTranscriptionPrompt(
-						resource,
-						DashScopeAudioTranscriptionOptions.builder()
-								.withModel(DEFAULT_MODEL)
-								.build()
-				)
+			new AudioTranscriptionPrompt(
+				resource,
+				DashScopeAudioTranscriptionOptions.builder()
+					.model(DashScopeModel.AudioModel.PARAFORMER_V2.getValue())
+					.build()
+			)
 		);
 
 		return response.getResult().getOutput();
@@ -89,19 +93,20 @@ public String callSTT() {
 	@GetMapping("/stream")
 	public String streamSTT() {
 
-		ClassPathResource audioResource = new ClassPathResource("hello_world_male_16k_16bit_mono.wav");
+		Resource resource = new DefaultResourceLoader().getResource(AUDIO_FILE_URL);
+
 		Flux<AudioTranscriptionResponse> response = transcriptionModel
-				.stream(
-						new AudioTranscriptionPrompt(
-								audioResource,
-								DashScopeAudioTranscriptionOptions.builder()
-										.withModel("paraformer-realtime-v2")
-										.withSampleRate(16000)
-										.withFormat(DashScopeAudioTranscriptionOptions.AudioFormat.WAV)
-										.withDisfluencyRemovalEnabled(false)
-										.build()
-						)
-				);
+			.stream(
+				new AudioTranscriptionPrompt(
+					resource,
+					DashScopeAudioTranscriptionOptions.builder()
+						.model(DashScopeModel.AudioModel.GUMMY_REALTIME_V1.getValue())
+						.sampleRate(16000)
+						.format(DashScopeAudioTranscriptionApi.AudioFormat.WAV)
+						.disfluencyRemovalEnabled(false)
+						.build()
+				)
+			);
 
 		return response.map(AudioTranscriptionResponse::getResult)
 			.map(AudioTranscription::getOutput)
 
@@ -32,10 +32,6 @@
 	<description>Spring AI Alibaba Dashscope Chat Example</description>
 	<name>Spring AI Alibaba Dashscope Chat Examples</name>
 
-	<properties>
-		<spring-ai-alibaba.version>1.0.0.3</spring-ai-alibaba.version>
-	</properties>
-
 	<dependencies>
 		<dependency>
 			<groupId>org.springframework.boot</groupId>