Add pronunciation assessment REST API sample code on Java (#180)

yinhew · web-flow · commit 22df3192c4c9 · 2020-06-12T15:40:24.000+08:00
* Add pronunciation assessment REST API sample code on Java

* Add a comment

* Put a new line at the end of the file

* Make tab alignment
diff --git a/PronunciationAssessment/Java/jre/.classpath b/PronunciationAssessment/Java/jre/.classpath
@@ -0,0 +1,6 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<classpath>
+	<classpathentry kind="src" path="src"/>
+	<classpathentry kind="con" path="org.eclipse.jdt.launching.JRE_CONTAINER"/>
+	<classpathentry kind="output" path="bin"/>
+</classpath>
diff --git a/PronunciationAssessment/Java/jre/.project b/PronunciationAssessment/Java/jre/.project
@@ -0,0 +1,17 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<projectDescription>
+	<name>PronunciationAssessment</name>
+	<comment></comment>
+	<projects>
+	</projects>
+	<buildSpec>
+		<buildCommand>
+			<name>org.eclipse.jdt.core.javabuilder</name>
+			<arguments>
+			</arguments>
+		</buildCommand>
+	</buildSpec>
+	<natures>
+		<nature>org.eclipse.jdt.core.javanature</nature>
+	</natures>
+</projectDescription>
diff --git a/PronunciationAssessment/Java/jre/README.md b/PronunciationAssessment/Java/jre/README.md
@@ -0,0 +1,23 @@
+# Pronunciation Assessment - Java Run-Time Environment (JRE) Samples
+
+This sample shows how to call pronunciation assessment REST API in Java, with chunked (streaming) data uploading.
+
+## Prerequisites
+
+* An Azure subscription with Speech Services enabled. [Get one for free!](https://docs.microsoft.com/azure/cognitive-services/speech-service/get-started)
+* 64-bit JRE/JDK for Java 8.
+* Version 4.15 of [Eclipse](https://www.eclipse.org), 64-bit.
+
+## Code sample
+
+To use this sample, follow these instructions:
+
+* Clone this repository.
+* Open this project in Eclipse.
+* Locate `"{SubscriptionKey}"` and replace it with your Speech Services subscription key.
+* Locate `"{Region}"` and replace it with region corresponding to your subscription key.
+* Run the project and check the result on the console.
+
+## Resources
+
+* [REST API reference](https://docs.microsoft.com/en-us/azure/cognitive-services/speech-service/rest-speech-to-text)
diff --git a/PronunciationAssessment/Java/jre/src/com/microsoft/cognitiveservices/pronunciationassessment/Sample.java b/PronunciationAssessment/Java/jre/src/com/microsoft/cognitiveservices/pronunciationassessment/Sample.java
@@ -0,0 +1,105 @@
+﻿//
+// Copyright (c) Microsoft. All rights reserved.
+// Licensed under the MIT license.
+//
+// Microsoft Cognitive Services (formerly Project Oxford): https://www.microsoft.com/cognitive-services
+//
+// Microsoft Cognitive Services (formerly Project Oxford) GitHub:
+// https://github.com/Microsoft/Cognitive-Speech-TTS
+//
+// Copyright (c) Microsoft Corporation
+// All rights reserved.
+//
+// MIT License:
+// Permission is hereby granted, free of charge, to any person obtaining
+// a copy of this software and associated documentation files (the
+// "Software"), to deal in the Software without restriction, including
+// without limitation the rights to use, copy, modify, merge, publish,
+// distribute, sublicense, and/or sell copies of the Software, and to
+// permit persons to whom the Software is furnished to do so, subject to
+// the following conditions:
+//
+// The above copyright notice and this permission notice shall be
+// included in all copies or substantial portions of the Software.
+//
+// THE SOFTWARE IS PROVIDED ""AS IS"", WITHOUT WARRANTY OF ANY KIND,
+// EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
+// MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+// NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
+// LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
+// OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
+// WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
+//
+
+package com.microsoft.cognitiveservices.pronunciationassessment;
+
+import java.io.File;
+import java.io.FileInputStream;
+import java.io.InputStream;
+import java.io.OutputStream;
+import java.net.URL;
+import java.util.Base64;
+
+import javax.net.ssl.HttpsURLConnection;
+
+public class Sample {
+	public static void main(String[] args) throws Exception {
+		
+		String subscriptionKey = "{SubscriptionKey}"; // replace this with your subscription key
+		String region = "{Region}"; // replace this with the region corresponding to your subscription key, e.g. westus, eastasia
+		
+		// a common wave header, with zero audio length
+		// since stream data doesn't contain header, but the API requires header to fetch format information, so you need post this header as first chunk for each query
+		final byte[] WaveHeader16K16BitMono = new byte[] { 82, 73, 70, 70, 78, (byte)128, 0, 0, 87, 65, 86, 69, 102, 109, 116, 32, 18, 0, 0, 0, 1, 0, 1, 0, (byte)128, 62, 0, 0, 0, 125, 0, 0, 2, 0, 16, 0, 0, 0, 100, 97, 116, 97, 0, 0, 0, 0 };
+		
+		// build pronunciation assessment parameters
+		String referenceText = "Good morning.";
+		String pronAssessmentParamsJson = "{\"ReferenceText\":\"" + referenceText + "\",\"GradingSystem\":\"HundredMark\",\"Dimension\":\"Comprehensive\"}";
+		byte[] pronAssessmentParamsBase64 = Base64.getEncoder().encode(pronAssessmentParamsJson.getBytes("utf-8"));
+		String pronAssessmentParams = new String(pronAssessmentParamsBase64, "utf-8");
+		
+		// build request
+		URL url = new URL("https://" + region + ".stt.speech.microsoft.com/speech/recognition/conversation/cognitiveservices/v1?language=en-us");
+		HttpsURLConnection connection = (HttpsURLConnection) url.openConnection();
+		connection.setRequestMethod("POST");
+		connection.setDoOutput(true);
+		connection.setChunkedStreamingMode(0);
+		connection.setRequestProperty("Accept", "application/json;text/xml");
+		connection.setRequestProperty("Content-Type", "audio/wav; codecs=audio/pcm; samplerate=16000");
+		connection.setRequestProperty("Ocp-Apim-Subscription-Key", subscriptionKey);
+		connection.setRequestProperty("Pronunciation-Assessment", pronAssessmentParams);
+		
+		// send request with chunked data
+		File file = new File("../../goodmorning.pcm");
+		FileInputStream fileStream = new FileInputStream(file);
+		byte[] audioChunk = new byte[1024];
+		
+		OutputStream outputStream = connection.getOutputStream();
+		outputStream.write(WaveHeader16K16BitMono);
+		int chunkSize = fileStream.read(audioChunk);
+		while (chunkSize > 0)
+		{
+			Thread.sleep(chunkSize / 32); // to simulate human speaking rate
+			outputStream.write(audioChunk, 0, chunkSize);
+			chunkSize = fileStream.read(audioChunk);
+		}
+
+		fileStream.close();
+		outputStream.flush();
+		outputStream.close();
+		
+		long uploadFinishTime = System.currentTimeMillis();
+		
+		// receive response
+		byte[] responseBuffer = new byte[connection.getContentLength()];
+		InputStream inputStream = connection.getInputStream();
+		inputStream.read(responseBuffer);
+		String result = new String(responseBuffer, "utf-8"); // the result is a JSON, you can parse it with a JSON library 
+
+		System.out.println("Pronunciation assessment result:\n");
+		System.out.println(result);
+		
+		long getResponseTime = System.currentTimeMillis();
+		System.out.println("\nLatency: " + (getResponseTime - uploadFinishTime) + "ms");
+	}
+}