test(Text to Speech): Add integration tests for synthesizeUsingWebSocket

lpatino10 · lpatino10 · commit 9214b685a036 · 2018-12-07T14:54:17.000-05:00
diff --git a/text-to-speech/src/test/java/com/ibm/watson/developer_cloud/text_to_speech/v1/TextToSpeechIT.java b/text-to-speech/src/test/java/com/ibm/watson/developer_cloud/text_to_speech/v1/TextToSpeechIT.java
@@ -16,11 +16,16 @@
 import com.ibm.watson.developer_cloud.text_to_speech.v1.model.DeleteUserDataOptions;
 import com.ibm.watson.developer_cloud.text_to_speech.v1.model.GetPronunciationOptions;
 import com.ibm.watson.developer_cloud.text_to_speech.v1.model.GetVoiceOptions;
+import com.ibm.watson.developer_cloud.text_to_speech.v1.model.MarkTiming;
+import com.ibm.watson.developer_cloud.text_to_speech.v1.model.Marks;
 import com.ibm.watson.developer_cloud.text_to_speech.v1.model.Pronunciation;
 import com.ibm.watson.developer_cloud.text_to_speech.v1.model.SynthesizeOptions;
+import com.ibm.watson.developer_cloud.text_to_speech.v1.model.Timings;
 import com.ibm.watson.developer_cloud.text_to_speech.v1.model.Voice;
 import com.ibm.watson.developer_cloud.text_to_speech.v1.model.Voices;
+import com.ibm.watson.developer_cloud.text_to_speech.v1.model.WordTiming;
 import com.ibm.watson.developer_cloud.text_to_speech.v1.util.WaveUtils;
+import com.ibm.watson.developer_cloud.text_to_speech.v1.websocket.BaseSynthesizeCallback;
 import com.ibm.watson.developer_cloud.util.RetryRunner;
 import org.junit.Assume;
 import org.junit.Before;
@@ -29,10 +34,20 @@
 
 import javax.sound.sampled.AudioSystem;
 import javax.sound.sampled.UnsupportedAudioFileException;
+import java.io.ByteArrayOutputStream;
 import java.io.File;
+import java.io.FileNotFoundException;
+import java.io.FileOutputStream;
 import java.io.IOException;
 import java.io.InputStream;
+import java.io.OutputStream;
+import java.util.ArrayList;
+import java.util.Collections;
+import java.util.List;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.TimeUnit;
 
+import static org.junit.Assert.assertEquals;
 import static org.junit.Assert.assertNotNull;
 import static org.junit.Assert.assertTrue;
 import static org.junit.Assert.fail;
@@ -43,8 +58,13 @@
 @RunWith(RetryRunner.class)
 public class TextToSpeechIT extends WatsonServiceTest {
 
+  private CountDownLatch lock = new CountDownLatch(1);
   private TextToSpeech service;
   private String voiceName;
+  private ByteArrayOutputStream byteArrayOutputStream;
+  private String returnedContentType;
+  private List<Timings> returnedTimings;
+  private List<Marks> returnedMarks;
 
   /*
    * (non-Javadoc)
@@ -63,6 +83,10 @@ public void setUp() throws Exception {
     service.setEndPoint(getProperty("text_to_speech.url"));
     service.setDefaultHeaders(getDefaultHeaders());
     voiceName = getProperty("text_to_speech.voice_name");
+
+    byteArrayOutputStream = new ByteArrayOutputStream();
+    returnedTimings = new ArrayList<>();
+    returnedMarks = new ArrayList<>();
   }
 
   /**
@@ -191,4 +215,99 @@ public void testDeleteUserData() {
       fail(ex.getMessage());
     }
   }
+
+  @Test
+  public void testSynthesizeUsingWebSocket() throws InterruptedException, IOException {
+    String basicText = "One taught me love. One taught me patience, and one taught me pain. Now, I'm so amazing. Say " +
+        "I've loved and I've lost, but that's not what I see. So, look what I got. Look what you taught me. And for " +
+        "that, I say... thank u, next.";
+
+    SynthesizeOptions synthesizeOptions = new SynthesizeOptions.Builder()
+        .text(basicText)
+        .voice(SynthesizeOptions.Voice.EN_US_ALLISONVOICE)
+        .accept(SynthesizeOptions.Accept.AUDIO_OGG_CODECS_OPUS)
+        .timings(Collections.singletonList("words"))
+        .build();
+
+    service.synthesizeUsingWebSocket(synthesizeOptions, new BaseSynthesizeCallback() {
+      @Override
+      public void onContentType(String contentType) {
+        returnedContentType = contentType;
+      }
+
+      @Override
+      public void onAudioStream(byte[] bytes) {
+        // build byte array of synthesized text
+        try {
+          byteArrayOutputStream.write(bytes);
+        } catch (IOException e) {
+          e.printStackTrace();
+        }
+      }
+
+      @Override
+      public void onTimings(Timings timings) {
+        returnedTimings.add(timings);
+      }
+    });
+
+    // wait for synthesis to complete
+    lock.await(5, TimeUnit.SECONDS);
+
+    String filename = "synthesize_websocket_test.ogg";
+    OutputStream fileOutputStream = new FileOutputStream(filename);
+    byteArrayOutputStream.writeTo(fileOutputStream);
+    File createdFile = new File(filename);
+
+    assertTrue(createdFile.exists());
+    assertEquals(SynthesizeOptions.Accept.AUDIO_OGG_CODECS_OPUS, returnedContentType);
+    for (Timings t : returnedTimings) {
+      List<WordTiming> wordTimings = t.getWords();
+      for (WordTiming wordTiming : wordTimings) {
+        assertTrue(basicText.contains(wordTiming.getWord()));
+      }
+    }
+
+    // clean up
+    byteArrayOutputStream.close();
+    fileOutputStream.close();
+    if (createdFile.delete()) {
+      System.out.println("File deleted successfully!");
+    } else {
+      System.out.println("File could not be deleted");
+    }
+  }
+
+  @Test
+  public void testSynthesizeUsingWebSocketWithSsml() throws InterruptedException {
+    List<String> ssmlMarks = new ArrayList<>();
+    ssmlMarks.add("sean");
+    ssmlMarks.add("ricky");
+    String ssmlText = String.format("Thought I'd end up with <mark name=\"%s\" />Sean, <express-as type=\"Apology\"> " +
+        "but he wasn't a match. </express-as> Wrote some songs about <mark name=\"%s\" />Ricky, now I listen and " +
+        "laugh", ssmlMarks.get(0), ssmlMarks.get(1));
+
+    SynthesizeOptions synthesizeOptions = new SynthesizeOptions.Builder()
+        .text(ssmlText)
+        .voice(SynthesizeOptions.Voice.EN_US_ALLISONVOICE)
+        .accept(SynthesizeOptions.Accept.AUDIO_OGG_CODECS_OPUS)
+        .build();
+
+    service.synthesizeUsingWebSocket(synthesizeOptions, new BaseSynthesizeCallback() {
+      @Override
+      public void onMarks(Marks marks) {
+        returnedMarks.add(marks);
+      }
+    });
+
+    // wait for synthesis to complete
+    lock.await(5, TimeUnit.SECONDS);
+
+    for (Marks m : returnedMarks) {
+      List<MarkTiming> markList = m.getMarks();
+      for (MarkTiming markTiming : markList) {
+        assertTrue(ssmlMarks.contains(markTiming.getMark()));
+      }
+    }
+  }
 }