renaming playFile to file for recognizeBlob and correcting documented default

nfriedly · nfriedly · commit 7a31b82c1220 · 2016-02-08T14:03:49.000-05:00
also setting timing strea and format stream as defaults when appropriate
diff --git a/README.md b/README.md
@@ -1,6 +1,8 @@
 IBM Watson Speech To Text Browser Client Library
 ================================================
 
+[![Build Status](https://travis-ci.org/watson-developer-cloud/speech-javascript-sdk.svg?branch=master)](https://travis-ci.org/watson-developer-cloud/speech-javascript-sdk)
+
 Allows you to easily add voice recognition to any web app with minimal code. 
 
 **Warning** This library is still early-stage and may see significant breaking changes.
@@ -102,6 +104,14 @@ For use with `.recognizeBlob({playFile: true})` - slows the results down to matc
 Inherits `.stop()` method and `result` event from the `RecognizeStream`.
 
 
+## Changelog
+
+### v0.7
+* Changed playFile option of recognizeBlob to play to match docs
+* Added options.format to recognize* to pipe text through a FormatStream (default: true)
+* Added close and end events to TimingStream
+
+
 ## todo
 
 * Fix bugs around `.stop()
@@ -116,5 +126,4 @@ Inherits `.stop()` method and `result` event from the `RecognizeStream`.
 * more tests in general
 * update node-sdk to use current version of this lib's RecognizeStream (and also provide the FormatStream + anything else that might be handy)
 * improve docs
-* check for a bug with the timing stream cutting off early
-
+* automatically npm publish on passing tagged build
diff --git a/examples/public/audio-element-programmatic.html b/examples/public/audio-element-programmatic.html
@@ -35,8 +35,7 @@ <h2>Code for this demo:</h2>
                 token: token,
                 element: audioElement
                 // muteSource: true // prevents sound from also playing locally
-            })
-            .pipe(new WatsonSpeech.SpeechToText.FormatStream()); // optional
+            });
 
             // each result gets it's own <span> because watson will sometimes go back and change a word as it hears more context
             var $curSentence = $('<span>&nbsp;</span>').appendTo($output);
diff --git a/examples/public/audio-element.html b/examples/public/audio-element.html
@@ -34,8 +34,7 @@ <h2>Code for this demo:</h2>
                 token: token,
                 element: $('#audio-element')[0]
                 // muteSource: true // prevents sound from also playing locally
-            })
-            .pipe(new WatsonSpeech.SpeechToText.FormatStream()); // optional
+            });
 
             // each result gets it's own <span> because watson will sometimes go back and change a word as it hears more context
             var $curSentence = $('<span>&nbsp;</span>').appendTo($output);
diff --git a/examples/public/blob-realtime-vs-no-realtime.html b/examples/public/blob-realtime-vs-no-realtime.html
@@ -0,0 +1,87 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <title>File Promise Example - Watson Speech to Text</title>
+</head>
+<body>
+
+<section>
+    <h2>Transcribe File, Comparing <code>{realtime: true}</code> to <code>{realtime: false}</code></h2>
+    <input type="file" id="audiofile"> <button id="button">Transcribe and Play</button> <button id="stop">Stop</button>
+    <p><small><i>Supported types are wav, ogg/opus (not ogg/vorbis), and flac. However, most browsers do not support flac.</i></small></p>
+
+    <h2><code>realtime: false</code> Output:</h2>
+    <div id="output">--</div>
+
+    <h2><code>realtime: true</code> Output:</h2>
+    <p><small><i>When transcription results are available faster than real-time (such as when simultaneously uploading and playing a file on a high-bandwidth connection), the TimingStream slows them down results to real-time.</i></small></p>
+    <div id="realtime-output">--</div>
+</section>
+
+<script src="watson-speech.js"></script>
+<script src="http://code.jquery.com/jquery-2.2.0.min.js"></script>
+
+<h2>Code for this demo:</h2>
+<pre><code><script style="display: block;">
+function renderStream(stream, $output) {
+    $output.html('');
+
+    // each result (sentence) gets it's own <span> because watson will sometimes go back and change a word as it hears more context
+    var $curSentence = $('<span>&nbsp;</span>').appendTo($output);
+
+    // a result is approximately equivalent to a sentence
+    stream.on('result', function(result) {
+        // update the text for the current sentence with the default alternative.
+        // there may be multiple alternatives but this example app ignores all but the first.
+        $curSentence.html(result.alternatives[0].transcript);
+        if (result.final) {
+            // if we have the final text for that sentence, start a new one
+            $curSentence = $('<span/>').appendTo($output);
+        }
+    });
+
+    stream.on('error', function(err) {
+        console.log(err);
+    });
+
+    stream.on('playback-error', function(err) {
+        console.log(err);
+    });
+}
+
+
+$(function() {
+
+    var stream;
+
+    $('#button').click(function () {
+        $.get('/token').then(function (token) {
+
+            stream = WatsonSpeech.SpeechToText.recognizeBlob({
+                token: token,
+                data: $('#audiofile')[0].files[0],
+                play: true,
+                max_alternatives: 1, // default is 3, but only the first one includes word timing data
+                realtime: false // defaults to true, but we're going to turn it off and then manually do it in a moment to show the difference
+            });
+
+            renderStream(stream, $('#output'));
+
+            // now do what the realtime option would have done: pipe through a TimingStream
+            var realtimeStream = stream.pipe(new WatsonSpeech.SpeechToText.TimingStream());
+
+            renderStream(realtimeStream, $('#realtime-output'));
+
+        });
+    });
+
+    $('#stop').click(function() {
+        if (stream) {
+            stream.stop();
+        }
+    });
+});
+</script></code></pre>
+</body>
+</html>
diff --git a/examples/public/file-promise.html b/examples/public/file-promise.html
@@ -36,7 +36,6 @@ <h2>Code for this demo:</h2>
                 timestamps: false,
                 max_alternatives: 1
             })
-            .pipe(new WatsonSpeech.SpeechToText.FormatStream()) // optional
             .promise()
             .then(function(text) {
                 $output.text(text);
diff --git a/examples/public/file-streaming.html b/examples/public/file-streaming.html
@@ -13,65 +13,50 @@ <h2>Transcribe File, Streaming</h2>
 
     <h2>Output:</h2>
     <div id="output">--</div>
-
-    <h2>TimingStream Output:</h2>
-    <p><small><i>When transcription results are available faster than real-time (such as when simultaneously uploading and playing a file on a high-bandwidth connection), the TimingStream slows them down results to real-time.</i></small></p>
-    <div id="realtime-output">--</div>
 </section>
 
 <script src="watson-speech.js"></script>
 <script src="http://code.jquery.com/jquery-2.2.0.min.js"></script>
 
 <h2>Code for this demo:</h2>
 <pre><code><script style="display: block;">
-function renderStream(stream, $output) {
-    $output.html('');
-
-    // each result (sentence) gets it's own <span> because watson will sometimes go back and change a word as it hears more context
-    var $curSentence = $('<span>&nbsp;</span>').appendTo($output);
-
-    // a result is approximately equivalent to a sentence
-    stream.on('result', function(result) {
-        // update the text for the current sentence with the default alternative.
-        // there may be multiple alternatives but this example app ignores all but the first.
-        $curSentence.html(result.alternatives[0].transcript);
-        if (result.final) {
-            // if we have the final text for that sentence, start a new one
-            $curSentence = $('<span/>').appendTo($output);
-        }
-    });
-
-    stream.on('error', function(err) {
-        console.log(err);
-    });
-
-    stream.on('playback-error', function(err) {
-        console.log(err);
-    });
-}
-
-
 $(function() {
 
-    var stream;
+    var stream, $output = $('#output');
 
     $('#button').click(function () {
+        $output.html('');
+
         $.get('/token').then(function (token) {
 
             stream = WatsonSpeech.SpeechToText.recognizeBlob({
                 token: token,
                 data: $('#audiofile')[0].files[0],
-                playFile: true,
-                max_alternatives: 1 // default is 3, but only the first one includes word timing data
-            })
-            .pipe(new WatsonSpeech.SpeechToText.FormatStream());// optional
-
-            renderStream(stream, $('#output'));
-
-            // optional, slows down results to real-time (only useful for recognizeBlob() with playFile: true)
-            var realtimeStream = stream.pipe(new WatsonSpeech.SpeechToText.TimingStream());
-
-            renderStream(realtimeStream, $('#realtime-output'));
+                play: true // play the audio out loud
+            });
+
+            // each result (sentence) gets it's own <span> because watson will sometimes go back and change a word as it hears more context
+            var $curSentence = $('<span>&nbsp;</span>').appendTo($output);
+
+            // a result is approximately equivalent to a sentence
+            stream.on('result', function(result) {
+                // update the text for the current sentence with the default alternative.
+                // there may be multiple alternatives but this example app ignores all but the first.
+                $curSentence.html(result.alternatives[0].transcript);
+                if (result.final) {
+                    // if we have the final text for that sentence, start a new one
+                    $curSentence = $('<span/>').appendTo($output);
+                }
+            });
+
+            stream.on('error', function(err) {
+                console.log(err);
+            });
+
+            // handle file playback errors
+            stream.on('playback-error', function(err) {
+                console.log(err);
+            });
 
         });
     });
@@ -85,3 +70,5 @@ <h2>Code for this demo:</h2>
 </script></code></pre>
 </body>
 </html>
+
+
diff --git a/examples/public/index.html b/examples/public/index.html
@@ -9,6 +9,7 @@
     <li><a href="microphone-streaming.html">Transcribe from Microphone, Streaming</a></li>
     <li><a href="microphone-streaming-auto-stop.html">Transcribe from Microphone, Streaming, automatically stop at first pause</a></li>
     <li><a href="file-streaming.html">Transcribe from file, Streaming</a></li>
+    <li><a href="blob-realtime-vs-no-realtime.html">Transcribe from file, Comparing <code>{realtime: true}</code> to <code>{realtime: false}</code></a></li>
     <li><a href="file-promise.html">Transcribe from file, Promise</a></li>
     <li><a href="audio-element.html">Transcribe from HTML5 &lt;audio&gt; element, Streaming</a></li>
     <li><a href="audio-element-programmatic.html">Transcribe from <code>new Audio()</code>, Streaming</a></li>
diff --git a/examples/public/microphone-streaming-auto-stop.html b/examples/public/microphone-streaming-auto-stop.html
@@ -30,8 +30,7 @@ <h2>Code for this demo:</h2>
             var stream = WatsonSpeech.SpeechToText.recognizeMicrophone({
                 token: token,
                 continuous: false // false = automatically stop transcription the first time a pause is detected
-            })
-            .pipe(new WatsonSpeech.SpeechToText.FormatStream()); // optional
+            });
 
             // each result (sentence) gets it's own <span> because Watson will sometimes go back and change a word as it hears more context
             var $curSentence = $('<span>&nbsp;</span>').appendTo($output);
diff --git a/examples/public/microphone-streaming.html b/examples/public/microphone-streaming.html
@@ -30,8 +30,7 @@ <h2>Code for this demo:</h2>
         $.get('/token').then(function (token) {
             var stream = WatsonSpeech.SpeechToText.recognizeMicrophone({
                 token: token
-            })
-            .pipe(new WatsonSpeech.SpeechToText.FormatStream()); // optional
+            });
 
             // each result (sentence) gets it's own <span> because Watson will sometimes go back and change a word as it hears more context
             var $curSentence = $('<span>&nbsp;</span>').appendTo($output);
diff --git a/speech-to-text/recognize-blob.js b/speech-to-text/recognize-blob.js
@@ -18,7 +18,8 @@
 var BlobStream = require('readable-blob-stream');
 var RecognizeStream = require('./recognize-stream.js');
 var FilePlayer = require('./file-player.js');
-
+var FormatStream = require('./format-stream.js');
+var TimingStream = require('./timing-stream.js');
 
 /**
  * Create and return a RecognizeStream from a File or Blob
@@ -27,7 +28,9 @@ var FilePlayer = require('./file-player.js');
  * @param {Object} options - Also passed to {MediaElementAudioStream} and to {RecognizeStream}
  * @param {String} options.token - Auth Token - see https://github.com/watson-developer-cloud/node-sdk#authorization
  * @param {Blob|File} options.data - the raw audio data as a Blob or File instance
- * @param {Boolean} [options.play=true] - If a file is set, play it locally as it's being uploaded
+ * @param {Boolean} [options.play=false] - If a file is set, play it locally as it's being uploaded
+ * @param {Boolena} [options.format=true] - pipe the text through a {FormatStream} which performs light formatting
+ * @param {Boolena} [options.realtime=options.play] - pipe the text through a {TimingStream} which slows the output down to real-time to match the audio playback.
  *
  * @returns {RecognizeStream}
  */
@@ -36,17 +39,26 @@ module.exports = function recognizeBlob(options) {
     throw new Error("WatsonSpeechToText: missing required parameter: opts.token");
   }
 
-  var recognizeStream  = new RecognizeStream(options);
+  var recognizeStream = new RecognizeStream(options);
+  var stream = new BlobStream(options.data).pipe(recognizeStream);
+
+  if (options.format !== false) {
+    stream = stream.pipe(new FormatStream(options));
+  }
+  if (options.realtime || typeof options.realtime === 'undefined' && options.play) {
+    stream = stream.pipe(new TimingStream(options));
+    start = Date.now();
+  }
 
-  if (options.playFile) {
+  if (options.play) {
     FilePlayer.playFile(options.data).then(function (player) {
       recognizeStream.on('stop', player.stop.bind(player));
     }).catch(function (err) {
       recognizeStream.emit('playback-error', err);
     });
   }
 
-  return new BlobStream(options.data).pipe(recognizeStream);
+  return stream;
 };
 
 
diff --git a/speech-to-text/recognize-element.js b/speech-to-text/recognize-element.js
@@ -18,13 +18,15 @@
 var MediaElementAudioStream = require('./media-element-audio-stream');
 var L16 = require('./webaudio-l16-stream');
 var RecognizeStream = require('./recognize-stream.js');
+var FormatStream = require('./format-stream.js');
 
 /**
  * Recognize audio from a <audio> or <video> element
  *
  * @param {Object} options - Also passed to {MediaElementAudioStream} and to {RecognizeStream}
  * @param {String} options.token - Auth Token - see https://github.com/watson-developer-cloud/node-sdk#authorization
  * @param {MediaElement} options.element - the <video> or <audio> element to play
+ * @param {Boolena} [options.format=true] - pipe the text through a {FormatStream} which performs light formatting
  *
  * @returns {RecognizeStream}
  */
@@ -38,11 +40,15 @@ module.exports = function recognizeElement(options) {
 
   var sourceStream = new MediaElementAudioStream(options.element , options);
 
-  sourceStream
+  var stream = sourceStream
     .pipe(new L16())
     .pipe(recognizeStream);
 
+  if (options.format !== false) {
+    stream = stream.pipe(new FormatStream(options));
+  }
+
   recognizeStream.on('stop', sourceStream.stop.bind(sourceStream));
 
-  return recognizeStream;
+  return stream;;
 };
diff --git a/speech-to-text/recognize-microphone.js b/speech-to-text/recognize-microphone.js
@@ -21,13 +21,15 @@ var getUserMedia = require('./getusermedia');
 var MicrophoneStream = require('microphone-stream');
 var RecognizeStream = require('./recognize-stream.js');
 var L16 = require('./webaudio-l16-stream.js');
+var FormatStream = require('./format-stream.js');
 
 /**
  * Create and return a RecognizeStream from the user's microphone
  * If the options.file is set, it is used instead of the microphone
  *
  * @param {Object} options - Also passed to {MediaElementAudioStream} and to {RecognizeStream}
  * @param {String} options.token - Auth Token - see https://github.com/watson-developer-cloud/node-sdk#authorization
+ * @param {Boolena} [options.format=true] - pipe the text through a {FormatStream} which performs light formatting
  *
  * @returns {RecognizeStream}
  */
@@ -51,7 +53,13 @@ module.exports = function recognizeMicrophone(options) {
     recognizeStream.on('stop', micStream.stop.bind(micStream));
   }).catch(recognizeStream.emit.bind(recognizeStream, 'error'));
 
-  return recognizeStream;
+
+  var stream = recognizeStream;
+  if (options.format !== false) {
+    stream = stream.pipe(new FormatStream(options));
+  }
+
+  return stream;
 };