watson-developer-cloud
diff --git a/‎CHANGELOG.md
Lines changed: 9 additions & 0 deletions b/‎CHANGELOG.md
Lines changed: 9 additions & 0 deletions
diff --git a/‎dist/watson-speech.js
Lines changed: 270 additions & 132 deletions b/‎dist/watson-speech.js
Lines changed: 270 additions & 132 deletions
diff --git a/‎examples/static/index.html
Lines changed: 2 additions & 1 deletion b/‎examples/static/index.html
Lines changed: 2 additions & 1 deletion
diff --git a/‎examples/static/microphone-streaming-object-extracted-to-console.html
Lines changed: 56 additions & 0 deletions b/‎examples/static/microphone-streaming-object-extracted-to-console.html
Lines changed: 56 additions & 0 deletions
diff --git a/‎examples/static/microphone-streaming-text-to-console.html
Lines changed: 2 additions & 1 deletion b/‎examples/static/microphone-streaming-text-to-console.html
Lines changed: 2 additions & 1 deletion
diff --git a/‎speech-to-text/format-stream.js
Lines changed: 27 additions & 23 deletions b/‎speech-to-text/format-stream.js
Lines changed: 27 additions & 23 deletions
diff --git a/‎speech-to-text/recognize-file.js
Lines changed: 17 additions & 0 deletions b/‎speech-to-text/recognize-file.js
Lines changed: 17 additions & 0 deletions
diff --git a/‎speech-to-text/recognize-microphone.js
Lines changed: 11 additions & 1 deletion b/‎speech-to-text/recognize-microphone.js
Lines changed: 11 additions & 1 deletion
diff --git a/‎speech-to-text/recognize-stream.js
Lines changed: 39 additions & 45 deletions b/‎speech-to-text/recognize-stream.js
Lines changed: 39 additions & 45 deletions
@@ -1,5 +1,14 @@
 # Changelog
 
+
+### v0.22.0
+* Breaking: RecognizeStream now emits the original JSON message rather than the extracted results objects.
+* New ResultExtractor stream that can provide the old behavior
+* New `extract_results` option on recogniseFile/Microphone enables this.
+* Removed derecated `result` and `results` events from RecognizeStream.
+* Removed `receive-json` event from RecognizeStream because it now duplicates the behavior of the `data` event.
+
+
 ### v0.21.0
 * Made FormatStream formatting methods available outside of streaming interface
 
 
@@ -13,7 +13,8 @@ <h2>Speech to Text</h2>
     <li><a href="microphone-alternatives.html">Transcribe from Microphone, with Alternatives</a></li>
     <li><a href="microphone-word-confidence.html">Transcribe from Microphone, with Word Confidence</a></li>
     <li><a href="microphone-streaming-text-to-console.html">Transcribe from Microphone, send text to console</a></li>
-    <li><a href="microphone-streaming-object-to-console.html">Transcribe from Microphone, send JSON to console (includes text and metadata)</a></li>
+    <li><a href="microphone-streaming-object-to-console.html">Transcribe from Microphone, send JSON to console (includes text and metadata; v0.22+ format)</a></li>
+    <li><a href="microphone-streaming-object-extracted-to-console.html">Transcribe from Microphone, send JSON to console with results extracted (pre-v0.22 format)</a></li>
     <li><a href="microphone-streaming-model.html">Transcribe from Microphone, Streaming with chosen model</a></li>
     <li><a href="file-streaming.html">Transcribe from file, Streaming</a></li>
     <li><a href="file-realtime-vs-no-realtime.html">Transcribe from file, Comparing <code>{realtime: true}</code> to <code>{realtime: false}</code></a></li>
 
@@ -0,0 +1,56 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <title>Watson Speech to Text client example</title>
+</head>
+<body>
+
+<section>
+    <h2>Transcribe from Microphone</h2>
+    <button id="button">Start Microphone Transcription</button>
+    <button id="stop">Stop</button>
+
+    <h2>Output:</h2>
+    <div id="output">Open your browser's console to view the output. The results are simplified by removing the outer JSON (this was the default behavior before v0.22).</div>
+</section>
+
+<script src="watson-speech.js"></script>
+<!-- window.fetch pollyfill for IE/Edge & Older Chrome/FireFox -->
+<script src="bower_components/fetch/fetch.js"></script>
+
+<h2>Code for this demo:</h2>
+
+<pre><code><script style="display: block;">
+document.querySelector('#button').onclick = function () {
+
+  fetch('/api/speech-to-text/token')
+  .then(function(response) {
+      return response.text();
+  }).then(function (token) {
+
+    var stream = WatsonSpeech.SpeechToText.recognizeMicrophone({
+        token: token,
+        objectMode: true, // send objects instead of text
+        extractResults: true // convert {results: [{alternatives:[...]}], result_index: 0} to {alternatives: [...], index: 0}
+    });
+
+    stream.on('data', function(data) {
+      console.log(data);
+    });
+
+    stream.on('error', function(err) {
+        console.log(err);
+    });
+
+    document.querySelector('#stop').onclick = stream.stop.bind(stream);
+
+  }).catch(function(error) {
+      console.log(error);
+  });
+};
+
+</script></code></pre>
+
+</body>
+</html>
@@ -30,7 +30,8 @@ <h2>Code for this demo:</h2>
   }).then(function (token) {
 
     var stream = WatsonSpeech.SpeechToText.recognizeMicrophone({
-        token: token
+        token: token,
+        speaker_labels: true
     });
 
     stream.setEncoding('utf8'); // get text instead of Buffers for on data events
 
@@ -113,32 +113,36 @@ FormatStream.prototype.formatString = function(str, isInterim) {
  *
  * May be used outside of Node.js streams
  *
- * @param {Object} result
+ * @param {Object} data
  * @returns {Object}
  */
-FormatStream.prototype.formatResult = function formatResult(result) {
-  result = clone(result);
-  result.alternatives = result.alternatives.map(function(alt) {
-    alt.transcript = this.formatString(alt.transcript, !result.final);
-    if (alt.timestamps) {
-      alt.timestamps = alt.timestamps.map(function(ts, i, arr) {
-        // timestamps is an array of arrays, each sub-array is in the form ["word", startTime, endTime]'
-        ts[0] = this.clean(ts[0]);
-        if (i === 0) {
-          ts[0] = this.capitalize(ts[0]);
+FormatStream.prototype.formatResult = function formatResult(data) {
+  data = clone(data);
+  if (Array.isArray(data.results)) {
+    data.results.forEach(function(result) {
+      result.alternatives = result.alternatives.map(function(alt) {
+        alt.transcript = this.formatString(alt.transcript, !result.final);
+        if (alt.timestamps) {
+          alt.timestamps = alt.timestamps.map(function(ts, i, arr) {
+            // timestamps is an array of arrays, each sub-array is in the form ["word", startTime, endTime]'
+            ts[0] = this.clean(ts[0]);
+            if (i === 0) {
+              ts[0] = this.capitalize(ts[0]);
+            }
+            if (i === arr.length - 1 && result.final) {
+              ts[0] = this.period(ts[0]);
+            }
+            return ts;
+          }, this).filter(function(ts) {
+            return ts[0]; // remove any timestamps without a word (due to cleaning out junk words)
+
+          });
         }
-        if (i === arr.length - 1 && result.final) {
-          ts[0] = this.period(ts[0]);
-        }
-        return ts;
-      }, this).filter(function(ts) {
-        return ts[0]; // remove any timestamps without a word (due to cleaning out junk words)
-
-      });
-    }
-    return alt;
-  }, this);
-  return result;
+        return alt;
+      }, this);
+    }, this);
+  }
+  return data;
 };
 
 FormatStream.prototype.promise = require('./to-promise');
 
@@ -22,6 +22,7 @@ var FormatStream = require('./format-stream.js');
 var TimingStream = require('./timing-stream.js');
 var assign = require('object.assign/polyfill')();
 var WritableElementStream = require('./writable-element-stream');
+var ResultExtractor = require('./result-extractor');
 
 /**
  * @module watson-speech/speech-to-text/recognize-file
@@ -38,6 +39,7 @@ var WritableElementStream = require('./writable-element-stream');
  * @param {Boolena} [options.format=true] - pipe the text through a {FormatStream} which performs light formatting. Also controls smart_formatting option unless explicitly set.
  * @param {Boolena} [options.realtime=options.play] - pipe the text through a {TimingStream} which slows the output down to real-time to match the audio playback.
  * @param {String|DOMElement} [options.outputElement] pipe the text to a WriteableElementStream targeting the specified element. Also defaults objectMode to true to enable interim results.
+ * @param {Boolean} [options.extractResults=false] pipe results through a ResultExtractor stream to simplify the objects. (Default behavior before v0.22) Requires objectMode.
  *
  * @returns {RecognizeStream|FormatStream|TimingStream}
  */
@@ -50,6 +52,10 @@ module.exports = function recognizeFile(options) { // eslint-disable-line comple
   if (options.outputElement && options.objectMode !== false) {
     options.objectMode = true;
   }
+  // the ResultExtractor only works in objectMode
+  if (options.extractResults && options.objectMode !== false) {
+    options.objectMode = true;
+  }
 
   // default format to true (capitals and periods)
   // default smart_formatting to options.format value (dates, currency, etc.)
@@ -97,6 +103,17 @@ module.exports = function recognizeFile(options) { // eslint-disable-line comple
     stream.pipe(new WritableElementStream(options));
   }
 
+  if(options.extractResults) {
+    var stop = stream.stop.bind(stream);
+    stream = stream.pipe(new ResultExtractor());
+    stream.stop = stop;
+  }
+
+  // Capture error from original RecognizeStream
+  if (stream !== recognizeStream) {
+    recognizeStream.on('error', stream.emit.bind(stream, 'error'));
+  }
+
   return stream;
 };
 
 
@@ -23,6 +23,7 @@ var FormatStream = require('./format-stream.js');
 var assign = require('object.assign/polyfill')();
 var WritableElementStream = require('./writable-element-stream');
 var Writable = require('stream').Writable;
+var ResultExtractor = require('./result-extractor');
 
 var preservedMicStream;
 var bitBucket = new Writable({
@@ -46,6 +47,7 @@ var bitBucket = new Writable({
  * @param {Boolean} [options.format=true] - pipe the text through a {FormatStream} which performs light formatting. Also controls smart_formatting option unless explicitly set.
  * @param {Boolean} [options.keepMicrophone=false] - keeps an internal reference to the microphone stream to reuse in subsequent calls (prevents multiple permissions dialogs in firefox)
  * @param {String|DOMElement} [options.outputElement] pipe the text to a WriteableElementStream targeting the specified element. Also defaults objectMode to true to enable interim results.
+ * @param {Boolean} [options.extractResults=false] pipe results through a ResultExtractor stream to simplify the objects. (Default behavior before v0.22) Requires objectMode.
  *
  * @returns {RecognizeStream|FormatStream}
  */
@@ -58,6 +60,10 @@ module.exports = function recognizeMicrophone(options) {
   if (options.outputElement && options.objectMode !== false) {
     options.objectMode = true;
   }
+  // the ResultExtractor only works in objectMode
+  if (options.extractResults && options.objectMode !== false) {
+    options.objectMode = true;
+  }
 
   // default format to true (capitals and periods)
   // default smart_formatting to options.format value (dates, currency, etc.)
@@ -97,13 +103,16 @@ module.exports = function recognizeMicrophone(options) {
   var stream = recognizeStream;
   if (options.format) {
     stream = stream.pipe(new FormatStream(options));
-    stream.stop = recognizeStream.stop.bind(recognizeStream);
   }
 
   if (options.outputElement) {
     stream.pipe(new WritableElementStream(options));
   }
 
+  if(options.extractResults) {
+    stream = stream.pipe(new ResultExtractor());
+  }
+
   getMicStream.catch(function(err) {
     stream.emit('error', err);
   });
@@ -144,6 +153,7 @@ module.exports = function recognizeMicrophone(options) {
   // Capture error from original RecognizeStream
   if (stream !== recognizeStream) {
     recognizeStream.on('error', stream.emit.bind(stream, 'error'));
+    stream.stop = recognizeStream.stop.bind(recognizeStream);
   }
 
   return stream;
 
@@ -25,10 +25,27 @@ var contentType = require('./content-type');
 var defaults = require('defaults');
 var qs = require('../util/querystring.js');
 
-var OPENING_MESSAGE_PARAMS_ALLOWED = ['continuous', 'max_alternatives', 'timestamps', 'word_confidence', 'inactivity_timeout',
-  'content-type', 'interim_results', 'keywords', 'keywords_threshold', 'word_alternatives_threshold', 'profanity_filter', 'smart_formatting'];
-
-var QUERY_PARAMS_ALLOWED = ['customization_id','model', 'watson-token']; // , 'X-Watson-Learning-Opt-Out' - should be allowed but currently isn't due to a service bug
+var OPENING_MESSAGE_PARAMS_ALLOWED = [
+  'continuous',
+  'inactivity_timeout',
+  'timestamps',
+  'word_confidence',
+  'content-type',
+  'interim_results',
+  'keywords',
+  'keywords_threshold',
+  'max_alternatives',
+  'word_alternatives_threshold',
+  'profanity_filter',
+  'smart_formatting'
+];
+
+var QUERY_PARAMS_ALLOWED = [
+  'customization_id',
+  'model',
+  'watson-token',
+  'X-Watson-Learning-Opt-Out'
+];
 
 
 /**
@@ -123,7 +140,7 @@ var QUERY_PARAMS_ALLOWED = ['customization_id','model', 'watson-token']; // , 'X
  * @param {Boolean} [options.profanity_filter=false] - set to true to filter out profanity and replace the words with *'s
  * @param {Number} [options.inactivity_timeout=30] - how many seconds of silence before automatically closing the stream (even if continuous is true). use -1 for infinity
  * @param {Boolean} [options.readableObjectMode=false] - emit `result` objects instead of string Buffers for the `data` events. Changes several other defaults.
- * @param {Number} [options.X-WDC-PL-OPT-OUT=0] - set to 1 to opt-out of allowing Watson to use this request to improve it's services
+ * @param {Number} [options.X-Watson-Learning-Opt-Out=false] - set to true to opt-out of allowing Watson to use this request to improve it's services
  * @param {Boolean} [options.smart_formatting=false] - formats numeric values such as dates, times, currency, etc.
  * @param {String} [options.customization_id] - not yet supported on the public STT service
  *
@@ -278,12 +295,6 @@ RecognizeStream.prototype.initialize = function() {
       return emitError('Invalid JSON received from service:', frame, jsonEx);
     }
 
-    /**
-     * @event RecognizeStream#receive-json
-     * @param {Object} msg - the raw JSON received from Watson - sometimes useful for debugging
-     */
-    self.emit('receive-json', data);
-
     if (data.error) {
       emitError(data.error, frame);
     } else if (data.state === 'listening') {
@@ -296,43 +307,26 @@ RecognizeStream.prototype.initialize = function() {
         self.listening = true;
         self.emit('listening');
       }
-    } else if (data.results) {
-      /**
-       * Object with array of interim or final results, possibly including confidence scores, alternatives, and word timing. May have no results at all for empty audio files.
-       * @event RecognizeStream#results
-       * @param {Object} results
-       * @deprecated - use objectMode and listen for the 'data' event instead
-       */
-      self.emit('results', data.results);
-
-      // note: currently there is always either 0 or 1 entries in the results array. However, this may change in the future.
-      data.results.forEach(function(result) {
-        result.index = data.result_index;
+    } else {
+      if (options.objectMode || options.readableObjectMode) {
         /**
          * Object with interim or final results, possibly including confidence scores, alternatives, and word timing.
-         * @event RecognizeStream#results
-         * @param {Object} results
-         * @deprecated - use objectMode and listen for the 'data' event instead
+         * @event RecognizeStream#data
+         * @param {Object} data
          */
-        self.emit('result', result);
-        if (options.objectMode || options.readableObjectMode) {
-          /**
-           * Object with interim or final results, possibly including confidence scores, alternatives, and word timing.
-           * @event RecognizeStream#data
-           * @param {Object} data
-           */
-          self.push(result);
-        } else if (result.final && result.alternatives) {
-          /**
-           * Finalized text
-           * @event RecognizeStream#data
-           * @param {String} transcript
-           */
-          self.push(result.alternatives[0].transcript, 'utf8');
-        }
-      });
-    } else {
-      emitError('Unrecognised message from server', frame);
+        self.push(data);
+      } else if (Array.isArray(data.results)) {
+        data.results.forEach(function(result) {
+          if (result.final && result.alternatives) {
+            /**
+             * Finalized text
+             * @event RecognizeStream#data
+             * @param {String} transcript
+             */
+            self.push(result.alternatives[0].transcript, 'utf8');
+          }
+        });
+      }
     }
   };