fixed bug with sendiong audio after stop, added firefox testing, disabled failing integration tests, misc renaming and debug events

nfriedly · nfriedly · commit f59ab62566b1 · 2016-02-01T10:27:25.000-05:00
diff --git a/dist/watson-speech.js b/dist/watson-speech.js
@@ -5972,7 +5972,7 @@ function MediaElementAudioStream(source, opts) {
    * @see https://developer.mozilla.org/en-US/docs/Web/API/ScriptProcessorNode/onaudioprocess
    * @param {AudioProcessingEvent} e https://developer.mozilla.org/en-US/docs/Web/API/AudioProcessingEvent
    */
-  function recorderProcess(e) {
+  function processAudio(e) {
     // onaudioprocess can be called at least once after we've stopped
     if (recording) {
 
@@ -6001,20 +6001,20 @@ function MediaElementAudioStream(source, opts) {
 
   var context = new AudioContext();
   var audioInput = context.createMediaElementSource(source);
-  var recorder = context.createScriptProcessor(opts.bufferSize, inputChannels, outputChannels);
+  var scriptProcessor = context.createScriptProcessor(opts.bufferSize, inputChannels, outputChannels);
 
-  recorder.onaudioprocess = recorderProcess;
+  scriptProcessor.onaudioprocess = processAudio;
 
   if (!opts.muteSource) {
     var gain = context.createGain();
     audioInput.connect(gain);
     gain.connect(context.destination);
   }
 
-  audioInput.connect(recorder);
+  audioInput.connect(scriptProcessor);
 
   // other half of workaround for chrome bugs
-  recorder.connect(context.destination);
+  scriptProcessor.connect(context.destination);
 
   this.stop = function() {
     recording = false;
@@ -6101,7 +6101,7 @@ module.exports = function promise(stream) {
  */
 
 'use strict';
-var fileReaderStream = require('readable-blob-stream');
+var ReadableBlobStream = require('readable-blob-stream');
 var RecognizeStream = require('./recognize-stream.js');
 var FilePlayer = require('./file-player.js');
 
@@ -6132,8 +6132,8 @@ module.exports = function recognizeBlob(options) {
     });
   }
 
-  return fileReaderStream(options.data).pipe(recognizeStream);
-}
+  return new ReadableBlobStream(options.data).pipe(recognizeStream);
+};
 
 
 
@@ -6372,7 +6372,7 @@ RecognizeStream.prototype.initialize = function () {
 
 
   this.socket.onopen = function () {
-    socket.send(JSON.stringify(openingMessage));
+    self.sendJSON(openingMessage);
     self.emit('connect');
   };
 
@@ -6469,6 +6469,15 @@ RecognizeStream.prototype.initialize = function () {
   this.initialized = true;
 };
 
+RecognizeStream.prototype.sendJSON = function sendJSON(msg) {
+  this.emit('send-json', msg);
+  return this.socket.send(JSON.stringify(msg));
+};
+
+RecognizeStream.prototype.sendData = function sendData(data) {
+  this.emit('send-data', data);
+  return this.socket.send(data);
+};
 
 RecognizeStream.prototype._read = function (size) {
   // there's no easy way to control reads from the underlying library
@@ -6477,8 +6486,12 @@ RecognizeStream.prototype._read = function (size) {
 
 RecognizeStream.prototype._write = function (chunk, encoding, callback) {
   var self = this;
+  if (self.finished) {
+    // can't send any more data after the stop message (although this shouldn't happen normally...)
+    return;
+  }
   if (self.listening) {
-    self.socket.send(chunk);
+    self.sendData(chunk);
     this.afterSend(callback);
   } else {
     if (!this.initialized) {
@@ -6488,7 +6501,7 @@ RecognizeStream.prototype._write = function (chunk, encoding, callback) {
       this.initialize();
     }
     this.once('listening', function () {
-      self.socket.send(chunk);
+      self.sendData(chunk);
       this.afterSend(callback);
     });
   }
@@ -6504,13 +6517,9 @@ RecognizeStream.prototype.afterSend = function afterSend(next) {
   }
 };
 
-RecognizeStream.prototype.stop = function (hard) {
+RecognizeStream.prototype.stop = function () {
   this.emit('stop');
-  if (hard) {
-    this.socket.close();
-  } else {
-    this.finish();
-  }
+  this.finish();
 };
 
 RecognizeStream.prototype.finish = function finish() {
@@ -6522,10 +6531,10 @@ RecognizeStream.prototype.finish = function finish() {
   var self = this;
   var closingMessage = {action: 'stop'};
   if (self.socket) {
-    self.socket.send(JSON.stringify(closingMessage));
+    self.sendJSON(closingMessage);
   } else {
     this.once('connect', function () {
-      self.socket.send(JSON.stringify(closingMessage));
+      self.sendJSON(closingMessage);
     });
   }
 };
diff --git a/examples/public/audio-element-programmatic.html b/examples/public/audio-element-programmatic.html
@@ -0,0 +1,63 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <title>Programmatic new Audio() Example - Watson Speech to Text</title>
+</head>
+<body>
+
+<section>
+    <h2>Transcribe Programmatic new Audio(), Streaming</h2>
+    <p><small><i>The browser must be able to decode and play the audio file.</i></small></p>
+
+    <button id="button">Play and Transcribe</button>
+
+    <h2>Output:</h2>
+    <div id="output">--</div>
+</section>
+
+<script src="watson-speech.js"></script>
+<script src="http://code.jquery.com/jquery-2.2.0.min.js"></script>
+
+<h2>Code for this demo:</h2>
+<pre><code><script style="display: block;">
+$(function() {
+    var $output = $('#output');
+
+    $('#button').click(function () {
+        $.get('/token').then(function (token) {
+            $output.html('');
+
+            var audioElement = new Audio(); // document.createElement('video'); also works here
+            audioElement.src = "audio.wav";
+
+            var stream = WatsonSpeech.SpeechToText.recognizeElement({
+                token: token,
+                element: audioElement
+                // muteSource: true // prevents sound from also playing locally
+            })
+            .pipe(new WatsonSpeech.SpeechToText.FormatStream()); // optional
+
+            // each result gets it's own <span> because watson will sometimes go back and change a word as it hears more context
+            var $curSentence = $('<span>&nbsp;</span>').appendTo($output);
+
+            // a result is approximately equivalent to a sentence
+            stream.on('result', function(result) {
+                // update the text for the current sentence with the default alternative.
+                // there may be multiple alternatives but this example app ignores all but the first.
+                $curSentence.html(result.alternatives[0].transcript);
+                if (result.final) {
+                    // if we have the final text for that sentence, start a new one
+                    $curSentence = $('<span/>').appendTo($output);
+                }
+            });
+
+            stream.on('error', function(err) {
+                console.log(err);
+            });
+        });
+    });
+});
+</script></code></pre>
+</body>
+</html>
diff --git a/examples/public/audio-element.html b/examples/public/audio-element.html
@@ -12,7 +12,7 @@ <h2>Transcribe &lt;audio&gt; Element, Streaming</h2>
         Your browser does not support the <code>audio</code> element.
     </audio>
     <button id="button">Play and Transcribe</button>
-    <p><small><i>&lt;video&gt; elements should behave the same as &lt;audio&gt; elements.</i></small></p>
+    <p><small><i>&lt;video&gt; elements should behave the same as &lt;audio&gt; elements. The browser must be able to decode and play the file in either case. </i></small></p>
 
     <h2>Output:</h2>
     <div id="output">--</div>
@@ -33,6 +33,7 @@ <h2>Code for this demo:</h2>
             var stream = WatsonSpeech.SpeechToText.recognizeElement({
                 token: token,
                 element: $('#audio-element')[0]
+                // muteSource: true // prevents sound from also playing locally
             })
             .pipe(new WatsonSpeech.SpeechToText.FormatStream()); // optional
 
diff --git a/examples/public/index.html b/examples/public/index.html
@@ -11,6 +11,7 @@
     <li><a href="file-streaming.html">Transcribe from file, Streaming</a></li>
     <li><a href="file-promise.html">Transcribe from file, Promise</a></li>
     <li><a href="audio-element.html">Transcribe from HTML5 &lt;audio&gt; element, Streaming</a></li>
+    <li><a href="audio-element-programmatic.html">Transcribe from <code>new Audio()</code>, Streaming</a></li>
 </ul>
 
 </body>
diff --git a/package.json b/package.json
@@ -20,6 +20,7 @@
   "devDependencies": {
     "browserify": "^13.0.0",
     "concat-stream": "^1.5.1",
+    "envify": "^3.4.0",
     "eslint": "^1.10.3",
     "eslint-config-google": "^0.3.0",
     "expect.js": "^0.3.1",
@@ -28,6 +29,7 @@
     "karma-browserify": "^5.0.1",
     "karma-chrome-launcher": "^0.2.2",
     "karma-express-http-server": "0.0.1",
+    "karma-firefox-launcher": "^0.1.7",
     "karma-mocha": "^0.2.1",
     "mocha": "^2.4.4",
     "serve-static": "^1.10.2",
diff --git a/speech-to-text/media-element-audio-stream.js b/speech-to-text/media-element-audio-stream.js
@@ -41,7 +41,7 @@ function MediaElementAudioStream(source, opts) {
    * @see https://developer.mozilla.org/en-US/docs/Web/API/ScriptProcessorNode/onaudioprocess
    * @param {AudioProcessingEvent} e https://developer.mozilla.org/en-US/docs/Web/API/AudioProcessingEvent
    */
-  function recorderProcess(e) {
+  function processAudio(e) {
     // onaudioprocess can be called at least once after we've stopped
     if (recording) {
 
@@ -70,20 +70,20 @@ function MediaElementAudioStream(source, opts) {
 
   var context = new AudioContext();
   var audioInput = context.createMediaElementSource(source);
-  var recorder = context.createScriptProcessor(opts.bufferSize, inputChannels, outputChannels);
+  var scriptProcessor = context.createScriptProcessor(opts.bufferSize, inputChannels, outputChannels);
 
-  recorder.onaudioprocess = recorderProcess;
+  scriptProcessor.onaudioprocess = processAudio;
 
   if (!opts.muteSource) {
     var gain = context.createGain();
     audioInput.connect(gain);
     gain.connect(context.destination);
   }
 
-  audioInput.connect(recorder);
+  audioInput.connect(scriptProcessor);
 
   // other half of workaround for chrome bugs
-  recorder.connect(context.destination);
+  scriptProcessor.connect(context.destination);
 
   this.stop = function() {
     recording = false;
diff --git a/speech-to-text/recognize-stream.js b/speech-to-text/recognize-stream.js
@@ -124,7 +124,7 @@ RecognizeStream.prototype.initialize = function () {
 
 
   this.socket.onopen = function () {
-    socket.send(JSON.stringify(openingMessage));
+    self.sendJSON(openingMessage);
     self.emit('connect');
   };
 
@@ -221,6 +221,15 @@ RecognizeStream.prototype.initialize = function () {
   this.initialized = true;
 };
 
+RecognizeStream.prototype.sendJSON = function sendJSON(msg) {
+  this.emit('send-json', msg);
+  return this.socket.send(JSON.stringify(msg));
+};
+
+RecognizeStream.prototype.sendData = function sendData(data) {
+  this.emit('send-data', data);
+  return this.socket.send(data);
+};
 
 RecognizeStream.prototype._read = function (size) {
   // there's no easy way to control reads from the underlying library
@@ -229,8 +238,12 @@ RecognizeStream.prototype._read = function (size) {
 
 RecognizeStream.prototype._write = function (chunk, encoding, callback) {
   var self = this;
+  if (self.finished) {
+    // can't send any more data after the stop message (although this shouldn't happen normally...)
+    return;
+  }
   if (self.listening) {
-    self.socket.send(chunk);
+    self.sendData(chunk);
     this.afterSend(callback);
   } else {
     if (!this.initialized) {
@@ -240,7 +253,7 @@ RecognizeStream.prototype._write = function (chunk, encoding, callback) {
       this.initialize();
     }
     this.once('listening', function () {
-      self.socket.send(chunk);
+      self.sendData(chunk);
       this.afterSend(callback);
     });
   }
@@ -256,13 +269,9 @@ RecognizeStream.prototype.afterSend = function afterSend(next) {
   }
 };
 
-RecognizeStream.prototype.stop = function (hard) {
+RecognizeStream.prototype.stop = function () {
   this.emit('stop');
-  if (hard) {
-    this.socket.close();
-  } else {
-    this.finish();
-  }
+  this.finish();
 };
 
 RecognizeStream.prototype.finish = function finish() {
@@ -274,10 +283,10 @@ RecognizeStream.prototype.finish = function finish() {
   var self = this;
   var closingMessage = {action: 'stop'};
   if (self.socket) {
-    self.socket.send(JSON.stringify(closingMessage));
+    self.sendJSON(closingMessage);
   } else {
     this.once('connect', function () {
-      self.socket.send(JSON.stringify(closingMessage));
+      self.sendJSON(closingMessage);
     });
   }
 };
diff --git a/test/resources/karma.conf.js b/test/resources/karma.conf.js
@@ -32,7 +32,10 @@ module.exports = function(config) {
 
     browserify: {
       debug: true,
-      transform: [ ] // 'brfs', 'browserify-shim'
+      // 'brfs' makes fs.read* work
+      // 'browserify-shim' wraps non-browserify modules
+      // 'envify' makes process.env work
+      transform: [ 'envify' ]
     },
 
 
@@ -61,7 +64,7 @@ module.exports = function(config) {
 
     // start these browsers
     // available browser launchers: https://npmjs.org/browse/keyword/karma-launcher
-    browsers: ['ChromeWithPrerecordedMic'],
+    browsers: ['ChromeWithPrerecordedMic', 'FirefoxAutoGUM'],
 
     // you can define custom flags
     // there's a handy list of chrome flags at
@@ -70,6 +73,13 @@ module.exports = function(config) {
         base: 'Chrome',
         // --no-sandbox is required for travis-ci
         flags: ['--use-fake-device-for-media-stream','--use-fake-ui-for-media-stream', '--use-file-for-fake-audio-capture=test/resources/audio.wav', '--no-sandbox']
+      },
+      // automatically approve getUserMedia calls
+      FirefoxAutoGUM: {
+        base: 'Firefox',
+        prefs: {
+          'media.navigator.permission.disabled': true
+        }
       }
     },
 
diff --git a/test/spec.js b/test/spec.js