cleanup and new api update to Crepe

cvalenzuela · cvalenzuela · commit 03fc3e1e0f11 · 2018-06-12T14:06:11.000-04:00
diff --git a/src/Crepe/index.js b/src/Crepe/index.js
@@ -3,33 +3,58 @@
 // This software is released under the MIT License.
 // https://opensource.org/licenses/MIT
 
-// Crepe Pitch Detection model
-// https://github.com/marl/crepe/tree/gh-pages
-// https://marl.github.io/crepe/crepe.js
+/*
+  Crepe Pitch Detection model
+  https://github.com/marl/crepe/tree/gh-pages
+  https://marl.github.io/crepe/crepe.js
+*/
 
 import * as tf from '@tensorflow/tfjs';
 
 class Crepe {
-  // in here are the functions to make exposed
   constructor(audioContext, stream) {
     this.audioContext = audioContext;
     this.stream = stream;
-    this.initTF();
+    this.loadModel();
   }
 
-  async initTF() {
-    try {
-      console.log('Loading Keras model...');
-      this.model = await tf.loadModel('model/model.json');
-      console.log('Model loading complete');
-    } catch (e) {
-      console.error(e);
-    }
+  async loadModel() {
+    this.model = await tf.loadModel('model/model.json');
     this.initAudio();
   }
 
-  // perform resampling the audio to 16000 Hz, on which the model is trained.
-  // setting a sample rate in AudioContext is not supported by most browsers at the moment.
+  initAudio() {
+    if (this.audioContext) {
+      try {
+        this.processStream(this.stream);
+      } catch (e) {
+        throw new Error(`Error: Could not access microphone - ${e}`);
+      }
+    } else {
+      throw new Error('Could not access microphone - getUserMedia not available');
+    }
+  }
+
+  processStream(stream) {
+    const mic = this.audioContext.createMediaStreamSource(stream);
+    const minBufferSize = (this.audioContext.sampleRate / 16000) * 1024;
+    let bufferSize = 4;
+    while (bufferSize < minBufferSize) bufferSize *= 2;
+
+    const scriptNode = this.audioContext.createScriptProcessor(bufferSize, 1, 1);
+    scriptNode.onaudioprocess = this.processMicrophoneBuffer.bind(this);
+    const gain = this.audioContext.createGain();
+    gain.gain.setValueAtTime(0, this.audioContext.currentTime);
+
+    mic.connect(scriptNode);
+    scriptNode.connect(gain);
+    gain.connect(this.audioContext.destination);
+
+    if (this.audioContext.state !== 'running') {
+      console.warn('User gesture needed to start AudioContext, please click');
+    }
+  }
+
   static resample(audioBuffer, onComplete) {
     const interpolate = (audioBuffer.sampleRate % 16000 !== 0);
     const multiplier = audioBuffer.sampleRate / 16000;
@@ -39,7 +64,6 @@ class Crepe {
       if (!interpolate) {
         subsamples[i] = original[i * multiplier];
       } else {
-        // simplistic, linear resampling
         const left = Math.floor(i * multiplier);
         const right = left + 1;
         const p = (i * multiplier) - left;
@@ -51,42 +75,32 @@ class Crepe {
 
   processMicrophoneBuffer(event) {
     this.results = {};
-    // bin number -> cent value mapping
     const centMapping = tf.add(tf.linspace(0, 7180, 360), tf.tensor(1997.3794084376191));
     Crepe.resample(event.inputBuffer, (resampled) => {
       tf.tidy(() => {
         this.running = true;
-
-        // run the prediction on the model
         const frame = tf.tensor(resampled.slice(0, 1024));
         const zeromean = tf.sub(frame, tf.mean(frame));
         const framestd = tf.tensor(tf.norm(zeromean).dataSync() / Math.sqrt(1024));
         const normalized = tf.div(zeromean, framestd);
         const input = normalized.reshape([1, 1024]);
         const activation = this.model.predict([input]).reshape([360]);
-
-        // the confidence of voicing activity and the argmax bin
         const confidence = activation.max().dataSync()[0];
         const center = activation.argMax().dataSync()[0];
         this.results.confidence = confidence.toFixed(3);
 
-        // slice the local neighborhood around the argmax bin
         const start = Math.max(0, center - 4);
         const end = Math.min(360, center + 5);
         const weights = activation.slice([start], [end - start]);
         const cents = centMapping.slice([start], [end - start]);
 
-        // take the local weighted average to get the predicted pitch
         const products = tf.mul(weights, cents);
         const productSum = products.dataSync().reduce((a, b) => a + b, 0);
         const weightSum = weights.dataSync().reduce((a, b) => a + b, 0);
         const predictedCent = productSum / weightSum;
         const predictedHz = 10 * ((predictedCent / 1200.0) ** 2);
 
-        // update
         const result = (confidence > 0.5) ? `${predictedHz.toFixed(3)} +  Hz` : 'no voice';
-        // const strlen = result.length;
-        // for (let i = 0; i < 11 - strlen; i += 1) result = result;
         this.results.result = result;
       });
     });
@@ -95,55 +109,8 @@ class Crepe {
   getResults() {
     return this.results;
   }
-
-  processStream(stream) {
-    console.log('Setting up AudioContext ...');
-    console.log(`Audio context sample rate =  + ${this.audioContext.sampleRate}`);
-    const mic = this.audioContext.createMediaStreamSource(stream);
-
-    // We need the buffer size that is a power of two
-    // and is longer than 1024 samples when resampled to 16000 Hz.
-    // In most platforms where the sample rate is 44.1 kHz or 48 kHz,
-    // this will be 4096, giving 10-12 updates/sec.
-    const minBufferSize = (this.audioContext.sampleRate / 16000) * 1024;
-    let bufferSize = 4;
-    while (bufferSize < minBufferSize) bufferSize *= 2;
-    console.log(`Buffer size = ${bufferSize}`);
-    const scriptNode = this.audioContext.createScriptProcessor(bufferSize, 1, 1);
-    scriptNode.onaudioprocess = this.processMicrophoneBuffer.bind(this);
-    // It seems necessary to connect the stream to a sink
-    // for the pipeline to work, contrary to documentataions.
-    // As a workaround, here we create a gain node with zero gain,
-    // and connect temp to the system audio output.
-    const gain = this.audioContext.createGain();
-    gain.gain.setValueAtTime(0, this.audioContext.currentTime);
-
-    mic.connect(scriptNode);
-    scriptNode.connect(gain);
-    gain.connect(this.audioContext.destination);
-
-    if (this.audioContext.state === 'running') {
-      console.log('Running ...');
-    } else {
-      console.error('User gesture needed to start AudioContext, please click');
-      // user gesture (like click) is required to start AudioContext, in some browser versions
-      // status('<a href="javascript:crepe.resume();" style="color:red;">*
-      // Click here to start the demo *</a>')
-    }
-  }
-
-  initAudio() {
-    if (this.audioContext) {
-      console.log('Initializing audio');
-      try {
-        this.processStream(this.stream);
-      } catch (e) {
-        console.error('Error: Could not access microphone - ', e);
-      }
-    } else {
-      console.error('Could not access microphone - getUserMedia not available');
-    }
-  }
 }
 
-export default Crepe;
+const crepe = (context, stream) => new Crepe(context, stream);
+
+export default crepe;