ml5js
diff --git a/‎package-lock.json‎
Lines changed: 59 additions & 26 deletions b/‎package-lock.json‎
Lines changed: 59 additions & 26 deletions
diff --git a/‎package.json‎
Lines changed: 4 additions & 3 deletions b/‎package.json‎
Lines changed: 4 additions & 3 deletions
diff --git a/‎src/FeatureExtractor/Mobilenet.js‎
Lines changed: 7 additions & 4 deletions b/‎src/FeatureExtractor/Mobilenet.js‎
Lines changed: 7 additions & 4 deletions
diff --git a/‎src/ImageClassifier/darknet.js‎
Lines changed: 118 additions & 0 deletions b/‎src/ImageClassifier/darknet.js‎
Lines changed: 118 additions & 0 deletions
diff --git a/‎src/ImageClassifier/index.js‎
Lines changed: 18 additions & 7 deletions b/‎src/ImageClassifier/index.js‎
Lines changed: 18 additions & 7 deletions
diff --git a/‎src/PitchDetection/index.js‎
Lines changed: 1 addition & 1 deletion b/‎src/PitchDetection/index.js‎
Lines changed: 1 addition & 1 deletion
@@ -86,9 +86,10 @@
     ]
   },
   "dependencies": {
-    "@tensorflow-models/mobilenet": "0.1.0",
-    "@tensorflow-models/posenet": "0.1.3",
-    "@tensorflow/tfjs": "0.11.4",
+    "@magenta/sketch": "^0.1.2",
+    "@tensorflow-models/mobilenet": "0.2.2",
+    "@tensorflow-models/posenet": "0.2.2",
+    "@tensorflow/tfjs": "0.13.0",
     "events": "^3.0.0"
   }
 }
@@ -95,7 +95,7 @@ class Mobilenet {
     if (inputOrLabel instanceof HTMLImageElement || inputOrLabel instanceof HTMLVideoElement) {
       imgToAdd = inputOrLabel;
     } else if (typeof inputOrLabel === 'object' && (inputOrLabel.elt instanceof HTMLImageElement || inputOrLabel.elt instanceof HTMLVideoElement)) {
-      imgToAdd = inputOrLabel;
+      imgToAdd = inputOrLabel.elt;
     } else if (typeof inputOrLabel === 'string' || typeof inputOrLabel === 'number') {
       imgToAdd = this.video;
       label = inputOrLabel;
@@ -121,7 +121,8 @@ class Mobilenet {
   async addImageInternal(imgToAdd, label) {
     await this.ready;
     tf.tidy(() => {
-      const processedImg = imgToTensor(imgToAdd);
+      const imageResize = (imgToAdd === this.video) ? null : [IMAGESIZE, IMAGESIZE];
+      const processedImg = imgToTensor(imgToAdd, imageResize);
       const prediction = this.mobilenetFeatures.predict(processedImg);
 
       let y;
@@ -243,7 +244,8 @@ class Mobilenet {
     await tf.nextFrame();
     this.isPredicting = true;
     const predictedClass = tf.tidy(() => {
-      const processedImg = imgToTensor(imgToPredict);
+      const imageResize = (imgToPredict === this.video) ? null : [IMAGESIZE, IMAGESIZE];
+      const processedImg = imgToTensor(imgToPredict, imageResize);
       const activation = this.mobilenetFeatures.predict(processedImg);
       const predictions = this.customModel.predict(activation);
       return predictions.as1D().argMax();
@@ -281,7 +283,8 @@ class Mobilenet {
     await tf.nextFrame();
     this.isPredicting = true;
     const predictedClass = tf.tidy(() => {
-      const processedImg = imgToTensor(imgToPredict);
+      const imageResize = (imgToPredict === this.video) ? null : [IMAGESIZE, IMAGESIZE];
+      const processedImg = imgToTensor(imgToPredict, imageResize);
       const activation = this.mobilenetFeatures.predict(processedImg);
       const predictions = this.customModel.predict(activation);
       return predictions.as1D();
 
@@ -0,0 +1,118 @@
+// Copyright (c) 2018 ml5
+//
+// This software is released under the MIT License.
+// https://opensource.org/licenses/MIT
+
+import * as tf from '@tensorflow/tfjs';
+import IMAGENET_CLASSES_DARKNET from '../utils/IMAGENET_CLASSES_DARKNET';
+
+const DEFAULTS = {
+  DARKNET_URL: 'https://rawgit.com/ml5js/ml5-data-and-models/master/models/darknetclassifier/darknetreference/model.json',
+  DARKNET_TINY_URL: 'https://rawgit.com/ml5js/ml5-data-and-models/master/models/darknetclassifier/darknettiny/model.json',
+  IMAGE_SIZE_DARKNET: 256,
+  IMAGE_SIZE_DARKNET_TINY: 224,
+};
+
+async function getTopKClasses(logits, topK) {
+  const values = await logits.data();
+  const valuesAndIndices = [];
+  for (let i = 0; i < values.length; i += 1) {
+    valuesAndIndices.push({
+      value: values[i],
+      index: i,
+    });
+  }
+  valuesAndIndices.sort((a, b) => b.value - a.value);
+
+  const topkValues = new Float32Array(topK);
+  const topkIndices = new Int32Array(topK);
+  for (let i = 0; i < topK; i += 1) {
+    topkValues[i] = valuesAndIndices[i].value;
+    topkIndices[i] = valuesAndIndices[i].index;
+  }
+
+  const topClassesAndProbs = [];
+  for (let i = 0; i < topkIndices.length; i += 1) {
+    topClassesAndProbs.push({
+      className: IMAGENET_CLASSES_DARKNET[topkIndices[i]],
+      probability: topkValues[i],
+    });
+  }
+  return topClassesAndProbs;
+}
+
+function preProcess(img, size) {
+  let image;
+  if (!(img instanceof tf.Tensor)) {
+    if (img instanceof HTMLImageElement || img instanceof HTMLVideoElement) {
+      image = tf.fromPixels(img);
+    } else if (typeof img === 'object' && (img.elt instanceof HTMLImageElement || img.elt instanceof HTMLVideoElement)) {
+      image = tf.fromPixels(img.elt); // Handle p5.js image and video.
+    }
+  } else {
+    image = img;
+  }
+  const normalized = image.toFloat().div(tf.scalar(255));
+  let resized = normalized;
+  if (normalized.shape[0] !== size || normalized.shape[1] !== size) {
+    const alignCorners = true;
+    resized = tf.image.resizeBilinear(normalized, [size, size], alignCorners);
+  }
+  const batched = resized.reshape([1, size, size, 3]);
+  return batched;
+}
+
+export class Darknet {
+  constructor(version) {
+    this.version = version;
+    switch (this.version) {
+      case 'reference':
+        this.imgSize = DEFAULTS.IMAGE_SIZE_DARKNET;
+        break;
+      case 'tiny':
+        this.imgSize = DEFAULTS.IMAGE_SIZE_DARKNET_TINY;
+        break;
+      default:
+        break;
+    }
+  }
+
+  async load() {
+    switch (this.version) {
+      case 'reference':
+        this.model = await tf.loadModel(DEFAULTS.DARKNET_URL);
+        break;
+      case 'tiny':
+        this.model = await tf.loadModel(DEFAULTS.DARKNET_TINY_URL);
+        break;
+      default:
+        break;
+    }
+
+    // Warmup the model.
+    const result = tf.tidy(() => this.model.predict(tf.zeros([1, this.imgSize, this.imgSize, 3])));
+    await result.data();
+    result.dispose();
+  }
+
+  async classify(img, topk = 3) {
+    const logits = tf.tidy(() => {
+      const imgData = preProcess(img, this.imgSize);
+      const predictions = this.model.predict(imgData);
+      return tf.softmax(predictions);
+    });
+    const classes = await getTopKClasses(logits, topk);
+    logits.dispose();
+    return classes;
+  }
+}
+
+export async function load(version) {
+  if (version !== 'reference' && version !== 'tiny') {
+    throw new Error('Please select a version: darknet-reference or darknet-tiny');
+  }
+
+  const darknet = new Darknet(version);
+  await darknet.load();
+  return darknet;
+}
@@ -9,6 +9,7 @@ Image Classifier using pre-trained networks
 
 import * as tf from '@tensorflow/tfjs';
 import * as mobilenet from '@tensorflow-models/mobilenet';
+import * as darknet from './darknet';
 import callCallback from '../utils/callcallback';
 
 const DEFAULTS = {
@@ -23,14 +24,24 @@ class ImageClassifier {
   constructor(modelName, video, options, callback) {
     this.modelName = modelName;
     this.video = video;
-    this.version = options.version || DEFAULTS[this.modelName].version;
-    this.alpha = options.alpha || DEFAULTS[this.modelName].alpha;
-    this.topk = options.topk || DEFAULTS[this.modelName].topk;
     this.model = null;
-    if (this.modelName === 'mobilenet') {
-      this.modelToUse = mobilenet;
-    } else {
-      this.modelToUse = null;
+    switch (this.modelName) {
+      case 'mobilenet':
+        this.modelToUse = mobilenet;
+        this.version = options.version || DEFAULTS.mobilenet.version;
+        this.alpha = options.alpha || DEFAULTS.mobilenet.alpha;
+        this.topk = options.topk || DEFAULTS.mobilenet.topk;
+        break;
+      case 'darknet':
+        this.version = 'reference'; // this a 28mb model
+        this.modelToUse = darknet;
+        break;
+      case 'darknet-tiny':
+        this.version = 'tiny'; // this a 4mb model
+        this.modelToUse = darknet;
+        break;
+      default:
+        this.modelToUse = null;
     }
     // Load the model
     this.ready = callCallback(this.loadModel(), callback);
 
@@ -79,7 +79,7 @@ class PitchDetection {
         const productSum = products.dataSync().reduce((a, b) => a + b, 0);
         const weightSum = weights.dataSync().reduce((a, b) => a + b, 0);
         const predictedCent = productSum / weightSum;
-        const predictedHz = 10 * ((predictedCent / 1200.0) ** 2);
+        const predictedHz = 10 * (2 ** (predictedCent / 1200.0));
 
         const frequency = (confidence > 0.5) ? predictedHz : null;
         this.frequency = frequency;
Original file line number	Diff line number	Diff line change
`@@ -86,9 +86,10 @@`
`86`	`86`	`]`
`87`	`87`	`},`
`88`	`88`	`"dependencies": {`
`89`		`- "@tensorflow-models/mobilenet": "0.1.0",`
`90`		`- "@tensorflow-models/posenet": "0.1.3",`
`91`		`- "@tensorflow/tfjs": "0.11.4",`
	`89`	`+ "@magenta/sketch": "^0.1.2",`
	`90`	`+ "@tensorflow-models/mobilenet": "0.2.2",`
	`91`	`+ "@tensorflow-models/posenet": "0.2.2",`
	`92`	`+ "@tensorflow/tfjs": "0.13.0",`
`92`	`93`	`"events": "^3.0.0"`
`93`	`94`	`}`
`94`	`95`	`}`