Merge pull request #27 from ml5js/model-pose-detection

ziyuan-linn · web-flow · commit 2e70dd385a05 · 2023-08-08T15:40:37.000-04:00
Model pose detection
diff --git a/examples/PoseDetection/index.html b/examples/PoseDetection/index.html
@@ -0,0 +1,19 @@
+<!--
+ Copyright (c) 2018 ml5
+ 
+ This software is released under the MIT License.
+ https://opensource.org/licenses/MIT
+-->
+
+<html>
+  <head>
+    <meta charset="UTF-8" />
+    <title>Pose detection example using p5.js</title>
+    <script src="https://cdnjs.cloudflare.com/ajax/libs/p5.js/1.6.0/p5.js"></script>
+    <script src="../../dist/ml5.js"></script>
+  </head>
+
+  <body>
+    <script src="sketch.js"></script>
+  </body>
+</html>
diff --git a/examples/PoseDetection/sketch.js b/examples/PoseDetection/sketch.js
@@ -0,0 +1,59 @@
+// Copyright (c) 2018 ml5
+//
+// This software is released under the MIT License.
+// https://opensource.org/licenses/MIT
+
+/* ===
+ml5 Example
+poseDetection example using p5.js
+=== */
+
+let video;
+let poseNet;
+let poses = [];
+
+function setup() {
+  createCanvas(640, 480);
+
+  // Create the video and hide it
+  video = createCapture(VIDEO);
+  video.size(width, height);
+  video.hide();
+
+  // Load the model and attach an event
+  poseDetector = ml5.poseDetection(video, modelReady);
+  poseDetector.on("pose", gotPoses);
+}
+
+// Event for pose detection
+function gotPoses(results) {
+  // Always save the latest output from the model in global variable "poses"
+  poses = results;
+}
+
+// Event for when model loaded
+function modelReady() {
+  console.log("Model ready!");
+}
+
+function draw() {
+  console.log(poses);
+  // Draw the video
+  image(video, 0, 0, width, height);
+
+  // Draw all the tracked landmark points
+  // for each individual pose detected
+  for (let i = 0; i < poses.length; i++) {
+    let pose = poses[i];
+    // for each keypoint in the pose
+    for (let j = 0; j < pose.keypoints.length; j++) {
+      let keypoint = pose.keypoints[j];
+      // Only draw an ellipse if the confidence score of the keypoint is bigger than 0.2
+      if (keypoint.score > 0.2) {
+        fill(255, 0, 0);
+        noStroke();
+        ellipse(keypoint.x, keypoint.y, 10, 10);
+      }
+    }
+  }
+}
diff --git a/package.json b/package.json
@@ -27,7 +27,9 @@
   },
   "dependencies": {
     "@mediapipe/hands": "^0.4.1675469240",
+    "@mediapipe/pose": "^0.5.1675469404",
     "@tensorflow-models/hand-pose-detection": "^2.0.0",
+    "@tensorflow-models/pose-detection": "^2.1.0",
     "@tensorflow/tfjs": "^4.2.0",
     "@tensorflow/tfjs-vis": "^1.5.1",
     "axios": "^1.3.4"
diff --git a/src/PoseDetection/index.js b/src/PoseDetection/index.js
@@ -0,0 +1,129 @@
+// Copyright (c) 2018 ml5
+//
+// This software is released under the MIT License.
+// https://opensource.org/licenses/MIT
+
+/*
+PoseDetection
+Ported from pose-detection at Tensorflow.js
+*/
+
+import EventEmitter from "events";
+import * as tf from "@tensorflow/tfjs";
+import * as bodyPoseDetection from "@tensorflow-models/pose-detection";
+import callCallback from "../utils/callcallback";
+import handleArguments from "../utils/handleArguments";
+import { mediaReady } from "../utils/imageUtilities";
+
+class PoseDetection extends EventEmitter {
+  /**
+   * @typedef {Object} options
+   * @property {string} modelType - Optional. specify what model variant to load from. Default: 'MULTIPOSE_LIGHTNING'.
+   * @property {boolean} enableSmoothing - Optional. Whether to use temporal filter to smooth keypoints across frames. Default: true.
+   * @property {string} modelUrl - Optional. A string that specifies custom url of the model. Default to load from tf.hub.
+   * @property {number} minPoseScore - Optional. The minimum confidence score for a pose to be detected. Default: 0.25.
+   * @property {number} multiPoseMaxDimension - Optional. The target maximum dimension to use as the input to the multi-pose model. Must be a mutiple of 32. Default: 256.
+   * @property {boolean} enableTracking - Optional. Track each person across the frame with a unique ID. Default: true.
+   * @property {string} trackerType - Optional. Specify what type of tracker to use. Default: 'boundingBox'.
+   * @property {Object} trackerConfig - Optional. Specify tracker configurations. Use tf.js setting by default.
+   */
+
+  /**
+   * Create a PoseNet model.
+   * @param {HTMLVideoElement || p5.Video} video  - Optional. A HTML video element or a p5 video element.
+   * @param {options} options - Optional. An object describing a model accuracy and performance.
+   * @param {function} callback  Optional. A function to run once the model has been loaded.
+   *    If no callback is provided, it will return a promise that will be resolved once the
+   *    model has loaded.
+   */
+  constructor(video, options, callback) {
+    super();
+
+    this.video = video;
+    this.model = null;
+    this.modelReady = false;
+    this.config = options;
+
+    this.ready = callCallback(this.loadModel(), callback);
+  }
+
+  /**
+   * Load the model and set it to this.model
+   * @return {this} the detector model.
+   */
+  async loadModel() {
+    const pipeline = bodyPoseDetection.SupportedModels.MoveNet;
+    //Set the config to user defined or default values
+    const modelConfig = {
+      enableSmoothing: this.config.enableSmoothing ?? true,
+      modelUrl: this.config.modelUrl,
+      minPoseScore: this.config.minPoseScore ?? 0.25,
+      multiPoseMaxDimension: this.config.multiPoseMaxDimension ?? 256,
+      enableTracking: this.config.enableTracking ?? true,
+      trackerType: this.config.trackerType ?? "boundingBox",
+      trackerConfig: this.config.trackerConfig,
+    };
+    // use multi-pose lightning model by default
+    switch (this.config.modelType) {
+      case "SINGLEPOSE_LIGHTNING":
+        modelConfig.modelType =
+          bodyPoseDetection.movenet.modelType.SINGLEPOSE_LIGHTNING;
+        break;
+      case "SINGLEPOSE_THUNDER":
+        modelConfig.modelType =
+          bodyPoseDetection.movenet.modelType.SINGLEPOSE_THUNDER;
+        break;
+      default:
+        modelConfig.modelType =
+          bodyPoseDetection.movenet.modelType.MULTIPOSE_LIGHTNING;
+    }
+    // Load the detector model
+    await tf.setBackend("webgl");
+    this.model = await bodyPoseDetection.createDetector(pipeline, modelConfig);
+    this.modelReady = true;
+
+    if (this.video) {
+      this.predict();
+    }
+
+    return this;
+  }
+
+  //TODO: Add named keypoints to a MoveNet pose object
+
+  /**
+   * Given an image or video, returns an array of objects containing pose estimations
+   * @param {HTMLVideoElement || p5.Video || function} inputOr - An HMTL or p5.js image, video, or canvas element to run the prediction on.
+   * @param {function} cb - A callback function to handle the predictions.
+   */
+  async predict(inputOr, cb) {
+    const { image, callback } = handleArguments(this.video, inputOr, cb);
+    if (!image) {
+      throw new Error("No input image found.");
+    }
+    // If video is provided, wait for video to be loaded
+    await mediaReady(image, false);
+    const result = await this.model.estimatePoses(image);
+
+    // TODO: Add named keypoints to each pose object
+
+    this.emit("pose", result);
+
+    if (this.video) {
+      return tf.nextFrame().then(() => this.predict());
+    }
+
+    if (typeof callback === "function") {
+      callback(result);
+    }
+
+    return result;
+  }
+}
+
+const poseDetection = (...inputs) => {
+  const { video, options = {}, callback } = handleArguments(...inputs);
+  return new PoseDetection(video, options, callback);
+};
+
+export default poseDetection;
diff --git a/src/PoseDetection/index.test.js b/src/PoseDetection/index.test.js
@@ -0,0 +1,60 @@
+// Copyright (c) 2018 ml5
+//
+// This software is released under the MIT License.
+// https://opensource.org/licenses/MIT
+
+import { asyncLoadImage } from "../utils/testingUtils";
+import poseNet from "./index";
+
+const POSENET_IMG =
+  "https://github.com/ml5js/ml5-adjacent/raw/master/02_ImageClassification_Video/starter.png";
+
+const POSENET_DEFAULTS = {
+  architecture: "MobileNetV1",
+  outputStride: 16,
+  flipHorizontal: false,
+  minConfidence: 0.5,
+  maxPoseDetections: 5,
+  scoreThreshold: 0.5,
+  nmsRadius: 20,
+  detectionType: "multiple",
+  inputResolution: 256,
+  multiplier: 0.75,
+  quantBytes: 2,
+};
+
+describe("PoseNet", () => {
+  let net;
+
+  beforeAll(async () => {
+    jest.setTimeout(10000);
+    net = await poseNet();
+  });
+
+  it("instantiates poseNet", () => {
+    expect(net.architecture).toBe(POSENET_DEFAULTS.architecture);
+    expect(net.outputStride).toBe(POSENET_DEFAULTS.outputStride);
+    expect(net.inputResolution).toBe(POSENET_DEFAULTS.inputResolution);
+    expect(net.multiplier).toBe(POSENET_DEFAULTS.multiplier);
+    expect(net.quantBytes).toBe(POSENET_DEFAULTS.quantBytes);
+  });
+
+  it("detects poses in image", async () => {
+    const image = await asyncLoadImage(POSENET_IMG);
+
+    // Result should be an array with a single object containing pose and skeleton.
+    const result = await net.singlePose(image);
+    expect(result).toHaveLength(1);
+    expect(result[0]).toHaveProperty("pose");
+    expect(result[0]).toHaveProperty("skeleton");
+
+    // Verify a known outcome.
+    const nose = result[0].pose.keypoints.find(
+      (keypoint) => keypoint.part === "nose"
+    );
+    expect(nose).toBeTruthy();
+    expect(nose.position.x).toBeCloseTo(448.6, 0);
+    expect(nose.position.y).toBeCloseTo(255.9, 0);
+    expect(nose.score).toBeCloseTo(0.999);
+  });
+});
diff --git a/src/index.js b/src/index.js
@@ -1,5 +1,6 @@
 import neuralNetwork from "./NeuralNetwork";
 import handpose from "./Handpose";
+import poseDetection from "./PoseDetection";
 import * as tf from "@tensorflow/tfjs";
 import * as tfvis from "@tensorflow/tfjs-vis";
 import p5Utils from "./utils/p5Utils";
@@ -11,5 +12,6 @@ export default Object.assign(
     tfvis,
     neuralNetwork,
     handpose,
+    poseDetection,
   }
 );
diff --git a/yarn.lock b/yarn.lock
@@ -62,13 +62,26 @@
   resolved "https://registry.yarnpkg.com/@mediapipe/hands/-/hands-0.4.1675469240.tgz#f032b2f5deff5a69430693f94be45dd9854e803f"
   integrity sha512-GxoZvL1mmhJxFxjuyj7vnC++JIuInGznHBin5c7ZSq/RbcnGyfEcJrkM/bMu5K1Mz/2Ko+vEX6/+wewmEHPrHg==
 
+"@mediapipe/pose@^0.5.1675469404":
+  version "0.5.1675469404"
+  resolved "https://registry.yarnpkg.com/@mediapipe/pose/-/pose-0.5.1675469404.tgz#8f81e64c6561b2357a021a134b54de0204bafc72"
+  integrity sha512-DFZsNWTsSphRIZppnUCuunzBiHP2FdJXR9ehc7mMi4KG+oPaOH0Em3d6kr7Py+TSyTXC1doH88KcF28k2sBxsQ==
+
 "@tensorflow-models/hand-pose-detection@^2.0.0":
   version "2.0.0"
   resolved "https://registry.yarnpkg.com/@tensorflow-models/hand-pose-detection/-/hand-pose-detection-2.0.0.tgz#967b26d17d26454d0625c2af2264fd7aad8fdc35"
   integrity sha512-wAiu/SpigjKuhlEdIvPp84FyzIH0v8kHn/jB/VslUn/pV75Kpsv8Jk0S55oC/Jj54B/fLDZU19+zYN7lQMBCxg==
   dependencies:
     rimraf "^3.0.2"
 
+"@tensorflow-models/pose-detection@^2.1.0":
+  version "2.1.0"
+  resolved "https://registry.yarnpkg.com/@tensorflow-models/pose-detection/-/pose-detection-2.1.0.tgz#733ce55dfe4a75d40cb04935e461beacac2e8e4d"
+  integrity sha512-4WOgxiPuA1ymZff9Epez2GsC0FSv7Fj8olu5LzXB/JAYo/zgyu2PFOQFeDXvvqyXwxdB4IrYYsgerUqlZaGdSQ==
+  dependencies:
+    rimraf "^3.0.2"
+    tslib "2.4.0"
+
 "@tensorflow/tfjs-backend-cpu@4.8.0":
   version "4.8.0"
   resolved "https://registry.yarnpkg.com/@tensorflow/tfjs-backend-cpu/-/tfjs-backend-cpu-4.8.0.tgz#6281ab0a93400f2b5c7b2efa07b0befb895a0260"
@@ -2880,6 +2893,11 @@ tr46@~0.0.3:
   resolved "https://registry.yarnpkg.com/tr46/-/tr46-0.0.3.tgz#8184fd347dac9cdc185992f3a6622e14b9d9ab6a"
   integrity sha512-N3WMsuqV66lT30CrXNbEjx4GEwlow3v6rr4mCcv6prnfwhS01rkgyFdjPNBYd9br7LpXV1+Emh01fHnq2Gdgrw==
 
+tslib@2.4.0:
+  version "2.4.0"
+  resolved "https://registry.yarnpkg.com/tslib/-/tslib-2.4.0.tgz#7cecaa7f073ce680a05847aa77be941098f36dc3"
+  integrity sha512-d6xOpEDfsi2CZVlPQzGeux8XMwLT9hssAsaPYExaQMuYskwb+x1x7J371tWlbBdWHroy99KnVB6qIkUbs5X3UQ==
+
 tslib@^2.0.3:
   version "2.6.0"
   resolved "https://registry.yarnpkg.com/tslib/-/tslib-2.6.0.tgz#b295854684dbda164e181d259a22cd779dcd7bc3"