ammogcoder
diff --git a/‎README.md
Lines changed: 87 additions & 12 deletions b/‎README.md
Lines changed: 87 additions & 12 deletions
diff --git a/‎build/FaceDetection.d.ts
Lines changed: 20 additions & 0 deletions b/‎build/FaceDetection.d.ts
Lines changed: 20 additions & 0 deletions
diff --git a/‎build/FaceDetection.js
Lines changed: 68 additions & 0 deletions b/‎build/FaceDetection.js
Lines changed: 68 additions & 0 deletions
diff --git a/‎build/FaceDetection.js.map
Lines changed: 1 addition & 0 deletions b/‎build/FaceDetection.js.map
Lines changed: 1 addition & 0 deletions
diff --git a/‎build/FaceLandmarks.d.ts
Lines changed: 14 additions & 0 deletions b/‎build/FaceLandmarks.d.ts
Lines changed: 14 additions & 0 deletions
diff --git a/‎build/FaceLandmarks.js
Lines changed: 32 additions & 0 deletions b/‎build/FaceLandmarks.js
Lines changed: 32 additions & 0 deletions
diff --git a/‎build/FaceLandmarks.js.map
Lines changed: 1 addition & 0 deletions b/‎build/FaceLandmarks.js.map
Lines changed: 1 addition & 0 deletions
diff --git a/‎build/FullFaceDescription.d.ts
Lines changed: 4 additions & 4 deletions b/‎build/FullFaceDescription.d.ts
Lines changed: 4 additions & 4 deletions
diff --git a/‎build/FullFaceDescription.js.map
Lines changed: 1 addition & 1 deletion b/‎build/FullFaceDescription.js.map
Lines changed: 1 addition & 1 deletion
diff --git a/‎build/NetInput.d.ts
Lines changed: 3 additions & 1 deletion b/‎build/NetInput.d.ts
Lines changed: 3 additions & 1 deletion
@@ -8,14 +8,16 @@ Check out my article **[face-api.js — JavaScript API for Face Recognition
 
 * **[Running the Examples](#running-the-examples)**
 * **[About the Package](#about-the-package)**
-  * **[Face Detection](#about-face-detection)**
+  * **[Face Detection - SSD Mobilenet v1](#about-face-detection-ssd)**
+  * **[Face Detection & 5 Point Face Landmarks - MTCNN](#about-face-detection-mtcnn)**
   * **[Face Recognition](#about-face-recognition)**
-  * **[Face Landmark Detection](#about-face-landmark-detection)**
+  * **[68 Point Face Landmark Detection](#about-face-landmark-detection)**
 * **[Usage](#usage)**
   * **[Loading the Models](#usage-load-models)**
-  * **[Face Detection](#usage-face-detection)**
+  * **[Face Detection - SSD Mobilenet v1](#usage-face-detection-ssd)**
+  * **[Face Detection & 5 Point Face Landmarks - MTCNN](#usage-face-detection-mtcnn)**
   * **[Face Recognition](#usage-face-recognition)**
-  * **[Face Landmark Detection](#usage-face-landmark-detection)**
+  * **[68 Point Face Landmark Detection](#usage-face-landmark-detection)**
   * **[Full Face Detection and Recognition Pipeline](#usage-full-face-detection-and-recognition-pipeline)**
 
 ## Examples
@@ -38,8 +40,14 @@ Check out my article **[face-api.js — JavaScript API for Face Recognition
 
 ### Live Video Face Detection
 
+**SSD Mobilenet v1**
+
 ![preview_video-facedetection](https://user-images.githubusercontent.com/31125521/41238649-bbf10046-6d96-11e8-9041-1de46c6adccd.jpg)
 
+**MTCNN**
+
+![preview_mtcnn_video](https://user-images.githubusercontent.com/31125521/42725487-857adfd4-8784-11e8-8de2-4faae81e7ea2.jpg)
+
 ### Face Alignment
 
 ![preview_face_alignment](https://user-images.githubusercontent.com/31125521/41526994-1a690818-72e6-11e8-8f3c-d2cf31fe517b.jpg)
@@ -60,14 +68,22 @@ Browse to http://localhost:3000/.
 
 ## About the Package
 
-<a name="about-face-detection"></a>
+<a name="about-face-detection-ssd"></a>
 
-### Face Detection
+### Face Detection - SSD Mobilenet v1
 
-For face detection, this project implements a SSD (Single Shot Multibox Detector) based on MobileNetV1. The neural net will compute the locations of each face in an image and will return the bounding boxes together with it's probability for each face.
+For face detection, this project implements a SSD (Single Shot Multibox Detector) based on MobileNetV1. The neural net will compute the locations of each face in an image and will return the bounding boxes together with it's probability for each face. This face detector is aiming towards obtaining high accuracy in detecting face bounding boxes instead of low inference time.
 
 The face detection model has been trained on the [WIDERFACE dataset](http://mmlab.ie.cuhk.edu.hk/projects/WIDERFace/) and the weights are provided by [yeephycho](https://github.com/yeephycho) in [this](https://github.com/yeephycho/tensorflow-face-detection) repo.
 
+<a name="about-face-detection-mtcnn"></a>
+
+### Face Detection & 5 Point Face Landmarks - MTCNN
+
+MTCNN (Multi-task Cascaded Convolutional Neural Networks) represents an alternative to SSD Mobilenet v1, which offers much more room for configuration and is able to achieve much lower processing times. MTCNN is a 3 stage cascaded CNN, which simultanously returns 5 face landmark points along with the bounding boxes and scores for each face. By limiting the minimum size of faces expected in an image, MTCNN allows you to process frames from your webcam in realtime. Additionally with 2MB, the size of the weights file is only a third of the size of the quantized SSD Mobilenet v1 model (~6MB).
+
+MTCNN has been presented in the paper [Joint Face Detection and Alignment using Multi-task Cascaded Convolutional Networks](https://kpzhang93.github.io/MTCNN_face_detection_alignment/paper/spl.pdf) by Zhang et al. and the model weights are provided in the official [repo](https://github.com/kpzhang93/MTCNN_face_detection_alignment) of the MTCNN implementation.
+
 <a name="about-face-recognition"></a>
 
 ### Face Recognition
@@ -78,7 +94,7 @@ The neural net is equivalent to the **FaceRecognizerNet** used in [face-recognit
 
 <a name="about-face-landmark-detection"></a>
 
-### Face Landmark Detection
+### 68 Point Face Landmark Detection
 
 This package implements a CNN to detect the 68 point face landmarks for a given face image.
 
@@ -113,6 +129,7 @@ await faceapi.loadFaceDetectionModel('/models')
 // accordingly for the other models:
 // await faceapi.loadFaceLandmarkModel('/models')
 // await faceapi.loadFaceRecognitionModel('/models')
+// await faceapi.loadMtcnnModel('/models')
 ```
 
 As an alternative, you can also create instance of the neural nets:
@@ -122,12 +139,14 @@ const net = new faceapi.FaceDetectionNet()
 // accordingly for the other models:
 // const net = new faceapi.FaceLandmarkNet()
 // const net = new faceapi.FaceRecognitionNet()
+// const net = new faceapi.Mtcnn()
 
 await net.load('/models/face_detection_model-weights_manifest.json')
 // await net.load('/models/face_landmark_68_model-weights_manifest.json')
 // await net.load('/models/face_recognition_model-weights_manifest.json')
+// await net.load('/models/mtcnn_model-weights_manifest.json')
 
-// or simply
+// or simply load all models
 await net.load('/models')
 ```
 
@@ -145,9 +164,9 @@ const weights = new Float32Array(res.data)
 net.load(weights)
 ```
 
-<a name="usage-face-detection"></a>
+<a name="usage-face-detection-ssd"></a>
 
-### Face Detection
+### Face Detection - SSD Mobilenet v1
 
 Detect faces and get the bounding boxes and scores:
 
@@ -178,6 +197,62 @@ You can also obtain the tensors of the unfiltered bounding boxes and scores for
 const { boxes, scores } = await net.forward('myImg')
 ```
 
+<a name="usage-face-detection-mtcnn"></a>
+
+### Face Detection & 5 Point Face Landmarks - MTCNN
+
+Detect faces and get the bounding boxes and scores:
+
+``` javascript
+// defaults parameters shown:
+const forwardParams = {
+  // number of scaled versions of the input image passed through the CNN
+  // of the first stage, lower numbers will result in lower inference time,
+  // but will also be less accurate
+  maxNumScales: 10,
+  // scale factor used to calculate the scale steps of the image
+  // pyramid used in stage 1
+  scaleFactor: 0.709,
+  // the score threshold values used to filter the bounding
+  // boxes of stage 1, 2 and 3
+  scoreThresholds: [0.6, 0.7, 0.7],
+  // mininum face size to expect, the higher the faster processing will be,
+  // but smaller faces won't be detected
+  minFaceSize: 20
+}
+
+const results = await faceapi.mtcnn(document.getElementById('myImg'), forwardParams)
+```
+
+Alternatively you can also specify the scale steps manually:
+
+``` javascript
+const forwardParams = {
+  scaleSteps: [0.4, 0.2, 0.1, 0.05]
+}
+
+const results = await faceapi.mtcnn(document.getElementById('myImg'), forwardParams)
+```
+
+Finally you can draw the returned bounding boxes and 5 Point Face Landmarks into a canvas:
+
+``` javascript
+const minConfidence = 0.9
+
+if (results) {
+  results.forEach(({ faceDetection, faceLandmarks }) => {
+
+    // ignore results with low confidence score
+    if (faceDetection.score < minConfidence) {
+      return
+    }
+
+    faceapi.drawDetection('overlay', faceDetection)
+    faceapi.drawLandmarks('overlay', faceLandmarks)
+  })
+}
+```
+
 <a name="usage-face-recognition"></a>
 
 ### Face Recognition
@@ -265,7 +340,7 @@ const fullFaceDescriptions = await faceapi.allFaces(input, minConfidence)
 const fullFaceDescription0 = fullFaceDescriptions[0]
 console.log(fullFaceDescription0.detection) // bounding box & score
 console.log(fullFaceDescription0.landmarks) // 68 point face landmarks
-console.log(fullFaceDescription0.descriptor) // face descriptors
+console.log(fullFaceDescription0.descriptor) // face descriptor
 
 ```
 
 
@@ -0,0 +1,20 @@
+import { Rect } from './Rect';
+import { Dimensions } from './types';
+export declare class FaceDetection {
+    private _score;
+    private _box;
+    private _imageWidth;
+    private _imageHeight;
+    constructor(score: number, relativeBox: Rect, imageDims: Dimensions);
+    readonly score: number;
+    readonly box: Rect;
+    readonly imageWidth: number;
+    readonly imageHeight: number;
+    readonly relativeBox: Rect;
+    getScore(): number;
+    getBox(): Rect;
+    getImageWidth(): number;
+    getImageHeight(): number;
+    getRelativeBox(): Rect;
+    forSize(width: number, height: number): FaceDetection;
+}
@@ -0,0 +1,14 @@
+import { Point } from './Point';
+import { Dimensions } from './types';
+export declare class FaceLandmarks {
+    protected _imageWidth: number;
+    protected _imageHeight: number;
+    protected _shift: Point;
+    protected _faceLandmarks: Point[];
+    constructor(relativeFaceLandmarkPositions: Point[], imageDims: Dimensions, shift?: Point);
+    getShift(): Point;
+    getImageWidth(): number;
+    getImageHeight(): number;
+    getPositions(): Point[];
+    getRelativePositions(): Point[];
+}
@@ -1,12 +1,12 @@
-import { FaceDetection } from './faceDetectionNet/FaceDetection';
-import { FaceLandmarks } from './faceLandmarkNet/FaceLandmarks';
+import { FaceDetection } from './FaceDetection';
+import { FaceLandmarks68 } from './faceLandmarkNet/FaceLandmarks68';
 export declare class FullFaceDescription {
     private _detection;
     private _landmarks;
     private _descriptor;
-    constructor(_detection: FaceDetection, _landmarks: FaceLandmarks, _descriptor: Float32Array);
+    constructor(_detection: FaceDetection, _landmarks: FaceLandmarks68, _descriptor: Float32Array);
     readonly detection: FaceDetection;
-    readonly landmarks: FaceLandmarks;
+    readonly landmarks: FaceLandmarks68;
     readonly descriptor: Float32Array;
     forSize(width: number, height: number): FullFaceDescription;
 }
@@ -3,12 +3,14 @@ import { Point } from './Point';
 import { TResolvedNetInput } from './types';
 export declare class NetInput {
     private _inputs;
+    private _canvases;
     private _isManaged;
     private _isBatchInput;
     private _inputDimensions;
     private _paddings;
-    constructor(inputs: tf.Tensor4D | Array<TResolvedNetInput>, isBatchInput?: boolean);
+    constructor(inputs: tf.Tensor4D | Array<TResolvedNetInput>, isBatchInput?: boolean, keepCanvases?: boolean);
     readonly inputs: tf.Tensor3D[];
+    readonly canvases: HTMLCanvasElement[];
     readonly isManaged: boolean;
     readonly isBatchInput: boolean;
     readonly batchSize: number;