ammogcoder
diff --git a/‎README.md
Lines changed: 8 additions & 13 deletions b/‎README.md
Lines changed: 8 additions & 13 deletions
diff --git a/‎examples/public/styles.css
Lines changed: 6 additions & 0 deletions b/‎examples/public/styles.css
Lines changed: 6 additions & 0 deletions
diff --git a/‎src/faceLandmarkNet/FaceLandmark68Net.ts
Lines changed: 42 additions & 27 deletions b/‎src/faceLandmarkNet/FaceLandmark68Net.ts
Lines changed: 42 additions & 27 deletions
diff --git a/‎src/faceLandmarkNet/FaceLandmark68TinyNet.ts
Lines changed: 71 additions & 0 deletions b/‎src/faceLandmarkNet/FaceLandmark68TinyNet.ts
Lines changed: 71 additions & 0 deletions
diff --git a/‎src/faceLandmarkNet/depthwiseSeparableConv.ts
Lines changed: 14 additions & 0 deletions b/‎src/faceLandmarkNet/depthwiseSeparableConv.ts
Lines changed: 14 additions & 0 deletions
diff --git a/‎src/faceLandmarkNet/extractParams.ts
Lines changed: 11 additions & 25 deletions b/‎src/faceLandmarkNet/extractParams.ts
Lines changed: 11 additions & 25 deletions
diff --git a/‎src/faceLandmarkNet/extractParamsTiny.ts
Lines changed: 33 additions & 0 deletions b/‎src/faceLandmarkNet/extractParamsTiny.ts
Lines changed: 33 additions & 0 deletions
@@ -43,7 +43,8 @@ Table of Contents:
 
 ### Face Landmarks
 
-![preview_face_landmarks_boxes](https://user-images.githubusercontent.com/31125521/41507933-65f9b642-723c-11e8-8f4e-aab13303e7ff.jpg)
+![face_landmarks_boxes_1](https://user-images.githubusercontent.com/31125521/46063403-fff9f480-c16c-11e8-900f-e4b7a3828d1d.jpg)
+![face_landmarks_boxes_2](https://user-images.githubusercontent.com/31125521/46063404-00928b00-c16d-11e8-8f29-e9c50afd2bc8.jpg)
 
 ![preview_face_landmarks](https://user-images.githubusercontent.com/31125521/41507950-e121b05e-723c-11e8-89f2-d8f9348a8e86.png)
 
@@ -57,10 +58,6 @@ Table of Contents:
 
 ![mtcnn-preview](https://user-images.githubusercontent.com/31125521/42756818-0a41edaa-88fe-11e8-9033-8cd141b0fa09.gif)
 
-### Face Alignment
-
-![preview_face_alignment](https://user-images.githubusercontent.com/31125521/41526994-1a690818-72e6-11e8-8f3c-d2cf31fe517b.jpg)
-
 <a name="running-the-examples"></a>
 
 ## Running the Examples
@@ -89,7 +86,7 @@ The face detection model has been trained on the [WIDERFACE dataset](http://mmla
 
 ### Face Detection - Tiny Yolo v2
 
-The Tiny Yolo v2 implementation is a very performant face detector, which can easily adapt to different input image sizes, thus can be used as an alternative to SSD Mobilenet v1 to trade off accuracy for performance (inference time). In general the models ability to locate smaller face bounding boxes is not as accurate as SSD Mobilenet v1. 
+The Tiny Yolo v2 implementation is a very performant face detector, which can easily adapt to different input image sizes, thus can be used as an alternative to SSD Mobilenet v1 to trade off accuracy for performance (inference time). In general the models ability to locate smaller face bounding boxes is not as accurate as SSD Mobilenet v1.
 
 The face detector has been trained on a custom dataset of ~10K images labeled with bounding boxes and uses depthwise separable convolutions instead of regular convolutions, which ensures very fast inference and allows to have a quantized model size of only 1.7MB making the model extremely mobile and web friendly. Thus, the Tiny Yolo v2 face detector should be your GO-TO face detector on mobile devices.
 
@@ -113,9 +110,7 @@ The neural net is equivalent to the **FaceRecognizerNet** used in [face-recognit
 
 ### 68 Point Face Landmark Detection
 
-This package implements a CNN to detect the 68 point face landmarks for a given face image.
-
-The model has been trained on a variety of public datasets and the model weights are provided by [yinguobing](https://github.com/yinguobing) in [this](https://github.com/yinguobing/head-pose-estimation) repo.
+This package implements a very lightweight and fast, yet accurate 68 point face landmark detector. The default model has a size of only 350kb and the tiny model is only 80kb. Both models employ the ideas of depthwise separable convolutions as well as densely connected blocks. The models have been trained on a dataset of ~35k face images labeled with 68 face landmark points.
 
 <a name="usage"></a>
 
@@ -145,6 +140,7 @@ Assuming the models reside in **public/models**:
 await faceapi.loadFaceDetectionModel('/models')
 // accordingly for the other models:
 // await faceapi.loadFaceLandmarkModel('/models')
+// await faceapi.loadFaceLandmarkTinyModel('/models')
 // await faceapi.loadFaceRecognitionModel('/models')
 // await faceapi.loadMtcnnModel('/models')
 // await faceapi.loadTinyYolov2Model('/models')
@@ -155,19 +151,18 @@ As an alternative, you can also create instance of the neural nets:
 ``` javascript
 const net = new faceapi.FaceDetectionNet()
 // accordingly for the other models:
-// const net = new faceapi.FaceLandmarkNet()
+// const net = new faceapi.FaceLandmark68Net()
+// const net = new faceapi.FaceLandmark68TinyNet()
 // const net = new faceapi.FaceRecognitionNet()
 // const net = new faceapi.Mtcnn()
 // const net = new faceapi.TinyYolov2()
 
 await net.load('/models/face_detection_model-weights_manifest.json')
 // await net.load('/models/face_landmark_68_model-weights_manifest.json')
+// await net.load('/models/face_landmark_68_tiny_model-weights_manifest.json')
 // await net.load('/models/face_recognition_model-weights_manifest.json')
 // await net.load('/models/mtcnn_model-weights_manifest.json')
 // await net.load('/models/tiny_yolov2_separable_conv_model-weights_manifest.json')
-
-// or simply load all models
-await net.load('/models')
 ```
 
 Using instances, you can also load the weights as a Float32Array (in case you want to use the uncompressed models):
 
@@ -67,6 +67,12 @@
   left: 0;
 }
 
+.overlay {
+  position: absolute;
+  top: 0;
+  left: 0;
+}
+
 #facesContainer canvas {
   margin: 10px;
 }
@@ -1,60 +1,75 @@
 import * as tf from '@tensorflow/tfjs-core';
-import { NetInput } from 'tfjs-image-recognition-base';
-import { convLayer, ConvParams } from 'tfjs-tiny-yolov2';
+import { NetInput, normalize } from 'tfjs-image-recognition-base';
+import { ConvParams } from 'tfjs-tiny-yolov2';
+import { SeparableConvParams } from 'tfjs-tiny-yolov2/build/tinyYolov2/types';
 
+import { depthwiseSeparableConv } from './depthwiseSeparableConv';
 import { extractParams } from './extractParams';
 import { FaceLandmark68NetBase } from './FaceLandmark68NetBase';
 import { fullyConnectedLayer } from './fullyConnectedLayer';
 import { loadQuantizedParams } from './loadQuantizedParams';
-import { NetParams } from './types';
+import { DenseBlock4Params, NetParams } from './types';
 
-function conv(x: tf.Tensor4D, params: ConvParams): tf.Tensor4D {
-  return convLayer(x, params, 'valid', true)
-}
+function denseBlock(
+  x: tf.Tensor4D,
+  denseBlockParams: DenseBlock4Params,
+  isFirstLayer: boolean = false
+): tf.Tensor4D {
+  return tf.tidy(() => {
+    const out1 = tf.relu(
+      isFirstLayer
+        ? tf.add(
+          tf.conv2d(x, (denseBlockParams.conv0 as ConvParams).filters, [2, 2], 'same'),
+          denseBlockParams.conv0.bias
+        )
+        : depthwiseSeparableConv(x, denseBlockParams.conv0 as SeparableConvParams, [2, 2])
+    ) as tf.Tensor4D
+    const out2 = depthwiseSeparableConv(out1, denseBlockParams.conv1, [1, 1])
+
+    const in3 = tf.relu(tf.add(out1, out2)) as tf.Tensor4D
+    const out3 = depthwiseSeparableConv(in3, denseBlockParams.conv2, [1, 1])
+
+    const in4 = tf.relu(tf.add(out1, tf.add(out2, out3))) as tf.Tensor4D
+    const out4 = depthwiseSeparableConv(in4, denseBlockParams.conv3, [1, 1])
 
-function maxPool(x: tf.Tensor4D, strides: [number, number] = [2, 2]): tf.Tensor4D {
-  return tf.maxPool(x, [2, 2], strides, 'valid')
+    return tf.relu(tf.add(out1, tf.add(out2, tf.add(out3, out4)))) as tf.Tensor4D
+  })
 }
 
 export class FaceLandmark68Net extends FaceLandmark68NetBase<NetParams> {
 
   constructor() {
-    super('FaceLandmark68Net')
+    super('FaceLandmark68LargeNet')
   }
 
   public runNet(input: NetInput): tf.Tensor2D {
 
     const { params } = this
 
     if (!params) {
-      throw new Error('FaceLandmark68Net - load model before inference')
+      throw new Error('FaceLandmark68LargeNet - load model before inference')
     }
 
     return tf.tidy(() => {
-      const batchTensor = input.toBatchTensor(128, true).toFloat() as tf.Tensor4D
-
-      let out = conv(batchTensor, params.conv0)
-      out = maxPool(out)
-      out = conv(out, params.conv1)
-      out = conv(out, params.conv2)
-      out = maxPool(out)
-      out = conv(out, params.conv3)
-      out = conv(out, params.conv4)
-      out = maxPool(out)
-      out = conv(out, params.conv5)
-      out = conv(out, params.conv6)
-      out = maxPool(out, [1, 1])
-      out = conv(out, params.conv7)
-      const fc0 = tf.relu(fullyConnectedLayer(out.as2D(out.shape[0], -1), params.fc0))
-
-      return fullyConnectedLayer(fc0, params.fc1)
+      const batchTensor = input.toBatchTensor(112, true)
+      const meanRgb = [122.782, 117.001, 104.298]
+      const normalized = normalize(batchTensor, meanRgb).div(tf.scalar(255)) as tf.Tensor4D
+
+      let out = denseBlock(normalized, params.dense0, true)
+      out = denseBlock(out, params.dense1)
+      out = denseBlock(out, params.dense2)
+      out = denseBlock(out, params.dense3)
+      out = tf.avgPool(out, [7, 7], [2, 2], 'valid')
+
+      return fullyConnectedLayer(out.as2D(out.shape[0], -1), params.fc)
     })
   }
 
   protected loadQuantizedParams(uri: string | undefined) {
     return loadQuantizedParams(uri)
   }
 
+
   protected extractParams(weights: Float32Array) {
     return extractParams(weights)
   }
 
@@ -0,0 +1,71 @@
+import * as tf from '@tensorflow/tfjs-core';
+import { NetInput, normalize } from 'tfjs-image-recognition-base';
+import { ConvParams } from 'tfjs-tiny-yolov2';
+import { SeparableConvParams } from 'tfjs-tiny-yolov2/build/tinyYolov2/types';
+
+import { depthwiseSeparableConv } from './depthwiseSeparableConv';
+import { extractParamsTiny } from './extractParamsTiny';
+import { FaceLandmark68NetBase } from './FaceLandmark68NetBase';
+import { fullyConnectedLayer } from './fullyConnectedLayer';
+import { loadQuantizedParamsTiny } from './loadQuantizedParamsTiny';
+import { DenseBlock3Params, TinyNetParams } from './types';
+
+function denseBlock(
+  x: tf.Tensor4D,
+  denseBlockParams: DenseBlock3Params,
+  isFirstLayer: boolean = false
+): tf.Tensor4D {
+  return tf.tidy(() => {
+    const out1 = tf.relu(
+      isFirstLayer
+        ? tf.add(
+          tf.conv2d(x, (denseBlockParams.conv0 as ConvParams).filters, [2, 2], 'same'),
+          denseBlockParams.conv0.bias
+        )
+        : depthwiseSeparableConv(x, denseBlockParams.conv0 as SeparableConvParams, [2, 2])
+    ) as tf.Tensor4D
+    const out2 = depthwiseSeparableConv(out1, denseBlockParams.conv1, [1, 1])
+
+    const in3 = tf.relu(tf.add(out1, out2)) as tf.Tensor4D
+    const out3 = depthwiseSeparableConv(in3, denseBlockParams.conv2, [1, 1])
+
+    return tf.relu(tf.add(out1, tf.add(out2, out3))) as tf.Tensor4D
+  })
+}
+
+export class FaceLandmark68TinyNet extends FaceLandmark68NetBase<TinyNetParams> {
+
+  constructor() {
+    super('FaceLandmark68TinyNet')
+  }
+
+  public runNet(input: NetInput): tf.Tensor2D {
+
+    const { params } = this
+
+    if (!params) {
+      throw new Error('FaceLandmark68TinyNet - load model before inference')
+    }
+
+    return tf.tidy(() => {
+      const batchTensor = input.toBatchTensor(112, true)
+      const meanRgb = [122.782, 117.001, 104.298]
+      const normalized = normalize(batchTensor, meanRgb).div(tf.scalar(255)) as tf.Tensor4D
+
+      let out = denseBlock(normalized, params.dense0, true)
+      out = denseBlock(out, params.dense1)
+      out = denseBlock(out, params.dense2)
+      out = tf.avgPool(out, [14, 14], [2, 2], 'valid')
+
+      return fullyConnectedLayer(out.as2D(out.shape[0], -1), params.fc)
+    })
+  }
+
+  protected loadQuantizedParams(uri: string | undefined) {
+    return loadQuantizedParamsTiny(uri)
+  }
+
+  protected extractParams(weights: Float32Array) {
+    return extractParamsTiny(weights)
+  }
+}
@@ -0,0 +1,14 @@
+import * as tf from '@tensorflow/tfjs-core';
+import { SeparableConvParams } from 'tfjs-tiny-yolov2/build/tinyYolov2/types';
+
+export function depthwiseSeparableConv(
+  x: tf.Tensor4D,
+  params: SeparableConvParams,
+  stride: [number, number]
+): tf.Tensor4D {
+  return tf.tidy(() => {
+    let out = tf.separableConv2d(x, params.depthwise_filter, params.pointwise_filter, stride, 'same')
+    out = tf.add(out, params.bias)
+    return out
+  })
+}
@@ -1,6 +1,6 @@
 import { extractWeightsFactory, ParamMapping } from 'tfjs-image-recognition-base';
-import { extractConvParamsFactory, extractFCParamsFactory } from 'tfjs-tiny-yolov2';
 
+import { extractorsFactory } from './extractorsFactory';
 import { NetParams } from './types';
 
 export function extractParams(weights: Float32Array): { params: NetParams, paramMappings: ParamMapping[] } {
@@ -12,37 +12,23 @@ export function extractParams(weights: Float32Array): { params: NetParams, param
     getRemainingWeights
   } = extractWeightsFactory(weights)
 
-  const extractConvParams = extractConvParamsFactory(extractWeights, paramMappings)
-  const extractFCParams = extractFCParamsFactory(extractWeights, paramMappings)
+  const {
+    extractDenseBlock4Params,
+    extractFCParams
+  } = extractorsFactory(extractWeights, paramMappings)
 
-  const conv0 = extractConvParams(3, 32, 3, 'conv0')
-  const conv1 = extractConvParams(32, 64, 3, 'conv1')
-  const conv2 = extractConvParams(64, 64, 3, 'conv2')
-  const conv3 = extractConvParams(64, 64, 3, 'conv3')
-  const conv4 = extractConvParams(64, 64, 3, 'conv4')
-  const conv5 = extractConvParams(64, 128, 3, 'conv5')
-  const conv6 = extractConvParams(128, 128, 3, 'conv6')
-  const conv7 = extractConvParams(128, 256, 3, 'conv7')
-  const fc0 = extractFCParams(6400, 1024, 'fc0')
-  const fc1 = extractFCParams(1024, 136, 'fc1')
+  const dense0 = extractDenseBlock4Params(3, 32, 'dense0', true)
+  const dense1 = extractDenseBlock4Params(32, 64, 'dense1')
+  const dense2 = extractDenseBlock4Params(64, 128, 'dense2')
+  const dense3 = extractDenseBlock4Params(128, 256, 'dense3')
+  const fc = extractFCParams(256, 136, 'fc')
 
   if (getRemainingWeights().length !== 0) {
     throw new Error(`weights remaing after extract: ${getRemainingWeights().length}`)
   }
 
   return {
     paramMappings,
-    params: {
-      conv0,
-      conv1,
-      conv2,
-      conv3,
-      conv4,
-      conv5,
-      conv6,
-      conv7,
-      fc0,
-      fc1
-    }
+    params: { dense0, dense1, dense2, dense3, fc }
   }
 }
@@ -0,0 +1,33 @@
+import { extractWeightsFactory, ParamMapping } from 'tfjs-image-recognition-base';
+
+import { extractorsFactory } from './extractorsFactory';
+import { TinyNetParams } from './types';
+
+export function extractParamsTiny(weights: Float32Array): { params: TinyNetParams, paramMappings: ParamMapping[] } {
+
+  const paramMappings: ParamMapping[] = []
+
+  const {
+    extractWeights,
+    getRemainingWeights
+  } = extractWeightsFactory(weights)
+
+  const {
+    extractDenseBlock3Params,
+    extractFCParams
+  } = extractorsFactory(extractWeights, paramMappings)
+
+  const dense0 = extractDenseBlock3Params(3, 32, 'dense0', true)
+  const dense1 = extractDenseBlock3Params(32, 64, 'dense1')
+  const dense2 = extractDenseBlock3Params(64, 128, 'dense2')
+  const fc = extractFCParams(128, 136, 'fc')
+
+  if (getRemainingWeights().length !== 0) {
+    throw new Error(`weights remaing after extract: ${getRemainingWeights().length}`)
+  }
+
+  return {
+    paramMappings,
+    params: { dense0, dense1, dense2, fc }
+  }
+}
Original file line number	Diff line number	Diff line change
`@@ -67,6 +67,12 @@`
`67`	`67`	`left: 0;`
`68`	`68`	`}`
`69`	`69`
	`70`	`+.overlay {`
	`71`	`+ position: absolute;`
	`72`	`+ top: 0;`
	`73`	`+ left: 0;`
	`74`	`+}`
	`75`	`+`
`70`	`76`	`#facesContainer canvas {`
`71`	`77`	`margin: 10px;`
`72`	`78`	`}`