ammogcoder
diff --git a/‎examples/views/detectAndDrawFaces.html
Lines changed: 1 addition & 4 deletions b/‎examples/views/detectAndDrawFaces.html
Lines changed: 1 addition & 4 deletions
diff --git a/‎examples/views/detectAndDrawLandmarks.html
Lines changed: 2 additions & 8 deletions b/‎examples/views/detectAndDrawLandmarks.html
Lines changed: 2 additions & 8 deletions
diff --git a/‎examples/views/faceAlignment.html
Lines changed: 5 additions & 17 deletions b/‎examples/views/faceAlignment.html
Lines changed: 5 additions & 17 deletions
diff --git a/‎package-lock.json
Lines changed: 8 additions & 7 deletions b/‎package-lock.json
Lines changed: 8 additions & 7 deletions
diff --git a/‎package.json
Lines changed: 2 additions & 2 deletions b/‎package.json
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/allFacesFactory.ts
Lines changed: 13 additions & 16 deletions b/‎src/allFacesFactory.ts
Lines changed: 13 additions & 16 deletions
diff --git a/‎src/dom/extractFaceTensors.ts
Lines changed: 7 additions & 17 deletions b/‎src/dom/extractFaceTensors.ts
Lines changed: 7 additions & 17 deletions
diff --git a/‎src/dom/extractFaces.ts
Lines changed: 5 additions & 10 deletions b/‎src/dom/extractFaces.ts
Lines changed: 5 additions & 10 deletions
diff --git a/‎src/faceDetectionNet/FaceDetectionNet.ts
Lines changed: 9 additions & 6 deletions b/‎src/faceDetectionNet/FaceDetectionNet.ts
Lines changed: 9 additions & 6 deletions
@@ -84,12 +84,9 @@
       const detections = await faceapi.locateFaces(input, minConfidence)
       faceapi.drawDetection('overlay', detections.map(det => det.forSize(width, height)))
 
-      const faceImages = await faceapi.extractFaces(input.inputs[0], detections)
+      const faceImages = await faceapi.extractFaces(inputImgEl, detections)
       $('#facesContainer').empty()
       faceImages.forEach(canvas => $('#facesContainer').append(canvas))
-
-      // free memory for input tensors
-      input.dispose()
     }
 
     async function onSelectionChanged(uri) {
 
@@ -89,11 +89,8 @@
       const input = await faceapi.toNetInput(inputImgEl)
       const locations = await faceapi.locateFaces(input, minConfidence)
 
-      const faceTensors = (await faceapi.extractFaceTensors(input, locations))
-      let landmarksByFace = await Promise.all(faceTensors.map(t => faceapi.detectLandmarks(t)))
-
-      // free memory for face image tensors after we computed their descriptors
-      faceTensors.forEach(t => t.dispose())
+      const faces = await faceapi.extractFaces(input, locations)
+      let landmarksByFace = await Promise.all(faces.map(face => faceapi.detectLandmarks(face)))
 
       // shift and scale the face landmarks to the face image position in the canvas
       landmarksByFace = landmarksByFace.map((landmarks, i) => {
@@ -103,9 +100,6 @@
 
       faceapi.drawLandmarks(canvas, landmarksByFace, { lineWidth: drawLines ? 2 : 4, drawLines, color: 'red' })
       faceapi.drawDetection('overlay', locations.map(det => det.forSize(width, height)))
-
-      // free memory for input tensors
-      input.dispose()
     }
 
     async function run() {
 
@@ -86,26 +86,17 @@
     }
 
     async function locateAndAlignFacesWithMtcnn(inputImgEl) {
-      const input = await faceapi.toNetInput(
-        inputImgEl,
-        // dispose input manually
-        false,
-        // keep canvases (required for mtcnn)
-        true
-      )
+      const input = await faceapi.toNetInput(inputImgEl)
 
       const results = await faceapi.mtcnn(input, { minFaceSize: 100 })
 
-      const unalignedFaceImages = await faceapi.extractFaces(input.inputs[0], results.map(res => res.faceDetection))
+      const unalignedFaceImages = await faceapi.extractFaces(input.getInput(0), results.map(res => res.faceDetection))
 
       const alignedFaceBoxes = results
         .filter(res => res.faceDetection.score > minConfidence)
         .map(res => res.faceLandmarks.align())
 
-      const alignedFaceImages = await faceapi.extractFaces(input.inputs[0], alignedFaceBoxes)
-
-      // free memory for input tensors
-      input.dispose()
+      const alignedFaceImages = await faceapi.extractFaces(input.getInput(0), alignedFaceBoxes)
 
       return {
         unalignedFaceImages,
@@ -118,7 +109,7 @@
 
       const locations = await faceapi.locateFaces(input, minConfidence)
 
-      const unalignedFaceImages = await faceapi.extractFaces(input.inputs[0], locations)
+      const unalignedFaceImages = await faceapi.extractFaces(input.getInput(0), locations)
 
       // detect landmarks and get the aligned face image bounding boxes
       const alignedFaceBoxes = await Promise.all(unalignedFaceImages.map(
@@ -127,10 +118,7 @@
           return faceLandmarks.align(locations[i])
         }
       ))
-      const alignedFaceImages = await faceapi.extractFaces(input.inputs[0], alignedFaceBoxes)
-
-      // free memory for input tensors
-      input.dispose()
+      const alignedFaceImages = await faceapi.extractFaces(input.getInput(0), alignedFaceBoxes)
 
       return {
         unalignedFaceImages,
 
@@ -22,8 +22,8 @@
   "license": "MIT",
   "dependencies": {
     "@tensorflow/tfjs-core": "^0.12.14",
-    "tfjs-image-recognition-base": "^0.0.0",
-    "tfjs-tiny-yolov2": "0.0.2",
+    "tfjs-image-recognition-base": "0.1.0",
+    "tfjs-tiny-yolov2": "0.1.0",
     "tslib": "^1.9.3"
   },
   "devDependencies": {
 
@@ -5,9 +5,9 @@ import { TinyYolov2 } from '.';
 import { FaceDetection } from './classes/FaceDetection';
 import { FaceLandmarks68 } from './classes/FaceLandmarks68';
 import { FullFaceDescription } from './classes/FullFaceDescription';
-import { extractFaceTensors } from './dom';
+import { extractFaces } from './dom';
 import { FaceDetectionNet } from './faceDetectionNet/FaceDetectionNet';
-import { FaceLandmarkNet } from './faceLandmarkNet/FaceLandmarkNet';
+import { FaceLandmark68Net } from './faceLandmarkNet/FaceLandmark68Net';
 import { FaceRecognitionNet } from './faceRecognitionNet/FaceRecognitionNet';
 import { Mtcnn } from './mtcnn/Mtcnn';
 import { MtcnnForwardParams } from './mtcnn/types';
@@ -16,23 +16,21 @@ function computeDescriptorsFactory(
   recognitionNet: FaceRecognitionNet
 ) {
   return async function(input: TNetInput, alignedFaceBoxes: Rect[], useBatchProcessing: boolean) {
-    const alignedFaceTensors = await extractFaceTensors(input, alignedFaceBoxes)
+    const alignedFaceCanvases = await extractFaces(input, alignedFaceBoxes)
 
     const descriptors = useBatchProcessing
-      ? await recognitionNet.computeFaceDescriptor(alignedFaceTensors) as Float32Array[]
-      : await Promise.all(alignedFaceTensors.map(
-        faceTensor => recognitionNet.computeFaceDescriptor(faceTensor)
+      ? await recognitionNet.computeFaceDescriptor(alignedFaceCanvases) as Float32Array[]
+      : await Promise.all(alignedFaceCanvases.map(
+        canvas => recognitionNet.computeFaceDescriptor(canvas)
       )) as Float32Array[]
 
-    alignedFaceTensors.forEach(t => t.dispose())
-
     return descriptors
   }
 }
 
 function allFacesFactory(
   detectFaces: (input: TNetInput) => Promise<FaceDetection[]>,
-  landmarkNet: FaceLandmarkNet,
+  landmarkNet: FaceLandmark68Net,
   recognitionNet: FaceRecognitionNet
 ) {
   const computeDescriptors = computeDescriptorsFactory(recognitionNet)
@@ -43,15 +41,14 @@ function allFacesFactory(
   ): Promise<FullFaceDescription[]> {
 
     const detections = await detectFaces(input)
-    const faceTensors = await extractFaceTensors(input, detections)
+    const faceCanvases = await extractFaces(input, detections)
 
     const faceLandmarksByFace = useBatchProcessing
-      ? await landmarkNet.detectLandmarks(faceTensors) as FaceLandmarks68[]
-      : await Promise.all(faceTensors.map(
-        faceTensor => landmarkNet.detectLandmarks(faceTensor)
+      ? await landmarkNet.detectLandmarks(faceCanvases) as FaceLandmarks68[]
+      : await Promise.all(faceCanvases.map(
+        canvas => landmarkNet.detectLandmarks(canvas)
       )) as FaceLandmarks68[]
 
-    faceTensors.forEach(t => t.dispose())
 
     const alignedFaceBoxes = faceLandmarksByFace.map(
       (landmarks, i) => landmarks.align(detections[i].getBox())
@@ -74,7 +71,7 @@ function allFacesFactory(
 
 export function allFacesSsdMobilenetv1Factory(
   ssdMobilenetv1: FaceDetectionNet,
-  landmarkNet: FaceLandmarkNet,
+  landmarkNet: FaceLandmark68Net,
   recognitionNet: FaceRecognitionNet
 ) {
   return async function(
@@ -90,7 +87,7 @@ export function allFacesSsdMobilenetv1Factory(
 
 export function allFacesTinyYolov2Factory(
   tinyYolov2: TinyYolov2,
-  landmarkNet: FaceLandmarkNet,
+  landmarkNet: FaceLandmark68Net,
   recognitionNet: FaceRecognitionNet
 ) {
   return async function(
 
@@ -1,5 +1,5 @@
 import * as tf from '@tensorflow/tfjs-core';
-import { Rect, TNetInput, toNetInput } from 'tfjs-image-recognition-base';
+import { isTensor4D, Rect } from 'tfjs-image-recognition-base';
 
 import { FaceDetection } from '../classes/FaceDetection';
 
@@ -9,28 +9,21 @@ import { FaceDetection } from '../classes/FaceDetection';
  * Using this method is faster then extracting a canvas for each face and
  * converting them to tensors individually.
  *
- * @param input The image that face detection has been performed on.
+ * @param imageTensor The image tensor that face detection has been performed on.
  * @param detections The face detection results or face bounding boxes for that image.
  * @returns Tensors of the corresponding image region for each detected face.
  */
 export async function extractFaceTensors(
-  input: TNetInput,
+  imageTensor: tf.Tensor3D | tf.Tensor4D,
   detections: Array<FaceDetection | Rect>
-): Promise<tf.Tensor4D[]> {
+): Promise<tf.Tensor3D[]> {
 
-  const netInput = await toNetInput(input, true)
-
-  if (netInput.batchSize > 1) {
-    if (netInput.isManaged) {
-      netInput.dispose()
-    }
+  if (isTensor4D(imageTensor) && imageTensor.shape[0] > 1) {
     throw new Error('extractFaceTensors - batchSize > 1 not supported')
   }
 
   return tf.tidy(() => {
-    const imgTensor = netInput.inputs[0].expandDims().toFloat() as tf.Tensor4D
-
-    const [imgHeight, imgWidth, numChannels] = imgTensor.shape.slice(1)
+    const [imgHeight, imgWidth, numChannels] = imageTensor.shape.slice(isTensor4D(imageTensor) ? 1 : 0)
 
     const boxes = detections.map(
       det => det instanceof FaceDetection
@@ -40,12 +33,9 @@ export async function extractFaceTensors(
       .map(box => box.clipAtImageBorders(imgWidth, imgHeight))
 
     const faceTensors = boxes.map(({ x, y, width, height }) =>
-      tf.slice4d(imgTensor, [0, y, x, 0], [1, height, width, numChannels])
+      tf.slice3d(imageTensor.as3D(imgHeight, imgWidth, numChannels), [y, x, 0], [height, width, numChannels])
     )
 
-    if (netInput.isManaged) {
-      netInput.dispose()
-    }
     return faceTensors
   })
 }
@@ -24,24 +24,19 @@ export async function extractFaces(
   let canvas = input as HTMLCanvasElement
 
   if (!(input instanceof HTMLCanvasElement)) {
-    const netInput = await toNetInput(input, true)
+    const netInput = await toNetInput(input)
 
     if (netInput.batchSize > 1) {
-      if (netInput.isManaged) {
-        netInput.dispose()
-      }
       throw new Error('extractFaces - batchSize > 1 not supported')
     }
 
-    canvas = await imageTensorToCanvas(netInput.inputs[0])
-
-    if (netInput.isManaged) {
-      netInput.dispose()
-    }
+    const tensorOrCanvas = netInput.getInput(0)
+    canvas = tensorOrCanvas instanceof HTMLCanvasElement
+      ? tensorOrCanvas
+      : await imageTensorToCanvas(tensorOrCanvas)
   }
 
   const ctx = getContext2dOrThrow(canvas)
-
   const boxes = detections.map(
     det => det instanceof FaceDetection
       ? det.forSize(canvas.width, canvas.height).getBox().floor()
 
@@ -25,7 +25,7 @@ export class FaceDetectionNet extends NeuralNetwork<NetParams> {
     }
 
     return tf.tidy(() => {
-      const batchTensor = input.toBatchTensor(512, false)
+      const batchTensor = input.toBatchTensor(512, false).toFloat()
 
       const x = tf.sub(tf.mul(batchTensor, tf.scalar(0.007843137718737125)), tf.scalar(1)) as tf.Tensor4D
       const features = mobileNetV1(x, params.mobilenetv1)
@@ -40,7 +40,7 @@ export class FaceDetectionNet extends NeuralNetwork<NetParams> {
   }
 
   public async forward(input: TNetInput) {
-    return this.forwardInput(await toNetInput(input, true))
+    return this.forwardInput(await toNetInput(input))
   }
 
   public async locateFaces(
@@ -49,7 +49,7 @@ export class FaceDetectionNet extends NeuralNetwork<NetParams> {
     maxResults: number = 100
   ): Promise<FaceDetection[]> {
 
-    const netInput = await toNetInput(input, true)
+    const netInput = await toNetInput(input)
 
     const {
       boxes: _boxes,
@@ -77,18 +77,21 @@ export class FaceDetectionNet extends NeuralNetwork<NetParams> {
       minConfidence
     )
 
-    const paddings = netInput.getRelativePaddings(0)
+    const reshapedDims = netInput.getReshapedInputDimensions(0)
+    const inputSize = netInput.inputSize as number
+    const padX = inputSize / reshapedDims.width
+    const padY = inputSize / reshapedDims.height
 
     const results = indices
       .map(idx => {
         const [top, bottom] = [
           Math.max(0, boxes.get(idx, 0)),
           Math.min(1.0, boxes.get(idx, 2))
-        ].map(val => val * paddings.y)
+        ].map(val => val * padY)
         const [left, right] = [
           Math.max(0, boxes.get(idx, 1)),
           Math.min(1.0, boxes.get(idx, 3))
-        ].map(val => val * paddings.x)
+        ].map(val => val * padX)
         return new FaceDetection(
           scoresData[idx],
           new Rect(