allow face alignment before classification

justadudewhohacks · justadudewhohacks · commit 4205fc29085e · 2019-05-03T12:48:21.000+02:00
diff --git a/src/classes/FaceLandmarks.ts b/src/classes/FaceLandmarks.ts
@@ -1,5 +1,6 @@
-import { Dimensions, getCenterPoint, IDimensions, Point, Rect } from 'tfjs-image-recognition-base';
+import { Box, Dimensions, getCenterPoint, IBoundingBox, IDimensions, IRect, Point, Rect } from 'tfjs-image-recognition-base';
 
+import { minBbox } from '../minBbox';
 import { FaceDetection } from './FaceDetection';
 
 // face alignment constants
@@ -71,16 +72,28 @@ export class FaceLandmarks implements IFaceLandmarks {
    * @returns The bounding box of the aligned face.
    */
   public align(
-    detection?: FaceDetection | Rect
-  ): Rect {
+    detection?: FaceDetection | IRect | IBoundingBox | null,
+    options: { useDlibAlignment?: boolean, minBoxPadding?: number } = { }
+  ): Box {
     if (detection) {
       const box = detection instanceof FaceDetection
         ? detection.box.floor()
-        : detection
+        : new Box(detection)
 
-      return this.shiftBy(box.x, box.y).align()
+      return this.shiftBy(box.x, box.y).align(null, options)
     }
 
+    const { useDlibAlignment, minBoxPadding } = Object.assign({}, { useDlibAlignment: false, minBoxPadding: 0.2 }, options)
+
+    if (useDlibAlignment) {
+      return this.alignDlib()
+    }
+
+    return this.alignMinBbox(minBoxPadding)
+  }
+
+  private alignDlib(): Box {
+
     const centers = this.getRefPointsForAlignment()
 
     const [leftEyeCenter, rightEyeCenter, mouthCenter] = centers
@@ -97,6 +110,11 @@ export class FaceLandmarks implements IFaceLandmarks {
     return new Rect(x, y, Math.min(size, this.imageWidth + x), Math.min(size, this.imageHeight + y))
   }
 
+  private alignMinBbox(padding: number): Box {
+    const box = minBbox(this.positions)
+    return box.pad(box.width * padding, box.height * padding)
+  }
+
   protected getRefPointsForAlignment(): Point[] {
     throw new Error('getRefPointsForAlignment not implemented by base class')
   }
diff --git a/src/globalApi/ComputeFaceDescriptorsTasks.ts b/src/globalApi/ComputeFaceDescriptorsTasks.ts
@@ -25,17 +25,17 @@ export class ComputeAllFaceDescriptorsTask<
 
     const parentResults = await this.parentTask
 
-    const alignedRects = parentResults.map(({ alignedRect }) => alignedRect)
-    const alignedFaces: Array<HTMLCanvasElement | tf.Tensor3D> = this.input instanceof tf.Tensor
-      ? await extractFaceTensors(this.input, alignedRects)
-      : await extractFaces(this.input, alignedRects)
+    const dlibAlignedRects = parentResults.map(({ landmarks }) => landmarks.align(null, { useDlibAlignment: true }))
+    const dlibAlignedFaces: Array<HTMLCanvasElement | tf.Tensor3D> = this.input instanceof tf.Tensor
+      ? await extractFaceTensors(this.input, dlibAlignedRects)
+      : await extractFaces(this.input, dlibAlignedRects)
 
     const results = await Promise.all(parentResults.map(async (parentResult, i) => {
-      const descriptor = await nets.faceRecognitionNet.computeFaceDescriptor(alignedFaces[i]) as Float32Array
+      const descriptor = await nets.faceRecognitionNet.computeFaceDescriptor(dlibAlignedFaces[i]) as Float32Array
       return extendWithFaceDescriptor<TSource>(parentResult, descriptor)
     }))
 
-    alignedFaces.forEach(f => f instanceof tf.Tensor && f.dispose())
+    dlibAlignedFaces.forEach(f => f instanceof tf.Tensor && f.dispose())
 
     return results
   }
@@ -52,10 +52,10 @@ export class ComputeSingleFaceDescriptorTask<
       return
     }
 
-    const { alignedRect } = parentResult
+    const dlibAlignedRect = parentResult.landmarks.align(null, { useDlibAlignment: true })
     const alignedFaces: Array<HTMLCanvasElement | tf.Tensor3D> = this.input instanceof tf.Tensor
-      ? await extractFaceTensors(this.input, [alignedRect])
-      : await extractFaces(this.input, [alignedRect])
+      ? await extractFaceTensors(this.input, [dlibAlignedRect])
+      : await extractFaces(this.input, [dlibAlignedRect])
     const descriptor = await nets.faceRecognitionNet.computeFaceDescriptor(alignedFaces[0]) as Float32Array
 
     alignedFaces.forEach(f => f instanceof tf.Tensor && f.dispose())
diff --git a/src/globalApi/DetectFaceLandmarksTasks.ts b/src/globalApi/DetectFaceLandmarksTasks.ts
@@ -10,7 +10,10 @@ import { extendWithFaceLandmarks, WithFaceLandmarks } from '../factories/WithFac
 import { ComposableTask } from './ComposableTask';
 import { ComputeAllFaceDescriptorsTask, ComputeSingleFaceDescriptorTask } from './ComputeFaceDescriptorsTasks';
 import { nets } from './nets';
-import { PredictAllFaceExpressionsTask, PredictSingleFaceExpressionTask } from './PredictFaceExpressionsTask';
+import {
+  PredictAllFaceExpressionsWithFaceAlignmentTask,
+  PredictSingleFaceExpressionsWithFaceAlignmentTask,
+} from './PredictFaceExpressionsTask';
 
 export class DetectFaceLandmarksTaskBase<TReturn, TParentReturn> extends ComposableTask<TReturn> {
   constructor(
@@ -52,6 +55,10 @@ export class DetectAllFaceLandmarksTask<
     )
   }
 
+  withFaceExpressions(): PredictAllFaceExpressionsWithFaceAlignmentTask<WithFaceLandmarks<TSource>> {
+    return new PredictAllFaceExpressionsWithFaceAlignmentTask<WithFaceLandmarks<TSource>>(this, this.input)
+  }
+
   withFaceDescriptors(): ComputeAllFaceDescriptorsTask<WithFaceLandmarks<TSource>> {
     return new ComputeAllFaceDescriptorsTask<WithFaceLandmarks<TSource>>(this, this.input)
   }
@@ -80,6 +87,10 @@ export class DetectSingleFaceLandmarksTask<
     return extendWithFaceLandmarks<TSource>(parentResult, landmarks)
   }
 
+  withFaceExpressions(): PredictSingleFaceExpressionsWithFaceAlignmentTask<WithFaceLandmarks<TSource>> {
+    return new PredictSingleFaceExpressionsWithFaceAlignmentTask<WithFaceLandmarks<TSource>>(this, this.input)
+  }
+
   withFaceDescriptor(): ComputeSingleFaceDescriptorTask<WithFaceLandmarks<TSource>> {
     return new ComputeSingleFaceDescriptorTask<WithFaceLandmarks<TSource>>(this, this.input)
   }
diff --git a/src/globalApi/DetectFacesTasks.ts b/src/globalApi/DetectFacesTasks.ts
@@ -8,7 +8,7 @@ import { TinyFaceDetectorOptions } from '../tinyFaceDetector/TinyFaceDetectorOpt
 import { ComposableTask } from './ComposableTask';
 import { DetectAllFaceLandmarksTask, DetectSingleFaceLandmarksTask } from './DetectFaceLandmarksTasks';
 import { nets } from './nets';
-import { PredictAllFaceExpressionsTask, PredictSingleFaceExpressionTask } from './PredictFaceExpressionsTask';
+import { PredictAllFaceExpressionsTask, PredictSingleFaceExpressionsTask } from './PredictFaceExpressionsTask';
 import { FaceDetectionOptions } from './types';
 
 export class DetectFacesTaskBase<TReturn> extends ComposableTask<TReturn> {
@@ -101,8 +101,8 @@ export class DetectSingleFaceTask extends DetectFacesTaskBase<FaceDetection | un
     )
   }
 
-  withFaceExpressions(): PredictSingleFaceExpressionTask<WithFaceDetection<{}>> {
-    return new PredictSingleFaceExpressionTask<WithFaceDetection<{}>>(
+  withFaceExpressions(): PredictSingleFaceExpressionsTask<WithFaceDetection<{}>> {
+    return new PredictSingleFaceExpressionsTask<WithFaceDetection<{}>>(
       this.runAndExtendWithFaceDetection(),
       this.input
     )
diff --git a/src/globalApi/PredictFaceExpressionsTask.ts b/src/globalApi/PredictFaceExpressionsTask.ts
@@ -5,8 +5,9 @@ import { extractFaces, extractFaceTensors } from '../dom';
 import { FaceExpressions } from '../faceExpressionNet/FaceExpressions';
 import { WithFaceDetection } from '../factories/WithFaceDetection';
 import { extendWithFaceExpressions, WithFaceExpressions } from '../factories/WithFaceExpressions';
+import { isWithFaceLandmarks, WithFaceLandmarks } from '../factories/WithFaceLandmarks';
 import { ComposableTask } from './ComposableTask';
-import { DetectAllFaceLandmarksTask, DetectSingleFaceLandmarksTask } from './DetectFaceLandmarksTasks';
+import { ComputeAllFaceDescriptorsTask, ComputeSingleFaceDescriptorTask } from './ComputeFaceDescriptorsTasks';
 import { nets } from './nets';
 
 export class PredictFaceExpressionsTaskBase<TReturn, TParentReturn> extends ComposableTask<TReturn> {
@@ -26,10 +27,12 @@ export class PredictAllFaceExpressionsTask<
 
     const parentResults = await this.parentTask
 
-    const detections = parentResults.map(parentResult => parentResult.detection)
+    const faceBoxes = parentResults.map(
+      parentResult => isWithFaceLandmarks(parentResult) ? parentResult.alignedRect : parentResult.detection
+    )
     const faces: Array<HTMLCanvasElement | tf.Tensor3D> = this.input instanceof tf.Tensor
-      ? await extractFaceTensors(this.input, detections)
-      : await extractFaces(this.input, detections)
+      ? await extractFaceTensors(this.input, faceBoxes)
+      : await extractFaces(this.input, faceBoxes)
 
     const faceExpressionsByFace = await Promise.all(faces.map(
       face => nets.faceExpressionNet.predictExpressions(face)
@@ -41,13 +44,9 @@ export class PredictAllFaceExpressionsTask<
       (parentResult, i) => extendWithFaceExpressions<TSource>(parentResult, faceExpressionsByFace[i])
     )
   }
-
-  withFaceLandmarks(): DetectAllFaceLandmarksTask<WithFaceExpressions<TSource>> {
-    return new DetectAllFaceLandmarksTask(this, this.input, false)
-  }
 }
 
-export class PredictSingleFaceExpressionTask<
+export class PredictSingleFaceExpressionsTask<
   TSource extends WithFaceDetection<{}>
 >  extends PredictFaceExpressionsTaskBase<WithFaceExpressions<TSource> | undefined, TSource | undefined> {
 
@@ -58,19 +57,33 @@ export class PredictSingleFaceExpressionTask<
       return
     }
 
-    const { detection } = parentResult
+    const faceBox = isWithFaceLandmarks(parentResult) ? parentResult.alignedRect : parentResult.detection
     const faces: Array<HTMLCanvasElement | tf.Tensor3D> = this.input instanceof tf.Tensor
-      ? await extractFaceTensors(this.input, [detection])
-      : await extractFaces(this.input, [detection])
+      ? await extractFaceTensors(this.input, [faceBox])
+      : await extractFaces(this.input, [faceBox])
 
     const faceExpressions = await nets.faceExpressionNet.predictExpressions(faces[0]) as FaceExpressions
 
     faces.forEach(f => f instanceof tf.Tensor && f.dispose())
 
     return extendWithFaceExpressions(parentResult, faceExpressions)
   }
+}
+
+export class PredictAllFaceExpressionsWithFaceAlignmentTask<
+  TSource extends WithFaceLandmarks<WithFaceDetection<{}>>
+> extends PredictAllFaceExpressionsTask<TSource> {
+
+  withFaceDescriptors(): ComputeAllFaceDescriptorsTask<WithFaceLandmarks<TSource>> {
+    return new ComputeAllFaceDescriptorsTask<WithFaceLandmarks<TSource>>(this, this.input)
+  }
+}
+
+export class PredictSingleFaceExpressionsWithFaceAlignmentTask<
+  TSource extends WithFaceLandmarks<WithFaceDetection<{}>>
+> extends PredictSingleFaceExpressionsTask<TSource> {
 
-  withFaceLandmarks(): DetectSingleFaceLandmarksTask<WithFaceExpressions<TSource>> {
-    return new DetectSingleFaceLandmarksTask(this, this.input, false)
+  withFaceDescriptor(): ComputeSingleFaceDescriptorTask<WithFaceLandmarks<TSource>> {
+    return new ComputeSingleFaceDescriptorTask<WithFaceLandmarks<TSource>>(this, this.input)
   }
 }
diff --git a/src/minBbox.ts b/src/minBbox.ts
@@ -0,0 +1,12 @@
+import { BoundingBox, IPoint } from 'tfjs-image-recognition-base';
+
+export function minBbox(pts: IPoint[]): BoundingBox {
+  const xs = pts.map(pt => pt.x)
+  const ys = pts.map(pt => pt.y)
+  const minX = xs.reduce((min, x) => x < min ? x : min, Infinity)
+  const minY = ys.reduce((min, y) => y < min ? y : min, Infinity)
+  const maxX = xs.reduce((max, x) => max < x ? x : max, 0)
+  const maxY = ys.reduce((max, y) => max < y ? y : max, 0)
+
+  return new BoundingBox(minX, minY, maxX, maxY)
+}
diff --git a/src/xception/TinyXception.ts b/src/xception/TinyXception.ts
@@ -10,6 +10,7 @@ import {
 } from 'tfjs-image-recognition-base';
 
 import { depthwiseSeparableConv } from '../common/depthwiseSeparableConv';
+import { bgrToRgbTensor } from '../mtcnn/bgrToRgbTensor';
 import { extractParams } from './extractParams';
 import { extractParamsFromWeigthMap } from './extractParamsFromWeigthMap';
 import { MainBlockParams, ReductionBlockParams, TinyXceptionParams } from './types';
@@ -54,8 +55,9 @@ export class TinyXception extends NeuralNetwork<TinyXceptionParams> {
 
     return tf.tidy(() => {
       const batchTensor = input.toBatchTensor(112, true)
+      const batchTensorRgb = bgrToRgbTensor(batchTensor)
       const meanRgb = [122.782, 117.001, 104.298]
-      const normalized = normalize(batchTensor, meanRgb).div(tf.scalar(255)) as tf.Tensor4D
+      const normalized = normalize(batchTensorRgb, meanRgb).div(tf.scalar(256)) as tf.Tensor4D
 
       let out = tf.relu(conv(normalized, params.entry_flow.conv_in, [2, 2]))
       out = reductionBlock(out, params.entry_flow.reduction_block_0, false)

Original file line number	Diff line number	Diff line change
`@@ -10,7 +10,10 @@ import { extendWithFaceLandmarks, WithFaceLandmarks } from '../factories/WithFac`
`10`	`10`	`import { ComposableTask } from './ComposableTask';`
`11`	`11`	`import { ComputeAllFaceDescriptorsTask, ComputeSingleFaceDescriptorTask } from './ComputeFaceDescriptorsTasks';`
`12`	`12`	`import { nets } from './nets';`
`13`		`-import { PredictAllFaceExpressionsTask, PredictSingleFaceExpressionTask } from './PredictFaceExpressionsTask';`
	`13`	`+import {`
	`14`	`+ PredictAllFaceExpressionsWithFaceAlignmentTask,`
	`15`	`+ PredictSingleFaceExpressionsWithFaceAlignmentTask,`
	`16`	`+} from './PredictFaceExpressionsTask';`
`14`	`17`
`15`	`18`	`export class DetectFaceLandmarksTaskBase<TReturn, TParentReturn> extends ComposableTask<TReturn> {`
`16`	`19`	`constructor(`
`@@ -52,6 +55,10 @@ export class DetectAllFaceLandmarksTask<`
`52`	`55`	`)`
`53`	`56`	`}`
`54`	`57`
	`58`	`+ withFaceExpressions(): PredictAllFaceExpressionsWithFaceAlignmentTask<WithFaceLandmarks<TSource>> {`
	`59`	`+ return new PredictAllFaceExpressionsWithFaceAlignmentTask<WithFaceLandmarks<TSource>>(this, this.input)`
	`60`	`+ }`
	`61`	`+`
`55`	`62`	`withFaceDescriptors(): ComputeAllFaceDescriptorsTask<WithFaceLandmarks<TSource>> {`
`56`	`63`	`return new ComputeAllFaceDescriptorsTask<WithFaceLandmarks<TSource>>(this, this.input)`
`57`	`64`	`}`
`@@ -80,6 +87,10 @@ export class DetectSingleFaceLandmarksTask<`
`80`	`87`	`return extendWithFaceLandmarks<TSource>(parentResult, landmarks)`
`81`	`88`	`}`
`82`	`89`
	`90`	`+ withFaceExpressions(): PredictSingleFaceExpressionsWithFaceAlignmentTask<WithFaceLandmarks<TSource>> {`
	`91`	`+ return new PredictSingleFaceExpressionsWithFaceAlignmentTask<WithFaceLandmarks<TSource>>(this, this.input)`
	`92`	`+ }`
	`93`	`+`
`83`	`94`	`withFaceDescriptor(): ComputeSingleFaceDescriptorTask<WithFaceLandmarks<TSource>> {`
`84`	`95`	`return new ComputeSingleFaceDescriptorTask<WithFaceLandmarks<TSource>>(this, this.input)`
`85`	`96`	`}`
Original file line number	Diff line number	Diff line change
`@@ -8,7 +8,7 @@ import { TinyFaceDetectorOptions } from '../tinyFaceDetector/TinyFaceDetectorOpt`
`8`	`8`	`import { ComposableTask } from './ComposableTask';`
`9`	`9`	`import { DetectAllFaceLandmarksTask, DetectSingleFaceLandmarksTask } from './DetectFaceLandmarksTasks';`
`10`	`10`	`import { nets } from './nets';`
`11`		`-import { PredictAllFaceExpressionsTask, PredictSingleFaceExpressionTask } from './PredictFaceExpressionsTask';`
	`11`	`+import { PredictAllFaceExpressionsTask, PredictSingleFaceExpressionsTask } from './PredictFaceExpressionsTask';`
`12`	`12`	`import { FaceDetectionOptions } from './types';`
`13`	`13`
`14`	`14`	`export class DetectFacesTaskBase<TReturn> extends ComposableTask<TReturn> {`
`@@ -101,8 +101,8 @@ export class DetectSingleFaceTask extends DetectFacesTaskBase<FaceDetection \| un`
`101`	`101`	`)`
`102`	`102`	`}`
`103`	`103`
`104`		`- withFaceExpressions(): PredictSingleFaceExpressionTask<WithFaceDetection<{}>> {`
`105`		`- return new PredictSingleFaceExpressionTask<WithFaceDetection<{}>>(`
	`104`	`+ withFaceExpressions(): PredictSingleFaceExpressionsTask<WithFaceDetection<{}>> {`
	`105`	`+ return new PredictSingleFaceExpressionsTask<WithFaceDetection<{}>>(`
`106`	`106`	`this.runAndExtendWithFaceDetection(),`
`107`	`107`	`this.input`
`108`	`108`	`)`