fix mobilefacenet module

2021-11-13 17:26:19 -05:00 · 2021-11-13 17:26:19 -05:00 · 39fa2396a1
parent 4b526ad53c
commit 39fa2396a1
8 changed files with 135 additions and 12 deletions
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@ -9,7 +9,10 @@
  
 ## Changelog
  
-### **HEAD -> main** 2021/11/12 mandic00@live.com
+### **HEAD -> main** 2021/11/13 mandic00@live.com
+
+
+### **origin/main** 2021/11/12 mandic00@live.com

 - implement optional face masking
 - add similarity score range normalization
--- a/TODO.md
+++ b/TODO.md
@ -46,9 +46,13 @@ New:
 - new optional model `liveness`  
  checks if input appears to be a real-world live image or a recording  
  best used together with `antispoofing` that checks if input appears to have a realistic face
- new face masking option in `face.config.detector.mask`
+- new face masking option in `face.config.detector.mask`  
+  result is shading of face image outside of face area which is useful for increased sensitivity of other modules that rely on detected face as input 
+- new face crop option in `face.config.detector.cropFactor`
+  result is user-definable fine-tuning for other modules that rely on detected face as input 

 Other:
 - Improved **Safari** compatibility
 - Improved `similarity` and `match` score range normalization
 - Documentation overhaul
+- Fixed optional `gear`, `ssrnet`, `mobilefacenet` modules
--- a/demo/faceid/index.js
+++ b/demo/faceid/index.js
@ -78,6 +78,7 @@ var humanConfig = {
    enabled: true,
    detector: { rotation: true, return: true, cropFactor: 1.6, mask: false },
    description: { enabled: true },
+    mobilefacenet: { enabled: false, modelPath: "https://vladmandic.github.io/human-models/models/mobilefacenet.json" },
    iris: { enabled: true },
    emotion: { enabled: false },
    antispoof: { enabled: true },
@ -88,6 +89,7 @@ var humanConfig = {
  object: { enabled: false },
  gesture: { enabled: true }
 };
+var matchOptions = { order: 2, multiplier: 25, min: 0.2, max: 0.8 };
 var options = {
  minConfidence: 0.6,
  minSize: 224,
@ -97,7 +99,8 @@ var options = {
  threshold: 0.5,
  mask: humanConfig.face.detector.mask,
  rotation: humanConfig.face.detector.rotation,
-  cropFactor: humanConfig.face.detector.cropFactor
+  cropFactor: humanConfig.face.detector.cropFactor,
+  ...matchOptions
 };
 var ok = {
  faceCount: false,
@ -254,6 +257,7 @@ async function detectFace() {
  (_a = dom.canvas.getContext("2d")) == null ? void 0 : _a.clearRect(0, 0, options.minSize, options.minSize);
  if (!current.face || !current.face.tensor || !current.face.embedding)
    return false;
+  console.log("face record:", current.face);
  human.tf.browser.toPixels(current.face.tensor, dom.canvas);
  if (await count() === 0) {
    log2("face database is empty");
@ -263,7 +267,7 @@ async function detectFace() {
  }
  const db2 = await load();
  const descriptors = db2.map((rec) => rec.descriptor);
-  const res = await human.match(current.face.embedding, descriptors);
+  const res = await human.match(current.face.embedding, descriptors, matchOptions);
  current.record = db2[res.index] || null;
  if (current.record) {
    log2(`best match: ${current.record.name} | id: ${current.record.id} | similarity: ${Math.round(1e3 * res.similarity) / 10}%`);
--- a/demo/faceid/index.ts
+++ b/demo/faceid/index.ts
@ -16,7 +16,8 @@ const humanConfig = { // user configuration for human, used to fine-tune behavio
  face: {
    enabled: true,
    detector: { rotation: true, return: true, cropFactor: 1.6, mask: false }, // return tensor is used to get detected face image
-    description: { enabled: true },
+    description: { enabled: true }, // default model for face descriptor extraction is faceres
+    mobilefacenet: { enabled: false, modelPath: 'https://vladmandic.github.io/human-models/models/mobilefacenet.json' }, // alternative model
    iris: { enabled: true }, // needed to determine gaze direction
    emotion: { enabled: false }, // not needed
    antispoof: { enabled: true }, // enable optional antispoof module
@ -28,6 +29,9 @@ const humanConfig = { // user configuration for human, used to fine-tune behavio
  gesture: { enabled: true }, // parses face and iris gestures
 };

+// const matchOptions = { order: 2, multiplier: 1000, min: 0.0, max: 1.0 }; // for embedding model
+const matchOptions = { order: 2, multiplier: 25, min: 0.2, max: 0.8 }; // for faceres model
+
 const options = {
  minConfidence: 0.6, // overal face confidence for box, face, gender, real, live
  minSize: 224, // min input to face descriptor model before degradation
@ -38,6 +42,7 @@ const options = {
  mask: humanConfig.face.detector.mask,
  rotation: humanConfig.face.detector.rotation,
  cropFactor: humanConfig.face.detector.cropFactor,
+  ...matchOptions,
 };

 const ok = { // must meet all rules
@ -194,6 +199,8 @@ async function deleteRecord() {
 async function detectFace() {
  dom.canvas.getContext('2d')?.clearRect(0, 0, options.minSize, options.minSize);
  if (!current.face || !current.face.tensor || !current.face.embedding) return false;
+  // eslint-disable-next-line no-console
+  console.log('face record:', current.face);
  human.tf.browser.toPixels(current.face.tensor as unknown as TensorLike, dom.canvas);
  if (await indexDb.count() === 0) {
    log('face database is empty');
@ -203,7 +210,7 @@ async function detectFace() {
  }
  const db = await indexDb.load();
  const descriptors = db.map((rec) => rec.descriptor);
-  const res = await human.match(current.face.embedding, descriptors);
+  const res = await human.match(current.face.embedding, descriptors, matchOptions);
  current.record = db[res.index] || null;
  if (current.record) {
    log(`best match: ${current.record.name} | id: ${current.record.id} | similarity: ${Math.round(1000 * res.similarity) / 10}%`);
--- a/src/face/face.ts
+++ b/src/face/face.ts
@ -15,6 +15,7 @@ import * as liveness from './liveness';
 import * as gear from '../gear/gear';
 import * as ssrnetAge from '../gear/ssrnet-age';
 import * as ssrnetGender from '../gear/ssrnet-gender';
+import * as mobilefacenet from './mobilefacenet';
 import type { FaceResult } from '../result';
 import type { Tensor } from '../tfjs/types';
 import type { Human } from '../human';
@ -28,7 +29,7 @@ export const detectFace = async (parent: Human /* instance of human */, input: T
  let gearRes;
  let genderRes;
  let emotionRes;
-  let embeddingRes;
+  let mobilefacenetRes;
  let antispoofRes;
  let livenessRes;
  let descRes;
@ -93,7 +94,7 @@ export const detectFace = async (parent: Human /* instance of human */, input: T
      parent.state = 'run:liveness';
      timeStamp = now();
      livenessRes = parent.config.face.liveness?.enabled ? await liveness.predict(faces[i].tensor || tf.tensor([]), parent.config, i, faces.length) : null;
-      parent.performance.antispoof = env.perfadd ? (parent.performance.antispoof || 0) + Math.trunc(now() - timeStamp) : Math.trunc(now() - timeStamp);
+      parent.performance.liveness = env.perfadd ? (parent.performance.antispoof || 0) + Math.trunc(now() - timeStamp) : Math.trunc(now() - timeStamp);
    }
    parent.analyze('End Liveness:');

@ -105,7 +106,7 @@ export const detectFace = async (parent: Human /* instance of human */, input: T
      parent.state = 'run:gear';
      timeStamp = now();
      gearRes = parent.config.face['gear']?.enabled ? await gear.predict(faces[i].tensor || tf.tensor([]), parent.config, i, faces.length) : {};
-      parent.performance.emotion = Math.trunc(now() - timeStamp);
+      parent.performance.gear = Math.trunc(now() - timeStamp);
    }
    parent.analyze('End GEAR:');

@ -119,10 +120,22 @@ export const detectFace = async (parent: Human /* instance of human */, input: T
      timeStamp = now();
      ageRes = parent.config.face['ssrnet']?.enabled ? await ssrnetAge.predict(faces[i].tensor || tf.tensor([]), parent.config, i, faces.length) : {};
      genderRes = parent.config.face['ssrnet']?.enabled ? await ssrnetGender.predict(faces[i].tensor || tf.tensor([]), parent.config, i, faces.length) : {};
-      parent.performance.emotion = Math.trunc(now() - timeStamp);
+      parent.performance.ssrnet = Math.trunc(now() - timeStamp);
    }
    parent.analyze('End SSRNet:');

+    // run gear, inherits face from blazeface
+    parent.analyze('Start MobileFaceNet:');
+    if (parent.config.async) {
+      mobilefacenetRes = parent.config.face['mobilefacenet']?.enabled ? mobilefacenet.predict(faces[i].tensor || tf.tensor([]), parent.config, i, faces.length) : {};
+    } else {
+      parent.state = 'run:mobilefacenet';
+      timeStamp = now();
+      mobilefacenetRes = parent.config.face['mobilefacenet']?.enabled ? await mobilefacenet.predict(faces[i].tensor || tf.tensor([]), parent.config, i, faces.length) : {};
+      parent.performance.mobilefacenet = Math.trunc(now() - timeStamp);
+    }
+    parent.analyze('End MobileFaceNet:');
+
    // run emotion, inherits face from blazeface
    parent.analyze('Start Description:');
    if (parent.config.async) {
@ -137,13 +150,15 @@ export const detectFace = async (parent: Human /* instance of human */, input: T

    // if async wait for results
    if (parent.config.async) {
-      [ageRes, genderRes, emotionRes, embeddingRes, descRes, gearRes, antispoofRes, livenessRes] = await Promise.all([ageRes, genderRes, emotionRes, embeddingRes, descRes, gearRes, antispoofRes, livenessRes]);
+      [ageRes, genderRes, emotionRes, mobilefacenetRes, descRes, gearRes, antispoofRes, livenessRes] = await Promise.all([ageRes, genderRes, emotionRes, mobilefacenetRes, descRes, gearRes, antispoofRes, livenessRes]);
    }
    parent.analyze('Finish Face:');

    // override age/gender if alternative models are used
    if (parent.config.face['ssrnet']?.enabled && ageRes && genderRes) descRes = { age: ageRes.age, gender: genderRes.gender, genderScore: genderRes.genderScore };
    if (parent.config.face['gear']?.enabled && gearRes) descRes = { age: gearRes.age, gender: gearRes.gender, genderScore: gearRes.genderScore, race: gearRes.race };
+    // override descriptor if embedding model is used
+    if (parent.config.face['mobilefacenet']?.enabled && mobilefacenetRes) descRes.descriptor = mobilefacenetRes;

    // calculate iris distance
    // iris: array[ center, left, top, right, bottom]
--- a/src/face/mobilefacenet.ts
+++ b/src/face/mobilefacenet.ts
@ -0,0 +1,87 @@
+/**
+ * EfficientPose model implementation
+ *
+ * Based on: [**BecauseofAI MobileFace**](https://github.com/becauseofAI/MobileFace)
+ *
+ * Obsolete and replaced by `faceres` that performs age/gender/descriptor analysis
+ */
+
+import { log, join, now } from '../util/util';
+import * as tf from '../../dist/tfjs.esm.js';
+import type { Tensor, GraphModel } from '../tfjs/types';
+import type { Config } from '../config';
+import { env } from '../util/env';
+
+let model: GraphModel | null;
+const last: Array<number[]> = [];
+let lastCount = 0;
+let lastTime = 0;
+let skipped = Number.MAX_SAFE_INTEGER;
+
+export async function load(config: Config): Promise<GraphModel> {
+  const modelUrl = join(config.modelBasePath, config.face['mobilefacenet'].modelPath);
+  if (env.initial) model = null;
+  if (!model) {
+    model = await tf.loadGraphModel(modelUrl) as unknown as GraphModel;
+    if (!model) log('load model failed:', config.face['mobilefacenet'].modelPath);
+    else if (config.debug) log('load model:', modelUrl);
+  } else if (config.debug) log('cached model:', modelUrl);
+  return model;
+}
+
+/*
+// convert to black&white to avoid colorization impact
+const rgb = [0.2989, 0.5870, 0.1140]; // factors for red/green/blue colors when converting to grayscale: https://www.mathworks.com/help/matlab/ref/rgb2gray.html
+const [red, green, blue] = tf.split(crop, 3, 3);
+const redNorm = tf.mul(red, rgb[0]);
+const greenNorm = tf.mul(green, rgb[1]);
+const blueNorm = tf.mul(blue, rgb[2]);
+const grayscale = tf.addN([redNorm, greenNorm, blueNorm]);
+const merge = tf.stack([grayscale, grayscale, grayscale], 3).squeeze(4);
+
+// optional increase image contrast
+// or do it per-channel so mean is done on each channel
+// or do it based on histogram
+const mean = merge.mean();
+const factor = 5;
+const contrast = merge.sub(mean).mul(factor).add(mean);
+*/
+
+export async function predict(input: Tensor, config: Config, idx, count): Promise<number[]> {
+  if (!model) return [];
+  const skipFrame = skipped < (config.face['embedding']?.skipFrames || 0);
+  const skipTime = (config.face['embedding']?.skipTime || 0) > (now() - lastTime);
+  if (config.skipAllowed && skipTime && skipFrame && (lastCount === count) && last[idx]) {
+    skipped++;
+    return last[idx];
+  }
+  return new Promise(async (resolve) => {
+    let data: Array<number> = [];
+    if (config.face['embedding']?.enabled && model?.inputs[0].shape) {
+      const t: Record<string, Tensor> = {};
+      t.crop = tf.image.resizeBilinear(input, [model.inputs[0].shape[2], model.inputs[0].shape[1]], false); // just resize to fit the embedding model
+      // do a tight crop of image and resize it to fit the model
+      // const box = [[0.05, 0.15, 0.85, 0.85]]; // empyrical values for top, left, bottom, right
+      // t.crop = tf.image.cropAndResize(input, box, [0], [model.inputs[0].shape[2], model.inputs[0].shape[1]]);
+      t.data = model?.execute(t.crop) as Tensor;
+      /*
+      // optional normalize outputs with l2 normalization
+      const scaled = tf.tidy(() => {
+        const l2 = res.norm('euclidean');
+        const scale = res.div(l2);
+        return scale;
+      });
+
+      // optional reduce feature vector complexity
+      const reshape = tf.reshape(res, [128, 2]); // split 256 vectors into 128 x 2
+      const reduce = reshape.logSumExp(1); // reduce 2nd dimension by calculating logSumExp on it
+      */
+      const output = await t.data.data();
+      data = Array.from(output); // convert typed array to simple array
+    }
+    last[idx] = data;
+    lastCount = count;
+    lastTime = now();
+    resolve(data);
+  });
+}
--- a/src/gear/gear.ts
+++ b/src/gear/gear.ts
@ -62,6 +62,7 @@ export async function predict(image: Tensor, config: Config, idx, count): Promis
    let age = ageSorted[0][0]; // pick best starting point
    for (let i = 1; i < ageSorted.length; i++) age += ageSorted[i][1] * (ageSorted[i][0] - age); // adjust with each other choice by weight
    obj.age = Math.round(10 * age) / 10;
+    Object.keys(t).forEach((tensor) => tf.dispose(t[tensor]));
    last[idx] = obj;
    lastCount = count;
    lastTime = now();
--- a/src/models.ts
+++ b/src/models.ts
@ -13,6 +13,7 @@ import * as blazepose from './body/blazepose';
 import * as centernet from './object/centernet';
 import * as efficientpose from './body/efficientpose';
 import * as emotion from './gear/emotion';
+import * as mobilefacenet from './face/mobilefacenet';
 import * as facemesh from './face/facemesh';
 import * as faceres from './face/faceres';
 import * as handpose from './hand/handpose';
@ -39,7 +40,7 @@ export class Models {
  blazepose: null | GraphModel | Promise<GraphModel> = null;
  centernet: null | GraphModel | Promise<GraphModel> = null;
  efficientpose: null | GraphModel | Promise<GraphModel> = null;
-  embedding: null | GraphModel | Promise<GraphModel> = null;
+  mobilefacenet: null | GraphModel | Promise<GraphModel> = null;
  emotion: null | GraphModel | Promise<GraphModel> = null;
  facedetect: null | GraphModel | Promise<GraphModel> = null;
  faceiris: null | GraphModel | Promise<GraphModel> = null;
@ -84,6 +85,7 @@ export async function load(instance: Human): Promise<void> {
  if (instance.config.face.enabled && instance.config.face['gear']?.enabled && !instance.models.gear) instance.models.gear = gear.load(instance.config);
  if (instance.config.face.enabled && instance.config.face['ssrnet']?.enabled && !instance.models.ssrnetage) instance.models.ssrnetage = ssrnetAge.load(instance.config);
  if (instance.config.face.enabled && instance.config.face['ssrnet']?.enabled && !instance.models.ssrnetgender) instance.models.ssrnetgender = ssrnetGender.load(instance.config);
+  if (instance.config.face.enabled && instance.config.face['mobilefacenet']?.enabled && !instance.models.mobilefacenet) instance.models.mobilefacenet = mobilefacenet.load(instance.config);
  if (instance.config.hand.enabled && !instance.models.handtrack && instance.config.hand.detector?.modelPath?.includes('handtrack')) instance.models.handtrack = handtrack.loadDetect(instance.config);
  if (instance.config.hand.enabled && instance.config.hand.landmarks && !instance.models.handskeleton && instance.config.hand.detector?.modelPath?.includes('handtrack')) instance.models.handskeleton = handtrack.loadSkeleton(instance.config);
  if (instance.config.object.enabled && !instance.models.centernet && instance.config.object?.modelPath?.includes('centernet')) instance.models.centernet = centernet.load(instance.config);