human/src/face/embedding.ts

/**
 * EfficientPose model implementation
 *
 * Based on: [**BecauseofAI MobileFace**](https://github.com/becauseofAI/MobileFace)
 *
 * Obsolete and replaced by `faceres` that performs age/gender/descriptor analysis
 */

import { log, join } from '../util/util';
import * as tf from '../../dist/tfjs.esm.js';
import type { Tensor, GraphModel } from '../tfjs/types';
import { env } from '../util/env';

let model: GraphModel | null;

export async function load(config) {
  const modelUrl = join(config.modelBasePath, config.face.embedding.modelPath);
  if (env.initial) model = null;
  if (!model) {
    model = await tf.loadGraphModel(modelUrl) as unknown as GraphModel;
    if (!model) log('load model failed:', config.face.embedding.modelPath);
    else if (config.debug) log('load model:', modelUrl);
  } else if (config.debug) log('cached model:', modelUrl);
  return model;
}

export function enhance(input): Tensor {
  const image = tf.tidy(() => {
    // input received from detector is already normalized to 0..1
    // input is also assumed to be straightened
    // const data = tf.image.resizeBilinear(input, [model.inputs[0].shape[2], model.inputs[0].shape[1]], false); // just resize to fit the embedding model
    // do a tight crop of image and resize it to fit the model
    const box = [[0.05, 0.15, 0.85, 0.85]]; // empyrical values for top, left, bottom, right
    const tensor = input.image || input.tensor;
    if (!(tensor instanceof tf.Tensor)) return null;
    if (!model || !model.inputs || !model.inputs[0].shape) return null;
    const crop = (tensor.shape.length === 3)
      ? tf.image.cropAndResize(tf.expandDims(tensor, 0), box, [0], [model.inputs[0].shape[2], model.inputs[0].shape[1]]) // add batch dimension if missing
      : tf.image.cropAndResize(tensor, box, [0], [model.inputs[0].shape[2], model.inputs[0].shape[1]]);

    // convert to black&white to avoid colorization impact
    const rgb = [0.2989, 0.5870, 0.1140]; // factors for red/green/blue colors when converting to grayscale: https://www.mathworks.com/help/matlab/ref/rgb2gray.html
    const [red, green, blue] = tf.split(crop, 3, 3);
    const redNorm = tf.mul(red, rgb[0]);
    const greenNorm = tf.mul(green, rgb[1]);
    const blueNorm = tf.mul(blue, rgb[2]);
    const grayscale = tf.addN([redNorm, greenNorm, blueNorm]);
    const merge = tf.stack([grayscale, grayscale, grayscale], 3).squeeze(4);

    /*
    // optional increase image contrast
    // or do it per-channel so mean is done on each channel
    // or do it based on histogram
    const mean = merge.mean();
    const factor = 5;
    const contrast = merge.sub(mean).mul(factor).add(mean);
    */

    // normalize brightness from 0..1
    const darken = tf.sub(merge, merge.min());
    const lighten = tf.div(darken, darken.max());

    return lighten;
  });
  return image;
}

export async function predict(input, config): Promise<number[]> {
  if (!model) return [];
  return new Promise(async (resolve) => {
    // let data: Array<[]> = [];
    let data: Array<number> = [];
    if (config.face.embedding.enabled) {
      const image = enhance(input);
      const dataT = model?.execute(image) as Tensor;
      /*
      const dataT = tf.tidy(() => {
        /*
        // if needed convert from NHWC to NCHW
        const nchw = image.transpose([3, 0, 1, 2]);

        const res = model.execute(image);

        // optionally do it twice with flipped image and average results
        const res1 = model.execute(image);
        const flipped = tf.image.flipLeftRight(image);
        const res2 = model.execute(flipped);
        const merge = tf.stack([res1, res2], 2).squeeze();
        const res = reshape.logSumExp(1);

        // optional normalize outputs with l2 normalization
        const scaled = tf.tidy(() => {
          const l2 = res.norm('euclidean');
          const scale = res.div(l2);
          return scale;
        });

        // optional reduce feature vector complexity
        const reshape = tf.reshape(res, [128, 2]); // split 256 vectors into 128 x 2
        const reduce = reshape.logSumExp(1); // reduce 2nd dimension by calculating logSumExp on it

        return reduce;
      });
      */
      const output = await dataT.data();
      data = Array.from(output); // convert typed array to simple array
      tf.dispose(dataT);
      tf.dispose(image);
    }
    resolve(data);
  });
}
update all box calculations 2021-05-25 14:58:20 +02:00			`/**`
new samples gallery and major code folder restructure 2021-09-25 17:51:15 +02:00			`* EfficientPose model implementation`
			`*`
			`* Based on: [BecauseofAI MobileFace](https://github.com/becauseofAI/MobileFace)`
			`*`
			* Obsolete and replaced by `faceres` that performs age/gender/descriptor analysis
update all box calculations 2021-05-25 14:58:20 +02:00			`*/`

refactoring 2021-09-27 19:58:13 +02:00			`import { log, join } from '../util/util';`
completed tfjs wrapper 2020-11-18 14:26:28 +01:00			`import * as tf from '../../dist/tfjs.esm.js';`
fix multiple memory leaks 2021-09-13 19:28:35 +02:00			`import type { Tensor, GraphModel } from '../tfjs/types';`
refactoring 2021-09-27 19:58:13 +02:00			`import { env } from '../util/env';`
implemented face embedding 2020-11-13 22:13:35 +01:00
experimental webgl status monitoring 2021-09-17 17:23:00 +02:00			`let model: GraphModel \| null;`
implemented face embedding 2020-11-13 22:13:35 +01:00
convert to typescript 2021-02-08 17:39:09 +01:00			`export async function load(config) {`
add tfjs types and remove all instances of any 2021-05-23 03:47:59 +02:00			`const modelUrl = join(config.modelBasePath, config.face.embedding.modelPath);`
experimental webgl status monitoring 2021-09-17 17:23:00 +02:00			`if (env.initial) model = null;`
updated typings 2021-02-08 18:47:38 +01:00			`if (!model) {`
strict type checks 2021-08-17 14:51:17 +02:00			`model = await tf.loadGraphModel(modelUrl) as unknown as GraphModel;`
add tfjs types and remove all instances of any 2021-05-23 03:47:59 +02:00			`if (!model) log('load model failed:', config.face.embedding.modelPath);`
			`else if (config.debug) log('load model:', modelUrl);`
			`} else if (config.debug) log('cached model:', modelUrl);`
updated typings 2021-02-08 18:47:38 +01:00			`return model;`
implemented face embedding 2020-11-13 22:13:35 +01:00			`}`

implement human.match and embedding demo 2021-03-15 17:14:48 +01:00			`export function enhance(input): Tensor {`
switched face embedding to mobileface 2021-03-12 18:54:08 +01:00			`const image = tf.tidy(() => {`
			`// input received from detector is already normalized to 0..1`
			`// input is also assumed to be straightened`
			`// const data = tf.image.resizeBilinear(input, [model.inputs[0].shape[2], model.inputs[0].shape[1]], false); // just resize to fit the embedding model`
			`// do a tight crop of image and resize it to fit the model`
distance based on minkowski space and limited euclidean space 2021-03-13 00:24:34 +01:00			`const box = [[0.05, 0.15, 0.85, 0.85]]; // empyrical values for top, left, bottom, right`
switched face embedding to mobileface 2021-03-12 18:54:08 +01:00			`const tensor = input.image \|\| input.tensor;`
strong typings 2021-03-13 19:47:45 +01:00			`if (!(tensor instanceof tf.Tensor)) return null;`
strict type checks 2021-08-17 14:51:17 +02:00			`if (!model \|\| !model.inputs \|\| !model.inputs[0].shape) return null;`
distance based on minkowski space and limited euclidean space 2021-03-13 00:24:34 +01:00			`const crop = (tensor.shape.length === 3)`
strong typings 2021-03-13 19:47:45 +01:00			`? tf.image.cropAndResize(tf.expandDims(tensor, 0), box, [0], [model.inputs[0].shape[2], model.inputs[0].shape[1]]) // add batch dimension if missing`
switched face embedding to mobileface 2021-03-12 18:54:08 +01:00			`: tf.image.cropAndResize(tensor, box, [0], [model.inputs[0].shape[2], model.inputs[0].shape[1]]);`

			`// convert to black&white to avoid colorization impact`
			`const rgb = [0.2989, 0.5870, 0.1140]; // factors for red/green/blue colors when converting to grayscale: https://www.mathworks.com/help/matlab/ref/rgb2gray.html`
			`const [red, green, blue] = tf.split(crop, 3, 3);`
			`const redNorm = tf.mul(red, rgb[0]);`
			`const greenNorm = tf.mul(green, rgb[1]);`
			`const blueNorm = tf.mul(blue, rgb[2]);`
			`const grayscale = tf.addN([redNorm, greenNorm, blueNorm]);`
			`const merge = tf.stack([grayscale, grayscale, grayscale], 3).squeeze(4);`

update embedding and strong typings 2021-03-13 17:26:53 +01:00			`/*`
			`// optional increase image contrast`
			`// or do it per-channel so mean is done on each channel`
			`// or do it based on histogram`
			`const mean = merge.mean();`
			`const factor = 5;`
			`const contrast = merge.sub(mean).mul(factor).add(mean);`
			`*/`

switched face embedding to mobileface 2021-03-12 18:54:08 +01:00			`// normalize brightness from 0..1`
fix unregistered ops in tfjs 2021-07-29 22:06:03 +02:00			`const darken = tf.sub(merge, merge.min());`
			`const lighten = tf.div(darken, darken.max());`
switched face embedding to mobileface 2021-03-12 18:54:08 +01:00
			`return lighten;`
			`});`
			`return image;`
			`}`

implement human.match and embedding demo 2021-03-15 17:14:48 +01:00			`export async function predict(input, config): Promise<number[]> {`
			`if (!model) return [];`
implemented face embedding 2020-11-13 22:13:35 +01:00			`return new Promise(async (resolve) => {`
switched face embedding to mobileface 2021-03-12 18:54:08 +01:00			`// let data: Array<[]> = [];`
			`let data: Array<number> = [];`
implemented face embedding 2020-11-13 22:13:35 +01:00			`if (config.face.embedding.enabled) {`
update embedding and strong typings 2021-03-13 17:26:53 +01:00			`const image = enhance(input);`
refactor predict with execute 2021-11-02 16:07:11 +01:00			`const dataT = model?.execute(image) as Tensor;`
			`/*`
complete async work 2021-08-14 17:16:26 +02:00			`const dataT = tf.tidy(() => {`
major update for 1.8 release candidate 2021-04-25 19:16:04 +02:00			`/*`
			`// if needed convert from NHWC to NCHW`
			`const nchw = image.transpose([3, 0, 1, 2]);`

refactor predict with execute 2021-11-02 16:07:11 +01:00			`const res = model.execute(image);`
major update for 1.8 release candidate 2021-04-25 19:16:04 +02:00
			`// optionally do it twice with flipped image and average results`
refactor predict with execute 2021-11-02 16:07:11 +01:00			`const res1 = model.execute(image);`
major update for 1.8 release candidate 2021-04-25 19:16:04 +02:00			`const flipped = tf.image.flipLeftRight(image);`
refactor predict with execute 2021-11-02 16:07:11 +01:00			`const res2 = model.execute(flipped);`
major update for 1.8 release candidate 2021-04-25 19:16:04 +02:00			`const merge = tf.stack([res1, res2], 2).squeeze();`
			`const res = reshape.logSumExp(1);`

			`// optional normalize outputs with l2 normalization`
			`const scaled = tf.tidy(() => {`
			`const l2 = res.norm('euclidean');`
			`const scale = res.div(l2);`
			`return scale;`
wip on embedding 2021-03-11 19:31:36 +01:00			`});`
major update for 1.8 release candidate 2021-04-25 19:16:04 +02:00
			`// optional reduce feature vector complexity`
add tfjs types and remove all instances of any 2021-05-23 03:47:59 +02:00			`const reshape = tf.reshape(res, [128, 2]); // split 256 vectors into 128 x 2`
major update for 1.8 release candidate 2021-04-25 19:16:04 +02:00			`const reduce = reshape.logSumExp(1); // reduce 2nd dimension by calculating logSumExp on it`

complete async work 2021-08-14 17:16:26 +02:00			`return reduce;`
major update for 1.8 release candidate 2021-04-25 19:16:04 +02:00			`});`
refactor predict with execute 2021-11-02 16:07:11 +01:00			`*/`
			`const output = await dataT.data();`
			`data = Array.from(output); // convert typed array to simple array`
complete async work 2021-08-14 17:16:26 +02:00			`tf.dispose(dataT);`
implement human.match and embedding demo 2021-03-15 17:14:48 +01:00			`tf.dispose(image);`
implemented face embedding 2020-11-13 22:13:35 +01:00			`}`
			`resolve(data);`
			`});`
			`}`