human/src/face/faceres.ts

/**
 * FaceRes model implementation
 *
 * Returns Age, Gender, Descriptor
 * Implements Face simmilarity function
 *
 * Based on: [**HSE-FaceRes**](https://github.com/HSE-asavchenko/HSE_FaceRec_tf)
 */

import { log, join } from '../util/util';
import * as tf from '../../dist/tfjs.esm.js';
import type { Tensor, GraphModel } from '../tfjs/types';
import type { Config } from '../config';
import { env } from '../util/env';

let model: GraphModel | null;
const last: Array<{
  age: number,
  gender: string,
  genderScore: number,
  descriptor: number[],
}> = [];

let lastCount = 0;
let skipped = Number.MAX_SAFE_INTEGER;

export async function load(config: Config): Promise<GraphModel> {
  const modelUrl = join(config.modelBasePath, config.face.description?.modelPath || '');
  if (env.initial) model = null;
  if (!model) {
    model = await tf.loadGraphModel(modelUrl) as unknown as GraphModel;
    if (!model) log('load model failed:', config.face.description?.modelPath || '');
    else if (config.debug) log('load model:', modelUrl);
  } else if (config.debug) log('cached model:', modelUrl);
  return model;
}

export function enhance(input): Tensor {
  const image = tf.tidy(() => {
    // input received from detector is already normalized to 0..1
    // input is also assumed to be straightened
    const tensor = input.image || input.tensor || input;
    if (!(tensor instanceof tf.Tensor)) return null;
    // do a tight crop of image and resize it to fit the model
    const box = [[0.05, 0.15, 0.85, 0.85]]; // empyrical values for top, left, bottom, right
    // const box = [[0.0, 0.0, 1.0, 1.0]]; // basically no crop for test
    if (!model?.inputs[0].shape) return null; // model has no shape so no point continuing
    const crop = (tensor.shape.length === 3)
      ? tf.image.cropAndResize(tf.expandDims(tensor, 0), box, [0], [model.inputs[0].shape[2], model.inputs[0].shape[1]]) // add batch dimension if missing
      : tf.image.cropAndResize(tensor, box, [0], [model.inputs[0].shape[2], model.inputs[0].shape[1]]);

    /*
    // just resize to fit the embedding model instead of cropping
    const crop = tf.image.resizeBilinear(tensor, [model.inputs[0].shape[2], model.inputs[0].shape[1]], false);
    */

    /*
    // convert to black&white to avoid colorization impact
    const rgb = [0.2989, 0.5870, 0.1140]; // factors for red/green/blue colors when converting to grayscale: https://www.mathworks.com/help/matlab/ref/rgb2gray.html
    const [red, green, blue] = tf.split(crop, 3, 3);
    const redNorm = tf.mul(red, rgb[0]);
    const greenNorm = tf.mul(green, rgb[1]);
    const blueNorm = tf.mul(blue, rgb[2]);
    const grayscale = tf.addN([redNorm, greenNorm, blueNorm]);
    const merge = tf.stack([grayscale, grayscale, grayscale], 3).squeeze(4);
    */

    /*
    // increase image pseudo-contrast 100%
    // (or do it per-channel so mean is done on each channel)
    // (or calculate histogram and do it based on histogram)
    const mean = merge.mean();
    const factor = 2;
    const contrast = merge.sub(mean).mul(factor).add(mean);
    */

    /*
    // normalize brightness from 0..1
    // silly way of creating pseudo-hdr of image
    const darken = crop.sub(crop.min());
    const lighten = darken.div(darken.max());
    */

    const norm = tf.mul(crop, 255);

    return norm;
  });
  return image;
}

export async function predict(image: Tensor, config: Config, idx, count) {
  if (!model) return null;
  if ((skipped < (config.face.description?.skipFrames || 0)) && config.skipFrame && (lastCount === count) && last[idx]?.age && (last[idx]?.age > 0)) {
    skipped++;
    return last[idx];
  }
  skipped = 0;
  return new Promise(async (resolve) => {
    const enhanced = enhance(image);

    let resT;
    const obj = {
      age: <number>0,
      gender: <string>'unknown',
      genderScore: <number>0,
      descriptor: <number[]>[],
    };

    if (config.face.description?.enabled) resT = await model?.predict(enhanced);
    tf.dispose(enhanced);

    if (resT) {
      const gender = await resT.find((t) => t.shape[1] === 1).data();
      const confidence = Math.trunc(200 * Math.abs((gender[0] - 0.5))) / 100;
      if (confidence > (config.face.description?.minConfidence || 0)) {
        obj.gender = gender[0] <= 0.5 ? 'female' : 'male';
        obj.genderScore = Math.min(0.99, confidence);
      }
      const argmax = tf.argMax(resT.find((t) => t.shape[1] === 100), 1);
      const age = (await argmax.data())[0];
      tf.dispose(argmax);
      const all = await resT.find((t) => t.shape[1] === 100).data();
      obj.age = Math.round(all[age - 1] > all[age + 1] ? 10 * age - 100 * all[age - 1] : 10 * age + 100 * all[age + 1]) / 10;

      const desc = resT.find((t) => t.shape[1] === 1024);
      // const reshape = desc.reshape([128, 8]); // reshape large 1024-element descriptor to 128 x 8
      // const reduce = reshape.logSumExp(1); // reduce 2nd dimension by calculating logSumExp on it which leaves us with 128-element descriptor

      const descriptor = await desc.data();
      obj.descriptor = [...descriptor];
      resT.forEach((t) => tf.dispose(t));
    }
    last[idx] = obj;
    lastCount = count;
    resolve(obj);
  });
}
update all box calculations 2021-05-25 14:58:20 +02:00			`/**`
new samples gallery and major code folder restructure 2021-09-25 17:51:15 +02:00			`* FaceRes model implementation`
			`*`
update all box calculations 2021-05-25 14:58:20 +02:00			`* Returns Age, Gender, Descriptor`
			`* Implements Face simmilarity function`
new samples gallery and major code folder restructure 2021-09-25 17:51:15 +02:00			`*`
			`* Based on: [HSE-FaceRes](https://github.com/HSE-asavchenko/HSE_FaceRec_tf)`
update all box calculations 2021-05-25 14:58:20 +02:00			`*/`

refactoring 2021-09-27 19:58:13 +02:00			`import { log, join } from '../util/util';`
new module: face description 2021-03-21 19:18:51 +01:00			`import * as tf from '../../dist/tfjs.esm.js';`
fix multiple memory leaks 2021-09-13 19:28:35 +02:00			`import type { Tensor, GraphModel } from '../tfjs/types';`
			`import type { Config } from '../config';`
refactoring 2021-09-27 19:58:13 +02:00			`import { env } from '../util/env';`
new module: face description 2021-03-21 19:18:51 +01:00
experimental webgl status monitoring 2021-09-17 17:23:00 +02:00			`let model: GraphModel \| null;`
release candidate 2021-06-01 14:59:09 +02:00			`const last: Array<{`
			`age: number,`
			`gender: string,`
			`genderScore: number,`
			`descriptor: number[],`
			`}> = [];`

human 1.9.0 beta with breaking changes regarding caching 2021-05-18 17:26:16 +02:00			`let lastCount = 0;`
new module: face description 2021-03-21 19:18:51 +01:00			`let skipped = Number.MAX_SAFE_INTEGER;`

update build with automatic linter 2021-06-03 15:41:53 +02:00			`export async function load(config: Config): Promise<GraphModel> {`
redefine config and result interfaces 2021-09-12 05:54:35 +02:00			`const modelUrl = join(config.modelBasePath, config.face.description?.modelPath \|\| '');`
experimental webgl status monitoring 2021-09-17 17:23:00 +02:00			`if (env.initial) model = null;`
new module: face description 2021-03-21 19:18:51 +01:00			`if (!model) {`
strict type checks 2021-08-17 14:51:17 +02:00			`model = await tf.loadGraphModel(modelUrl) as unknown as GraphModel;`
redefine config and result interfaces 2021-09-12 05:54:35 +02:00			`if (!model) log('load model failed:', config.face.description?.modelPath \|\| '');`
add tfjs types and remove all instances of any 2021-05-23 03:47:59 +02:00			`else if (config.debug) log('load model:', modelUrl);`
			`} else if (config.debug) log('cached model:', modelUrl);`
new module: face description 2021-03-21 19:18:51 +01:00			`return model;`
			`}`

			`export function enhance(input): Tensor {`
			`const image = tf.tidy(() => {`
			`// input received from detector is already normalized to 0..1`
			`// input is also assumed to be straightened`
			`const tensor = input.image \|\| input.tensor \|\| input;`
improve fact matching 2021-03-23 20:24:58 +01:00			`if (!(tensor instanceof tf.Tensor)) return null;`
new module: face description 2021-03-21 19:18:51 +01:00			`// do a tight crop of image and resize it to fit the model`
			`const box = [[0.05, 0.15, 0.85, 0.85]]; // empyrical values for top, left, bottom, right`
refactored human.config and human.draw 2021-04-13 17:05:52 +02:00			`// const box = [[0.0, 0.0, 1.0, 1.0]]; // basically no crop for test`
experimental webgl status monitoring 2021-09-17 17:23:00 +02:00			`if (!model?.inputs[0].shape) return null; // model has no shape so no point continuing`
new module: face description 2021-03-21 19:18:51 +01:00			`const crop = (tensor.shape.length === 3)`
			`? tf.image.cropAndResize(tf.expandDims(tensor, 0), box, [0], [model.inputs[0].shape[2], model.inputs[0].shape[1]]) // add batch dimension if missing`
			`: tf.image.cropAndResize(tensor, box, [0], [model.inputs[0].shape[2], model.inputs[0].shape[1]]);`
update 2021-05-17 14:56:57 +02:00
			`/*`
			`// just resize to fit the embedding model instead of cropping`
			`const crop = tf.image.resizeBilinear(tensor, [model.inputs[0].shape[2], model.inputs[0].shape[1]], false);`
			`*/`
new module: face description 2021-03-21 19:18:51 +01:00
			`/*`
			`// convert to black&white to avoid colorization impact`
			`const rgb = [0.2989, 0.5870, 0.1140]; // factors for red/green/blue colors when converting to grayscale: https://www.mathworks.com/help/matlab/ref/rgb2gray.html`
			`const [red, green, blue] = tf.split(crop, 3, 3);`
			`const redNorm = tf.mul(red, rgb[0]);`
			`const greenNorm = tf.mul(green, rgb[1]);`
			`const blueNorm = tf.mul(blue, rgb[2]);`
			`const grayscale = tf.addN([redNorm, greenNorm, blueNorm]);`
			`const merge = tf.stack([grayscale, grayscale, grayscale], 3).squeeze(4);`
			`*/`

			`/*`
update 2021-05-17 14:56:57 +02:00			`// increase image pseudo-contrast 100%`
			`// (or do it per-channel so mean is done on each channel)`
			`// (or calculate histogram and do it based on histogram)`
new module: face description 2021-03-21 19:18:51 +01:00			`const mean = merge.mean();`
update 2021-05-17 14:56:57 +02:00			`const factor = 2;`
new module: face description 2021-03-21 19:18:51 +01:00			`const contrast = merge.sub(mean).mul(factor).add(mean);`
			`*/`
refactored human.config and human.draw 2021-04-13 17:05:52 +02:00
new module: face description 2021-03-21 19:18:51 +01:00			`/*`
			`// normalize brightness from 0..1`
update 2021-05-17 14:56:57 +02:00			`// silly way of creating pseudo-hdr of image`
new module: face description 2021-03-21 19:18:51 +01:00			`const darken = crop.sub(crop.min());`
			`const lighten = darken.div(darken.max());`
			`*/`
refactored human.config and human.draw 2021-04-13 17:05:52 +02:00
fix unregistered ops in tfjs 2021-07-29 22:06:03 +02:00			`const norm = tf.mul(crop, 255);`
new module: face description 2021-03-21 19:18:51 +01:00
			`return norm;`
			`});`
			`return image;`
			`}`

update build with automatic linter 2021-06-03 15:41:53 +02:00			`export async function predict(image: Tensor, config: Config, idx, count) {`
new module: face description 2021-03-21 19:18:51 +01:00			`if (!model) return null;`
redefine config and result interfaces 2021-09-12 05:54:35 +02:00			`if ((skipped < (config.face.description?.skipFrames \|\| 0)) && config.skipFrame && (lastCount === count) && last[idx]?.age && (last[idx]?.age > 0)) {`
new module: face description 2021-03-21 19:18:51 +01:00			`skipped++;`
release candidate 2021-06-01 14:59:09 +02:00			`return last[idx];`
new module: face description 2021-03-21 19:18:51 +01:00			`}`
human 1.9.0 beta with breaking changes regarding caching 2021-05-18 17:26:16 +02:00			`skipped = 0;`
new module: face description 2021-03-21 19:18:51 +01:00			`return new Promise(async (resolve) => {`
			`const enhanced = enhance(image);`

			`let resT;`
			`const obj = {`
			`age: <number>0,`
			`gender: <string>'unknown',`
release candidate 2021-06-01 14:59:09 +02:00			`genderScore: <number>0,`
			`descriptor: <number[]>[],`
			`};`
new module: face description 2021-03-21 19:18:51 +01:00
experimental webgl status monitoring 2021-09-17 17:23:00 +02:00			`if (config.face.description?.enabled) resT = await model?.predict(enhanced);`
new module: face description 2021-03-21 19:18:51 +01:00			`tf.dispose(enhanced);`

			`if (resT) {`
complete async work 2021-08-14 17:16:26 +02:00			`const gender = await resT.find((t) => t.shape[1] === 1).data();`
			`const confidence = Math.trunc(200 * Math.abs((gender[0] - 0.5))) / 100;`
redefine config and result interfaces 2021-09-12 05:54:35 +02:00			`if (confidence > (config.face.description?.minConfidence \|\| 0)) {`
complete async work 2021-08-14 17:16:26 +02:00			`obj.gender = gender[0] <= 0.5 ? 'female' : 'male';`
			`obj.genderScore = Math.min(0.99, confidence);`
			`}`
			`const argmax = tf.argMax(resT.find((t) => t.shape[1] === 100), 1);`
			`const age = (await argmax.data())[0];`
fix multiple memory leaks 2021-09-13 19:28:35 +02:00			`tf.dispose(argmax);`
			`const all = await resT.find((t) => t.shape[1] === 100).data();`
complete async work 2021-08-14 17:16:26 +02:00			`obj.age = Math.round(all[age - 1] > all[age + 1] ? 10 * age - 100 * all[age - 1] : 10 * age + 100 * all[age + 1]) / 10;`

			`const desc = resT.find((t) => t.shape[1] === 1024);`
			`// const reshape = desc.reshape([128, 8]); // reshape large 1024-element descriptor to 128 x 8`
			`// const reduce = reshape.logSumExp(1); // reduce 2nd dimension by calculating logSumExp on it which leaves us with 128-element descriptor`

			`const descriptor = await desc.data();`
			`obj.descriptor = [...descriptor];`
new module: face description 2021-03-21 19:18:51 +01:00			`resT.forEach((t) => tf.dispose(t));`
			`}`
human 1.9.0 beta with breaking changes regarding caching 2021-05-18 17:26:16 +02:00			`last[idx] = obj;`
			`lastCount = count;`
new module: face description 2021-03-21 19:18:51 +01:00			`resolve(obj);`
			`});`
			`}`