import human from '../dist/human.esm.js'; import draw from './draw.js'; import Menu from './menu.js'; // ui options const ui = { baseColor: 'rgba(173, 216, 230, 0.3)', // this is 'lightblue', just with alpha channel baseLabel: 'rgba(173, 216, 230, 0.9)', baseFontProto: 'small-caps {size} "Segoe UI"', baseLineWidth: 16, baseLineHeightProto: 2, columns: 2, busy: false, facing: true, useWorker: false, worker: 'worker.js', samples: ['../assets/sample6.jpg', '../assets/sample1.jpg', '../assets/sample4.jpg', '../assets/sample5.jpg', '../assets/sample3.jpg', '../assets/sample2.jpg'], drawBoxes: true, drawPoints: false, drawPolygons: true, fillPolygons: true, useDepth: true, console: true, maxFrames: 10, }; // configuration overrides const config = { backend: 'webgl', // if you want to use 'wasm' backend, enable script load of tf and tf-backend-wasm in index.html face: { enabled: true, detector: { maxFaces: 10, skipFrames: 10, minConfidence: 0.5, iouThreshold: 0.3, scoreThreshold: 0.7 }, mesh: { enabled: true }, iris: { enabled: true }, age: { enabled: true, skipFrames: 10 }, gender: { enabled: true }, emotion: { enabled: true, minConfidence: 0.5, useGrayscale: true }, }, body: { enabled: true, maxDetections: 10, scoreThreshold: 0.7, nmsRadius: 20 }, hand: { enabled: true, skipFrames: 10, minConfidence: 0.5, iouThreshold: 0.3, scoreThreshold: 0.7 }, }; // global variables let menu; let worker; let timeStamp; const fps = []; // helper function: translates json to human readable string function str(...msg) { if (!Array.isArray(msg)) return msg; let line = ''; for (const entry of msg) { if (typeof entry === 'object') line += JSON.stringify(entry).replace(/{|}|"|\[|\]/g, '').replace(/,/g, ', '); else line += entry; } return line; } // helper function: wrapper around console output const log = (...msg) => { // eslint-disable-next-line no-console if (ui.console) console.log(...msg); }; // draws processed results and starts processing of a next frame function drawResults(input, result, canvas) { // update fps fps.push(1000 / (performance.now() - timeStamp)); if (fps.length > ui.maxFrames) fps.shift(); menu.updateChart('FPS', fps); // eslint-disable-next-line no-use-before-define requestAnimationFrame(() => runHumanDetect(input, canvas)); // immediate loop // draw image from video const ctx = canvas.getContext('2d'); ctx.drawImage(input, 0, 0, input.width, input.height, 0, 0, canvas.width, canvas.height); // draw all results draw.face(result.face, canvas, ui, human.facemesh.triangulation); draw.body(result.body, canvas, ui); draw.hand(result.hand, canvas, ui); // update log const engine = human.tf.engine(); const memory = `${engine.state.numBytes.toLocaleString()} bytes ${engine.state.numDataBuffers.toLocaleString()} buffers ${engine.state.numTensors.toLocaleString()} tensors`; const gpu = engine.backendInstance ? `GPU: ${engine.backendInstance.numBytesInGPU.toLocaleString()} bytes` : ''; document.getElementById('log').innerText = ` TFJS Version: ${human.tf.version_core} | Backend: ${human.tf.getBackend()} | Memory: ${memory} ${gpu} Performance: ${str(result.performance)} | Object size: ${(str(result)).length.toLocaleString()} bytes `; } // setup webcam async function setupCamera() { if (ui.busy) return null; ui.busy = true; const video = document.getElementById('video'); const canvas = document.getElementById('canvas'); const output = document.getElementById('log'); const live = video.srcObject ? ((video.srcObject.getVideoTracks()[0].readyState === 'live') && (video.readyState > 2) && (!video.paused)) : false; let msg = `Setting up camera: live: ${live} facing: ${ui.facing ? 'front' : 'back'}`; output.innerText += `\n${msg}`; log(msg); // setup webcam. note that navigator.mediaDevices requires that page is accessed via https if (!navigator.mediaDevices) { msg = 'Camera access not supported'; output.innerText += `\n${msg}`; log(msg); return null; } let stream; try { stream = await navigator.mediaDevices.getUserMedia({ audio: false, video: { facingMode: (ui.facing ? 'user' : 'environment'), width: window.innerWidth, height: window.innerHeight }, }); } catch (err) { output.innerText += '\nCamera permission denied'; log(err); } if (stream) video.srcObject = stream; else return null; return new Promise((resolve) => { video.onloadeddata = async () => { video.width = video.videoWidth; video.height = video.videoHeight; canvas.width = video.videoWidth; canvas.height = video.videoHeight; if (live) video.play(); ui.busy = false; // do once more because onresize events can be delayed or skipped if (video.width > window.innerWidth) await setupCamera(); output.innerText += `\nCamera resolution: ${video.width} x ${video.height}`; resolve(video); }; }); } // wrapper for worker.postmessage that creates worker if one does not exist function webWorker(input, image, canvas) { if (!worker) { // create new webworker and add event handler only once log('Creating worker thread'); worker = new Worker(ui.worker, { type: 'module' }); // after receiving message from webworker, parse&draw results and send new frame for processing worker.addEventListener('message', (msg) => drawResults(input, msg.data, canvas)); } // pass image data as arraybuffer to worker by reference to avoid copy worker.postMessage({ image: image.data.buffer, width: canvas.width, height: canvas.height, config }, [image.data.buffer]); } // main processing function when input is webcam, can use direct invocation or web worker function runHumanDetect(input, canvas) { timeStamp = performance.now(); // perform detect if live video or not video at all if (input.srcObject) { // if video not ready, just redo const live = (input.srcObject.getVideoTracks()[0].readyState === 'live') && (input.readyState > 2) && (!input.paused); if (!live) { if (!input.paused) log(`Video not ready: state: ${input.srcObject.getVideoTracks()[0].readyState} stream state: ${input.readyState}`); setTimeout(() => runHumanDetect(input, canvas), 500); return; } if (ui.useWorker) { // get image data from video as we cannot send html objects to webworker const offscreen = new OffscreenCanvas(canvas.width, canvas.height); const ctx = offscreen.getContext('2d'); ctx.drawImage(input, 0, 0, input.width, input.height, 0, 0, canvas.width, canvas.height); const data = ctx.getImageData(0, 0, canvas.width, canvas.height); // perform detection in worker webWorker(input, data, canvas); } else { human.detect(input, config).then((result) => { if (result.error) log(result.error); else drawResults(input, result, canvas); }); } } } // main processing function when input is image, can use direct invocation or web worker async function processImage(input) { // must be zero for images config.face.detector.skipFrames = 0; config.face.emotion.skipFrames = 0; config.face.age.skipFrames = 0; config.hand.skipFrames = 0; timeStamp = performance.now(); return new Promise((resolve) => { const image = document.getElementById('image'); image.onload = async () => { log('Processing image:', image.src); const canvas = document.getElementById('canvas'); image.width = image.naturalWidth; image.height = image.naturalHeight; canvas.width = image.naturalWidth; canvas.height = image.naturalHeight; const result = await human.detect(image, config); drawResults(image, result, canvas); const thumb = document.createElement('canvas'); thumb.width = (window.innerWidth - menu.width) / (ui.columns + 0.1); thumb.height = canvas.height / (window.innerWidth / thumb.width); thumb.style.margin = '8px'; thumb.style.boxShadow = '4px 4px 4px 0 dimgrey'; const ctx = thumb.getContext('2d'); ctx.drawImage(canvas, 0, 0, canvas.width, canvas.height, 0, 0, thumb.width, thumb.height); document.getElementById('samples').appendChild(thumb); image.src = ''; resolve(true); }; image.src = input; }); } // just initialize everything and call main function async function detectVideo() { document.getElementById('samples').style.display = 'none'; document.getElementById('canvas').style.display = 'block'; const video = document.getElementById('video'); const canvas = document.getElementById('canvas'); ui.baseFont = ui.baseFontProto.replace(/{size}/, '1.2rem'); ui.baseLineHeight = ui.baseLineHeightProto; if ((video.srcObject !== null) && !video.paused) { document.getElementById('log').innerText += '\nPaused ...'; video.pause(); } else { await setupCamera(); document.getElementById('log').innerText += '\nStarting Human Library ...'; video.play(); } runHumanDetect(video, canvas); } // just initialize everything and call main function async function detectSampleImages() { ui.baseFont = ui.baseFontProto.replace(/{size}/, `${ui.columns}rem`); ui.baseLineHeight = ui.baseLineHeightProto * ui.columns; document.getElementById('canvas').style.display = 'none'; document.getElementById('samples').style.display = 'block'; log('Running detection of sample images'); for (const sample of ui.samples) await processImage(sample); } function setupMenu() { menu = new Menu(document.body); menu.addButton('Start Video', 'Pause Video', (evt) => detectVideo(evt)); menu.addButton('Process Images', 'Process Images', () => detectSampleImages()); menu.addHTML('