human/dist/human.js

8054 lines
1.6 MiB
JavaScript
Raw Normal View History

2022-02-10 18:27:21 +01:00
/*
Human
homepage: <https://github.com/vladmandic/human>
author: <https://github.com/vladmandic>'
*/
2022-04-14 17:47:08 +02:00
var Human=(()=>{var Vc=Object.defineProperty;var $E=Object.getOwnPropertyDescriptor;var PE=Object.getOwnPropertyNames;var _E=Object.prototype.hasOwnProperty;var zE=(e,t,r)=>t in e?Vc(e,t,{enumerable:!0,configurable:!0,writable:!0,value:r}):e[t]=r;var xs=(e,t)=>{for(var r in t)Vc(e,r,{get:t[r],enumerable:!0})},OE=(e,t,r,n)=>{if(t&&typeof t=="object"||typeof t=="function")for(let a of PE(t))!_E.call(e,a)&&a!==r&&Vc(e,a,{get:()=>t[a],enumerable:!(n=$E(t,a))||n.enumerable});return e};var DE=e=>OE(Vc({},"__esModule",{value:!0}),e);var fe=(e,t,r)=>(zE(e,typeof t!="symbol"?t+"":t,r),r),N3=(e,t,r)=>{if(!t.has(e))throw TypeError("Cannot "+r)};var pp=(e,t,r)=>(N3(e,t,"read from private field"),r?r.call(e):t.get(e)),hp=(e,t,r)=>{if(t.has(e))throw TypeError("Cannot add the same private member more than once");t instanceof WeakSet?t.add(e):t.set(e,r)},cp=(e,t,r,n)=>(N3(e,t,"write to private field"),n?n.call(e,r):t.set(e,r),r);var zAe={};xs(zAe,{Human:()=>s3,default:()=>s3,defaults:()=>bs,draw:()=>J5,env:()=>he,match:()=>a3,models:()=>lg});function ie(...e){let t=new Date,r=`${t.getHours().toString().padStart(2,"0")}:${t.getMinutes().toString().padStart(2,"0")}:${t.getSeconds().toString().padStart(2,"0")}.${t.getMilliseconds().toString().padStart(3,"0")}`;e&&console.log(r,"Human:",...e)}function C3(e,t){let r=e.endsWith("/")?"":"/",a=t.startsWith(".")||t.startsWith("/")||t.startsWith("http:")||t.startsWith("https:")||t.startsWith("file:")?`${t}`:`${e}${r}${t}`;if(!a.toLocaleLowerCase().includes(".json"))throw new Error(`modelpath error: expecting json file: ${a}`);return a}var oe=()=>typeof performance!="undefined"?performance.now():parseInt((Number(process.hrtime.bigint())/1e3/1e3).toString());function G1(e,t,r="config",n=[]){for(let a of Object.keys(t))if(typeof t[a]=="object")G1(e[a],t[a],a,n);else{let s=e&&typeof e[a]!="undefined";s||n.push({reason:"unknown property",where:`${r}.${a} = ${t[a]}`});let i=e&&typeof e[a]==typeof t[a];s&&!i&&n.push({reason:"property type mismatch",where:`${r}.${a} = ${t[a]}`,expected:typeof e[a]})}return t.debug&&r==="config"&&n.length>0&&ie("invalid configuration",n),n}function Ut(...e){let t=r=>r&&typeof r=="object";return e.reduce((r,n)=>(Object.keys(n||{}).forEach(a=>{let s=r[a],i=n[a];Array.isArray(s)&&Array.isArray(i)?r[a]=s.concat(...i):t(s)&&t(i)?r[a]=Ut(s,i):r[a]=i}),r),{})}var bs={backend:"",modelBasePath:"",cacheModels:!0,wasmPath:"",wasmPlatformFetch:!1,debug:!0,async:!0,warmup:"full",cacheSensitivity:.7,skipAllowed:!1,deallocate:!1,filter:{enabled:!0,equalization:!1,width:0,height:0,flip:!1,return:!0,brightness:0,contrast:0,sharpness:0,blur:0,saturation:0,hue:0,negative:!1,sepia:!1,vintage:!1,kodachrome:!1,technicolor:!1,polaroid:!1,pixelate:0},gesture:{enabled:!0},face:{enabled:!0,detector:{modelPath:"blazeface.json",rotation:!0,maxDetected:1,skipFrames:99,skipTime:2500,minConfidence:.2,iouThreshold:.1,mask:!1,return:!1},mesh:{enabled:!0,modelPath:"facemesh.json"},attention:{enabled:!1,modelPath:"facemesh-attention.json"},iris:{enabled:!0,modelPath:"iris.json"},emotion:{enabled:!0,minConfidence:.1,skipFrames:99,skipTime:1500,modelPath:"emotion.json"},description:{enabled:!0,modelPath:"faceres.json",skipFrames:99,skipTime:3e3,minConfidence:.1},antispoof:{enabled:!1,skipFrames:99,skipTime:4e3,modelPath:"antispoof.json"},liveness:{enabled:!1,skipFrames:99,skipTime:4e3,modelPath:"liveness.json"}},body:{enabled:!0,modelPath:"movenet-lightning.json",maxDetected:-1,minConfidence:.3,skipFrames:1,skipTime:200},hand:{enabled:!0,rotation:!0,skipFrames:99,skipTime:1e3,minConfidence:.5,iouThreshold:.2,maxDetected:-1,landmarks:!0,detector:{modelPath:"handtrack.json"},skeleton:{modelPath:"handlandmark-full.json"}},object:{enabled:!1,modelPath:"mb3-centernet.json",minConfidence:.2,iouThreshold:.4,maxDetected:10,skipFrames:99,skipTime:2e3},segmentation:{enabled:!1,modelPath:"selfie.json",blur:8}};var Ue={};xs(Ue,{Abs:()=>Lo,Acos:()=>Pu,Acosh:()=>_u,AdadeltaOptimizer:()=>Dm,AdagradOptimizer:()=>Lm,AdamOptimizer:()=>Bm,AdamaxOptimizer:()=>Wm,Add:()=>Ya,AddN:()=>qs,All:()=>zu,Any:()=>Ou,ArgMax:()=>Ks,ArgMin
2022-04-01 15:13:32 +02:00
`),V=C=>j.writeSync(2,C+`
2022-04-14 17:47:08 +02:00
`));var ee=p.print||Q,J=p.printErr||V;Object.assign(p,g),g=null,p.arguments&&(y=p.arguments),p.thisProgram&&(A=p.thisProgram),p.quit&&(x=p.quit);var se=4;function Z(C){Z.shown||(Z.shown={}),Z.shown[C]||(Z.shown[C]=1,J(C))}function ae(C,$){if(typeof WebAssembly.Function=="function"){for(var U={i:"i32",j:"i64",f:"f32",d:"f64"},te={parameters:[],results:$[0]=="v"?[]:[U[$[0]]]},ge=1;ge<$.length;++ge)te.parameters.push(U[$[ge]]);return new WebAssembly.Function(te,C)}var xe=[1,0,1,96],Ne=$.slice(0,1),_e=$.slice(1),$t={i:127,j:126,f:125,d:124};xe.push(_e.length);for(var ge=0;ge<_e.length;++ge)xe.push($t[_e[ge]]);Ne=="v"?xe.push(0):xe=xe.concat([1,$t[Ne]]),xe[1]=xe.length-2;var aa=new Uint8Array([0,97,115,109,1,0,0,0].concat(xe,[2,7,1,1,101,1,102,0,0,7,5,1,1,102,0,0])),sa=new WebAssembly.Module(aa),Wc=new WebAssembly.Instance(sa,{e:{f:C}}),dp=Wc.exports.f;return dp}var de=[],Ae;function be(){if(de.length)return de.pop();try{kn.grow(1)}catch(C){throw C instanceof RangeError?"Unable to grow wasm table. Set ALLOW_TABLE_GROWTH.":C}return kn.length-1}function Ee(C,$){for(var U=C;U<C+$;U++){var te=Yl(U);te&&Ae.set(te,U)}}var Me=0,De=C=>{Me=C},Be=Atomics.load,Ze=Atomics.store,ot=Atomics.compareExchange,dt;p.wasmBinary&&(dt=p.wasmBinary);var pt=p.noExitRuntime||!0;typeof WebAssembly!="object"&&Kl("no native wasm support detected");var $e,vt,yt=!1,$r;function dr(C,$){C||Kl($)}function Zr(C){var $=p["_"+C];return $}function er(C,$,U,te,ge){var xe={string:function(In){var au=0;if(In!=null&&In!==0){var T3=(In.length<<2)+1;au=nu(T3),ro(In,au,T3)}return au},array:function(In){var au=nu(In.length);return Ua(In,au),au}};function Ne(In){return $==="string"?wn(In):$==="boolean"?Boolean(In):In}var _e=Zr(C),$t=[],aa=0;if(te)for(var sa=0;sa<te.length;sa++){var Wc=xe[U[sa]];Wc?(aa===0&&(aa=V1()),$t[sa]=Wc(te[sa])):$t[sa]=te[sa]}var dp=_e.apply(null,$t);function FE(In){return aa!==0&&Oc(aa),Ne(In)}return dp=FE(dp),dp}function pr(C,$,U,te){U=U||[];var ge=U.every(function(Ne){return Ne==="number"}),xe=$!=="string";return xe&&ge&&!te?Zr(C):function(){return er(C,$,U,arguments,te)}}var Qn=1;function Yr(C){var $=new TextDecoder(C);this.decode=U=>(U.buffer instanceof SharedArrayBuffer&&(U=new Uint8Array(U)),$.decode.call($,U))}var tr=typeof TextDecoder!="undefined"?new Yr("utf8"):void 0;function vn(C,$,U){for(var te=$+U,ge=$;C[ge]&&!(ge>=te);)++ge;if(ge-$>16&&C.subarray&&tr)return tr.decode(C.subarray($,ge));for(var xe="";$<ge;){var Ne=C[$++];if(!(Ne&128)){xe+=String.fromCharCode(Ne);continue}var _e=C[$++]&63;if((Ne&224)==192){xe+=String.fromCharCode((Ne&31)<<6|_e);continue}var $t=C[$++]&63;if((Ne&240)==224?Ne=(Ne&15)<<12|_e<<6|$t:Ne=(Ne&7)<<18|_e<<12|$t<<6|C[$++]&63,Ne<65536)xe+=String.fromCharCode(Ne);else{var aa=Ne-65536;xe+=String.fromCharCode(55296|aa>>10,56320|aa&1023)}}return xe}function wn(C,$){return C?vn(i(),C,$):""}function fs(C,$,U,te){if(!(te>0))return 0;for(var ge=U,xe=U+te-1,Ne=0;Ne<C.length;++Ne){var _e=C.charCodeAt(Ne);if(_e>=55296&&_e<=57343){var $t=C.charCodeAt(++Ne);_e=65536+((_e&1023)<<10)|$t&1023}if(_e<=127){if(U>=xe)break;$[U++]=_e}else if(_e<=2047){if(U+1>=xe)break;$[U++]=192|_e>>6,$[U++]=128|_e&63}else if(_e<=65535){if(U+2>=xe)break;$[U++]=224|_e>>12,$[U++]=128|_e>>6&63,$[U++]=128|_e&63}else{if(U+3>=xe)break;$[U++]=240|_e>>18,$[U++]=128|_e>>12&63,$[U++]=128|_e>>6&63,$[U++]=128|_e&63}}return $[U]=0,U-ge}function ro(C,$,U){return fs(C,i(),$,U)}function ic(C){for(var $=0,U=0;U<C.length;++U){var te=C.charCodeAt(U);te>=55296&&te<=57343&&(te=65536+((te&1023)<<10)|C.charCodeAt(++U)&1023),te<=127?++$:te<=2047?$+=2:te<=65535?$+=3:$+=4}return $}var ms=typeof TextDecoder!="undefined"?new Yr("utf-16le"):void 0;function Ua(C,$){s().set(C,$)}function Qd(C,$,U){for(var te=0;te<C.length;++te)s()[$++>>0]=C.charCodeAt(te);U||(s()[$>>0]=0)}function Hl(C,$){return C%$>0&&(C+=$-C%$),C}var Pr,oc,lc,ep,uc,dc,i3,pc,hc;T&&(Pr=p.buffer);function ea(C){Pr=C,p.HEAP8=oc=new Int8Array(C),p.HEAP16=ep=new Int16Array(C),p.HEAP32=dc=new Int32Array(C),p.HEAPU8=lc=new Uint8Array(C),p.HEAPU16=uc=new Uint16Array(C),p.HEAPU32=i3=new Uint32Array(C),p.HEAPF32=pc=new Float
2022-02-10 18:27:21 +01:00
`)),l.join(`
2022-04-14 17:47:08 +02:00
`)}function KR(e,t,r,n){let a=Tt(t),s=n[n.length-1],i=new Array(s).fill(0),o=t.length,l=r==="complex64"?xp(e):e;if(o>1)for(let u=0;u<a/s;u++){let d=u*s;for(let h=0;h<s;h++)i[h]=Math.max(i[h],Ap(l[d+h],0,r).length)}return i}function Ap(e,t,r){let n;return Array.isArray(e)?n=`${parseFloat(e[0].toFixed(H1))} + ${parseFloat(e[1].toFixed(H1))}j`:Ss(e)?n=`'${e}'`:r==="bool"?n=Fw(e):n=parseFloat(e.toFixed(H1)).toString(),Cp(n,t)}function Fw(e){return e===0?"false":"true"}function ef(e,t,r,n,a,s=!0){let i=r==="complex64"?2:1,o=t[0],l=t.length;if(l===0){if(r==="complex64"){let m=xp(e);return[Ap(m[0],0,r)]}return r==="bool"?[Fw(e[0])]:[e[0].toString()]}if(l===1){if(o>F3){let g=fp*i,y=Array.from(e.slice(0,g)),A=Array.from(e.slice((o-fp)*i,o*i));return r==="complex64"&&(y=xp(y),A=xp(A)),["["+y.map((x,b)=>Ap(x,a[b],r)).join(", ")+", ..., "+A.map((x,b)=>Ap(x,a[o-fp+b],r)).join(", ")+"]"]}let m=r==="complex64"?xp(e):Array.from(e);return["["+m.map((g,y)=>Ap(g,a[y],r)).join(", ")+"]"]}let u=t.slice(1),d=n.slice(1),h=n[0]*i,p=[];if(o>F3){for(let m=0;m<fp;m++){let g=m*h,y=g+h;p.push(...ef(e.slice(g,y),u,r,d,a,!1))}p.push("...");for(let m=o-fp;m<o;m++){let g=m*h,y=g+h;p.push(...ef(e.slice(g,y),u,r,d,a,m===o-1))}}else for(let m=0;m<o;m++){let g=m*h,y=g+h;p.push(...ef(e.slice(g,y),u,r,d,a,m===o-1))}let c=l===2?",":"";p[0]="["+p[0]+c;for(let m=1;m<p.length-1;m++)p[m]=" "+p[m]+c;let f=`,
2022-02-10 18:27:21 +01:00
`;for(let m=2;m<l;m++)f+=`
2022-04-14 17:47:08 +02:00
`;return p[p.length-1]=" "+p[p.length-1]+"]"+(s?"":f),p}function xp(e){let t=[];for(let r=0;r<e.length;r+=2)t.push([e[r],e[r+1]]);return t}var ar=class{constructor(e,t,r){if(this.dtype=t,this.shape=e.slice(),this.size=Tt(e),r!=null){let n=r.length;P(n===this.size,()=>`Length of values '${n}' does not match the size inferred by the shape '${this.size}'.`)}if(t==="complex64")throw new Error("complex64 dtype TensorBuffers are not supported. Please create a TensorBuffer for the real and imaginary parts separately and call tf.complex(real, imag).");this.values=r||Aw(t,this.size),this.strides=$u(e)}set(e,...t){t.length===0&&(t=[0]),P(t.length===this.rank,()=>`The number of provided coordinates (${t.length}) must match the rank (${this.rank})`);let r=this.locToIndex(t);this.values[r]=e}get(...e){e.length===0&&(e=[0]);let t=0;for(let n of e){if(n<0||n>=this.shape[t]){let a=`Requested out of range element at ${e}. Buffer shape=${this.shape}`;throw new Error(a)}t++}let r=e[e.length-1];for(let n=0;n<e.length-1;++n)r+=this.strides[n]*e[n];return this.values[r]}locToIndex(e){if(this.rank===0)return 0;if(this.rank===1)return e[0];let t=e[e.length-1];for(let r=0;r<e.length-1;++r)t+=this.strides[r]*e[r];return t}indexToLoc(e){if(this.rank===0)return[];if(this.rank===1)return[e];let t=new Array(this.shape.length);for(let r=0;r<t.length-1;++r)t[r]=Math.floor(e/this.strides[r]),e-=t[r]*this.strides[r];return t[t.length-1]=e,t}get rank(){return this.shape.length}toTensor(){return ia().makeTensor(this.values,this.shape,this.dtype)}},ia=null,du=null,XR=null;function ZR(e){ia=e}function YR(e){du=e}function JR(e){XR=e}var rt=class{constructor(e,t,r,n){this.kept=!1,this.isDisposedInternal=!1,this.shape=e.slice(),this.dtype=t||"float32",this.size=Tt(e),this.strides=$u(e),this.dataId=r,this.id=n,this.rankType=this.rank<5?this.rank.toString():"higher"}get rank(){return this.shape.length}async buffer(){let e=await this.data();return du.buffer(this.shape,this.dtype,e)}bufferSync(){return du.buffer(this.shape,this.dtype,this.dataSync())}async array(){let e=await this.data();return cu(this.shape,e,this.dtype==="complex64")}arraySync(){return cu(this.shape,this.dataSync(),this.dtype==="complex64")}async data(){this.throwIfDisposed();let e=ia().read(this.dataId);if(this.dtype==="string"){let t=await e;try{return t.map(r=>Af(r))}catch(r){throw new Error("Failed to decode the string bytes into utf-8. To get the original bytes, call tensor.bytes().")}}return e}dataToGPU(e){return this.throwIfDisposed(),ia().readToGPU(this.dataId,e)}dataSync(){this.throwIfDisposed();let e=ia().readSync(this.dataId);if(this.dtype==="string")try{return e.map(t=>Af(t))}catch(t){throw new Error("Failed to decode the string bytes into utf-8. To get the original bytes, call tensor.bytes().")}return e}async bytes(){this.throwIfDisposed();let e=await ia().read(this.dataId);return this.dtype==="string"?e:new Uint8Array(e.buffer)}dispose(){this.isDisposed||(ia().disposeTensor(this),this.isDisposedInternal=!0)}get isDisposed(){return this.isDisposedInternal}throwIfDisposed(){if(this.isDisposed)throw new Error("Tensor is disposed.")}print(e=!1){return du.print(this,e)}clone(){return this.throwIfDisposed(),du.clone(this)}toString(e=!1){let t=this.dataSync();return qR(t,this.shape,this.dtype,e)}cast(e){return this.throwIfDisposed(),du.cast(this,e)}variable(e=!0,t,r){return this.throwIfDisposed(),ia().makeVariable(this,e,t,r)}};Object.defineProperty(rt,Symbol.hasInstance,{value:e=>!!e&&e.data!=null&&e.dataSync!=null&&e.throwIfDisposed!=null});function QR(){return p2("Tensor",()=>rt)}QR();var Op=class extends rt{constructor(e,t,r,n){super(e.shape,e.dtype,e.dataId,n),this.trainable=t,this.name=r}assign(e){if(e.dtype!==this.dtype)throw new Error(`dtype of the new value (${e.dtype}) and previous value (${this.dtype}) must match`);if(!Hs(e.shape,this.shape))throw new Error(`shape of the new value (${e.shape}) and previous value (${this.shape}) must match`);ia().disposeTensor(this),this.dataId=e.dataId,ia().incRef(this,null)}dispose(){ia().disposeVariable(this),this.isDisposedInternal=!0}};Ob
Manifest JSON has weights with names: ${o.join(", ")}.`)}let l=a.reduce((c,f,m)=>(f&&c.push(m),c),[]),u=[];l.forEach(c=>{t[c].paths.forEach(f=>{let m=r+(r.endsWith("/")?"":"/")+f;u.push(m)})});let d=await e(u),h={},p=0;return l.forEach(c=>{let f=t[c].paths.length,m=0;for(let x=0;x<f;x++)m+=d[p+x].byteLength;let g=new ArrayBuffer(m),y=new Uint8Array(g),A=0;for(let x=0;x<f;x++){let b=new Uint8Array(d[p+x]);y.set(b,A),A+=b.byteLength}s[c].forEach(x=>{let b=g.slice(x.groupOffset,x.groupOffset+x.sizeBytes),v=Gw(b,[x.manifestEntry]);for(let S in v)h[S]=v[S]}),p+=f}),h}}var ZM="application/octet-stream",YM="application/json",A2=class{constructor(e,t){if(this.DEFAULT_METHOD="POST",t==null&&(t={}),this.weightPathPrefix=t.weightPathPrefix,this.onProgress=t.onProgress,this.weightUrlConverter=t.weightUrlConverter,t.fetchFunc!=null?(P(typeof t.fetchFunc=="function",()=>"Must pass a function that matches the signature of `fetch` (see https://developer.mozilla.org/en-US/docs/Web/API/Fetch_API)"),this.fetch=t.fetchFunc):this.fetch=Y().platform.fetch,P(e!=null&&e.length>0,()=>"URL path for http must not be null, undefined or empty."),Array.isArray(e)&&P(e.length===2,()=>`URL paths for http must have a length of 2, (actual length is ${e.length}).`),this.path=e,t.requestInit!=null&&t.requestInit.body!=null)throw new Error("requestInit is expected to have no pre-existing body, but has one.");this.requestInit=t.requestInit||{}}async save(e){if(e.modelTopology instanceof ArrayBuffer)throw new Error("BrowserHTTPRequest.save() does not support saving model topology in binary formats yet.");let t=Object.assign({method:this.DEFAULT_METHOD},this.requestInit);t.body=new FormData;let r=[{paths:["./model.weights.bin"],weights:e.weightSpecs}],n=jw(e,r);t.body.append("model.json",new Blob([JSON.stringify(n)],{type:YM}),"model.json"),e.weightData!=null&&t.body.append("model.weights.bin",new Blob([e.weightData],{type:ZM}),"model.weights.bin");let a=await this.fetch(this.path,t);if(a.ok)return{modelArtifactsInfo:mh(e),responses:[a]};throw new Error(`BrowserHTTPRequest.save() failed due to HTTP response status ${a.status}.`)}async load(){let e=await this.fetch(this.path,this.requestInit);if(!e.ok)throw new Error(`Request to ${this.path} failed with status code ${e.status}. Please verify this URL points to the model JSON of the model to load.`);let t;try{t=await e.json()}catch(a){let s=`Failed to parse model JSON of response from ${this.path}.`;throw this.path.endsWith(".pb")?s+=" Your path contains a .pb file extension. Support for .pb models have been removed in TensorFlow.js 1.0 in favor of .json models. You can re-convert your Python TensorFlow model using the TensorFlow.js 1.0 conversion scripts or you can convert your.pb models with the 'pb2json'NPM script in the tensorflow/tfjs-converter repository.":s+=" Please make sure the server is serving valid JSON for this request.",new Error(s)}let r=t.modelTopology,n=t.weightsManifest;if(r==null&&n==null)throw new Error(`The JSON from HTTP path ${this.path} contains neither model topology or manifest for weights.`);return y2(t,a=>this.loadWeights(a))}async loadWeights(e){let t=Array.isArray(this.path)?this.path[1]:this.path,[r,n]=JM(t),a=this.weightPathPrefix||r,s=[];for(let u of e)s.push(...u.weights);let i=[],o=[];for(let u of e)for(let d of u.paths)this.weightUrlConverter!=null?o.push(this.weightUrlConverter(d)):i.push(a+d+n);this.weightUrlConverter&&i.push(...await Promise.all(o));let l=await ek(i,{requestInit:this.requestInit,fetchFunc:this.fetch,onProgress:this.onProgress});return[s,g2(l)]}};A2.URL_SCHEME_REGEX=/^https?:\/\//;function JM(e){let t=e.lastIndexOf("/"),r=e.lastIndexOf("?"),n=e.substring(0,t),a=r>t?e.substring(r):"";return[n+"/",a]}function gy(e){return e.match(A2.URL_SCHEME_REGEX)!=null}var rk=(e,t)=>{if(typeof fetch=="undefined"&&(t==null||t.fetchFunc==null))return null;{let r=!0;if(Array.isArray(e)?r=e.every(n=>gy(n)):r=gy(e),r)return x2(e,t)}return null};Lt.registerSaveRouter(rk);Lt.registerLoadRouter(rk);function x2(e,t){return new A2(e,t)}function QM(e,t){return x2(e,t)}var X1=class{
2022-04-01 15:13:32 +02:00
Actual: ${a}.
Expected: ${s}.`);for(let i=0;i<s.length;++i){let o=a[i],l=s[i];if(!r(o,l))throw new Error(`Arrays differ: actual[${i}] = ${o}, expected[${i}] = ${l}.
Actual: ${a}.
2022-04-14 17:47:08 +02:00
Expected: ${s}.`)}}function TF(e,t){e().then(()=>t.fail(),()=>t())}function NF(e,t){let r=typeof t=="string"||typeof t=="number"||typeof t=="boolean"?[t]:t;return Ss(e)||Ss(e[0])||Ss(t)||Ss(t[0])?Ay(e,r,(n,a)=>n==a):Ay(e,t,(n,a)=>S2(n,a,0))}function CF(e,t,r){if(r==null&&(r=I2()),!S2(e,t,r))throw new Error(`Numbers differ: actual === ${e}, expected === ${t}`)}function S2(e,t,r){return!isFinite(e)&&!isFinite(t)?!0:!(isNaN(e)||isNaN(t)||Math.abs(e-t)>r)}function EF(e,t,r){for(let n=0;n<e.length;n++)if(e[n]<t||e[n]>r)throw new Error(`Value out of range:${e[n]} low: ${t}, high: ${r}`)}function RF(e,t){let r=new Float32Array(e),n=new Float32Array(t);if(r.length!==n.length)throw new Error(`Expected ArrayBuffer to be of length ${n.length}, but it was ${r.length}`);for(let a=0;a<n.length;a++)if(r[a]!==n[a])throw new Error(`Expected ArrayBuffer value at ${a} to be ${n[a]} but got ${r[a]} instead`)}function vk(e){for(let t=0;t<e.length;t++){let r=e[t];Array.isArray(r)?vk(r):e[t]=hh(r)}return e}var T2="0.0.0";function N2(){Y().set("PROD",!0)}function MF(){Y().set("DEBUG",!0)}function FF(){Y().set("DEPRECATION_WARNINGS_ENABLED",!1),console.warn("TensorFlow.js deprecation warnings have been disabled.")}function C2(e){Y().getBool("DEPRECATION_WARNINGS_ENABLED")&&console.warn(e+" You can disable deprecation warnings with tf.disableDeprecationWarnings().")}JR(C2);function $F(){B.disposeVariables()}function br(){return B}function vf(){return B.memory()}function PF(e){return B.profile(e)}function K(e,t){return B.tidy(e,t)}function re(e){c2(e).forEach(t=>t.dispose())}function cr(e){return B.keep(e)}function _F(e){return B.time(e)}function E2(e){return B.setBackend(e)}function ld(){return B.ready()}function sn(){return B.backendName}function zF(e){B.removeBackend(e)}function R2(e){return B.findBackend(e)}function OF(e){return B.findBackendFactory(e)}function Tl(e,t,r=1){return B.registerBackend(e,t,r)}function jn(){return B.backend}function DF(e,t){Y().setPlatform(e,t)}function LF(e,t){let r=F(e,"a","add"),n=F(t,"b","add");[r,n]=Ot(r,n);let a={a:r,b:n};return B.runKernel(Ya,a)}var le=W({add_:LF});function BF(e,t){let r=F(e,"a","floorDiv"),n=F(t,"b","floorDiv");[r,n]=Ot(r,n);let a={a:r,b:n};return B.runKernel(li,a)}var gh=W({floorDiv_:BF});function WF(e,t){let r=F(e,"a","div"),n=F(t,"b","div");if([r,n]=Ot(r,n),r.dtype==="int32"&&n.dtype==="int32")return gh(r,n);let a={a:r,b:n},s={};return B.runKernel(ai,a,s)}var pe=W({div_:WF});function VF(e,t){let r=F(e,"a","mul"),n=F(t,"b","mul");[r,n]=Ot(r,n);let a={a:r,b:n};return B.runKernel(vi,a)}var L=W({mul_:VF});function UF(e){let t=F(e,"x","abs");if(t.dtype==="complex64"){let r={x:t};return B.runKernel(Zp,r)}else{let r={x:t};return B.runKernel(Lo,r)}}var rr=W({abs_:UF});function GF(e){let t={x:F(e,"x","acos")};return B.runKernel(Pu,t)}var wk=W({acos_:GF});function jF(e){let t={x:F(e,"x","acosh")};return B.runKernel(_u,t)}var kk=W({acosh_:jF});function HF(e){P(Array.isArray(e),()=>"The argument passed to tf.addN() must be a list of tensors"),P(e.length>=1,()=>`Must pass at least one tensor to tf.addN(), but got ${e.length}`);let t=e.map((a,s)=>F(a,`tensors${s}`,"addN")),r=t[0];t.forEach(a=>{if(a.dtype!==r.dtype)throw new Error("All tensors passed to tf.addN() must have the same dtype")}),t.forEach(a=>{if(!Hs(a.shape,r.shape))throw new Error("All tensors passed to tf.addN() must have the same shape")});let n=t;return B.runKernel(qs,n)}var ym=W({addN_:HF});function qF(e,t=null,r=!1){let n={x:F(e,"x","all","bool")},a={axis:t,keepDims:r};return B.runKernel(zu,n,a)}var M2=W({all_:qF});function KF(e,t=null,r=!1){let n={x:F(e,"x","any","bool")},a={axis:t,keepDims:r};return B.runKernel(Ou,n,a)}var wf=W({any_:KF});function XF(e,t=0){let r={x:F(e,"x","argMax")},n={axis:t};return B.runKernel(Ks,r,n)}var Cn=W({argMax_:XF});function ZF(e,t=0){let r={x:F(e,"x","argMin")},n={axis:t};return B.runKernel(Du,r,n)}var Ik=W({argMin_:ZF});function YF(e){let t={x:F(e,"x","asin")};return B.runKernel(Lu,t)}var Sk=W({asin_:YF});function JF(e){let t={x:F(e,"x","asinh")};return B.runKernel(Bu,t)}var Tk=W({asinh_:JF});function
with dtype ${s.dtype}. `)}),r.length===1)return Br(r[0]);let n=r,a={axis:t};return B.runKernel(Wo,n,a)}var kt=W({concat_:p$});function h$(e){let t={x:F(e,"x","sigmoid","float32")};return B.runKernel(Ri,t)}var Nr=W({sigmoid_:h$});function c$(e,t,r){let n=F(e,"x","slice","string_or_numeric");if(n.rank===0)throw new Error("Slicing scalar is not possible");let a={x:n},s={begin:t,size:r};return B.runKernel(fl,a,s)}var Pe=W({slice_:c$});function f$(e){let t={x:F(e,"x","tanh","float32")};return B.runKernel(zi,t)}var bu=W({tanh_:f$});function m$(e,t,r,n,a,s){let i=F(e,"forgetBias","basicLSTMCell"),o=F(t,"lstmKernel","basicLSTMCell"),l=F(r,"lstmBias","basicLSTMCell"),u=F(n,"data","basicLSTMCell"),d=F(a,"c","basicLSTMCell"),h=F(s,"h","basicLSTMCell"),p=kt([u,h],1),c=Je(p,o),f=le(c,l),m=f.shape[0],g=f.shape[1]/4,y=[m,g],A=Pe(f,[0,0],y),x=Pe(f,[0,g],y),b=Pe(f,[0,g*2],y),v=Pe(f,[0,g*3],y),S=le(L(Nr(A),bu(x)),L(d,Nr(le(i,b)))),T=L(bu(S),Nr(v));return[S,T]}var g$=W({basicLSTMCell_:m$});function y$(e,t,r){let n=F(e,"x","batchToSpaceND"),a=t.reduce((o,l)=>o*l);P(n.rank>=1+t.length,()=>`input rank is ${n.rank} but should be > than blockShape.length ${t.length}`),P(r.length===t.length,()=>`crops.length is ${r.length} but should be equal to blockShape.length ${t.length}`),P(n.shape[0]%a===0,()=>`input tensor batch is ${n.shape[0]} but is not divisible by the product of the elements of blockShape ${t.join(" * ")} === ${a}`);let s={x:n},i={blockShape:t,crops:r};return B.runKernel(Bo,s,i)}var xm=W({batchToSpaceND_:y$});function A$(e){let t;return e.rank===0||e.rank===1?t=G(e,[1,1,1,e.size]):e.rank===2?t=G(e,[1,1,e.shape[0],e.shape[1]]):e.rank===3?t=G(e,[1,e.shape[0],e.shape[1],e.shape[2]]):t=e,t}function x$(e,t,r,n,a,s){s==null&&(s=.001);let i=F(e,"x","batchNorm"),o=F(t,"mean","batchNorm"),l=F(r,"variance","batchNorm"),u;a!=null&&(u=F(a,"scale","batchNorm"));let d;n!=null&&(d=F(n,"offset","batchNorm")),P(o.rank===l.rank,()=>"Batch normalization gradient requires mean and variance to have equal ranks."),P(d==null||o.rank===d.rank,()=>"Batch normalization gradient requires mean and offset to have equal ranks."),P(u==null||o.rank===u.rank,()=>"Batch normalization gradient requires mean and scale to have equal ranks.");let h={x:A$(i),scale:u,offset:d,mean:o,variance:l},p={varianceEpsilon:s},c=B.runKernel(ui,h,p);return G(c,i.shape)}var vu=W({batchNorm_:x$});function b$(e,t,r,n,a,s){let i=F(e,"x","batchNorm"),o=F(t,"mean","batchNorm"),l=F(r,"variance","batchNorm"),u;a!=null&&(u=F(a,"scale","batchNorm"));let d;return n!=null&&(d=F(n,"offset","batchNorm")),P(i.rank===2,()=>`Error in batchNorm2D: x must be rank 2 but got rank ${i.rank}.`),P(o.rank===2||o.rank===1,()=>`Error in batchNorm2D: mean must be rank 2 or rank 1 but got rank ${o.rank}.`),P(l.rank===2||l.rank===1,()=>`Error in batchNorm2D: variance must be rank 2 or rank 1 but got rank ${l.rank}.`),u!=null&&P(u.rank===2||u.rank===1,()=>`Error in batchNorm2D: scale must be rank 2 or rank 1 but got rank ${u.rank}.`),d!=null&&P(d.rank===2||d.rank===1,()=>`Error in batchNorm2D: offset must be rank 2 or rank 1 but got rank ${d.rank}.`),vu(i,o,l,d,u,s)}var $k=W({batchNorm2d_:b$});function v$(e,t,r,n,a,s){let i=F(e,"x","batchNorm"),o=F(t,"mean","batchNorm"),l=F(r,"variance","batchNorm"),u;a!=null&&(u=F(a,"scale","batchNorm"));let d;return n!=null&&(d=F(n,"offset","batchNorm")),P(i.rank===3,()=>`Error in batchNorm3D: x must be rank 3 but got rank ${i.rank}.`),P(o.rank===3||o.rank===1,()=>`Error in batchNorm3D: mean must be rank 3 or rank 1 but got rank ${o.rank}.`),P(l.rank===3||l.rank===1,()=>`Error in batchNorm3D: variance must be rank 3 or rank 1 but got rank ${l.rank}.`),u!=null&&P(u.rank===3||u.rank===1,()=>`Error in batchNorm3D: scale must be rank 3 or rank 1 but got rank ${u.rank}.`),d!=null&&P(d.rank===3||d.rank===1,()=>`Error in batchNorm3D: offset must be rank 3 or rank 1 but got rank ${d.rank}.`),vu(i,o,l,d,u,s)}var Pk=W({batchNorm3d_:v$});function w$(e,t,r,n,a,s){let i=F(e,"x","batchNorm"),o=F(t,"mean","batchNorm"),l=F(r,"variance","batchNorm"),u;a!=null&&(u=F(a,"scale","batchNor
2022-04-01 15:13:32 +02:00
${a} and ${t} for depthToSpace with input shape
${n.shape}`),P(s*t>=0,()=>`Negative dimension size caused by overflow when multiplying
${s} and ${t} for depthToSpace with input shape
2022-04-14 17:47:08 +02:00
${n.shape}`),P(i%(t*t)===0,()=>`Dimension size must be evenly divisible by ${t*t} but is ${i} for depthToSpace with input shape ${n.shape}`);let o={x:n},l={blockSize:t,dataFormat:r};return B.runKernel(Go,o,l)}var jk=W({depthToSpace_:G$});function j$(e,t,r,n,a="NHWC",s=[1,1],i){let o=F(e,"x","depthwiseConv2d","float32"),l=F(t,"filter","depthwiseConv2d","float32"),u=o,d=!1;o.rank===3&&(d=!0,u=G(o,[1,o.shape[0],o.shape[1],o.shape[2]])),P(u.rank===4,()=>`Error in depthwiseConv2d: input must be rank 4, but got rank ${u.rank}.`),P(l.rank===4,()=>`Error in depthwiseConv2d: filter must be rank 4, but got rank ${l.rank}.`),P(u.shape[3]===l.shape[2],()=>`Error in depthwiseConv2d: number of input channels (${u.shape[3]}) must match the inChannels dimension in filter ${l.shape[2]}.`),Ur("depthwiseConv2d",n,i);let h={x:u,filter:l},p={strides:r,pad:n,dataFormat:a,dilations:s,dimRoundingMode:i},c=B.runKernel(ni,h,p);return d?G(c,[c.shape[1],c.shape[2],c.shape[3]]):c}var Ah=W({depthwiseConv2d_:j$});function H$(e){let t={x:F(e,"x","diag")};return B.runKernel(tm,t)}var q$=W({diag_:H$});function K$(e,t,r,n,a=[1,1],s="NHWC"){let i=F(e,"x","dilation2d"),o=F(t,"filter","dilation2d");P(i.rank===3||i.rank===4,()=>`Error in dilation2d: input must be rank 3 or 4, but got rank ${i.rank}.`),P(o.rank===3,()=>`Error in dilation2d: filter must be rank 3, but got rank ${o.rank}.`),P(s==="NHWC",()=>`Error in dilation2d: Only NHWC is currently supported, but got dataFormat of ${s}`);let l=i,u=!1;i.rank===3&&(l=G(i,[1,i.shape[0],i.shape[1],i.shape[2]]),u=!0);let d={x:l,filter:o},h={strides:r,pad:n,dilations:a},p=B.runKernel(Jp,d,h);return u?G(p,[p.shape[1],p.shape[2],p.shape[3]]):p}var Hk=W({dilation2d_:K$});function X$(e,t){let r=F(e,"a","equal","string_or_numeric"),n=F(t,"b","equal","string_or_numeric");[r,n]=Ot(r,n),bt(r.shape,n.shape);let a={a:r,b:n};return B.runKernel(jo,a)}var En=W({equal_:X$});function Z$(e,t,r){let n=F(t,"a","where"),a=F(r,"b","where"),s=F(e,"condition","where","bool"),i=bt(bt(s.shape,n.shape),a.shape),o=Ep(s,i),l=Ep(n,i),u=Ep(a,i),d={condition:o,t:l,e:u};return B.runKernel(cl,d)}var Wr=W({where_:Z$});function Y$(e){let t={x:F(e,"x","zerosLike")};return B.runKernel(kl,t)}var at=W({zerosLike_:Y$});function J$(e,t){let r=F(e,"a","div"),n=F(t,"b","div");[r,n]=Ot(r,n);let a=pe(r,n),s=at(a),i=En(n,s);return Wr(i,s,a)}var qk=W({divNoNan_:J$});function Q$(e,t){let r=F(e,"t1","dot"),n=F(t,"t2","dot");P((r.rank===1||r.rank===2)&&(n.rank===1||n.rank===2),()=>`Error in dot: inputs must all be rank 1 or 2, but got ranks ${r.rank} and ${n.rank}.`);let a=r.rank===1?r.size:r.shape[1],s=n.rank===1?n.size:n.shape[0];if(P(a===s,()=>`Error in dot: inner dimensions of inputs must match, but got ${a} and ${s}.`),r.rank===1&&n.rank===1){let i=G(r,[1,-1]),o=G(n,[-1,1]),l=Je(i,o);return G(l,[])}else if(r.rank===1&&n.rank===2){let i=G(r,[1,-1]),o=G(n,[n.shape[0],n.shape[1]]),l=Je(i,o);return G(l,[l.size])}else if(r.rank===2&&n.rank===1){let i=G(n,[-1,1]),o=Je(r,i);return G(o,[o.size])}else{let i=G(n,[n.shape[0],n.shape[1]]);return Je(r,i)}}var eP=W({dot_:Q$});function tP(e,...t){let r=t.map((a,s)=>F(a,`tensors${s}`,"einsum")),n={equation:e};return B.runKernel(Qp,r,n)}var Kk=W({einsum_:tP});function rP(e){let t={x:F(e,"x","elu","float32")};return B.runKernel(si,t)}var xh=W({elu_:rP});function nP(e){let t=F(e,"x","erf");P(t.dtype==="int32"||t.dtype==="float32",()=>"Input dtype must be `int32` or `float32`."),t.dtype==="int32"&&(t=me(t,"float32"));let r={x:t};return B.runKernel(ju,r)}var Xk=W({erf_:nP});function aP(e){let t={x:F(e,"x","exp")};return B.runKernel(ii,t)}var Rn=W({exp_:aP});function sP(e,t=0){let r=F(e,"x","expandDims","string_or_numeric");P(t<=r.rank,()=>"Axis must be <= rank of the tensor");let n={input:r},a={dim:t};return B.runKernel(Ho,n,a)}var qt=W({expandDims_:sP});function iP(e){let t={x:F(e,"x","expm1")};return B.runKernel(qo,t)}var Zk=W({expm1_:iP});function oP(e,t){let r=F(e,"x","tile","string_or_numeric");P(r.rank===t.length,()=>`Error in transpose: rank of input ${r.rank} must match length of reps ${t}.`);let n={x:r},a={reps
rank ${s.rank}.`),P(Au(t),()=>`Error in localResponseNormalization: depthRadius must be an integer but got depthRadius ${t}.`);let i=s,o=!1;s.rank===3&&(o=!0,i=G(s,[1,s.shape[0],s.shape[1],s.shape[2]]));let l={x:i},u={depthRadius:t,bias:r,alpha:n,beta:a},d=B.runKernel(rh,l,u);return o?G(d,[d.shape[1],d.shape[2],d.shape[3]]):d}var Qk=W({localResponseNormalization_:wP});function kP(e){let t={x:F(e,"x","log","float32")};return B.runKernel(ci,t)}var Mn=W({log_:kP});function IP(e){let t={x:F(e,"x","log1p")};return B.runKernel(Zu,t)}var km=W({log1p_:IP});function SP(e){return P(Rs(e),()=>"The f passed in grad(f) must be a function"),(t,r)=>{let n=F(t,"x","tf.grad","string_or_numeric"),a=r!=null?F(r,"dy","tf.grad"):null;return B.tidy(()=>{let{value:s,grads:i}=B.gradients(()=>e(n),[n],a);return a!=null&&Vr(s.shape,a.shape,"The shape of dy passed in grad(f)(x, dy) must match the shape returned by f(x)"),Im(i),i[0]})}}function TP(e){return P(Rs(e),()=>"The f passed in grads(f) must be a function"),(t,r)=>{P(Array.isArray(t),()=>"The args passed in grads(f)(args) must be an array of `Tensor`s or `TensorLike`s");let n=Dp(t,"args","tf.grads","string_or_numeric"),a=r!=null?F(r,"dy","tf.grads"):null;return B.tidy(()=>{let{value:s,grads:i}=B.gradients(()=>e(...n),n,a);return a!=null&&Vr(s.shape,a.shape,"The shape of dy passed in grads(f)([x1,...], dy) must match the shape returned by f([x1,...])"),Im(i),i})}}function NP(e){return P(Rs(e),()=>"The f passed in valueAndGrad(f) must be a function"),(t,r)=>{P(t instanceof rt,()=>"The x passed in valueAndGrad(f)(x) must be a tensor"),P(r==null||r instanceof rt,()=>"The dy passed in valueAndGrad(f)(x, dy) must be a tensor");let{grads:n,value:a}=B.gradients(()=>e(t),[t],r);return Im(n),{grad:n[0],value:a}}}function CP(e){return P(Rs(e),()=>"The f passed in valueAndGrads(f) must be a function"),(t,r)=>{P(Array.isArray(t)&&t.every(a=>a instanceof rt),()=>"The args passed in valueAndGrads(f)(args) must be array of tensors"),P(r==null||r instanceof rt,()=>"The dy passed in valueAndGrads(f)(args, dy) must be a tensor");let n=B.gradients(()=>e(...t),t,r);return r!=null&&Vr(n.value.shape,r.shape,"The shape of dy passed in valueAndGrads(f)([x1,...], dy) must match the shape returned by f([x1,...])"),Im(n.grads),n}}function e7(e,t){P(Rs(e),()=>"The f passed in variableGrads(f) must be a function"),P(t==null||Array.isArray(t)&&t.every(u=>u instanceof Op),()=>"The varList passed in variableGrads(f, varList) must be an array of variables");let r=t!=null;if(!r){t=[];for(let u in B.registeredVariables)t.push(B.registeredVariables[u])}let n=r?t.filter(u=>!u.trainable):null,a=t.length;t=t.filter(u=>u.trainable),P(t.length>0,()=>`variableGrads() expects at least one of the input variables to be trainable, but none of the ${a} variables is trainable.`);let s=!0,{value:i,grads:o}=B.gradients(e,t,null,s);P(o.some(u=>u!=null),()=>"Cannot find a connection between any variable and the result of the loss function y=f(x). Please make sure the operations that use variables are inside the function f passed to minimize()."),P(i.rank===0,()=>`The f passed in variableGrads(f) must return a scalar, but it returned a rank-${i.rank} tensor`);let l={};return t.forEach((u,d)=>{o[d]!=null&&(l[u.name]=o[d])}),n!=null&&n.forEach(u=>l[u.name]=null),{value:i,grads:l}}function Fa(e){return B.customGrad(e)}function Im(e){if(e.filter(t=>t==null).length>0)throw new Error(`Cannot compute gradient of y=f(x) with respect to x. Make sure that
the f you passed encloses all operations that lead from x to y.`)}function EP(e){let t={x:F(e,"x","neg")};return B.runKernel(tl,t)}var zt=W({neg_:EP});function RP(e){let t={x:F(e,"x","softplus")};return B.runKernel(sd,t)}var pd=W({softplus_:RP});function MP(e){let t=F(e,"x","logSigmoid");return Fa(r=>({value:zt(pd(zt(r))),gradFunc:n=>L(n,Nr(zt(r)))}))(t)}var FP=W({logSigmoid_:MP});function $P(e,t=null,r=!1){let n={x:F(e,"x","max")},a={reductionIndices:t,keepDims:r};return B.runKernel(fi,n,a)}var mr=W({max_:$P});function PP(e,t){let r=F(e,"a","sub"),n=F(t,"b","sub");[r,n]=Ot(r,n);let a={a:r,b:n};return B.runKernel(_i,a)}var ce=W({sub_:PP});function _P(e,t=null,r=!1){let n=F(e,"x","sum");n.dtype==="bool"&&(n=me(n,"int32"));let a={x:n},s={axis:t,keepDims:r};return B.runKernel(Fi,a,s)}var ke=W({sum_:_P});function zP(e,t=-1){let r=F(e,"logits","logSoftmax");if(t===-1&&(t=r.rank-1),t!==r.rank-1)throw Error(`Log Softmax along a non-last dimension is not yet supported. Logits was rank ${r.rank} and axis was ${t}`);return Fa((n,a)=>{let s=mr(n,t,!0),i=ce(n,s),o=ce(me(i,"float32"),Mn(ke(Rn(i),t,!0)));return a([o]),{value:o,gradFunc:(l,u)=>{let[d]=u,h=!0,p=Rn(d);return ce(l,L(ke(l,t,h),p))}}})(r)}var U2=W({logSoftmax_:zP});function G2(e,t){for(let r=0;r<e.length;++r)if(e[e.length-r-1]!==t-1-r)return!1;return!0}function t7(e,t,r){let n=e.length+t.length,a=[],s=0,i=0;for(let o=0;o<n;o++)r.indexOf(o)===-1?a.push(e[s++]):a.push(t[i++]);return a}function r7(e,t){let r=[],n=e.length;for(let s=0;s<n;s++)t.indexOf(s)===-1&&r.push(e[s]);let a=t.map(s=>e[s]);return[r,a]}function Eo(e,t){let r=t.map(n=>1);return t7(e,r,t)}function OP(e,t,r){P(G2(t,r),()=>`${e} supports only inner-most axes for now. Got axes ${t} and rank-${r} input.`)}function n7(e,t){if(G2(e,t))return null;let r=[];for(let n=0;n<t;++n)e.indexOf(n)===-1&&r.push(n);return e.forEach(n=>r.push(n)),r}function j2(e){return e.map((t,r)=>[r,t]).sort((t,r)=>t[1]-r[1]).map(t=>t[0])}function DP(e,t){let r=[];for(let n=t-e;n<t;++n)r.push(n);return r}function LP(e,t=null,r=!1){let n=F(e,"x","logSumExp"),a=Un(t,n.shape),s=mr(n,a,!0),i=ce(n,s),o=Rn(i),l=ke(o,a),u=Mn(l),d=le(G(s,u.shape),u);if(r){let h=Eo(d.shape,a);return G(d,h)}return d}var a7=W({logSumExp_:LP});function BP(e,t){let r=F(e,"a","logicalAnd","bool"),n=F(t,"b","logicalAnd","bool");bt(r.shape,n.shape);let a={a:r,b:n};return B.runKernel(el,a)}var fa=W({logicalAnd_:BP});function WP(e){let t={x:F(e,"x","logicalNot","bool")};return B.runKernel(Yu,t)}var Sm=W({logicalNot_:WP});function VP(e,t){let r=F(e,"a","logicalOr","bool"),n=F(t,"b","logicalOr","bool");bt(r.shape,n.shape);let a={a:r,b:n};return B.runKernel(th,a)}var H2=W({logicalOr_:VP});function UP(e,t){let r=F(e,"a","logicalXor","bool"),n=F(t,"b","logicalXor","bool");return bt(r.shape,n.shape),fa(H2(e,t),Sm(fa(e,t)))}var GP=W({logicalXor_:UP});function jP(e,t,r,n,a){let s=F(e,"x","maxPool"),i=1,o=s,l=!1;s.rank===3&&(l=!0,o=G(s,[1,s.shape[0],s.shape[1],s.shape[2]])),P(o.rank===4,()=>`Error in maxPool: input must be rank 4 but got rank ${o.rank}.`),P(Pa(r,i),()=>`Error in maxPool: Either strides or dilations must be 1. Got strides ${r} and dilations '${i}'`),Ur("maxPool",n,a);let u={x:o},d={filterSize:t,strides:r,pad:n,dimRoundingMode:a},h=B.runKernel(gi,u,d);return l?G(h,[h.shape[1],h.shape[2],h.shape[3]]):h}var Tm=W({maxPool_:jP});function HP(e,t=[1,1,1],r,n,a,s="NDHWC"){let i=F(e,"x","maxPool3d"),o=i,l=!1;i.rank===4&&(l=!0,o=G(i,[1,i.shape[0],i.shape[1],i.shape[2],i.shape[3]])),P(o.rank===5,()=>`Error in maxPool3d: x must be rank 5 but got rank ${o.rank}.`),P(s==="NDHWC",()=>`Error in maxPool3d: Only NDHWC is currently supported, but got dataFormat of ${s}`),Ur("maxPool3d",n,a);let u={x:o},d={filterSize:t,strides:r,pad:n,dimRoundingMode:a,dataFormat:s},h=B.runKernel(nh,u,d);return l?G(h,[h.shape[1],h.shape[2],h.shape[3],h.shape[4]]):h}var q2=W({maxPool3d_:HP});function qP(e,t,r,n,a=!1){let s={x:F(e,"x","maxPoolWithArgmax")},i={filterSize:t,strides:r,pad:n,includeBatchInIndex:a},o=B.runKernel(um,s,i);return{result:o[0],indexes:o[1]}}var s7=W({maxPoolWithArgmax_:qP});func
${a.shape}`);if(s.rank!==1)throw new Error(`Values should be Tensor1D but received shape ${s.shape}`);if(i.rank!==1)throw new Error(`Dense shape should be Tensor1D but received shape ${i.shape}`);if(o.rank!==0)throw new Error(`Default value should be a scalar but received shape ${o.shape}`);let l={indices:a,values:s,denseShape:i,defaultValue:o},u=B.runKernel(sh,l);return{outputIndices:u[0],outputValues:u[1],emptyRowIndicator:u[2],reverseIndexMap:u[3]}}var uD=W({sparseFillEmptyRows_:lD});function dD(e,t,r){let n=F(e,"inputIndices","sparseReshape","int32"),a=F(t,"inputShape","sparseReshape","int32"),s=F(r,"newShape","sparseReshape","int32");if(n.rank!==2)throw new Error(`Input indices should be Tensor2D but received shape
${n.shape}`);if(a.rank!==1)throw new Error(`Input shape should be Tensor1D but received shape ${a.shape}`);if(s.rank!==1)throw new Error(`New shape should be Tensor1D but received shape ${s.shape}`);let i={inputIndices:n,inputShape:a,newShape:s},o=B.runKernel(id,i);return{outputIndices:o[0],outputShape:o[1]}}var pD=W({sparseReshape_:dD});function hD(e,t,r){let n=F(e,"data","sparseSegmentMean"),a=F(t,"indices","sparseSegmentMean","int32"),s=F(r,"segmentIds","sparseSegmentMean","int32");if(n.rank<1)throw new Error("Data should be at least 1 dimensional but received scalar");if(a.rank!==1)throw new Error(`Indices should be Tensor1D but received shape
2022-04-01 15:13:32 +02:00
${a.shape}`);if(s.rank!==1)throw new Error(`Segment ids should be Tensor1D but received shape
2022-04-14 17:47:08 +02:00
${s.shape}`);let i={data:n,indices:a,segmentIds:s};return B.runKernel(ih,i)}var cD=W({sparseSegmentMean_:hD});function fD(e,t,r){let n=F(e,"data","sparseSegmentSum"),a=F(t,"indices","sparseSegmentSum","int32"),s=F(r,"segmentIds","sparseSegmentSum","int32");if(n.rank<1)throw new Error("Data should be at least 1 dimensional but received scalar");if(a.rank!==1)throw new Error(`Indices should be Tensor1D but received shape
2022-04-01 15:13:32 +02:00
${a.shape}`);if(s.rank!==1)throw new Error(`Segment ids should be Tensor1D but received shape
2022-04-14 17:47:08 +02:00
${s.shape}`);let i={data:n,indices:a,segmentIds:s};return B.runKernel(oh,i)}var mD=W({sparseSegmentSum_:fD});function gD(e,t,r,n,a,s,i,o){let l=F(e,"data","stringNGrams","string");if(l.dtype!=="string")throw new Error("Data must be of datatype string");if(l.shape.length!==1)throw new Error(`Data must be a vector, saw: ${l.shape}`);let u=F(t,"dataSplits","stringNGrams");if(u.dtype!=="int32")throw new Error("Data splits must be of datatype int32");let d={separator:r,nGramWidths:n,leftPad:a,rightPad:s,padWidth:i,preserveShortSequences:o},h={data:l,dataSplits:u},p=B.runKernel(uh,h,d);return{nGrams:p[0],nGramsSplits:p[1]}}var yD=W({stringNGrams_:gD});function AD(e,t,r=!0){let n=F(e,"input","stringSplit","string"),a=F(t,"delimiter","stringSplit","string");if(n.rank!==1)throw new Error(`Input should be Tensor1D but received shape ${n.shape}`);if(a.rank!==0)throw new Error(`Delimiter should be a scalar but received shape ${a.shape}`);let s={skipEmpty:r},i={input:n,delimiter:a},o=B.runKernel(cm,i,s);return{indices:o[0],values:o[1],shape:o[2]}}var xD=W({stringSplit_:AD});function bD(e,t){let r=F(e,"input","stringToHashBucketFast","string"),n={numBuckets:t};if(t<=0)throw new Error("Number of buckets must be at least 1");let a={input:r};return B.runKernel(fm,a,n)}var vD=W({stringToHashBucketFast_:bD}),wD={fft:Mm,ifft:Wp,rfft:Fm,irfft:aA},kD={hammingWindow:Yz,hannWindow:T7,frame:N7,stft:tO},Ie={flipLeftRight:sO,grayscaleToRGB:oO,resizeNearestNeighbor:MO,resizeBilinear:EO,rotateWithOffset:uO,cropAndResize:nO,nonMaxSuppression:pO,nonMaxSuppressionAsync:xO,nonMaxSuppressionWithScore:vO,nonMaxSuppressionWithScoreAsync:kO,nonMaxSuppressionPadded:SO,nonMaxSuppressionPaddedAsync:NO,threshold:PO,transform:zO},F7={bandPart:DO,gramSchmidt:BO,qr:VO},ID={absoluteDifference:jO,computeWeightedLoss:ts,cosineDistance:qO,hingeLoss:XO,huberLoss:YO,logLoss:QO,meanSquaredError:tD,sigmoidCrossEntropy:aD,softmaxCrossEntropy:oD},bp={sparseFillEmptyRows:uD,sparseReshape:pD,sparseSegmentMean:cD,sparseSegmentSum:mD},rf={stringNGrams:yD,stringSplit:xD,stringToHashBucketFast:vD},rs=class extends Ak{minimize(e,t=!1,r){let{value:n,grads:a}=this.computeGradients(e,r);if(r!=null){let s=r.map(i=>({name:i.name,tensor:a[i.name]}));this.applyGradients(s)}else this.applyGradients(a);return re(a),t?n:(n.dispose(),null)}get iterations(){return this.iterations_==null&&(this.iterations_=0),this.iterations_}incrementIterations(){this.iterations_=this.iterations+1}computeGradients(e,t){return e7(e,t)}dispose(){this.iterations_!=null&&re(this.iterations_)}async saveIterations(){return this.iterations_==null&&(this.iterations_=0),{name:"iter",tensor:Se(this.iterations_,"int32")}}async getWeights(){throw new Error("getWeights() is not implemented for this optimizer yet.")}async setWeights(e){throw new Error(`setWeights() is not implemented for this optimizer class ${this.getClassName()}`)}async extractIterations(e){return this.iterations_=(await e[0].tensor.data())[0],e.slice(1)}};Object.defineProperty(rs,Symbol.hasInstance,{value:e=>e.minimize!=null&&e.computeGradients!=null&&e.applyGradients!=null});var Dm=class extends rs{constructor(e,t,r=null){super(),this.learningRate=e,this.rho=t,this.epsilon=r,this.accumulatedGrads=[],this.accumulatedUpdates=[],r==null&&(this.epsilon=B.backend.epsilon())}applyGradients(e){(Array.isArray(e)?e.map(t=>t.name):Object.keys(e)).forEach((t,r)=>{let n=B.registeredVariables[t],a=!1;this.accumulatedGrads[r]==null&&(this.accumulatedGrads[r]={originalName:`${t}/accum_grad`,variable:K(()=>at(n).variable(a))}),this.accumulatedUpdates[r]==null&&(this.accumulatedUpdates[r]={originalName:`${t}/accum_var`,variable:K(()=>at(n).variable(a))});let s=Array.isArray(e)?e[r].tensor:e[t];if(s==null)return;let i=this.accumulatedGrads[r].variable,o=this.accumulatedUpdates[r].variable;K(()=>{let l=le(L(i,this.rho),L(At(s),1-this.rho)),u=L(pe(Er(le(o,this.epsilon)),Er(le(i,this.epsilon))),s),d=le(L(o,this.rho),L(At(u),1-this.rho));i.assign(l),o.assign(d);let h=le(L(u,-this.learningRate),n);n.assign(h)})}),this.incrementIterations()}dispose(){this.accumulate
indices.shape[0] = ${e}`}function aL(e,t){return`indices(${e}, 0) is invalid: ${t} < 0`}function sL(e,t,r){return`indices(${e}, 0) is invalid: ${t} >= ${r}`}function iL(e,t){return`only one output dimension may be -1, not both ${e} and ${t}`}function oL(e,t){return`size ${e} must be non-negative, not ${t}`}function lL(){return"reshape cannot infer the missing input size for an empty tensor unless all specified input sizes are non-zero"}function uL(e,t){let r=Tt(e),n=Tt(t);return`Input to reshape is a SparseTensor with ${r}
dense values, but the requested shape requires a multiple of ${n}. inputShape=${e} outputShape= ${t}`}function dL(e,t){let r=Tt(e),n=Tt(t);return`Input to reshape is a tensor with ${r} dense values, but the requested shape has ${n}. inputShape=${e} outputShape=${t}`}function pL(){return"segment ids must be >= 0"}function hL(){return"segment ids are not increasing"}function cL(e,t){return`Segment id ${e} out of range [0, ${t}), possibly because segmentIds input is not sorted.`}function fL(e,t,r){return`Bad: indices[${e}] == ${t} out of range [0, ${r})`}var _7={};Le(_7,{collectGatherOpShapeInfo:()=>yL,computeOutShape:()=>gL,segOpComputeOptimalWindowSize:()=>mL});function mL(e,t){let r=!1,n;for(e<=cA?(n=e,r=!0):n=ff(e,Math.floor(Math.sqrt(e)));!r;)n>t||n===e?r=!0:n=ff(e,n+1);return n}function gL(e,t,r){let n=[],a=e.length;for(let s=0;s<a;s++)s!==t?n.push(e[s]):n.push(r);return n}function yL(e,t,r,n){let a=t.shape.length,s=e.shape.length;if(n!==0&&(n<-a||n>a))throw new Error(`Expect batchDims in the range of [-${a}, ${a}], but got ${n}`);if(n<0&&(n+=a),n>s)throw new Error(`batchDims (${n}) must be less than rank(x) (
${s}).`);if(r<n)throw new Error(`batchDims (${n}) must be less than or equal to axis (${r}).`);for(let h=0;h<n;++h)if(e.shape[h]!==t.shape[h])throw new Error(`x.shape[${h}]: ${e.shape[h]} should be equal to indices.shape[${h}]: ${t.shape[h]}.`);let i=e.shape[r],o=[],l=1,u=1,d=1;for(let h=0;h<n;++h)o.push(e.shape[h]),l*=e.shape[h];for(let h=n;h<r;h++)o.push(e.shape[h]),u*=e.shape[h];for(let h=n;h<a;h++)o.push(t.shape[h]);for(let h=r+1;h<s;h++)o.push(e.shape[h]),d*=e.shape[h];return{batchSize:l,sliceSize:d,outerSize:u,dimSize:i,outputShape:o}}function AL(e){try{return e.map(t=>Af(t))}catch(t){throw new Error(`Failed to decode encoded string bytes into utf-8, error: ${t}`)}}function xL(e){return e.map(t=>hh(t))}var qn={};Le(qn,{nonMaxSuppressionV3Impl:()=>C7,nonMaxSuppressionV4Impl:()=>E7,nonMaxSuppressionV5Impl:()=>R7,whereImpl:()=>A7});var z7={kernelName:Lo,inputsToSave:["x"],gradFunc:(e,t)=>{let[r]=t;return{x:()=>L(e,wh(me(r,"float32"),-1))}}},bL={kernelName:Pu,inputsToSave:["x"],gradFunc:(e,t)=>{let[r]=t;return{x:()=>{let n=At(me(r,"float32")),a=Er(ce(Se(1),n));return zt(pe(e,a))}}}},vL={kernelName:_u,inputsToSave:["x"],gradFunc:(e,t)=>{let[r]=t;return{x:()=>{let n=Er(ce(At(me(r,"float32")),1));return pe(e,n)}}}},wL={kernelName:Ya,inputsToSave:["a","b"],gradFunc:(e,t)=>{let[r,n]=t,a=bt(r.shape,n.shape);return{a:()=>{let s=e,i=Zt(r.shape,a);return i.length>0&&(s=ke(s,i)),G(s,r.shape)},b:()=>{let s=e,i=Zt(n.shape,a);return i.length>0&&(s=ke(s,i)),G(s,n.shape)}}}},kL={kernelName:qs,saveAllInputs:!0,gradFunc:(e,t)=>{let r={};return t.forEach((n,a)=>{r[a]=()=>e.clone()}),r}},IL={kernelName:Ks,inputsToSave:["x"],gradFunc:(e,t)=>{let[r]=t;return{x:()=>at(r)}}},SL={kernelName:Du,inputsToSave:["x"],gradFunc:(e,t)=>{let[r]=t;return{x:()=>at(r)}}},TL={kernelName:Lu,inputsToSave:["x"],gradFunc:(e,t)=>{let[r]=t;return{x:()=>pe(e,Er(ce(Se(1),At(me(r,"float32")))))}}},NL={kernelName:Bu,inputsToSave:["x"],gradFunc:(e,t)=>{let[r]=t;return{x:()=>{let n=Er(le(Se(1),At(me(r,"float32"))));return pe(e,n)}}}},CL={kernelName:Uu,inputsToSave:["a","b"],gradFunc:(e,t)=>{let[r,n]=t,a=bt(r.shape,n.shape);return{a:()=>{let s=le(At(r),At(n)),i=L(e,pe(n,s)),o=Zt(r.shape,a);return o.length>0&&(i=ke(i,o)),G(i,r.shape)},b:()=>{let s=le(At(r),At(n)),i=zt(L(e,pe(r,s))),o=Zt(n.shape,a);return o.length>0&&(i=ke(i,o)),G(i,n.shape)}}}},EL={kernelName:Wu,inputsToSave:["x"],gradFunc:(e,t)=>{let[r]=t;return{x:()=>pe(e,le(At(me(r,"float32")),1))}}},RL={kernelName:Vu,inputsToSave:["x"],gradFunc:(e,t)=>{let[r]=t;return{x:()=>pe(e,ce(Se(1),At(me(r,"float32"))))}}};function ML(e,t,r,n,a,s){let i=F(e,"dy","avgPool3dGrad"),o=F(t,"input","avgPool3dGrad"),l=i,u=o,d=!1;o.rank===4&&(d=!0,l=G(i,[1,i.shape[0],i.shape[1],i.shape[2],i.shape[3]]),u=G(o,[1,o.shape[0],o.shape[1],o.shape[2],o.shape[3]])),P(l.rank===5,()=>`Error in avgPool3dGrad: dy must be rank 5 but got rank ${l.rank}.`),P(u.rank===5,()=>`Error in avgPool3dGrad: input must be rank 5 but got rank ${u.rank}.`),Ur("avgPool3dGrad",a,s);let h={dy:l,input:u},p={filterSize:r,strides:n,pad:a,dimRoundingMode:s},c=B.runKernel(Hf,h,p);return d?G(c,[c.shape[1],c.shape[2],c.shape[3],c.shape[4]]):c}var FL=W({avgPool3dGrad_:ML}),$L={kernelName:Kp,inputsToSave:["x"],gradFunc:(e,t,r)=>{let[n]=t,{filterSize:a,strides:s,pad:i,dimRoundingMode:o}=r;return{x:()=>FL(e,n,a,s,i,o)}}};function PL(e,t,r,n,a){let s=F(e,"dy","avgPoolGrad"),i=F(t,"input","avgPoolGrad");P(i.rank===s.rank,()=>`Rank of input (${i.rank}) does not match rank of dy (${s.rank})`);let o=i,l=s,u=!1;i.rank===3&&(u=!0,o=G(i,[1,i.shape[0],i.shape[1],i.shape[2]]),l=G(s,[1,s.shape[0],s.shape[1],s.shape[2]])),P(l.rank===4,()=>`Error in avgPoolGrad: dy must be rank 4 but got rank ${l.rank}.`),P(o.rank===4,()=>`Error in avgPoolGrad: input must be rank 4 but got rank ${o.rank}.`);let d={dy:l,input:o},h={filterSize:r,strides:n,pad:a},p=B.runKernel(jf,d,h);return u?G(p,[p.shape[1],p.shape[2],p.shape[3]]):p}var _L=W({avgPoolGrad_:PL}),zL={kernelName:Xs,inputsToSave:["x"],gradFunc:(e,t,r)=>{let[n]=t,{filterSize:a,strides:s,pad:i}=r;return{x:()=>_L(e,n,a,s,i)}}},OL={kernelName:
2022-04-01 15:13:32 +02:00
1. The ${n} is defined in Python, in which case it needs to be ported to TensorFlow.js or your JavaScript code.
2. The custom ${n} is defined in JavaScript, but is not registered properly with tf.serialization.registerClass().`);return i}else{let s=e;if(s.className==null||s.config==null)throw new q(`${n}: Improper config format: ${JSON.stringify(s)}.
2022-04-11 17:45:24 +02:00
'className' and 'config' must set.`);let i=s.className,o,l;if(i in r?[o,l]=r[i]:i in Dn?[o,l]=Dn.className:i in t&&([o,l]=t[i]),o==null)throw new q(`Unknown ${n}: ${i}. This may be due to one of the following reasons:
2022-04-01 15:13:32 +02:00
1. The ${n} is defined in Python, in which case it needs to be ported to TensorFlow.js or your JavaScript code.
2022-04-14 17:47:08 +02:00
2. The custom ${n} is defined in JavaScript, but is not registered properly with tf.serialization.registerClass().`);if(l!=null){let u={};for(let c of Object.keys(Dn))u[c]=Dn[c];for(let c of Object.keys(r))u[c]=r[c];let d=s.config;d.customObjects=u;let h={...Dn};for(let c of Object.keys(r))Dn[c]=r[c];vy(s.config);let p=l(o,s.config,r,a);return Dn={...h},p}else{let u={...Dn};for(let h of Object.keys(r))Dn[h]=r[h];let d=new o(s.config);return Dn={...u},d}}}function vW(e,t){return e<t?-1:e>t?1:0}function Gc(e,t){return-1*vW(e,t)}function Cs(e){if(e==null)return e;let t=[];for(let r of e)t.indexOf(r)===-1&&t.push(r);return t}function wW(e){if(e==null)throw new q(`Invalid value in obj: ${JSON.stringify(e)}`);for(let t in e)if(e.hasOwnProperty(t))return!1;return!0}function Rl(e,t,r){if(r!=null&&e.indexOf(r)<0)throw new q(`${r} is not a valid ${t}. Valid values are ${e} or null/undefined.`)}function mA(e,t,r=0,n=1/0){return Ta(r>=0),Ta(n>=r),Array.isArray(e)&&e.length>=r&&e.length<=n&&e.every(a=>typeof a===t)}function fr(e,t){Array.isArray(e)?(w.assert(e.length>0,()=>`${t} is unexpectedly an empty array.`),e.forEach((r,n)=>fr(r,`element ${n+1} of ${t}`))):w.assert(Number.isInteger(e)&&e>0,()=>`Expected ${t} to be a positive integer, but got ${B7(e)}.`)}function B7(e){return e===null?"null":Array.isArray(e)?"["+e.map(t=>B7(t)).join(",")+"]":typeof e=="string"?`"${e}"`:`${e}`}function kW(e,t,r){let n=r!=null?r():w.now(),a;return(...s)=>{let i=r!=null?r():w.now();return i-n<t||(n=i,a=e(...s)),a}}function W7(e){return e==="relu"?"relu":e==="linear"?"linear":e==="elu"?"elu":null}function gA(e,t){return K(()=>Er(ke(L(e,e),t,!0)))}var Sh=class extends ue.Serializable{getConfig(){return{}}},yA=class extends Sh{constructor(e){super(),this.defaultMaxValue=2,this.defaultAxis=0,this.maxValue=e.maxValue!=null?e.maxValue:this.defaultMaxValue,this.axis=e.axis!=null?e.axis:this.defaultAxis}apply(e){return K(()=>{let t=gA(e,this.axis),r=cn(t,0,this.maxValue);return L(e,pe(r,le(nr(),t)))})}getConfig(){return{maxValue:this.maxValue,axis:this.axis}}};yA.className="MaxNorm";ue.registerClass(yA);var AA=class extends Sh{constructor(e){super(),this.defaultAxis=0,this.axis=e.axis!=null?e.axis:this.defaultAxis}apply(e){return K(()=>pe(e,le(nr(),gA(e,this.axis))))}getConfig(){return{axis:this.axis}}};AA.className="UnitNorm";ue.registerClass(AA);var xA=class extends Sh{apply(e){return _a(e)}};xA.className="NonNeg";ue.registerClass(xA);var bA=class extends Sh{constructor(e){super(),this.defaultMinValue=0,this.defaultMaxValue=1,this.defaultRate=1,this.defaultAxis=0,this.minValue=e.minValue!=null?e.minValue:this.defaultMinValue,this.maxValue=e.maxValue!=null?e.maxValue:this.defaultMaxValue,this.rate=e.rate!=null?e.rate:this.defaultRate,this.axis=e.axis!=null?e.axis:this.defaultAxis}apply(e){return K(()=>{let t=gA(e,this.axis),r=le(L(this.rate,cn(t,this.minValue,this.maxValue)),L(1-this.rate,t));return L(e,pe(r,le(nr(),t)))})}getConfig(){return{minValue:this.minValue,maxValue:this.maxValue,rate:this.rate,axis:this.axis}}};bA.className="MinMaxNorm";ue.registerClass(bA);var Y3={maxNorm:"MaxNorm",minMaxNorm:"MinMaxNorm",nonNeg:"NonNeg",unitNorm:"UnitNorm"};function sr(e){return fA(e)}function J3(e,t={}){return Ih(e,ue.SerializationMap.getMap().classNameMap,t,"constraint")}function ir(e){if(e==null)return null;if(typeof e=="string"){let t={className:e in Y3?Y3[e]:e,config:{}};return J3(t)}else return e instanceof Sh?e:J3(e)}function IW(e){return new yA(e)}function SW(e){return new AA(e)}function TW(){return new xA}function NW(e){return new bA(e)}var V7={};Le(V7,{constant:()=>ZW,glorotNormal:()=>nV,glorotUniform:()=>rV,heNormal:()=>aV,heUniform:()=>sV,identity:()=>eV,leCunNormal:()=>iV,leCunUniform:()=>oV,ones:()=>XW,orthogonal:()=>lV,randomNormal:()=>JW,randomUniform:()=>YW,truncatedNormal:()=>QW,varianceScaling:()=>tV,zeros:()=>KW});var CW=["channelsFirst","channelsLast"],EW=["nearest","bilinear"],RW=["valid","same","causal"],MW=["max","avg"],FW=["sum","mul","concat","ave"],su=new Map;function Gt(e){Rl(CW,"DataFormat",e)}function $W(e){Rl(EW,"InterpolationForm
2022-04-11 17:45:24 +02:00
because the value dtype is ${t.dtype}, but TensorArray dtype is ${this.dtype}.`);if(this.size()===0&&(this.elementShape==null||this.elementShape.length===0)&&(this.elementShape=t.shape),Ln(this.elementShape,t.shape,`TensorArray ${this.name}: Could not write to TensorArray index ${e}.`),r.read)throw new Error(`TensorArray ${this.name}: Could not write to TensorArray index ${e}, because it has already been read.`);if(r.written)throw new Error(`TensorArray ${this.name}: Could not write to TensorArray index ${e}, because it has already been written.`);r.tensor=t,cr(t),r.written=!0,this.tensors[e]=r}writeMany(e,t){if(e.length!==t.length)throw new Error(`TensorArray ${this.name}: could not write multiple tensors,because the index size: ${e.length} is not the same as tensors size: ${t.length}.`);e.forEach((r,n)=>this.write(r,t[n]))}gather(e,t){if(!!t&&t!==this.dtype)throw new Error(`TensorArray dtype is ${this.dtype} but gather requested dtype ${t}`);if(e)e=e.slice(0,this.size());else{e=[];for(let n=0;n<this.size();n++)e.push(n)}if(e.length===0)return ct([],[0].concat(this.elementShape));let r=this.readMany(e);return Ln(this.elementShape,r[0].shape,"TensorArray shape mismatch: "),or(r,0)}concat(e){if(!!e&&e!==this.dtype)throw new Error(`TensorArray dtype is ${this.dtype} but concat requested dtype ${e}`);if(this.size()===0)return ct([],[0].concat(this.elementShape));let t=[];for(let n=0;n<this.size();n++)t.push(n);let r=this.readMany(t);return Ln(this.elementShape,r[0].shape,`TensorArray shape mismatch: tensor array shape (${this.elementShape}) vs first tensor shape (${r[0].shape})`),kt(r,0)}scatter(e,t){if(t.dtype!==this.dtype)throw new Error(`TensorArray dtype is ${this.dtype} but tensor has dtype ${t.dtype}`);if(e.length!==t.shape[0])throw new Error(`Expected len(indices) == tensor.shape[0], but saw: ${e.length} vs. ${t.shape[0]}`);let r=Math.max(...e);if(!this.dynamicSize&&r>=this.maxSize)throw new Error(`Max index must be < array size (${r} vs. ${this.maxSize})`);this.writeMany(e,tn(t,0))}split(e,t){if(t.dtype!==this.dtype)throw new Error(`TensorArray dtype is ${this.dtype} but tensor has dtype ${t.dtype}`);let r=0,n=e.map(o=>(r+=o,r));if(r!==t.shape[0])throw new Error(`Expected sum of lengths to be equal to
2022-02-10 18:27:21 +01:00
tensor.shape[0], but sum of lengths is
2022-04-14 17:47:08 +02:00
${r}, and tensor's shape is: ${t.shape}`);if(!this.dynamicSize&&e.length!==this.maxSize)throw new Error(`TensorArray's size is not equal to the size of lengths (${this.maxSize} vs. ${e.length}), and the TensorArray is not marked as dynamically resizeable`);let a=r===0?0:t.size/r,s=[];K(()=>{t=G(t,[1,r,a]);for(let o=0;o<e.length;++o){let l=o===0?0:n[o-1],u=[0,l,0],d=[1,e[o],a];s[o]=G(Pe(t,u,d),this.elementShape)}return s});let i=[];for(let o=0;o<e.length;o++)i[o]=o;this.writeMany(i,s)}},Nu=class{constructor(e,t,r,n=-1){this.tensors=e,this.elementShape=t,this.elementDtype=r,e!=null&&e.forEach(a=>{if(r!==a.dtype)throw new Error(`Invalid data types; op elements ${r}, but list elements ${a.dtype}`);Ln(t,a.shape,"TensorList shape mismatch: "),cr(a)}),this.idTensor=Se(0),this.maxNumElements=n,cr(this.idTensor)}get id(){return this.idTensor.id}copy(){return new Nu([...this.tensors],this.elementShape,this.elementDtype)}clearAndClose(e){this.tensors.forEach(t=>{(e==null||!e.has(t.id))&&t.dispose()}),this.tensors.length=0,this.idTensor.dispose()}size(){return this.tensors.length}stack(e,t,r=-1){if(t!==this.elementDtype)throw new Error(`Invalid data types; op elements ${t}, but list elements ${this.elementDtype}`);if(r!==-1&&this.tensors.length!==r)throw new Error(`Operation expected a list with ${r} elements but got a list with ${this.tensors.length} elements.`);Ln(e,this.elementShape,"TensorList shape mismatch: ");let n=gp(this.elementShape,this.tensors,e);return K(()=>{let a=this.tensors.map(s=>G(s,n));return or(a,0)})}popBack(e,t){if(t!==this.elementDtype)throw new Error(`Invalid data types; op elements ${t}, but list elements ${this.elementDtype}`);if(this.size()===0)throw new Error("Trying to pop from an empty list.");let r=gp(this.elementShape,this.tensors,e),n=this.tensors.pop();return Ln(n.shape,e,"TensorList shape mismatch: "),G(n,r)}pushBack(e){if(e.dtype!==this.elementDtype)throw new Error(`Invalid data types; op elements ${e.dtype}, but list elements ${this.elementDtype}`);if(Ln(e.shape,this.elementShape,"TensorList shape mismatch: "),this.maxNumElements===this.size())throw new Error("Trying to push element into a full list.");cr(e),this.tensors.push(e)}resize(e){if(e<0)throw new Error(`TensorListResize expects size to be non-negative. Got: ${e}`);if(this.maxNumElements!==-1&&e>this.maxNumElements)throw new Error(`TensorListResize input size ${e} is greater maxNumElement ${this.maxNumElements}.`);let t=new Nu([],this.elementShape,this.elementDtype,this.maxNumElements);t.tensors.length=e;for(let r=0;r<Math.min(this.tensors.length,e);++r)t.tensors[r]=this.tensors[r];return t}getItem(e,t,r){if(r!==this.elementDtype)throw new Error(`Invalid data types; op elements ${r}, but list elements ${this.elementDtype}`);if(e<0||e>this.tensors.length)throw new Error(`Trying to access element ${e} in a list with ${this.tensors.length} elements.`);if(this.tensors[e]==null)throw new Error(`element at index ${e} is null.`);Ln(this.tensors[e].shape,t,"TensorList shape mismatch: ");let n=gp(this.elementShape,this.tensors,t);return G(this.tensors[e],n)}setItem(e,t){if(t.dtype!==this.elementDtype)throw new Error(`Invalid data types; op elements ${t.dtype}, but list elements ${this.elementDtype}`);if(e<0||this.maxNumElements!==-1&&e>=this.maxNumElements)throw new Error(`Trying to set element ${e} in a list with max ${this.maxNumElements} elements.`);Ln(this.elementShape,t.shape,"TensorList shape mismatch: "),cr(t),this.tensors[e]=t}gather(e,t,r){if(t!==this.elementDtype)throw new Error(`Invalid data types; op elements ${t}, but list elements ${this.elementDtype}`);Ln(this.elementShape,r,"TensorList shape mismatch: "),e=e.slice(0,this.size());let n=gp(this.elementShape,this.tensors,r);return e.length===0?ct([],[0].concat(n)):K(()=>{let a=e.map(s=>G(this.tensors[s],n));return or(a,0)})}concat(e,t){if(!!e&&e!==this.elementDtype)throw new Error(`TensorList dtype is ${this.elementDtype} but concat requested dtype ${e}`);Ln(this.elementShape,t,"TensorList shape mismatch: ");let r=gp(this.elementShape,this.tensors,t);return this.size()===0?c
2022-02-10 18:27:21 +01:00
tensor.shape[0], but sum of lengths is
2022-04-14 17:47:08 +02:00
${n}, and tensor's shape is: ${e.shape}`);let s=e.shape.slice(1),i=Vy(s,r),o=n===0?0:e.size/n,l=K(()=>{let d=[];e=G(e,[1,n,o]);for(let h=0;h<t.length;++h){let p=h===0?0:a[h-1],c=[0,p,0],f=[1,t[h],o];d[h]=G(Pe(e,c,f),i)}return e.dispose(),d}),u=new Nu([],r,e.dtype,t.length);for(let d=0;d<l.length;d++)u.setItem(d,l[d]);return u}var _j=async(e,t,r)=>{switch(e.op){case"If":case"StatelessIf":{let n=k("thenBranch",e,t,r),a=k("elseBranch",e,t,r),s=k("cond",e,t,r),i=k("args",e,t,r);return(await s.data())[0]?r.functionMap[n].executeFunctionAsync(i,r.tensorArrayMap,r.tensorListMap):r.functionMap[a].executeFunctionAsync(i,r.tensorArrayMap,r.tensorListMap)}case"While":case"StatelessWhile":{let n=k("body",e,t,r),a=k("cond",e,t,r),s=k("args",e,t,r),i=await r.functionMap[a].executeFunctionAsync(s,r.tensorArrayMap,r.tensorListMap),o=s.map(d=>d.id),l=await i[0].data();i.forEach(d=>{!d.kept&&o.indexOf(d.id)===-1&&d.dispose()});let u=s;for(;l[0];){let d=u;u=await r.functionMap[n].executeFunctionAsync(u,r.tensorArrayMap,r.tensorListMap);let h=u.map(c=>c.id);d.forEach(c=>{!c.kept&&o.indexOf(c.id)===-1&&h.indexOf(c.id)===-1&&c.dispose()});let p=await r.functionMap[a].executeFunctionAsync(u,r.tensorArrayMap,r.tensorListMap);l=await p[0].data(),p.forEach(c=>{!c.kept&&o.indexOf(c.id)===-1&&h.indexOf(c.id)===-1&&c.dispose()})}return u}case"LoopCond":{let n=k("pred",e,t,r);return[Ha(n)]}case"Switch":{let n=k("pred",e,t,r),a=k("data",e,t,r);return a.kept||(a=Ha(a)),(await n.data())[0]?[void 0,a]:[a,void 0]}case"Merge":{let n=e.inputNames.find(a=>Dr(a,t,r)!==void 0);if(n){let a=Dr(n,t,r);return[Ha(a)]}return}case"Enter":{let n=k("frameName",e,t,r),a=k("tensor",e,t,r);return r.enterFrame(n),[Ha(a)]}case"Exit":{let n=k("tensor",e,t,r);return r.exitFrame(),[Ha(n)]}case"NextIteration":{let n=k("tensor",e,t,r);return r.nextIteration(),[Ha(n)]}case"TensorArrayV3":{let n=k("size",e,t,r),a=k("dtype",e,t,r),s=k("elementShape",e,t,r),i=k("dynamicSize",e,t,r),o=k("clearAfterRead",e,t,r),l=k("identicalElementShapes",e,t,r),u=k("name",e,t,r),d=new Rj(u,a,n,s,l,i,o);return r.addTensorArray(d),[d.idTensor,Se(1)]}case"TensorArrayWriteV3":{let n=k("tensorArrayId",e,t,r),a=k("index",e,t,r),s=k("tensor",e,t,r),i=r.getTensorArray(n.id);return i.write(a,s),[i.idTensor]}case"TensorArrayReadV3":{let n=k("tensorArrayId",e,t,r),a=k("index",e,t,r);return[r.getTensorArray(n.id).read(a)]}case"TensorArrayGatherV3":{let n=k("tensorArrayId",e,t,r),a=k("indices",e,t,r),s=k("dtype",e,t,r);return[r.getTensorArray(n.id).gather(a,s)]}case"TensorArrayScatterV3":{let n=k("tensorArrayId",e,t,r),a=k("indices",e,t,r),s=k("tensor",e,t,r),i=r.getTensorArray(n.id);return i.scatter(a,s),[i.idTensor]}case"TensorArrayConcatV3":{let n=k("tensorArrayId",e,t,r),a=r.getTensorArray(n.id),s=k("dtype",e,t,r);return[a.concat(s)]}case"TensorArraySplitV3":{let n=k("tensorArrayId",e,t,r),a=k("tensor",e,t,r),s=k("lengths",e,t,r),i=r.getTensorArray(n.id);return i.split(s,a),[i.idTensor]}case"TensorArraySizeV3":{let n=k("tensorArrayId",e,t,r),a=r.getTensorArray(n.id);return[Se(a.size(),"int32")]}case"TensorArrayCloseV3":{let n=k("tensorArrayId",e,t,r),a=r.getTensorArray(n.id);return a.clearAndClose(),[a.idTensor]}case"TensorListSetItem":{let n=k("tensorListId",e,t,r),a=k("index",e,t,r),s=k("tensor",e,t,r),i=r.getTensorList(n.id);return i.setItem(a,s),[i.idTensor]}case"TensorListGetItem":{let n=k("tensorListId",e,t,r),a=k("index",e,t,r),s=k("elementShape",e,t,r),i=k("elementDType",e,t,r);return[r.getTensorList(n.id).getItem(a,s,i)]}case"TensorListScatterV2":case"TensorListScatter":{let n=k("indices",e,t,r),a=k("tensor",e,t,r),s=k("elementShape",e,t,r),i=k("numElements",e,t,r),o=$j(a,n,s,i);return r.addTensorList(o),[o.idTensor]}case"TensorListReserve":case"EmptyTensorList":{let n=k("elementShape",e,t,r),a=k("elementDType",e,t,r),s;e.op==="TensorListReserve"?s="numElements":s="maxNumElements";let i=k(s,e,t,r),o=Fj(n,a,i);return r.addTensorList(o),[o.idTensor]}case"TensorListGather":{let n=k("tensorListId",e,t,r),a=k("indices",e,t,r),s=k("elementShape",e,t,r),i=k("elementDType",e,t,r);return[r.getTensor
${e}`);let n;return this.size===1/0||this.size==null?n=this.size:t?n=Math.ceil(this.size/e):n=Math.floor(this.size/e),un(async()=>(await r.iterator()).columnMajorBatch(e,t,PH),n)}concatenate(e){let t=this,r;return this.size===1/0||e.size===1/0?r=1/0:this.size!=null&&e.size!=null?r=this.size+e.size:r=null,un(async()=>(await t.iterator()).concatenate(await e.iterator()),r)}filter(e){let t=this,r;return this.size===1/0?r=1/0:r=null,un(async()=>(await t.iterator()).filter(n=>K(()=>e(n))),r)}async forEachAsync(e){return(await this.iterator()).forEachAsync(e)}map(e){let t=this;return un(async()=>(await t.iterator()).map(r=>K(()=>e(r))),this.size)}mapAsync(e){let t=this;return un(async()=>(await t.iterator()).mapAsync(e),this.size)}prefetch(e){if(e==null)throw new RangeError("`Dataset.prefetch()` requires bufferSize to be specified.");let t=this;return un(async()=>(await t.iterator()).prefetch(e),this.size)}repeat(e){let t=this,r;return this.size!=null&&e>0?r=this.size*e:e===0?r=0:this.size!=null&&(e===void 0||e<0)?r=1/0:r=null,un(async()=>{let n=Ux(async()=>({value:await t.iterator(),done:!1}));return AH(n.take(e))},r)}skip(e){let t=this,r;return this.size!=null&&e>=0&&this.size>=e?r=this.size-e:this.size!=null&&(this.size<e||e===void 0||e<0)?r=0:r=null,un(async()=>(await t.iterator()).skip(e),r)}shuffle(e,t,r=!0){if(e==null||e<0)throw this.size==null?new RangeError("`Dataset.shuffle()` requires bufferSize to be specified."):new RangeError(`\`Dataset.shuffle()\` requires bufferSize to be specified. If your data fits in main memory (for regular JS objects), and/or GPU memory (for \`tf.Tensor\`s), consider setting bufferSize to the dataset size (${this.size} elements)`);let n=this,a=dH.alea(t||w.now().toString());return un(async()=>{let s=a.int32();return r&&(s+=a.int32()),(await n.iterator()).shuffle(e,s.toString())},this.size)}take(e){let t=this,r;return this.size!=null&&this.size>e?r=e:this.size!=null&&this.size<=e?r=this.size:r=null,un(async()=>(await t.iterator()).take(e),r)}async toArray(){if(this.size===1/0)throw new Error("Can not convert infinite data stream to array.");return(await this.iterator()).toArray()}async toArrayForTest(){if(this.size===1/0)throw new Error("Can not convert infinite data stream to array.");return(await this.iterator()).toArrayForTest()}};Ad.MAX_BUFFER_SIZE=1e4;function un(e,t=null){return new class extends Ad{constructor(){super(...arguments),this.size=t}async iterator(){return e()}}}function FH(e){return un(async()=>P6(e),e.length)}function $H(e){if(!Cu(e))throw new Error("The argument to zip() must be an object or array.");let t;if(Array.isArray(e))for(let r=0;r<e.length;r++)t=t==null?e[r].size:Math.min(t,e[r].size);else if(e instanceof Object)for(let r in e)t=t==null?e[r].size:Math.min(t,e[r].size);return un(async()=>{let r=await R6(e,n=>{if(n instanceof Ad)return{value:n.iterator(),recurse:!1};if(Cu(n))return{value:null,recurse:!0};throw new Error("Leaves of the structure passed to zip() must be Datasets, not primitives.")});return xH(r,1)},t)}function PH(e){if(e===null)return null;let t=e[0];return fH(t)?{value:_H(e),recurse:!1}:{value:null,recurse:!0}}function _H(e){if(e.length===0)throw new Error("Can't make a batch of zero elements.");return e[0]instanceof rt?or(e):ct(e)}var D6=class extends Ad{constructor(e){super(),this.input=e}async iterator(){return(await this.input.iterator()).decodeUTF8().split(`
`).map(e=>(e.endsWith("\r")&&(e=e.slice(0,-1)),e))}},Xc='"',yp=Symbol("out"),Tv=Symbol("field"),Zc=Symbol("quote"),ny=Symbol("quoteafterquote"),Nv=Symbol("quoteinquote"),L6=class extends Ad{constructor(e,t){super(),this.input=e,this.hasHeader=!0,this.fullColumnNames=null,this.columnNamesValidated=!1,this.columnConfigs=null,this.configuredColumnsOnly=!1,this.delimiter=",",this.delimWhitespace=!1,this.base=new D6(e),t||(t={}),this.hasHeader=t.hasHeader!==!1,this.fullColumnNames=t.columnNames,this.columnConfigs=t.columnConfigs,this.configuredColumnsOnly=t.configuredColumnsOnly,t.delimWhitespace?(w.assert(t.delimiter==null,()=>"Delimiter should not be provided when delimWhitespace is true."),this.delimWhitespace=!0,this.delimiter=" "):this.delimiter=t.delimiter?t.delimiter:","}async columnNames(){return this.columnNamesValidated||await this.setColumnNames(),this.configuredColumnsOnly?Object.keys(this.columnConfigs):this.fullColumnNames}async setColumnNames(){let e=await this.maybeReadHeaderLine();if(!this.fullColumnNames&&!e)throw new Error("Column names must be provided if there is no header line.");this.fullColumnNames&&e&&w.assert(e.length===this.fullColumnNames.length,()=>"The length of provided columnNames ("+this.fullColumnNames.length.toString()+") does not match the length of the header line read from file ("+e.length.toString()+")."),this.fullColumnNames||(this.fullColumnNames=e);let t=this.fullColumnNames.reduce((n,a)=>(n[a]=n[a]+1||1,n),{}),r=Object.keys(t).filter(n=>t[n]>1);if(w.assert(r.length===0,()=>"Duplicate column names found: "+r.toString()),this.columnConfigs){for(let n of Object.keys(this.columnConfigs))if(this.fullColumnNames.indexOf(n)===-1)throw new Error('The key "'+n+'" provided in columnConfigs does not match any of the column names ('+this.fullColumnNames.toString()+").")}this.columnNamesValidated=!0}async maybeReadHeaderLine(){if(this.hasHeader){let e=await(await this.base.iterator()).next();if(e.done)throw new Error("No data was found for CSV parsing.");let t=e.value;return this.parseRow(t,!1)}else return null}async iterator(){this.columnNamesValidated||await this.setColumnNames();let e=await this.base.iterator();return this.hasHeader&&(e=e.skip(1)),e.map(t=>this.makeDataElement(t))}makeDataElement(e){let t=this.parseRow(e),r={},n={};for(let a=0;a<this.fullColumnNames.length;a++){let s=this.fullColumnNames[a],i=this.columnConfigs?this.columnConfigs[s]:null;if(!(this.configuredColumnsOnly&&!i)){let o=t[a],l=null;if(o==="")if(i&&i.default!==void 0)l=i.default;else{if(i&&(i.required||i.isLabel))throw new Error(`Required column ${s} is empty in this line: ${e}`);l=void 0}else{let u=Number(o);if(isNaN(u))i&&i.dtype==="bool"?l=this.getBoolean(o):l=o;else if(!i||!i.dtype)l=u;else switch(i.dtype){case"float32":l=u;break;case"int32":l=Math.floor(u);break;case"bool":l=this.getBoolean(o);break;default:l=u}}i&&i.isLabel?n[s]=l:r[s]=l}}return Object.keys(n).length===0?r:{xs:r,ys:n}}getBoolean(e){return e==="1"||e.toLowerCase()==="true"?1:0}parseRow(e,t=!0){let r=[],n=0,a=e.length,s=yp;for(let i=0;i<a;i++)switch(s){case yp:switch(e.charAt(i)){case Xc:n=i+1,s=Zc;break;case this.delimiter:if(n=i+1,this.delimiter===" "&&this.delimWhitespace)break;r.push(""),s=yp;break;default:s=Tv,n=i;break}break;case Tv:switch(e.charAt(i)){case this.delimiter:r.push(e.substring(n,i)),s=yp,n=i+1;break;default:}break;case Zc:switch(e.charAt(i)){case Xc:s=ny;break;default:}break;case ny:switch(e.charAt(i)){case this.delimiter:r.push(e.substring(n,i-1)),s=yp,n=i+1;break;case Xc:s=Zc;break;default:s=Nv;break}break;case Nv:switch(e.charAt(i)){case Xc:s=Zc;break;default:}break;default:}if(s===ny?r.push(e.substring(n,a-1)):r.push(e.substring(n)),t&&r.length!==this.fullColumnNames.length)throw new Error(`Invalid row in csv file. Should have ${this.fullColumnNames.length} elements in a row, but got ${r}`);return r}},B6=class extends yr{constructor(e){super(),this.microphoneConfig=e,this.isClosed=!1,this.fftSize=e.fftSize||1024;let t=Math.log2(this.fftSize);if(this.fftSize<0||t<4||t>14||!Number.isInteger(t))throw new Error(`Invalid fftSi
2022-02-10 18:27:21 +01:00
============================
Hi there \u{1F44B}. Looks like you are running TensorFlow.js in Node.js. To speed things up dramatically, install our node backend, which binds to TensorFlow C++, by running npm i @tensorflow/tfjs-node, or npm i @tensorflow/tfjs-node-gpu if you have CUDA. Then call require('@tensorflow/tfjs-node'); (-gpu suffix for CUDA) at the start of your program. Visit https://github.com/tensorflow/tfjs-node for more details.
2022-04-14 17:47:08 +02:00
============================`));let n={id:this.nextDataId()};return this.data.set(n,{values:e,dtype:r,refCount:1}),n}makeTensorInfo(e,t,r){let n;if(t==="string"&&r!=null&&r.length>0&&w.isString(r[0])){let a=r.map(s=>w.encodeString(s));n=this.write(a,e,t)}else n=this.write(r,e,t);return{dataId:n,shape:e,dtype:t}}refCount(e){return this.data.has(e)?this.data.get(e).refCount:0}incRef(e){let t=this.data.get(e);t.refCount++}decRef(e){if(this.data.has(e)){let t=this.data.get(e);t.refCount--}}move(e,t,r,n,a){this.data.set(e,{values:t,dtype:n,refCount:a})}numDataIds(){return this.data.numDataIds()}async read(e){return this.readSync(e)}readSync(e){let{dtype:t,complexTensorInfos:r}=this.data.get(e);if(t==="complex64"){let n=this.readSync(r.real.dataId),a=this.readSync(r.imag.dataId);return N.mergeRealAndImagArrays(n,a)}return this.data.get(e).values}bufferSync(e){let t=this.readSync(e.dataId),r=t;if(e.dtype==="string")try{r=t.map(n=>w.decodeString(n))}catch(n){throw new Error("Failed to decode encoded string bytes into utf-8")}return We(e.shape,e.dtype,r)}makeOutput(e,t,r){let n=this.write(e,t,r);return br().makeTensorFromDataId(n,t,r,this)}disposeData(e,t=!1){if(this.data.has(e)){if(this.data.get(e).refCount--,!t&&this.data.get(e).refCount>0)return!1;let{complexTensorInfos:r}=this.data.get(e);r!=null&&(this.disposeData(r.real.dataId,!0),this.disposeData(r.imag.dataId,!0)),this.data.delete(e)}return!0}disposeIntermediateTensorInfo(e){this.disposeData(e.dataId)}async time(e){let t=w.now();return e(),{kernelMs:w.now()-t}}memory(){return{unreliable:!0,reasons:["The reported memory is an upper bound. Due to automatic garbage collection, the true allocated memory may be less."]}}where(e){Te([e],"where");let t=this.readSync(e.dataId);return XH(e.shape,t)}dispose(){}floatPrecision(){return 32}epsilon(){return super.epsilon()}},jx=K6;jx.nextDataId=0;var c0={};Le(c0,{addImpl:()=>Z6,bincountImpl:()=>qx,bincountReduceImpl:()=>Y6,ceilImpl:()=>J6,concatImpl:()=>Kx,equalImpl:()=>Q6,expImpl:()=>tI,expm1Impl:()=>nI,floorImpl:()=>aI,gatherNdImpl:()=>sI,gatherV2Impl:()=>iI,greaterEqualImpl:()=>lI,greaterImpl:()=>oI,lessEqualImpl:()=>dI,lessImpl:()=>uI,linSpaceImpl:()=>pI,logImpl:()=>hI,maxImpl:()=>cI,maximumImpl:()=>fI,minimumImpl:()=>mI,multiplyImpl:()=>Xx,negImpl:()=>gI,notEqualImpl:()=>yI,prodImpl:()=>AI,rangeImpl:()=>Yx,rsqrtImpl:()=>xI,sigmoidImpl:()=>Oq,simpleAbsImpl:()=>X6,sliceImpl:()=>Pf,sparseFillEmptyRowsImpl:()=>vI,sparseReshapeImpl:()=>wI,sparseSegmentReductionImpl:()=>Jx,sqrtImpl:()=>Bq,squaredDifferenceImpl:()=>kI,stridedSliceImpl:()=>II,stringNGramsImpl:()=>SI,stringSplitImpl:()=>TI,stringToHashBucketFastImpl:()=>NI,subImpl:()=>CI,tileImpl:()=>EI,topKImpl:()=>MI,transposeImpl:()=>Zx,uniqueImpl:()=>FI});function X6(e){let t=new Float32Array(e.length);for(let r=0;r<e.length;++r)t[r]=Math.abs(e[r]);return t}var ZH=e=>{let{x:t}=e.inputs,r=e.backend;Te(t,"abs");let n=new Float32Array(w.sizeFromShape(t.shape)),a=r.data.get(t.dataId).values;return n=X6(a),r.makeOutput(n,t.shape,t.dtype)},YH={kernelName:Lo,backendName:"cpu",kernelFunc:ZH};function Yt(e){return(t,r,n,a,s)=>{let i=N.assertAndGetBroadcastShape(t,r),o=i.length,l=w.computeStrides(i),u=w.sizeFromShape(i),d=w.getTypedArrayFromDType(s,u),h=t.length,p=r.length,c=w.computeStrides(t),f=w.computeStrides(r),m=N.getBroadcastDims(t,i),g=N.getBroadcastDims(r,i);if(m.length+g.length===0)for(let y=0;y<d.length;++y)d[y]=e(n[y%n.length],a[y%a.length]);else for(let y=0;y<d.length;++y){let A=w.indexToLoc(y,o,l),x=A.slice(-h);m.forEach(T=>x[T]=0);let b=w.locToIndex(x,h,c),v=A.slice(-p);g.forEach(T=>v[T]=0);let S=w.locToIndex(v,p,f);d[y]=e(n[b],a[S])}return[d,i]}}function pn(e){let{inputs:t,backend:r}=e,{real:n,imag:a}=t,s=r.data.get(n.dataId).values,i=r.data.get(a.dataId).values,o=r.makeTensorInfo(n.shape,"complex64"),l=r.data.get(o.dataId);return l.complexTensorInfos={real:r.makeTensorInfo(n.shape,"float32",s),imag:r.makeTensorInfo(a.shape,"float32",i)},o}var JH={kernelName:Xp,backendName:"cpu",kernelFunc:pn};function $f(e,t,r="float32"){if(r==="complex64"){let a=$f(e,t,"float32"),s=$f(e,t,"flo
2022-04-01 15:13:32 +02:00
${s.shape}`);if(n.shape.length!==2)throw new Error(`Indices must be a matrix, saw:
${n.shape}`);if(a.shape.length!==1)throw new Error(`Values must be a vector, saw:
${a.shape}`);if(i.shape.length!==0)throw new Error(`Default value must be a scalar, saw:
2022-04-14 17:47:08 +02:00
${i.shape}`);let o=r.data.get(n.dataId).values,l=r.data.get(a.dataId).values,u=r.data.get(s.dataId).values,d=r.data.get(i.dataId).values[0],[h,p,c,f,m]=vI(o,n.shape,n.dtype,l,a.dtype,u,d);return[r.makeTensorInfo(p,n.dtype,h),r.makeTensorInfo([p[0]],a.dtype,c),r.makeTensorInfo([f.length],"bool",new Uint8Array(f.map(g=>Number(g)))),r.makeTensorInfo([m.length],n.dtype,new Int32Array(m))]}var dJ={kernelName:sh,backendName:"cpu",kernelFunc:uJ};function pJ(e){let{inputs:t,backend:r}=e,{inputIndices:n,inputShape:a,newShape:s}=t;if(n.shape.length!==2)throw new Error(`Input indices should be a matrix but received shape
2022-04-01 15:13:32 +02:00
${n.shape}`);if(a.shape.length!==1)throw new Error(`Input shape should be a vector but received shape
2022-04-14 17:47:08 +02:00
${a.shape}`);if(s.shape.length!==1)throw new Error(`Target shape should be a vector but received shape ${s.shape}`);let i=Array.from(r.data.get(a.dataId).values),o=r.data.get(n.dataId).values,l=Array.from(r.data.get(s.dataId).values),[u,d,h]=wI(o,n.shape,n.dtype,i,l);return[r.makeTensorInfo(d,n.dtype,u),r.makeTensorInfo([h.length],s.dtype,new Int32Array(h))]}var hJ={kernelName:id,backendName:"cpu",kernelFunc:pJ};function cJ(e){let{inputs:t,backend:r}=e,{data:n,indices:a,segmentIds:s}=t;if(n.shape.length<1)throw new Error("Data should be at least 1 dimensional but received scalar");if(a.shape.length!==1)throw new Error(`Indices should be a vector but received shape
2022-04-01 15:13:32 +02:00
${a.shape}`);if(s.shape.length!==1)throw new Error(`Segment ids should be a vector but received shape
2022-04-14 17:47:08 +02:00
${s.shape}`);if(a.shape[0]!==s.shape[0])throw new Error("segmentIds and indices should have same size.");let i=r.data.get(n.dataId).values,o=r.data.get(a.dataId).values,l=r.data.get(s.dataId).values,[u,d]=Jx(i,n.shape,n.dtype,o,l,!0);return r.makeTensorInfo(d,n.dtype,u)}var fJ={kernelName:ih,backendName:"cpu",kernelFunc:cJ};function mJ(e){let{inputs:t,backend:r}=e,{data:n,indices:a,segmentIds:s}=t;if(n.shape.length<1)throw new Error("Data should be at least 1 dimensional but received scalar");if(a.shape.length!==1)throw new Error(`Indices should be a vector but received shape
2022-04-01 15:13:32 +02:00
${a.shape}`);if(s.shape.length!==1)throw new Error(`Segment ids should be a vector but received shape
2022-04-14 17:47:08 +02:00
${s.shape}`);if(a.shape[0]!==s.shape[0])throw new Error("segmentIds and indices should have same size.");let i=r.data.get(n.dataId).values,o=r.data.get(a.dataId).values,l=r.data.get(s.dataId).values,[u,d]=Jx(i,n.shape,n.dtype,o,l);return r.makeTensorInfo(d,n.dtype,u)}var gJ={kernelName:oh,backendName:"cpu",kernelFunc:mJ};function yJ(e){let{inputs:t,backend:r,attrs:n}=e,{sparseIndices:a,sparseValues:s,defaultValue:i}=t,{outputShape:o}=n,{sliceRank:l,numUpdates:u,sliceSize:d,strides:h,outputSize:p}=N.calculateShapes(s,a,o),c=!1,f=r.bufferSync(a),m=r.bufferSync(s),g=r.data.get(i.dataId).values[0],y=XI(f,m,o,p,d,u,l,h,g,c);return r.makeTensorInfo(o,y.dtype,y.values)}var AJ={kernelName:lh,backendName:"cpu",kernelFunc:yJ};function xJ(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{numOrSizeSplits:s,axis:i}=n,o=w.parseAxisParam(i,a.shape)[0],l=N.prepareSplitSize(a,s,o),u=new Array(a.shape.length).fill(0),d=a.shape.slice();return l.map(h=>{let p=[...d];p[o]=h;let c=$o({inputs:{x:a},backend:r,attrs:{begin:u,size:p}});return u[o]+=h,c})}var bJ={kernelName:yl,backendName:"cpu",kernelFunc:xJ},vJ={kernelName:od,backendName:"cpu",kernelFunc:({inputs:e,backend:t})=>{let{x:r}=e,n=t;Te(r,"square");let a=n.data.get(r.dataId).values,s=new Float32Array(a.length);for(let i=0;i<a.length;++i){let o=a[i];s[i]=o*o}return{dataId:n.write(s,r.shape,r.dtype),shape:r.shape,dtype:r.dtype}}},wJ=mt(Di,(e,t)=>{let r=t;return isNaN(e)?NaN:e>0?1:r.alpha}),kJ={kernelName:Di,backendName:"cpu",kernelFunc:wJ};function IJ(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{begin:s,end:i,strides:o,beginMask:l,endMask:u,ellipsisMask:d,newAxisMask:h,shrinkAxisMask:p}=n;Te(a,"stridedSlice");let{finalShapeSparse:c,finalShape:f,isIdentity:m,sliceDim0:g,isSimpleSlice:y,begin:A,end:x,strides:b}=_t.sliceInfo(a.shape,s,i,o,l,u,d,h,p),v;if(m)v=Mt({inputs:{x:a},backend:r,attrs:{shape:f}});else if(g||y){w.assert(a.shape.length>=1,()=>`Input must have rank at least 1, got: ${a.shape.length}`);let S=_t.computeOutShape(A,x,b),T=$o({inputs:{x:a},backend:r,attrs:{begin:A,size:S}});v=Mt({inputs:{x:T},backend:r,attrs:{shape:f}}),r.disposeIntermediateTensorInfo(T)}else{let S=r.bufferSync(a),T=II(c,S,b,A);v=r.makeTensorInfo(f,T.dtype,T.values)}return v}var SJ={kernelName:Al,backendName:"cpu",kernelFunc:IJ};function TJ(e){let{inputs:t,backend:r,attrs:n}=e,{separator:a,nGramWidths:s,leftPad:i,rightPad:o,padWidth:l,preserveShortSequences:u}=n,{data:d,dataSplits:h}=t,p=r.data.get(d.dataId).values,c=r.data.get(h.dataId).values,[f,m]=SI(p,c,a,s,i,o,l,u);return[r.makeTensorInfo([f.length],"string",f),r.makeTensorInfo(h.shape,"int32",m)]}var NJ={kernelName:uh,backendName:"cpu",kernelFunc:TJ};function CJ(e){let{inputs:t,backend:r,attrs:n}=e,{skipEmpty:a}=n,{input:s,delimiter:i}=t;if(s.dtype!=="string")throw new Error("Input must be of datatype string");if(s.shape.length!==1)throw new Error(`Input must be a vector, got shape: ${s.shape}`);if(i.shape.length!==0)throw new Error(`Delimiter must be a scalar, got shape: ${i.shape}`);let o=r.data.get(s.dataId).values,l=r.data.get(i.dataId).values[0],[u,d,h]=TI(o,l,a),p=d.length;return[r.makeTensorInfo([p,2],"int32",u),r.makeTensorInfo([p],"string",d),r.makeTensorInfo([2],"int32",new Int32Array(h))]}var EJ={kernelName:cm,backendName:"cpu",kernelFunc:CJ};function RJ(e){let{inputs:t,backend:r,attrs:n}=e,{numBuckets:a}=n,{input:s}=t;if(s.dtype!=="string")throw new Error("Input must be of datatype string");if(a<=0)throw new Error("Number of buckets must be at least 1");let i=r.data.get(s.dataId).values,o=NI(i,a);return r.makeTensorInfo(s.shape,"int32",o)}var MJ={kernelName:fm,backendName:"cpu",kernelFunc:RJ},FJ=mt(xl,e=>Math.tan(e)),$J={kernelName:xl,backendName:"cpu",kernelFunc:FJ},PJ=mt(zi,e=>Math.tanh(e)),_J={kernelName:zi,backendName:"cpu",kernelFunc:PJ};function zJ(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{reps:s}=n;Te(a,"tile");let i=EI(r.bufferSync(a),s);return r.makeTensorInfo(i.shape,i.dtype,i.values)}var OJ={kernelName:Qa,backendName:"cpu",kernelFunc:zJ};function DJ(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{k:s,sorted:i}=n;Te(a,"topk
2022-04-11 17:45:24 +02:00
`),s=a.length.toString().length+2,i=a.map((h,p)=>w.rightPad((p+1).toString(),s)+h),o=0;for(let h=0;h<i.length;h++)o=Math.max(i[h].length,o);let l=i.slice(0,n-1),u=i.slice(n-1,n),d=i.slice(n);console.log(l.join(`
2022-02-10 18:27:21 +01:00
`)),console.log(t.split(`
2022-04-11 17:45:24 +02:00
`)[0]),console.log(`%c ${w.rightPad(u[0],o)}`,"border:1px solid red; background-color:#e3d2d2; color:#a61717"),console.log(d.join(`
2022-04-14 17:47:08 +02:00
`))}function tS(e){return as(e,()=>e.createProgram(),"Unable to create WebGLProgram.")}function rS(e,t){if(we(e,()=>e.linkProgram(t)),!Y().get("ENGINE_COMPILE_ONLY")&&e.getProgramParameter(t,e.LINK_STATUS)===!1)throw console.log(e.getProgramInfoLog(t)),new Error("Failed to link vertex and fragment shaders.")}function af(e,t){if(we(e,()=>e.validateProgram(t)),e.getProgramParameter(t,e.VALIDATE_STATUS)===!1)throw console.log(e.getProgramInfoLog(t)),new Error("Shader program validation failed.")}function nS(e,t){let r=as(e,()=>e.createBuffer(),"Unable to create WebGLBuffer");return we(e,()=>e.bindBuffer(e.ARRAY_BUFFER,r)),we(e,()=>e.bufferData(e.ARRAY_BUFFER,t,e.STATIC_DRAW)),r}function aS(e,t){let r=as(e,()=>e.createBuffer(),"Unable to create WebGLBuffer");return we(e,()=>e.bindBuffer(e.ELEMENT_ARRAY_BUFFER,r)),we(e,()=>e.bufferData(e.ELEMENT_ARRAY_BUFFER,t,e.STATIC_DRAW)),r}function uQ(){return Y().getNumber("WEBGL_VERSION")===2?1:4}function sS(e){return as(e,()=>e.createTexture(),"Unable to create WebGLTexture.")}function iS(e,t){let r=Y().getNumber("WEBGL_MAX_TEXTURE_SIZE");if(e<=0||t<=0){let n=`[${e}x${t}]`;throw new Error("Requested texture size "+n+" is invalid.")}if(e>r||t>r){let n=`[${e}x${t}]`,a=`[${r}x${r}]`;throw new Error("Requested texture size "+n+" greater than WebGL maximum on this browser / GPU "+a+".")}}function oS(e){return as(e,()=>e.createFramebuffer(),"Unable to create WebGLFramebuffer.")}function Hy(e,t,r,n,a,s,i){let o=e.getAttribLocation(t,r);return o===-1?!1:(we(e,()=>e.bindBuffer(e.ARRAY_BUFFER,n)),we(e,()=>e.vertexAttribPointer(o,a,e.FLOAT,!1,s,i)),we(e,()=>e.enableVertexAttribArray(o)),!0)}function lS(e,t,r){cS(e,r),we(e,()=>e.activeTexture(e.TEXTURE0+r)),we(e,()=>e.bindTexture(e.TEXTURE_2D,t))}function dQ(e,t){cS(e,t),we(e,()=>e.activeTexture(e.TEXTURE0+t)),we(e,()=>e.bindTexture(e.TEXTURE_2D,null))}function uS(e,t,r){return as(e,()=>e.getUniformLocation(t,r),'uniform "'+r+'" not present in program.')}function dS(e,t,r){return e.getUniformLocation(t,r)}function pS(e,t,r,n){we(e,()=>lS(e,t,n)),we(e,()=>e.uniform1i(r,n))}function pQ(e){we(e,()=>e.bindFramebuffer(e.FRAMEBUFFER,null)),we(e,()=>e.viewport(0,0,e.canvas.width,e.canvas.height)),we(e,()=>e.scissor(0,0,e.canvas.width,e.canvas.height))}function sf(e,t,r){we(e,()=>e.bindFramebuffer(e.FRAMEBUFFER,r)),we(e,()=>e.framebufferTexture2D(e.FRAMEBUFFER,e.COLOR_ATTACHMENT0,e.TEXTURE_2D,t,0))}function qy(e,t){we(e,()=>e.bindFramebuffer(e.FRAMEBUFFER,t)),we(e,()=>e.framebufferTexture2D(e.FRAMEBUFFER,e.COLOR_ATTACHMENT0,e.TEXTURE_2D,null,0))}function Tp(e){let t=e.checkFramebufferStatus(e.FRAMEBUFFER);if(t!==e.FRAMEBUFFER_COMPLETE)throw new Error("Error binding framebuffer: "+hS(e,t))}function hS(e,t){switch(t){case e.FRAMEBUFFER_INCOMPLETE_ATTACHMENT:return"FRAMEBUFFER_INCOMPLETE_ATTACHMENT";case e.FRAMEBUFFER_INCOMPLETE_MISSING_ATTACHMENT:return"FRAMEBUFFER_INCOMPLETE_MISSING_ATTACHMENT";case e.FRAMEBUFFER_INCOMPLETE_DIMENSIONS:return"FRAMEBUFFER_INCOMPLETE_DIMENSIONS";case e.FRAMEBUFFER_UNSUPPORTED:return"FRAMEBUFFER_UNSUPPORTED";default:return`unknown error ${t}`}}function as(e,t,r){let n=we(e,()=>t());if(n==null)throw new Error(r);return n}function cS(e,t){let r=e.MAX_COMBINED_TEXTURE_IMAGE_UNITS-1,n=t+e.TEXTURE0;if(n<e.TEXTURE0||n>r){let a=`[gl.TEXTURE0, gl.TEXTURE${r}]`;throw new Error(`textureUnit must be in ${a}.`)}}function Po(e,t=2){return w.sizeFromShape(e.slice(0,e.length-t))}function _o(e){if(e.length===0)throw Error("Cannot get rows and columns of an empty shape array.");return[e.length>1?e[e.length-2]:1,e[e.length-1]]}function of(e){let t=[1,1,1];return e.length===0||e.length===1&&e[0]===1||(t=[Po(e),..._o(e)]),t}function fS(e,t=!1){let r=Y().getNumber("WEBGL_MAX_TEXTURE_SIZE");t&&(r=r*2,e=e.map((a,s)=>s>=e.length-2?w.nearestLargerEven(e[s]):e[s]),e.length===1&&(e=[2,e[0]])),e.length!==2&&(e=w.squeezeShape(e).newShape);let n=w.sizeFromShape(e);if(e.length<=1&&n<=r)return[1,n];if(e.length===2&&e[0]<=r&&e[1]<=r)return e;if(e.length===3&&e[0]*e[1]<=r&&e[2]<=r)return[e[0]*e[1],e[2]];if(e.length===3&&e[0]<=r&&e[1]*e[2]<=r)return[e[0],e[1]
2022-02-10 18:27:21 +01:00
bool isnan_custom(float val) {
2022-03-07 19:24:06 +01:00
uint floatToUint = floatBitsToUint(val);
return (floatToUint & 0x7fffffffu) > 0x7f800000u;
2022-02-10 18:27:21 +01:00
}
bvec4 isnan_custom(vec4 val) {
return bvec4(isnan_custom(val.x),
isnan_custom(val.y), isnan_custom(val.z), isnan_custom(val.w));
}
#define isnan(value) isnan_custom(value)
2022-02-17 14:15:57 +01:00
`,l="",u=`
2022-02-10 18:27:21 +01:00
#define round(value) newRound(value)
int newRound(float value) {
return int(floor(value + 0.5));
}
ivec4 newRound(vec4 value) {
return ivec4(floor(value + vec4(0.5)));
}
2022-04-01 15:13:32 +02:00
`):(e="",t="attribute",r="varying",n="varying",a="texture2D",s="gl_FragColor",i="",o=`
2022-02-10 18:27:21 +01:00
#define isnan(value) isnan_custom(value)
bool isnan_custom(float val) {
return (val > 0. || val < 1. || val == 0.) ? false : true;
}
bvec4 isnan_custom(vec4 val) {
return bvec4(isnan(val.x), isnan(val.y), isnan(val.z), isnan(val.w));
}
`,l=`
uniform float INFINITY;
bool isinf(float val) {
return abs(val) == INFINITY;
}
bvec4 isinf(vec4 val) {
return equal(abs(val), vec4(INFINITY));
}
2022-02-17 14:15:57 +01:00
`,u=`
2022-02-10 18:27:21 +01:00
int round(float value) {
return int(floor(value + 0.5));
}
ivec4 round(vec4 value) {
return ivec4(floor(value + vec4(0.5)));
}
2022-04-14 17:47:08 +02:00
`),{version:e,attribute:t,varyingVs:r,varyingFs:n,texture2D:a,output:s,defineOutput:i,defineSpecialNaN:o,defineSpecialInf:l,defineRound:u}}function $l(e,t,r="index"){let n=w.computeStrides(t);return n.map((a,s)=>{let i=`int ${e[s]} = ${r} / ${a}`,o=s===n.length-1?`int ${e[s+1]} = ${r} - ${e[s]} * ${a}`:`index -= ${e[s]} * ${a}`;return`${i}; ${o};`}).join("")}function g0(e,t,r="index"){let n=w.computeStrides(t);return n.map((a,s)=>{let i=`int ${e[s]} = ${r} / outShapeStrides[${s}]`,o=s===n.length-1?`int ${e[s+1]} = ${r} - ${e[s]} * outShapeStrides[${s}]`:`index -= ${e[s]} * outShapeStrides[${s}]`;return`${i}; ${o};`}).join("")}function mQ(e,t){let r=e.length,n=e.map(s=>`${t}[${s}]`),a=new Array(r-1);a[r-2]=n[r-1];for(let s=r-3;s>=0;--s)a[s]=`(${a[s+1]} * ${n[s+1]})`;return a}function gQ(e,t,r="index"){let n=e.map((s,i)=>i),a=mQ(n,t);return a.map((s,i)=>{let o=`int ${e[i]} = ${r} / ${a[i]}`,l=i===a.length-1?`int ${e[i+1]} = ${r} - ${e[i]} * ${a[i]}`:`index -= ${e[i]} * ${a[i]}`;return`${o}; ${l};`}).join("")}function ib(e){let t=w.computeStrides(e).map(r=>r.toString());return`
2022-02-10 18:27:21 +01:00
int getFlatIndex(ivec3 coords) {
return coords.x * ${t[0]} + coords.y * ${t[1]} + coords.z;
}
2022-04-14 17:47:08 +02:00
`}function ob(){return`
2022-02-10 18:27:21 +01:00
int getFlatIndex(ivec3 coords) {
return coords.x * outShapeStrides[0] + coords.y * outShapeStrides[1] + coords.z;
}
2022-04-14 17:47:08 +02:00
`}var vS=`
2022-02-10 18:27:21 +01:00
const float FLOAT_MAX = 1.70141184e38;
const float FLOAT_MIN = 1.17549435e-38;
lowp vec4 encode_float(highp float v) {
if (isnan(v)) {
return vec4(255, 255, 255, 255);
}
highp float av = abs(v);
if(av < FLOAT_MIN) {
return vec4(0.0, 0.0, 0.0, 0.0);
} else if(v > FLOAT_MAX) {
return vec4(0.0, 0.0, 128.0, 127.0) / 255.0;
} else if(v < -FLOAT_MAX) {
return vec4(0.0, 0.0, 128.0, 255.0) / 255.0;
}
highp vec4 c = vec4(0,0,0,0);
highp float e = floor(log2(av));
highp float m = exp2(fract(log2(av))) - 1.0;
c[2] = floor(128.0 * m);
m -= c[2] / 128.0;
c[1] = floor(32768.0 * m);
m -= c[1] / 32768.0;
c[0] = floor(8388608.0 * m);
highp float ebias = e + 127.0;
c[3] = floor(ebias / 2.0);
ebias -= c[3] * 2.0;
c[2] += floor(ebias) * 128.0;
c[3] += 128.0 * step(0.0, -v);
return c / 255.0;
}
2022-04-14 17:47:08 +02:00
`,{getBroadcastDims:wS}=N;function yQ(e,t,r){let n=[];if(e.forEach(p=>{let c=w.sizeFromShape(p.shapeInfo.logicalShape);if(p.shapeInfo.isUniform?n.push(`uniform float ${p.name}${c>1?`[${c}]`:""};`):(n.push(`uniform sampler2D ${p.name};`),n.push(`uniform int offset${p.name};`)),r.enableShapeUniforms){let{uniformShape:f}=lb(r.packedInputs,p.shapeInfo.logicalShape,p.shapeInfo.texShape);switch(f.length){case 1:n.push(`uniform int ${p.name}Shape;`);break;case 2:n.push(`uniform ivec2 ${p.name}Shape;`);break;case 3:n.push(`uniform ivec3 ${p.name}Shape;`);break;case 4:n.push(`uniform ivec4 ${p.name}Shape;`);break;default:break}n.push(`uniform ivec2 ${p.name}TexShape;`)}}),r.enableShapeUniforms){switch(t.logicalShape.length){case 1:n.push("uniform int outShape;");break;case 2:n.push("uniform ivec2 outShape;"),n.push("uniform int outShapeStrides;");break;case 3:n.push("uniform ivec3 outShape;"),n.push("uniform ivec2 outShapeStrides;");break;case 4:n.push("uniform ivec4 outShape;"),n.push("uniform ivec3 outShapeStrides;");break;default:break}n.push("uniform ivec2 outTexShape;")}r.customUniforms&&r.customUniforms.forEach(p=>{n.push(`uniform ${p.type} ${p.name}${p.arrayIndex?`[${p.arrayIndex}]`:""};`)});let a=n.join(`
`),s=e.map(p=>AQ(p,t,r.packedInputs,r.enableShapeUniforms)).join(`
`),i=t.texShape,o=Gr(),l=vQ(o),u,d,h=IQ(o);return t.isPacked?(u=xQ(t.logicalShape,i,r.enableShapeUniforms),d=kQ(o)):(u=bQ(t.logicalShape,i,r.enableShapeUniforms),d=wQ(o)),r.packedInputs&&(h+=CQ),[h,l,d,a,u,s,r.userCode].join(`
`)}function wd(e,t=!1){let r=e.shapeInfo.logicalShape;switch(r.length){case 0:return BQ(e,t);case 1:return VQ(e,t);case 2:return GQ(e,t);case 3:return HQ(e,t);case 4:return KQ(e,t);case 5:return XQ(e);case 6:return ZQ(e);default:throw new Error(`${r.length}-D input sampling is not yet supported`)}}function kS(e,t){switch(e.shapeInfo.logicalShape.length){case 0:return LQ(e);case 1:return WQ(e,t);case 2:return UQ(e,t);case 3:return jQ(e,t);default:return qQ(e,t)}}function AQ(e,t,r=!1,n){let a="";r?a+=kS(e,n):a+=wd(e,n);let s=e.shapeInfo.logicalShape,i=t.logicalShape;return s.length<=i.length&&(r?a+=YQ(e,t):a+=JQ(e,t)),a}function xQ(e,t,r){switch(e.length){case 0:return IS();case 1:return EQ(e,t,r);case 2:return OQ(e,t,r);case 3:return MQ(e,t,r);default:return $Q(e,t,r)}}function bQ(e,t,r){switch(e.length){case 0:return IS();case 1:return RQ(e,t,r);case 2:return DQ(e,t,r);case 3:return FQ(e,t,r);case 4:return PQ(e,t,r);case 5:return _Q(e,t);case 6:return zQ(e,t);default:throw new Error(`${e.length}-D output sampling is not yet supported`)}}function vQ(e){return`
2022-02-10 18:27:21 +01:00
float sampleTexture(sampler2D textureSampler, vec2 uv) {
return ${e.texture2D}(textureSampler, uv).r;
}
2022-04-14 17:47:08 +02:00
`}function wQ(e){return`
2022-02-10 18:27:21 +01:00
void setOutput(float val) {
${e.output} = vec4(val, 0, 0, 0);
}
2022-04-14 17:47:08 +02:00
`}function kQ(e){return`
2022-02-10 18:27:21 +01:00
void setOutput(vec4 val) {
${e.output} = val;
}
2022-04-14 17:47:08 +02:00
`}function IQ(e){return`${e.version}
2022-02-10 18:27:21 +01:00
precision highp float;
precision highp int;
precision highp sampler2D;
${e.varyingFs} vec2 resultUV;
${e.defineOutput}
const vec2 halfCR = vec2(0.5, 0.5);
struct ivec5
{
int x;
int y;
int z;
int w;
int u;
};
struct ivec6
{
int x;
int y;
int z;
int w;
int u;
int v;
};
uniform float NAN;
${e.defineSpecialNaN}
${e.defineSpecialInf}
${e.defineRound}
int imod(int x, int y) {
return x - y * (x / y);
}
int idiv(int a, int b, float sign) {
int res = a / b;
int mod = imod(a, b);
if (sign < 0. && mod != 0) {
res -= 1;
}
return res;
}
//Based on the work of Dave Hoskins
//https://www.shadertoy.com/view/4djSRW
#define HASHSCALE1 443.8975
float random(float seed){
vec2 p = resultUV * seed;
vec3 p3 = fract(vec3(p.xyx) * HASHSCALE1);
p3 += dot(p3, p3.yzx + 19.19);
return fract((p3.x + p3.y) * p3.z);
}
2022-04-11 17:45:24 +02:00
${SQ}
${TQ}
2022-04-14 17:47:08 +02:00
${NQ}
`}var SQ=`
2022-02-10 18:27:21 +01:00
vec2 uvFromFlat(int texNumR, int texNumC, int index) {
int texR = index / texNumC;
int texC = index - texR * texNumC;
return (vec2(texC, texR) + halfCR) / vec2(texNumC, texNumR);
}
vec2 packedUVfrom1D(int texNumR, int texNumC, int index) {
int texelIndex = index / 2;
int texR = texelIndex / texNumC;
int texC = texelIndex - texR * texNumC;
return (vec2(texC, texR) + halfCR) / vec2(texNumC, texNumR);
}
2022-04-14 17:47:08 +02:00
`,TQ=`
2022-02-10 18:27:21 +01:00
vec2 packedUVfrom2D(int texelsInLogicalRow, int texNumR,
int texNumC, int row, int col) {
int texelIndex = (row / 2) * texelsInLogicalRow + (col / 2);
int texR = texelIndex / texNumC;
int texC = texelIndex - texR * texNumC;
return (vec2(texC, texR) + halfCR) / vec2(texNumC, texNumR);
}
2022-04-14 17:47:08 +02:00
`,NQ=`
2022-02-10 18:27:21 +01:00
vec2 packedUVfrom3D(int texNumR, int texNumC,
int texelsInBatch, int texelsInLogicalRow, int b,
int row, int col) {
int index = b * texelsInBatch + (row / 2) * texelsInLogicalRow + (col / 2);
int texR = index / texNumC;
int texC = index - texR * texNumC;
return (vec2(texC, texR) + halfCR) / vec2(texNumC, texNumR);
}
2022-04-14 17:47:08 +02:00
`,CQ=`
2022-02-10 18:27:21 +01:00
float getChannel(vec4 frag, vec2 innerDims) {
vec2 modCoord = mod(innerDims, 2.);
return modCoord.x == 0. ?
(modCoord.y == 0. ? frag.r : frag.g) :
(modCoord.y == 0. ? frag.b : frag.a);
}
float getChannel(vec4 frag, int dim) {
float modCoord = mod(float(dim), 2.);
return modCoord == 0. ? frag.r : frag.g;
}
2022-04-14 17:47:08 +02:00
`;function IS(){return`
2022-02-10 18:27:21 +01:00
int getOutputCoords() {
return 0;
}
2022-04-14 17:47:08 +02:00
`}function EQ(e,t,r){let n=[Math.ceil(t[0]/2),Math.ceil(t[1]/2)];return n[0]===1?r?`
2022-02-10 18:27:21 +01:00
int getOutputCoords() {
return 2 * int(resultUV.x * ceil(float(outTexShape[1]) / 2.0));
}
`:`
int getOutputCoords() {
2022-04-01 15:13:32 +02:00
return 2 * int(resultUV.x * ${n[1]}.0);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`:n[1]===1?r?`
2022-02-10 18:27:21 +01:00
int getOutputCoords() {
return 2 * int(resultUV.y * ceil(float(outTexShape[0]) / 2.0));
}
`:`
int getOutputCoords() {
2022-04-01 15:13:32 +02:00
return 2 * int(resultUV.y * ${n[0]}.0);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`:r?`
2022-02-10 18:27:21 +01:00
int getOutputCoords() {
ivec2 packedTexShape = ivec2(ceil(float(outTexShape[0]) / 2.0), ceil(float(outTexShape[1]) / 2.0));
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(packedTexShape[0], packedTexShape[1]));
return 2 * (resTexRC.x * packedTexShape[1] + resTexRC.y);
}
`:`
int getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
2022-04-01 15:13:32 +02:00
vec2(${n[0]}, ${n[1]}));
return 2 * (resTexRC.x * ${n[1]} + resTexRC.y);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}function RQ(e,t,r){return t[0]===1?r?`
2022-02-10 18:27:21 +01:00
int getOutputCoords() {
return int(resultUV.x * float(outTexShape[1]));
}
`:`
int getOutputCoords() {
return int(resultUV.x * ${t[1]}.0);
}
2022-04-01 15:13:32 +02:00
`:t[1]===1?r?`
2022-02-10 18:27:21 +01:00
int getOutputCoords() {
return int(resultUV.y * float(outTexShape[0]));
}
`:`
int getOutputCoords() {
return int(resultUV.y * ${t[0]}.0);
}
2022-04-01 15:13:32 +02:00
`:r?`
2022-02-10 18:27:21 +01:00
int getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(outTexShape[0], outTexShape[1]));
return resTexRC.x * outTexShape[1] + resTexRC.y;
}
`:`
int getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(${t[0]}, ${t[1]}));
return resTexRC.x * ${t[1]} + resTexRC.y;
}
2022-04-14 17:47:08 +02:00
`}function MQ(e,t,r){if(r)return`
2022-02-10 18:27:21 +01:00
ivec3 getOutputCoords() {
ivec2 packedTexShape = ivec2(ceil(float(outTexShape[0]) / 2.0), ceil(float(outTexShape[1]) / 2.0));
int texelsInLogicalRow = int(ceil(float(outShape[2]) / 2.0));
int texelsInBatch = texelsInLogicalRow * int(ceil(float(outShape[1]) / 2.0));
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(packedTexShape[0], packedTexShape[1]));
int index = resTexRC.x * packedTexShape[1] + resTexRC.y;
int b = index / texelsInBatch;
index -= b * texelsInBatch;
int r = 2 * (index / texelsInLogicalRow);
int c = imod(index, texelsInLogicalRow) * 2;
return ivec3(b, r, c);
}
2022-04-01 15:13:32 +02:00
`;let n=[Math.ceil(t[0]/2),Math.ceil(t[1]/2)],a=Math.ceil(e[2]/2),s=a*Math.ceil(e[1]/2);return`
2022-02-10 18:27:21 +01:00
ivec3 getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
2022-04-01 15:13:32 +02:00
vec2(${n[0]}, ${n[1]}));
int index = resTexRC.x * ${n[1]} + resTexRC.y;
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
int b = index / ${s};
index -= b * ${s};
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
int r = 2 * (index / ${a});
int c = imod(index, ${a}) * 2;
2022-02-10 18:27:21 +01:00
return ivec3(b, r, c);
}
2022-04-14 17:47:08 +02:00
`}function FQ(e,t,r){if(r)return`
2022-02-10 18:27:21 +01:00
ivec3 getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(outTexShape[0], outTexShape[1]));
int index = resTexRC.x * outTexShape[1] + resTexRC.y;
2022-04-14 17:47:08 +02:00
${g0(["r","c","d"],e)}
2022-02-10 18:27:21 +01:00
return ivec3(r, c, d);
}
2022-04-14 17:47:08 +02:00
`;let n=$l(["r","c","d"],e);return`
2022-02-10 18:27:21 +01:00
ivec3 getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(${t[0]}, ${t[1]}));
int index = resTexRC.x * ${t[1]} + resTexRC.y;
2022-04-01 15:13:32 +02:00
${n}
2022-02-10 18:27:21 +01:00
return ivec3(r, c, d);
}
2022-04-14 17:47:08 +02:00
`}function $Q(e,t,r){if(r)return`
2022-02-10 18:27:21 +01:00
ivec4 getOutputCoords() {
ivec2 packedTexShape = ivec2(ceil(float(outTexShape[0]) / 2.0), ceil(float(outTexShape[1]) / 2.0));
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(packedTexShape[0], packedTexShape[1]));
int index = resTexRC.x * packedTexShape[1] + resTexRC.y;
int texelsInLogicalRow = int(ceil(float(outShape[3]) / 2.0));
int texelsInBatch = texelsInLogicalRow * int(ceil(float(outShape[2]) / 2.0));
int texelsInBatchN = texelsInBatch * outShape[1];
int b2 = index / texelsInBatchN;
index -= b2 * texelsInBatchN;
int b = index / texelsInBatch;
index -= b * texelsInBatch;
int r = 2 * (index / texelsInLogicalRow);
int c = imod(index, texelsInLogicalRow) * 2;
return ivec4(b2, b, r, c);
}
2022-04-01 15:13:32 +02:00
`;let n=[Math.ceil(t[0]/2),Math.ceil(t[1]/2)],a=Math.ceil(e[e.length-1]/2),s=a*Math.ceil(e[e.length-2]/2),i=s,o="",l="b, r, c";for(let u=2;u<e.length-1;u++)i*=e[e.length-u-1],o=`
int b${u} = index / ${i};
index -= b${u} * ${i};
`+o,l=`b${u}, `+l;return`
2022-02-10 18:27:21 +01:00
ivec${e.length} getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
2022-04-01 15:13:32 +02:00
vec2(${n[0]}, ${n[1]}));
int index = resTexRC.x * ${n[1]} + resTexRC.y;
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
${o}
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
int b = index / ${s};
index -= b * ${s};
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
int r = 2 * (index / ${a});
int c = imod(index, ${a}) * 2;
2022-02-10 18:27:21 +01:00
return ivec${e.length}(${l});
}
2022-04-14 17:47:08 +02:00
`}function PQ(e,t,r){if(r)return`
2022-02-10 18:27:21 +01:00
ivec4 getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(outTexShape[0], outTexShape[1]));
int index = resTexRC.x * outTexShape[1] + resTexRC.y;
2022-04-14 17:47:08 +02:00
${g0(["r","c","d","d2"],e)}
2022-02-10 18:27:21 +01:00
return ivec4(r, c, d, d2);
}
2022-04-14 17:47:08 +02:00
`;let n=$l(["r","c","d","d2"],e);return`
2022-02-10 18:27:21 +01:00
ivec4 getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(${t[0]}, ${t[1]}));
int index = resTexRC.x * ${t[1]} + resTexRC.y;
2022-04-01 15:13:32 +02:00
${n}
2022-02-10 18:27:21 +01:00
return ivec4(r, c, d, d2);
}
2022-04-14 17:47:08 +02:00
`}function _Q(e,t){let r=$l(["r","c","d","d2","d3"],e);return`
2022-02-10 18:27:21 +01:00
ivec5 getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx * vec2(${t[0]},
${t[1]}));
int index = resTexRC.x * ${t[1]} + resTexRC.y;
2022-04-01 15:13:32 +02:00
${r}
2022-02-10 18:27:21 +01:00
ivec5 outShape = ivec5(r, c, d, d2, d3);
return outShape;
}
2022-04-14 17:47:08 +02:00
`}function zQ(e,t){let r=$l(["r","c","d","d2","d3","d4"],e);return`
2022-02-10 18:27:21 +01:00
ivec6 getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(${t[0]}, ${t[1]}));
int index = resTexRC.x * ${t[1]} + resTexRC.y;
2022-04-01 15:13:32 +02:00
${r}
2022-02-10 18:27:21 +01:00
ivec6 result = ivec6(r, c, d, d2, d3, d4);
return result;
}
2022-04-14 17:47:08 +02:00
`}function OQ(e,t,r){let n=[Math.ceil(t[0]/2),Math.ceil(t[1]/2)];if(w.arraysEqual(e,t))return r?`
2022-02-10 18:27:21 +01:00
ivec2 getOutputCoords() {
ivec2 packedTexShape = ivec2(ceil(float(outTexShape[0]) / 2.0), ceil(float(outTexShape[1]) / 2.0));
return 2 * ivec2(resultUV.yx * vec2(packedTexShape[0], packedTexShape[1]));
}
`:`
ivec2 getOutputCoords() {
2022-04-01 15:13:32 +02:00
return 2 * ivec2(resultUV.yx * vec2(${n[0]}, ${n[1]}));
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;let a=Math.ceil(e[1]/2);return r?`
2022-02-10 18:27:21 +01:00
ivec2 getOutputCoords() {
ivec2 packedTexShape = ivec2(ceil(float(outTexShape[0]) / 2.0), ceil(float(outTexShape[1]) / 2.0));
int texelsInLogicalRow = int(ceil(float(outShape[1]) / 2.0));
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(packedTexShape[0], packedTexShape[1]));
int index = resTexRC.x * packedTexShape[1] + resTexRC.y;
int r = 2 * (index / texelsInLogicalRow);
int c = imod(index, texelsInLogicalRow) * 2;
return ivec2(r, c);
}
`:`
ivec2 getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
2022-04-01 15:13:32 +02:00
vec2(${n[0]}, ${n[1]}));
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
int index = resTexRC.x * ${n[1]} + resTexRC.y;
int r = 2 * (index / ${a});
int c = imod(index, ${a}) * 2;
2022-02-10 18:27:21 +01:00
return ivec2(r, c);
}
2022-04-14 17:47:08 +02:00
`}function DQ(e,t,r){return w.arraysEqual(e,t)?r?`
2022-02-10 18:27:21 +01:00
ivec2 getOutputCoords() {
return ivec2(resultUV.yx * vec2(outTexShape[0], outTexShape[1]));
}
`:`
ivec2 getOutputCoords() {
return ivec2(resultUV.yx * vec2(${t[0]}, ${t[1]}));
}
2022-04-01 15:13:32 +02:00
`:e[1]===1?r?`
2022-02-10 18:27:21 +01:00
ivec2 getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(outTexShape[0], outTexShape[1]));
int index = resTexRC.x * outTexShape[1] + resTexRC.y;
return ivec2(index, 0);
}
`:`
ivec2 getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(${t[0]}, ${t[1]}));
int index = resTexRC.x * ${t[1]} + resTexRC.y;
return ivec2(index, 0);
}
2022-04-01 15:13:32 +02:00
`:e[0]===1?r?`
2022-02-10 18:27:21 +01:00
ivec2 getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(outTexShape[0], outTexShape[1]));
int index = resTexRC.x * outTexShape[1] + resTexRC.y;
return ivec2(0, index);
}
`:`
ivec2 getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(${t[0]}, ${t[1]}));
int index = resTexRC.x * ${t[1]} + resTexRC.y;
return ivec2(0, index);
}
2022-04-01 15:13:32 +02:00
`:r?`
2022-02-10 18:27:21 +01:00
ivec2 getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(outTexShape[0], outTexShape[1]));
int index = resTexRC.x * outTexShape[1] + resTexRC.y;
int r = index / outShape[1];
int c = index - r * outShape[1];
return ivec2(r, c);
}
`:`
ivec2 getOutputCoords() {
ivec2 resTexRC = ivec2(resultUV.yx *
vec2(${t[0]}, ${t[1]}));
int index = resTexRC.x * ${t[1]} + resTexRC.y;
int r = index / ${e[1]};
int c = index - r * ${e[1]};
return ivec2(r, c);
}
2022-04-14 17:47:08 +02:00
`}function Pl(e){return`offset${e}`}function LQ(e){let t=e.name,r="get"+t.charAt(0).toUpperCase()+t.slice(1),n=Gr();return`
2022-04-01 15:13:32 +02:00
vec4 ${r}() {
return ${n.texture2D}(${t}, halfCR);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}function BQ(e,t){let r=e.name,n="get"+r.charAt(0).toUpperCase()+r.slice(1);if(e.shapeInfo.isUniform)return`float ${n}() {return ${r};}`;let[a,s]=e.shapeInfo.texShape;if(a===1&&s===1)return`
2022-04-01 15:13:32 +02:00
float ${n}() {
return sampleTexture(${r}, halfCR);
}
2022-04-14 17:47:08 +02:00
`;let i=Pl(r);if(t)return`
2022-04-01 15:13:32 +02:00
float ${n}() {
vec2 uv = uvFromFlat(${r}TexShape[0], ${r}TexShape[1], ${i});
return sampleTexture(${r}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;let[o,l]=e.shapeInfo.texShape;return`
float ${n}() {
vec2 uv = uvFromFlat(${o}, ${l}, ${i});
return sampleTexture(${r}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}function WQ(e,t){let r=e.name,n="get"+r.charAt(0).toUpperCase()+r.slice(1),a=e.shapeInfo.texShape,s=Gr();if(t)return`
2022-04-01 15:13:32 +02:00
vec4 ${n}(int index) {
ivec2 packedTexShape = ivec2(ceil(float(${r}TexShape[0]) / 2.0), ceil(float(${r}TexShape[1]) / 2.0));
2022-02-10 18:27:21 +01:00
vec2 uv = packedUVfrom1D(
packedTexShape[0], packedTexShape[1], index);
2022-04-01 15:13:32 +02:00
return ${s.texture2D}(${r}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;let i=[Math.ceil(a[0]/2),Math.ceil(a[1]/2)];return`
vec4 ${n}(int index) {
2022-02-10 18:27:21 +01:00
vec2 uv = packedUVfrom1D(
2022-04-01 15:13:32 +02:00
${i[0]}, ${i[1]}, index);
return ${s.texture2D}(${r}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}function VQ(e,t){let r=e.name,n="get"+r.charAt(0).toUpperCase()+r.slice(1);if(e.shapeInfo.isUniform)return`
2022-04-01 15:13:32 +02:00
float ${n}(int index) {
2022-04-14 17:47:08 +02:00
${kd(e)}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;let a=e.shapeInfo.texShape,s=a[0],i=a[1];if(i===1&&s===1)return`
float ${n}(int index) {
return sampleTexture(${r}, halfCR);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`;let o=Pl(r);return i===1?t?`
2022-04-01 15:13:32 +02:00
float ${n}(int index) {
vec2 uv = vec2(0.5, (float(index + ${o}) + 0.5) / float(${r}TexShape[0]));
return sampleTexture(${r}, uv);
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
float ${n}(int index) {
vec2 uv = vec2(0.5, (float(index + ${o}) + 0.5) / ${s}.0);
return sampleTexture(${r}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`:s===1?t?`
float ${n}(int index) {
vec2 uv = vec2((float(index + ${o}) + 0.5) / float(${r}TexShape[1]), 0.5);
return sampleTexture(${r}, uv);
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
float ${n}(int index) {
vec2 uv = vec2((float(index + ${o}) + 0.5) / ${i}.0, 0.5);
return sampleTexture(${r}, uv);
2022-02-10 18:27:21 +01:00
}
`:t?`
2022-04-01 15:13:32 +02:00
float ${n}(int index) {
vec2 uv = uvFromFlat(${r}TexShape[0], ${r}TexShape[1], index + ${o});
return sampleTexture(${r}, uv);
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
float ${n}(int index) {
vec2 uv = uvFromFlat(${s}, ${i}, index + ${o});
return sampleTexture(${r}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}function UQ(e,t){let r=e.shapeInfo.logicalShape,n=e.name,a="get"+n.charAt(0).toUpperCase()+n.slice(1),s=e.shapeInfo.texShape,i=s[0],o=s[1],l=Gr();if(s!=null&&w.arraysEqual(r,s))return t?`
2022-04-01 15:13:32 +02:00
vec4 ${a}(int row, int col) {
vec2 uv = (vec2(col, row) + halfCR) / vec2(${n}TexShape[1], ${n}TexShape[0]);
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
return ${l.texture2D}(${n}, uv);
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
vec4 ${a}(int row, int col) {
vec2 uv = (vec2(col, row) + halfCR) / vec2(${o}.0, ${i}.0);
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
return ${l.texture2D}(${n}, uv);
2022-02-10 18:27:21 +01:00
}
`;if(t)return`
2022-04-01 15:13:32 +02:00
vec4 ${a}(int row, int col) {
ivec2 packedTexShape = ivec2(ceil(float(${n}TexShape[0]) / 2.0), ceil(float(${n}TexShape[1]) / 2.0));
int valuesPerRow = int(ceil(float(${n}Shape[1]) / 2.0));
2022-02-10 18:27:21 +01:00
vec2 uv = packedUVfrom2D(valuesPerRow, packedTexShape[0], packedTexShape[1], row, col);
2022-04-01 15:13:32 +02:00
return ${l.texture2D}(${n}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;let u=[Math.ceil(s[0]/2),Math.ceil(s[1]/2)],d=Math.ceil(r[1]/2);return`
vec4 ${a}(int row, int col) {
vec2 uv = packedUVfrom2D(${d}, ${u[0]}, ${u[1]}, row, col);
return ${l.texture2D}(${n}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}function GQ(e,t){let r=e.shapeInfo.logicalShape,n=e.name,a="get"+n.charAt(0).toUpperCase()+n.slice(1),s=e.shapeInfo.texShape;if(s!=null&&w.arraysEqual(r,s)){if(t)return`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col) {
vec2 uv = (vec2(col, row) + halfCR) / vec2(${n}TexShape[1], ${n}TexShape[0]);
return sampleTexture(${n}, uv);
}
`;let p=s[0],c=s[1];return`
float ${a}(int row, int col) {
vec2 uv = (vec2(col, row) + halfCR) / vec2(${c}.0, ${p}.0);
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}let{newShape:i,keptDims:o}=w.squeezeShape(r),l=i;if(l.length<r.length){let p=Id(e,l),c=["row","col"];return`
${wd(p,t)}
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col) {
2022-04-14 17:47:08 +02:00
return ${a}(${Sd(c,o)});
2022-02-10 18:27:21 +01:00
}
`}if(e.shapeInfo.isUniform)return`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col) {
int index = round(dot(vec2(row, col), vec2(${r[1]}, 1)));
2022-04-14 17:47:08 +02:00
${kd(e)}
2022-04-01 15:13:32 +02:00
}
2022-04-14 17:47:08 +02:00
`;let u=s[0],d=s[1],h=Pl(n);return d===1?t?`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col) {
float index = dot(vec3(row, col, ${h}), vec3(${n}Shape[1], 1, 1));
vec2 uv = vec2(0.5, (index + 0.5) / float(${n}TexShape[0]));
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col) {
float index = dot(vec3(row, col, ${h}), vec3(${r[1]}, 1, 1));
2022-02-17 14:15:57 +01:00
vec2 uv = vec2(0.5, (index + 0.5) / ${u}.0);
2022-04-01 15:13:32 +02:00
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
2022-02-17 14:15:57 +01:00
`:u===1?t?`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col) {
float index = dot(vec3(row, col, ${h}), vec3(${n}Shape[1], 1, 1));
vec2 uv = vec2((index + 0.5) / float(${n}TexShape[1]), 0.5);
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col) {
float index = dot(vec3(row, col, ${h}), vec3(${r[1]}, 1, 1));
vec2 uv = vec2((index + 0.5) / ${d}.0, 0.5);
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
`:t?`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col) {
2022-02-10 18:27:21 +01:00
// Explicitly use integer operations as dot() only works on floats.
2022-04-01 15:13:32 +02:00
int index = row * ${n}Shape[1] + col + ${h};
vec2 uv = uvFromFlat(${n}TexShape[0], ${n}TexShape[1], index);
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col) {
2022-02-10 18:27:21 +01:00
// Explicitly use integer operations as dot() only works on floats.
2022-04-01 15:13:32 +02:00
int index = row * ${r[1]} + col + ${h};
vec2 uv = uvFromFlat(${u}, ${d}, index);
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}function jQ(e,t){let r=e.shapeInfo.logicalShape,n=e.name,a="get"+n.charAt(0).toUpperCase()+n.slice(1),s=e.shapeInfo.texShape,i=[Math.ceil(s[0]/2),Math.ceil(s[1]/2)];if(r[0]===1){let p=r.slice(1),c=[1,2],f=Id(e,p),m=["b","row","col"];return`
${kS(f,t)}
2022-04-01 15:13:32 +02:00
vec4 ${a}(int b, int row, int col) {
2022-04-14 17:47:08 +02:00
return ${a}(${Sd(m,c)});
2022-04-01 15:13:32 +02:00
}
2022-04-11 17:45:24 +02:00
`}let o=Gr();if(t)return`
2022-04-01 15:13:32 +02:00
vec4 ${a}(int b, int row, int col) {
ivec2 packedTexShape = ivec2(ceil(float(${n}TexShape[0]) / 2.0), ceil(float(${n}TexShape[1]) / 2.0));
int valuesPerRow = int(ceil(float(${n}Shape[2]) / 2.0));
int texelsInBatch = valuesPerRow * int(ceil(float(${n}Shape[1]) / 2.0));
2022-02-10 18:27:21 +01:00
vec2 uv = packedUVfrom3D(
packedTexShape[0], packedTexShape[1], texelsInBatch, valuesPerRow, b, row, col);
2022-04-01 15:13:32 +02:00
return ${o.texture2D}(${n}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;let l=i[0],u=i[1],d=Math.ceil(r[2]/2),h=d*Math.ceil(r[1]/2);return`
vec4 ${a}(int b, int row, int col) {
2022-02-10 18:27:21 +01:00
vec2 uv = packedUVfrom3D(
2022-04-01 15:13:32 +02:00
${l}, ${u}, ${h}, ${d}, b, row, col);
return ${o.texture2D}(${n}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}function HQ(e,t){let r=e.shapeInfo.logicalShape,n=e.name,a="get"+n.charAt(0).toUpperCase()+n.slice(1),s=r[1]*r[2],i=r[2],{newShape:o,keptDims:l}=w.squeezeShape(r),u=o;if(u.length<r.length){let m=Id(e,u),g=["row","col","depth"];return`
${wd(m,t)}
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col, int depth) {
2022-04-14 17:47:08 +02:00
return ${a}(${Sd(g,l)});
2022-02-10 18:27:21 +01:00
}
`}if(e.shapeInfo.isUniform)return`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col, int depth) {
2022-02-10 18:27:21 +01:00
int index = round(dot(vec3(row, col, depth),
2022-04-01 15:13:32 +02:00
vec3(${s}, ${i}, 1)));
2022-04-14 17:47:08 +02:00
${kd(e)}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;let d=e.shapeInfo.texShape,h=d[0],p=d[1],c=e.shapeInfo.flatOffset;if(p===s&&c==null)return t?`
float ${a}(int row, int col, int depth) {
int stride1 = ${n}Shape[2];
2022-02-10 18:27:21 +01:00
float texR = float(row);
float texC = dot(vec2(col, depth), vec2(stride1, 1));
vec2 uv = (vec2(texC, texR) + halfCR) /
2022-04-01 15:13:32 +02:00
vec2(${n}TexShape[1], ${n}TexShape[0]);
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col, int depth) {
2022-02-10 18:27:21 +01:00
float texR = float(row);
2022-04-01 15:13:32 +02:00
float texC = dot(vec2(col, depth), vec2(${i}, 1));
2022-02-10 18:27:21 +01:00
vec2 uv = (vec2(texC, texR) + halfCR) /
2022-04-01 15:13:32 +02:00
vec2(${p}.0, ${h}.0);
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;if(p===i&&c==null)return t?`
float ${a}(int row, int col, int depth) {
float texR = dot(vec2(row, col), vec2(${n}Shape[1], 1));
2022-02-10 18:27:21 +01:00
float texC = float(depth);
2022-04-01 15:13:32 +02:00
vec2 uv = (vec2(texC, texR) + halfCR) / vec2(${n}TexShape[1], ${n}TexShape[0]);
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col, int depth) {
float texR = dot(vec2(row, col), vec2(${r[1]}, 1));
2022-02-10 18:27:21 +01:00
float texC = float(depth);
2022-04-01 15:13:32 +02:00
vec2 uv = (vec2(texC, texR) + halfCR) / vec2(${p}.0, ${h}.0);
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`;let f=Pl(n);return t?`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col, int depth) {
2022-02-10 18:27:21 +01:00
// Explicitly use integer operations as dot() only works on floats.
2022-04-01 15:13:32 +02:00
int stride0 = ${n}Shape[1] * ${n}Shape[2];
int stride1 = ${n}Shape[2];
int index = row * ${s} + col * ${i} + depth + ${f};
vec2 uv = uvFromFlat(${n}TexShape[0], ${n}TexShape[1], index);
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col, int depth) {
2022-02-10 18:27:21 +01:00
// Explicitly use integer operations as dot() only works on floats.
2022-04-01 15:13:32 +02:00
int index = row * ${s} + col * ${i} + depth + ${f};
vec2 uv = uvFromFlat(${h}, ${p}, index);
return sampleTexture(${n}, uv);
}
2022-04-14 17:47:08 +02:00
`}function qQ(e,t){let r=e.name,n="get"+r.charAt(0).toUpperCase()+r.slice(1),a=Gr();if(t)return`
2022-04-01 15:13:32 +02:00
vec4 ${n}(int b2, int b, int row, int col) {
int valuesPerRow = int(ceil(float(${r}Shape[3]) / 2.0));
int texelsInBatch = valuesPerRow * int(ceil(float(${r}Shape[2]) / 2.0));
2022-02-10 18:27:21 +01:00
int index = b * texelsInBatch + (row / 2) * valuesPerRow + (col / 2);
2022-04-01 15:13:32 +02:00
texelsInBatch *= ${r}Shape[1];
2022-02-10 18:27:21 +01:00
index = b2 * texelsInBatch + index;
2022-04-01 15:13:32 +02:00
ivec2 packedTexShape = ivec2(ceil(float(${r}TexShape[0]) / 2.0), ceil(float(${r}TexShape[1]) / 2.0));
2022-02-10 18:27:21 +01:00
int texR = index / packedTexShape[1];
int texC = index - texR * packedTexShape[1];
2022-04-01 15:13:32 +02:00
vec2 uv = (vec2(texC, texR) + halfCR) / vec2(packedTexShape[1], packedTexShape[0]); return ${a.texture2D}(${r}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;let s=e.shapeInfo.logicalShape,i=s.length,o=e.shapeInfo.texShape,l=[Math.ceil(o[0]/2),Math.ceil(o[1]/2)],u=l[0],d=l[1],h=Math.ceil(s[i-1]/2),p=h*Math.ceil(s[i-2]/2),c="int b, int row, int col",f=`b * ${p} + (row / 2) * ${h} + (col / 2)`;for(let m=2;m<i-1;m++)c=`int b${m}, `+c,p*=s[i-m-1],f=`b${m} * ${p} + `+f;return`
vec4 ${n}(${c}) {
2022-02-10 18:27:21 +01:00
int index = ${f};
2022-04-01 15:13:32 +02:00
int texR = index / ${d};
int texC = index - texR * ${d};
vec2 uv = (vec2(texC, texR) + halfCR) / vec2(${d}, ${u});
return ${a.texture2D}(${r}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}function KQ(e,t){let r=e.shapeInfo.logicalShape,n=e.name,a="get"+n.charAt(0).toUpperCase()+n.slice(1),s=r[3],i=r[2]*s,o=r[1]*i,{newShape:l,keptDims:u}=w.squeezeShape(r);if(l.length<r.length){let A=Id(e,l),x=["row","col","depth","depth2"];return`
${wd(A,t)}
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col, int depth, int depth2) {
2022-04-14 17:47:08 +02:00
return ${a}(${Sd(x,u)});
2022-02-10 18:27:21 +01:00
}
`}if(e.shapeInfo.isUniform)return`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col, int depth, int depth2) {
2022-02-10 18:27:21 +01:00
int index = round(dot(vec4(row, col, depth, depth2),
2022-04-01 15:13:32 +02:00
vec4(${o}, ${i}, ${s}, 1)));
2022-04-14 17:47:08 +02:00
${kd(e)}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;let d=e.shapeInfo.flatOffset,h=e.shapeInfo.texShape,p=h[0],c=h[1],f=`int stride2 = ${n}Shape[3];`,m=`int stride1 = ${n}Shape[2] * stride2;`,g=`int stride0 = ${n}Shape[1] * stride1;`;if(c===o&&d==null)return t?`
float ${a}(int row, int col, int depth, int depth2) {
2022-02-10 18:27:21 +01:00
${f}
${m}
float texR = float(row);
float texC =
dot(vec3(col, depth, depth2),
vec3(stride1, stride2, 1));
vec2 uv = (vec2(texC, texR) + halfCR) /
2022-04-01 15:13:32 +02:00
vec2(${n}TexShape[1], ${n}TexShape[0]);
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col, int depth, int depth2) {
2022-02-10 18:27:21 +01:00
float texR = float(row);
float texC =
dot(vec3(col, depth, depth2),
2022-04-01 15:13:32 +02:00
vec3(${i}, ${s}, 1));
2022-02-10 18:27:21 +01:00
vec2 uv = (vec2(texC, texR) + halfCR) /
2022-04-01 15:13:32 +02:00
vec2(${c}.0, ${p}.0);
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;if(c===s&&d==null)return t?`
float ${a}(int row, int col, int depth, int depth2) {
2022-02-10 18:27:21 +01:00
float texR = dot(vec3(row, col, depth),
2022-04-01 15:13:32 +02:00
vec3(${n}Shape[1] * ${n}Shape[2], ${n}Shape[2], 1));
2022-02-10 18:27:21 +01:00
float texC = float(depth2);
vec2 uv = (vec2(texC, texR) + halfCR) /
2022-04-01 15:13:32 +02:00
vec2(${n}TexShape[1], ${n}TexShape[0]);
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col, int depth, int depth2) {
2022-02-10 18:27:21 +01:00
float texR = dot(vec3(row, col, depth),
2022-04-01 15:13:32 +02:00
vec3(${r[1]*r[2]}, ${r[2]}, 1));
2022-02-10 18:27:21 +01:00
float texC = float(depth2);
vec2 uv = (vec2(texC, texR) + halfCR) /
2022-04-01 15:13:32 +02:00
vec2(${c}.0, ${p}.0);
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`;let y=Pl(n);return t?`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col, int depth, int depth2) {
2022-02-10 18:27:21 +01:00
// Explicitly use integer operations as dot() only works on floats.
${f}
${m}
${g}
int index = row * stride0 + col * stride1 +
depth * stride2 + depth2;
2022-04-01 15:13:32 +02:00
vec2 uv = uvFromFlat(${n}TexShape[0], ${n}TexShape[1], index + ${y});
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
float ${a}(int row, int col, int depth, int depth2) {
2022-02-10 18:27:21 +01:00
// Explicitly use integer operations as dot() only works on floats.
2022-04-01 15:13:32 +02:00
int index = row * ${o} + col * ${i} +
depth * ${s} + depth2;
vec2 uv = uvFromFlat(${p}, ${c}, index + ${y});
return sampleTexture(${n}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}function XQ(e){let t=e.shapeInfo.logicalShape,r=e.name,n="get"+r.charAt(0).toUpperCase()+r.slice(1),a=t[4],s=t[3]*a,i=t[2]*s,o=t[1]*i,{newShape:l,keptDims:u}=w.squeezeShape(t);if(l.length<t.length){let m=Id(e,l),g=["row","col","depth","depth2","depth3"];return`
${wd(m)}
2022-04-01 15:13:32 +02:00
float ${n}(int row, int col, int depth, int depth2, int depth3) {
2022-04-14 17:47:08 +02:00
return ${n}(${Sd(g,u)});
2022-02-10 18:27:21 +01:00
}
`}if(e.shapeInfo.isUniform)return`
2022-04-01 15:13:32 +02:00
float ${n}(int row, int col, int depth, int depth2, int depth3) {
2022-02-10 18:27:21 +01:00
float index = dot(
vec4(row, col, depth, depth2),
2022-04-01 15:13:32 +02:00
vec4(${o}, ${i}, ${s}, ${a})) +
2022-02-10 18:27:21 +01:00
depth3;
2022-04-14 17:47:08 +02:00
${kd(e)}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;let d=e.shapeInfo.flatOffset,h=e.shapeInfo.texShape,p=h[0],c=h[1];if(c===o&&d==null)return`
float ${n}(int row, int col, int depth, int depth2, int depth3) {
2022-02-10 18:27:21 +01:00
int texR = row;
float texC = dot(vec4(col, depth, depth2, depth3),
2022-04-01 15:13:32 +02:00
vec4(${i}, ${s}, ${a}, 1));
2022-02-10 18:27:21 +01:00
vec2 uv = (vec2(texC, texR) + halfCR) /
2022-04-01 15:13:32 +02:00
vec2(${c}.0, ${p}.0);
return sampleTexture(${r}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;if(c===a&&d==null)return`
float ${n}(int row, int col, int depth, int depth2, int depth3) {
2022-02-10 18:27:21 +01:00
float texR = dot(
vec4(row, col, depth, depth2),
vec4(${t[1]*t[2]*t[3]},
${t[2]*t[3]}, ${t[3]}, 1));
int texC = depth3;
vec2 uv = (vec2(texC, texR) + halfCR) /
2022-04-01 15:13:32 +02:00
vec2(${c}.0, ${p}.0);
return sampleTexture(${r}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`;let f=Pl(r);return`
2022-04-01 15:13:32 +02:00
float ${n}(int row, int col, int depth, int depth2, int depth3) {
2022-02-10 18:27:21 +01:00
// Explicitly use integer operations as dot() only works on floats.
2022-04-01 15:13:32 +02:00
int index = row * ${o} + col * ${i} + depth * ${s} +
depth2 * ${a} + depth3 + ${f};
vec2 uv = uvFromFlat(${p}, ${c}, index);
return sampleTexture(${r}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}function ZQ(e){let t=e.shapeInfo.logicalShape,r=e.name,n="get"+r.charAt(0).toUpperCase()+r.slice(1),{newShape:a,keptDims:s}=w.squeezeShape(t);if(a.length<t.length){let g=Id(e,a),y=["row","col","depth","depth2","depth3","depth4"];return`
${wd(g)}
2022-04-01 15:13:32 +02:00
float ${n}(int row, int col, int depth,
2022-02-10 18:27:21 +01:00
int depth2, int depth3, int depth4) {
2022-04-14 17:47:08 +02:00
return ${n}(${Sd(y,s)});
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`}let i=t[5],o=t[4]*i,l=t[3]*o,u=t[2]*l,d=t[1]*u;if(e.shapeInfo.isUniform)return`
float ${n}(int row, int col, int depth,
2022-02-10 18:27:21 +01:00
int depth2, int depth3, int depth4) {
int index = round(dot(
vec4(row, col, depth, depth2),
2022-04-01 15:13:32 +02:00
vec4(${d}, ${u}, ${l}, ${o})) +
2022-02-10 18:27:21 +01:00
dot(
vec2(depth3, depth4),
2022-04-01 15:13:32 +02:00
vec2(${i}, 1)));
2022-04-14 17:47:08 +02:00
${kd(e)}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;let h=e.shapeInfo.flatOffset,p=e.shapeInfo.texShape,c=p[0],f=p[1];if(f===d&&h==null)return`
float ${n}(int row, int col, int depth,
2022-02-10 18:27:21 +01:00
int depth2, int depth3, int depth4) {
int texR = row;
float texC = dot(vec4(col, depth, depth2, depth3),
2022-04-01 15:13:32 +02:00
vec4(${u}, ${l}, ${o}, ${i})) +
2022-02-10 18:27:21 +01:00
float(depth4);
vec2 uv = (vec2(texC, texR) + halfCR) /
2022-04-01 15:13:32 +02:00
vec2(${f}.0, ${c}.0);
return sampleTexture(${r}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;if(f===i&&h==null)return`
float ${n}(int row, int col, int depth,
2022-02-10 18:27:21 +01:00
int depth2, int depth3, int depth4) {
float texR = dot(vec4(row, col, depth, depth2),
vec4(${t[1]*t[2]*t[3]*t[4]},
${t[2]*t[3]*t[4]},
${t[3]*t[4]},
${t[4]})) + float(depth3);
int texC = depth4;
vec2 uv = (vec2(texC, texR) + halfCR) /
2022-04-01 15:13:32 +02:00
vec2(${f}.0, ${c}.0);
return sampleTexture(${r}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`;let m=Pl(r);return`
2022-04-01 15:13:32 +02:00
float ${n}(int row, int col, int depth,
2022-02-10 18:27:21 +01:00
int depth2, int depth3, int depth4) {
// Explicitly use integer operations as dot() only works on floats.
2022-04-01 15:13:32 +02:00
int index = row * ${d} + col * ${u} + depth * ${l} +
depth2 * ${o} + depth3 * ${i} + depth4 + ${m};
vec2 uv = uvFromFlat(${c}, ${f}, index);
return sampleTexture(${r}, uv);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}function kd(e){let t=e.name,r=w.sizeFromShape(e.shapeInfo.logicalShape);return r<2?`return ${t};`:`
2022-04-01 15:13:32 +02:00
for (int i = 0; i < ${r}; i++) {
2022-02-10 18:27:21 +01:00
if (i == index) {
return ${t}[i];
}
}
2022-04-14 17:47:08 +02:00
`}function YQ(e,t){let r=e.name,n=r.charAt(0).toUpperCase()+r.slice(1),a="get"+n+"AtOutCoords",s=e.shapeInfo.logicalShape.length,i=t.logicalShape.length,o=wS(e.shapeInfo.logicalShape,t.logicalShape),l=gt(i),u=i-s,d,h=["x","y","z","w","u","v"];s===0?d="":i<2&&o.length>=1?d="coords = 0;":d=o.map(g=>`coords.${h[g+u]} = 0;`).join(`
2022-04-11 17:45:24 +02:00
`);let p="";i<2&&s>0?p="coords":p=e.shapeInfo.logicalShape.map((g,y)=>`coords.${h[y+u]}`).join(", ");let c="return outputValue;",f=w.sizeFromShape(e.shapeInfo.logicalShape)===1,m=w.sizeFromShape(t.logicalShape)===1;if(s===1&&!f&&!m)c=`
2022-02-10 18:27:21 +01:00
return vec4(outputValue.xy, outputValue.xy);
2022-04-01 15:13:32 +02:00
`;else if(f&&!m)i===1?c=`
2022-02-10 18:27:21 +01:00
return vec4(outputValue.x, outputValue.x, 0., 0.);
2022-04-01 15:13:32 +02:00
`:c=`
2022-02-10 18:27:21 +01:00
return vec4(outputValue.x);
2022-04-01 15:13:32 +02:00
`;else if(o.length){let g=s-2,y=s-1;o.indexOf(g)>-1&&o.indexOf(y)>-1?c="return vec4(outputValue.x);":o.indexOf(g)>-1?c="return vec4(outputValue.x, outputValue.y, outputValue.x, outputValue.y);":o.indexOf(y)>-1&&(c="return vec4(outputValue.xx, outputValue.zz);")}return`
vec4 ${a}() {
2022-02-10 18:27:21 +01:00
${l} coords = getOutputCoords();
2022-04-01 15:13:32 +02:00
${d}
vec4 outputValue = get${n}(${p});
2022-02-10 18:27:21 +01:00
${c}
}
2022-04-14 17:47:08 +02:00
`}function JQ(e,t){let r=e.name,n=r.charAt(0).toUpperCase()+r.slice(1),a="get"+n+"AtOutCoords",s=t.texShape,i=e.shapeInfo.texShape,o=e.shapeInfo.logicalShape.length,l=t.logicalShape.length;if(!e.shapeInfo.isUniform&&o===l&&e.shapeInfo.flatOffset==null&&w.arraysEqual(i,s))return`
2022-04-01 15:13:32 +02:00
float ${a}() {
return sampleTexture(${r}, resultUV);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`;let u=gt(l),d=wS(e.shapeInfo.logicalShape,t.logicalShape),h=l-o,p,c=["x","y","z","w","u","v"];o===0?p="":l<2&&d.length>=1?p="coords = 0;":p=d.map(m=>`coords.${c[m+h]} = 0;`).join(`
2022-04-01 15:13:32 +02:00
`);let f="";return l<2&&o>0?f="coords":f=e.shapeInfo.logicalShape.map((m,g)=>`coords.${c[g+h]}`).join(", "),`
float ${a}() {
2022-02-17 14:15:57 +01:00
${u} coords = getOutputCoords();
2022-04-01 15:13:32 +02:00
${p}
return get${n}(${f});
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}function gt(e){if(e<=1)return"int";if(e===2)return"ivec2";if(e===3)return"ivec3";if(e===4)return"ivec4";if(e===5)return"ivec5";if(e===6)return"ivec6";throw Error(`GPU for rank ${e} is not yet supported`)}function lb(e,t,r){let{newShape:n,keptDims:a}=w.squeezeShape(t),s=t.length,i=e&&s===3&&t[0]===1,o=i?t.slice(1):n,l=!e&&s>1&&!w.arraysEqual(t,r)&&n.length<s||i;return{useSqueezeShape:l,uniformShape:l?o:t,keptDims:a}}function Id(e,t){let r=JSON.parse(JSON.stringify(e));return r.shapeInfo.logicalShape=t,r}function Sd(e,t){return t.map(r=>e[r]).join(", ")}function QQ(e,t,r,n){let a=r.map((d,h)=>{let p={logicalShape:d.shape,texShape:d.isUniform?null:d.texData.texShape,isUniform:d.isUniform,isPacked:d.isUniform?!1:d.texData.isPacked,flatOffset:null};return d.texData!=null&&d.texData.slice!=null&&d.texData.slice.flatOffset>0&&(p.flatOffset=d.texData.slice.flatOffset),{name:t.variableNames[h],shapeInfo:p}}),s=a.map(d=>d.shapeInfo),i={logicalShape:n.shape,texShape:n.texData.texShape,isUniform:!1,isPacked:n.texData.isPacked,flatOffset:null},o=yQ(a,i,t),l=eS(e.gl,o),u=e.createProgram(l);return Y().get("ENGINE_COMPILE_ONLY")?{program:t,fragmentShader:l,source:o,webGLProgram:u,inShapeInfos:s,outShapeInfo:i,uniformLocations:null,customUniformLocations:null,infLoc:null,nanLoc:null,inShapesLocations:null,inTexShapesLocations:null,outShapeLocation:null,outShapeStridesLocation:null,outTexShapeLocation:null}:{program:t,fragmentShader:l,source:o,webGLProgram:u,inShapeInfos:s,outShapeInfo:i,...SS(e,t,u)}}function SS(e,t,r){let n={},a={},s={},i=[],o,l,u,d=null,h=null;h=e.getUniformLocation(r,"NAN",!1),Y().getNumber("WEBGL_VERSION")===1&&(d=e.getUniformLocation(r,"INFINITY",!1));let p=!1;for(let c=0;c<t.variableNames.length;c++){let f=t.variableNames[c];n[f]=e.getUniformLocation(r,f,p),n[`offset${f}`]=e.getUniformLocation(r,`offset${f}`,p),t.enableShapeUniforms&&(a[`${f}Shape`]=e.getUniformLocation(r,`${f}Shape`,p),s[`${f}TexShape`]=e.getUniformLocation(r,`${f}TexShape`,p))}return t.enableShapeUniforms&&(o=e.getUniformLocation(r,"outShape",p),u=e.getUniformLocation(r,"outShapeStrides",p),l=e.getUniformLocation(r,"outTexShape",p)),t.customUniforms&&t.customUniforms.forEach((c,f)=>{i[f]=e.getUniformLocation(r,c.name,p)}),{uniformLocations:n,customUniformLocations:i,infLoc:d,nanLoc:h,inShapesLocations:a,inTexShapesLocations:s,outShapeLocation:o,outShapeStridesLocation:u,outTexShapeLocation:l}}function Rv(e,t){if(e.length!==t.length)throw Error(`Binary was compiled with ${e.length} inputs, but was executed with ${t.length} inputs`);e.forEach((r,n)=>{let a=r.logicalShape,s=t[n],i=s.shape;if(!w.arraysEqual(a,i))throw Error(`Binary was compiled with different shapes than the current args. Shapes ${a} and ${i} must match`);if(r.isUniform&&s.isUniform)return;let o=r.texShape,l=s.isUniform?null:s.texData.texShape;if(!w.arraysEqual(o,l))throw Error(`Binary was compiled with different texture shapes than the current args. Shape ${o} and ${l} must match`)})}function eee(e,t,r,n,a){t.program.enableShapeUniforms||(Rv(t.inShapeInfos,r),Rv([t.outShapeInfo],[n]));let s=n.texData.texture,i=n.texData.texShape;n.texData.isPacked?e.setOutputPackedMatrixTexture(s.texture,i[0],i[1]):e.setOutputMatrixTexture(s.texture,i[0],i[1]),e.setProgram(t.webGLProgram),Y().getNumber("WEBGL_VERSION")===1&&t.infLoc!==null&&e.gl.uniform1f(t.infLoc,1/0),t.nanLoc!==null&&e.gl.uniform1f(t.nanLoc,NaN),r.forEach((l,u)=>{let d=t.program.variableNames[u],h=t.uniformLocations[d],p=t.uniformLocations[`offset${d}`],c=t.inShapesLocations[`${d}Shape`],f=t.inTexShapesLocations[`${d}TexShape`];if(c){let{uniformShape:m}=lb(t.program.packedInputs,l.shape,l.texData.texShape);switch(m.length){case 1:e.gl.uniform1iv(c,new Int32Array(m));break;case 2:e.gl.uniform2iv(c,new Int32Array(m));break;case 3:e.gl.uniform3iv(c,new Int32Array(m));break;case 4:e.gl.uniform4iv(c,new Int32Array(m));break;default:break}}if(f&&e.gl.uniform2i(f,l.texData.texShape[0],l.texData.texShape[1]),h!=null){if(l.isUniform){if(w.sizeFromShape(l.shape)<2)e.gl.uniform1f(h,l.uniformValues[0]);else{let m=l.uniformValues;m instan
2022-02-10 18:27:21 +01:00
ivec3 outCoordsFromFlatIndex(int index) {
2022-04-14 17:47:08 +02:00
${this.enableShapeUniforms?g0(["r","c","d"],e):$l(["r","c","d"],e)}
2022-02-10 18:27:21 +01:00
return ivec3(r, c, d);
}
void main() {
ivec2 resTexRC = ivec2(resultUV.yx * vec2(texShape[0], texShape[1]));
int index = 4 * (resTexRC.x * texShape[1] + resTexRC.y);
vec4 result = vec4(0.);
for (int i=0; i<4; i++) {
int flatIndex = index + i;
ivec3 rc = outCoordsFromFlatIndex(flatIndex);
result[i] = getA(rc.x, rc.y, rc.z);
}
${t.output} = result;
}
2022-04-14 17:47:08 +02:00
`}},nee=class{constructor(e){this.variableNames=["A"],this.packedInputs=!0,this.packedOutput=!0,this.outPackingScheme=0,this.customUniforms=[{name:"texShape",type:"ivec2"}];let t=Gr();this.outputShape=e,this.enableShapeUniforms=ln(this.outputShape.length),this.userCode=`
2022-02-10 18:27:21 +01:00
ivec3 outCoordsFromFlatIndex(int index) {
2022-04-14 17:47:08 +02:00
${this.enableShapeUniforms?g0(["r","c","d"],e):$l(["r","c","d"],e)}
2022-02-10 18:27:21 +01:00
return ivec3(r, c, d);
}
void main() {
ivec2 resTexRC = ivec2(resultUV.yx * vec2(texShape[0], texShape[1]));
int index = 4 * (resTexRC.x * texShape[1] + resTexRC.y);
vec4 result = vec4(0.);
for (int i=0; i<4; i++) {
int flatIndex = index + i;
ivec3 rc = outCoordsFromFlatIndex(flatIndex);
result[i] = getChannel(getA(rc.x, rc.y, rc.z), vec2(rc.y, rc.z));
}
${t.output} = result;
}
2022-04-14 17:47:08 +02:00
`}},aee=class{constructor(e){this.variableNames=["A"],this.outTexUsage=3;let t=Gr();this.outputShape=e,this.userCode=`
${vS}
2022-02-10 18:27:21 +01:00
void main() {
float x = getAAtOutCoords();
${t.output} = encode_float(x);
}
2022-04-14 17:47:08 +02:00
`}},see=class{constructor(e){this.variableNames=["A"],this.packedInputs=!0,this.packedOutput=!1,this.outTexUsage=3;let t=Gr();this.outputShape=e,this.userCode=`
${vS}
2022-02-10 18:27:21 +01:00
void main() {
ivec3 coords = getOutputCoords();
float x = getChannel(getAAtOutCoords(), vec2(coords.y, coords.z));
${t.output} = encode_float(x);
}
2022-04-14 17:47:08 +02:00
`}},iee=class{constructor(e,t=!1){this.variableNames=["A"],this.customUniforms=[{name:"texShape",type:"ivec2"}];let r=Gr();this.outputShape=e,this.enableShapeUniforms=ln(this.outputShape.length);let n="result";t&&(n="floor(result * 255. + 0.5)"),this.userCode=`
${this.enableShapeUniforms?ob():ib(e)}
2022-02-10 18:27:21 +01:00
void main() {
ivec3 coords = getOutputCoords();
int flatIndex = getFlatIndex(coords);
int offset = imod(flatIndex, 4);
flatIndex = idiv(flatIndex, 4, 1.);
int r = flatIndex / texShape[1];
int c = imod(flatIndex, texShape[1]);
vec2 uv = (vec2(c, r) + halfCR) / vec2(texShape[1], texShape[0]);
2022-04-01 15:13:32 +02:00
vec4 values = ${r.texture2D}(A, uv);
2022-02-10 18:27:21 +01:00
float result;
if(offset == 0) {
result = values[0];
} else if(offset == 1) {
result = values[1];
} else if(offset == 2) {
result = values[2];
} else {
result = values[3];
}
2022-04-01 15:13:32 +02:00
${r.output} = vec4(${n}, 0., 0., 0.);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}},oee=class{constructor(e,t=!1){this.variableNames=["A"],this.packedInputs=!1,this.packedOutput=!0,this.customUniforms=[{name:"texShape",type:"ivec2"}];let r=Gr();this.outputShape=e,this.enableShapeUniforms=ln(this.outputShape.length);let n="",a="result";t&&(a="floor(result * 255. + 0.5)");for(let s=0;s<=1;s++)for(let i=0;i<=1;i++){let o=s*2+i;n+=`
2022-02-10 18:27:21 +01:00
localCoords = coords;
2022-04-01 15:13:32 +02:00
if(localCoords[2] + ${i} < ${this.enableShapeUniforms?"outShape[2]":`${e[2]}`}) {
localCoords[2] += ${i};
if (localCoords[1] + ${s} < ${this.enableShapeUniforms?"outShape[1]":`${e[1]}`}) {
localCoords[1] += ${s};
2022-02-10 18:27:21 +01:00
flatIndex = getFlatIndex(localCoords);
offset = imod(flatIndex, 4);
flatIndex = idiv(flatIndex, 4, 1.);
int r = flatIndex / texShape[1];
int c = imod(flatIndex, texShape[1]);
vec2 uv = (vec2(c, r) + halfCR) / vec2(texShape[1], texShape[0]);
2022-04-01 15:13:32 +02:00
values = ${r.texture2D}(A, uv);
2022-02-10 18:27:21 +01:00
if (offset == 0) {
2022-04-01 15:13:32 +02:00
result[${o}] = values[0];
2022-02-10 18:27:21 +01:00
} else if (offset == 1) {
2022-04-01 15:13:32 +02:00
result[${o}] = values[1];
2022-02-10 18:27:21 +01:00
} else if (offset == 2) {
2022-04-01 15:13:32 +02:00
result[${o}] = values[2];
2022-02-10 18:27:21 +01:00
} else {
2022-04-01 15:13:32 +02:00
result[${o}] = values[3];
2022-02-10 18:27:21 +01:00
}
}
}
`}this.userCode=`
2022-04-14 17:47:08 +02:00
${this.enableShapeUniforms?ob():ib(e)}
2022-02-10 18:27:21 +01:00
void main() {
ivec3 coords = getOutputCoords();
vec4 result = vec4(0.);
int flatIndex, r, c, offset;
ivec3 localCoords;
vec2 uv;
vec4 values;
2022-04-01 15:13:32 +02:00
${n}
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
${r.output} = ${a};
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}},TS={};Le(TS,{bindVertexProgramAttributeStreams:()=>_S,createBufferFromOutputTexture:()=>DS,createFloat16MatrixTexture:()=>MS,createFloat16PackedMatrixTexture:()=>PS,createFloat32MatrixTexture:()=>RS,createIndexBuffer:()=>ES,createPackedMatrixTexture:()=>$S,createUnsignedBytesMatrixTexture:()=>FS,createVertexBuffer:()=>CS,createVertexShader:()=>NS,downloadByteEncodedFloatMatrixFromOutputTexture:()=>BS,downloadFloat32MatrixFromBuffer:()=>LS,downloadMatrixFromPackedOutputTexture:()=>VS,downloadPackedMatrixFromBuffer:()=>WS,getInternalFormatForFloat16MatrixTexture:()=>db,getInternalFormatForFloat16PackedMatrixTexture:()=>cb,getInternalFormatForFloat32MatrixTexture:()=>ub,getInternalFormatForPackedMatrixTexture:()=>hb,getInternalFormatForUnsignedBytesMatrixTexture:()=>pb,uploadDenseMatrixToTexture:()=>zS,uploadPixelDataToTexture:()=>OS});function NS(e){let t=Gr(),r=`${t.version}
2022-02-10 18:27:21 +01:00
precision highp float;
${t.attribute} vec3 clipSpacePos;
${t.attribute} vec2 uv;
${t.varyingVs} vec2 resultUV;
void main() {
gl_Position = vec4(clipSpacePos, 1);
resultUV = uv;
2022-04-14 17:47:08 +02:00
}`;return QI(e,r)}function CS(e){let t=new Float32Array([-1,1,0,0,1,-1,-1,0,0,0,1,1,0,1,1,1,-1,0,1,0]);return nS(e,t)}function ES(e){let t=new Uint16Array([0,1,2,2,1,3]);return aS(e,t)}function zh(e,t,r,n,a,s){iS(t,r);let i=sS(e),o=e.TEXTURE_2D;return we(e,()=>e.bindTexture(o,i)),we(e,()=>e.texParameteri(o,e.TEXTURE_WRAP_S,e.CLAMP_TO_EDGE)),we(e,()=>e.texParameteri(o,e.TEXTURE_WRAP_T,e.CLAMP_TO_EDGE)),we(e,()=>e.texParameteri(o,e.TEXTURE_MIN_FILTER,e.NEAREST)),we(e,()=>e.texParameteri(o,e.TEXTURE_MAG_FILTER,e.NEAREST)),Y().getNumber("WEBGL_VERSION")===1?we(e,()=>e.texImage2D(o,0,n,t,r,0,a,s,null)):we(e,()=>e.texStorage2D(o,1,n,t,r)),we(e,()=>e.bindTexture(e.TEXTURE_2D,null)),{texture:i,texShape:[r,t]}}function ub(e){return e.internalFormatFloat}function RS(e,t,r,n){let[a,s]=_h(t,r);return zh(e,a,s,ub(n),n.textureFormatFloat,e.FLOAT)}function db(e){return e.internalFormatHalfFloat}function MS(e,t,r,n){let[a,s]=_h(t,r);return zh(e,a,s,db(n),n.textureFormatFloat,n.textureTypeHalfFloat)}function pb(e){return e.downloadTextureFormat}function FS(e,t,r,n){let[a,s]=_h(t,r);return zh(e,a,s,pb(n),e.RGBA,e.UNSIGNED_BYTE)}function hb(e){return e.internalFormatPackedFloat}function $S(e,t,r,n){let[a,s]=bd(t,r);return zh(e,a,s,hb(n),e.RGBA,e.FLOAT)}function cb(e){return e.internalFormatPackedHalfFloat}function PS(e,t,r,n){let[a,s]=bd(t,r);return zh(e,a,s,cb(n),e.RGBA,n.textureTypeHalfFloat)}function _S(e,t,r){return we(e,()=>e.bindBuffer(e.ARRAY_BUFFER,r)),Hy(e,t,"clipSpacePos",r,3,20,0)&&Hy(e,t,"uv",r,2,20,12)}function zS(e,t,r,n,a,s){we(e,()=>e.bindTexture(e.TEXTURE_2D,t));let i,o,l;a instanceof Uint8Array?(i=new Uint8Array(r*n*4),o=e.UNSIGNED_BYTE,l=e.RGBA):(i=new Float32Array(r*n*4),o=e.FLOAT,l=s.internalFormatPackedFloat),i.set(a),Y().getNumber("WEBGL_VERSION")===2?we(e,()=>e.texSubImage2D(e.TEXTURE_2D,0,0,0,r,n,e.RGBA,o,i)):we(e,()=>e.texImage2D(e.TEXTURE_2D,0,l,r,n,0,e.RGBA,o,i)),we(e,()=>e.bindTexture(e.TEXTURE_2D,null))}function OS(e,t,r){we(e,()=>e.bindTexture(e.TEXTURE_2D,t)),r.data instanceof Uint8Array?Y().getNumber("WEBGL_VERSION")===2?we(e,()=>e.texSubImage2D(e.TEXTURE_2D,0,0,0,r.width,r.height,e.RGBA,e.UNSIGNED_BYTE,r.data)):we(e,()=>e.texImage2D(e.TEXTURE_2D,0,e.RGBA,r.width,r.height,0,e.RGBA,e.UNSIGNED_BYTE,r.data)):Y().getNumber("WEBGL_VERSION")===2?we(e,()=>e.texSubImage2D(e.TEXTURE_2D,0,0,0,e.RGBA,e.UNSIGNED_BYTE,r)):we(e,()=>e.texImage2D(e.TEXTURE_2D,0,e.RGBA,e.RGBA,e.UNSIGNED_BYTE,r)),we(e,()=>e.bindTexture(e.TEXTURE_2D,null))}function DS(e,t,r,n){let a=e.createBuffer();we(e,()=>e.bindBuffer(e.PIXEL_PACK_BUFFER,a));let s=4*4*t*r;return we(e,()=>e.bufferData(e.PIXEL_PACK_BUFFER,s,e.STREAM_READ)),we(e,()=>e.readPixels(0,0,r,t,e.RGBA,e.FLOAT,0)),we(e,()=>e.bindBuffer(e.PIXEL_PACK_BUFFER,null)),a}function LS(e,t,r){let n=e,a=new Float32Array(r);return n.bindBuffer(n.PIXEL_PACK_BUFFER,t),n.getBufferSubData(n.PIXEL_PACK_BUFFER,0,a),n.bindBuffer(n.PIXEL_PACK_BUFFER,null),a}function BS(e,t,r,n){let[a,s]=_h(t,r),i=4,o=new Uint8Array(nQ(t*r,i));return we(e,()=>e.readPixels(0,0,a,s,n.downloadTextureFormat,e.UNSIGNED_BYTE,o)),new Float32Array(o.buffer)}function WS(e,t,r,n,a,s,i,o){let l=e,u=new Float32Array(aQ(s,i));return l.bindBuffer(l.PIXEL_PACK_BUFFER,t),l.getBufferSubData(l.PIXEL_PACK_BUFFER,0,u),l.bindBuffer(l.PIXEL_PACK_BUFFER,null),u}function VS(e,t,r){let n=new Float32Array(t*r*4);return we(e,()=>e.readPixels(0,0,r,t,e.RGBA,e.FLOAT,n)),n}var yu=class{constructor(e){this.outputTexture=null,this.program=null,this.disposed=!1,this.vertexAttrsAreBound=!1,this.itemsToPoll=[];let t=Y().getNumber("WEBGL_VERSION");e!=null?(this.gl=e,m0(t,e)):this.gl=ya(t);let r="WEBGL_color_buffer_float",n="EXT_color_buffer_half_float";if(this.parallelCompilationExtension=this.gl.getExtension("KHR_parallel_shader_compile"),Y().getNumber("WEBGL_VERSION")===1){let a="OES_texture_float",s="OES_texture_half_float";if(this.textureFloatExtension=Sp(this.gl,a),Nn(this.gl,s))this.textureHalfFloatExtension=Sp(this.gl,s);else if(Y().get("WEBGL_FORCE_F16_TEXTURES"))throw new Error("GL context does not support half float textures, yet the environm
2022-02-10 18:27:21 +01:00
void main() {
setOutput(vec4(getA(), 0., 0., 0.));
}
2022-04-11 17:45:24 +02:00
`;else{let t=Lr("rc",this.rank),r=gt(this.rank),n=this.getOutOfBoundsCondition(t),a=this.getSetup(t),s=this.getOutput(t);this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${r} rc = getOutputCoords();
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
if(${n}) {
2022-02-10 18:27:21 +01:00
setOutput(vec4(0));
} else {
2022-04-01 15:13:32 +02:00
${a}
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
setOutput(vec4(${s}));
2022-02-10 18:27:21 +01:00
}
}
2022-04-01 15:13:32 +02:00
`}}getSourceCoordsArr(e){let t=[];for(let r=0;r<=1;r++)for(let n=0;n<=1;n++){let a=`${r===0?"r":"rp1"}, ${n===0?"c":"cp1"}`;for(let s=2;s<this.rank;s++)a=`${e[e.length-1-s]},`+a;t.push(a)}return t}getOutOfBoundsCondition(e){if(this.rank===1)return`rc > ${this.enableShapeUniforms?"outShape":this.outputShape[0]}`;let t="";for(let r=this.rank-2;r<this.rank;r++)t+=`${e[r]} >= ${this.enableShapeUniforms?`outShape[${r}]`:this.outputShape[r]}`,r<this.rank-1&&(t+="||");return t}getSetup(e){if(this.rank===1)return"";let t=e.slice(-2),r=this.enableShapeUniforms?`outShape[${this.rank} - 1]`:this.outputShape[this.rank-1],n=this.enableShapeUniforms?`outShape[${this.rank} - 2]`:this.outputShape[this.rank-2];return`
2022-02-10 18:27:21 +01:00
int r = ${t[0]};
int c = ${t[1]};
int rp1 = r + 1;
int cp1 = c + 1;
2022-04-01 15:13:32 +02:00
bool cEdge = cp1 >= ${r};
bool rEdge = rp1 >= ${n};
2022-02-10 18:27:21 +01:00
`}getOutput(e){let t=this.getSourceCoordsArr(e);return this.rank===1?`getA(rc), (rc + 1 >= ${this.enableShapeUniforms?"outShape":this.outputShape[0]} ? 0. : getA(rc + 1)), 0, 0`:`getA(${t[0]}),
cEdge ? 0. : getA(${t[1]}),
rEdge ? 0. : getA(${t[2]}),
2022-04-14 17:47:08 +02:00
rEdge || cEdge ? 0. : getA(${t[3]})`}},qS=class{constructor(e,t){this.variableNames=["A"],this.packedInputs=!0,this.packedOutput=!0,this.customUniforms=[{name:"inputShape",type:"ivec3"}],this.outputShape=e,this.enableShapeUniforms=ln(this.outputShape.length);let r="";for(let n=0;n<4;n++){let a="thisRC = rc;";n%2===1&&(a+="thisRC.z += 1;"),n>1&&(a+="thisRC.y += 1;"),r+=`
2022-04-01 15:13:32 +02:00
${a}
${n>0?"if(thisRC.y < rows && thisRC.z < cols){":""}
2022-02-10 18:27:21 +01:00
int flatIndex = getFlatIndex(thisRC);
ivec3 inputRC = inputCoordsFromReshapedOutCoords(flatIndex);
vec2 inputRCInnerDims = vec2(float(inputRC.y),float(inputRC.z));
2022-04-01 15:13:32 +02:00
result[${n}] =
2022-02-10 18:27:21 +01:00
getChannel(getA(inputRC.x, inputRC.y, inputRC.z), inputRCInnerDims);
2022-04-01 15:13:32 +02:00
${n>0?"}":""}
2022-02-10 18:27:21 +01:00
`}this.userCode=`
2022-04-14 17:47:08 +02:00
${Xee(t,this.enableShapeUniforms)}
${this.enableShapeUniforms?ob():ib(e)}
2022-02-10 18:27:21 +01:00
void main() {
ivec3 rc = getOutputCoords();
vec4 result = vec4(0.);
ivec3 thisRC;
int rows = ${this.enableShapeUniforms?"outShape[1]":e[1]};
int cols = ${this.enableShapeUniforms?"outShape[2]":e[2]};
2022-04-01 15:13:32 +02:00
${r}
2022-02-10 18:27:21 +01:00
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}};function Xee(e,t){return`
2022-02-10 18:27:21 +01:00
ivec3 inputCoordsFromReshapedOutCoords(int index) {
2022-04-14 17:47:08 +02:00
${t?gQ(["r","c","d"],"inputShape"):$l(["r","c","d"],e)}
2022-02-10 18:27:21 +01:00
return ivec3(r, c, d);
}
2022-04-14 17:47:08 +02:00
`}var Zee=class{constructor(e){this.gpgpu=e,this.numUsedTextures=0,this.numFreeTextures=0,this._numBytesAllocated=0,this._numBytesFree=0,this.freeTextures={},this.logEnabled=!1,this.usedTextures={}}acquireTexture(e,t,r){let n=Fv(t,r),a=$v(e,n,r);a in this.freeTextures||(this.freeTextures[a]=[]),a in this.usedTextures||(this.usedTextures[a]=[]);let s=Mv(e,n,this.gpgpu.gl,this.gpgpu.textureConfig,r);if(this.freeTextures[a].length>0){this.numFreeTextures--,this.numUsedTextures++,this._numBytesFree-=s,this.log();let o=this.freeTextures[a].shift();return this.usedTextures[a].push(o),o}let i;return n===3?i=this.gpgpu.createPackedMatrixTexture(e[0],e[1]):n===4?i=this.gpgpu.createFloat16PackedMatrixTexture(e[0],e[1]):n===1?i=this.gpgpu.createFloat32MatrixTexture(e[0],e[1]):n===0?i=this.gpgpu.createFloat16MatrixTexture(e[0],e[1]):n===2&&(i=this.gpgpu.createUnsignedBytesMatrixTexture(e[0],e[1])),this.usedTextures[a].push(i),this.numUsedTextures++,this._numBytesAllocated+=s,this.log(),i}releaseTexture(e,t,r,n){if(this.freeTextures==null)return;let a=Fv(r,n),s=$v(t,a,n);s in this.freeTextures||(this.freeTextures[s]=[]);let i=Mv(t,a,this.gpgpu.gl,this.gpgpu.textureConfig,n),o=Y().get("WEBGL_DELETE_TEXTURE_THRESHOLD");o!==-1&&this._numBytesAllocated>o?(this.gpgpu.deleteMatrixTexture(e.texture),this._numBytesAllocated-=i):(this.freeTextures[s].push(e),this.numFreeTextures++,this._numBytesFree+=i),this.numUsedTextures--;let l=this.usedTextures[s],u=l.indexOf(e);if(u<0)throw new Error("Cannot release a texture that was never provided by this texture manager");l.splice(u,1),this.log()}log(){if(!this.logEnabled)return;let e=this.numFreeTextures+this.numUsedTextures;console.log("Free/Used",`${this.numFreeTextures} / ${this.numUsedTextures}`,`(${e})`);let t=this._numBytesFree/this._numBytesAllocated;console.log(`Bytes allocated: ${this._numBytesAllocated}`),console.log(`Bytes unused: ${this._numBytesFree} (${Math.round(100*t)}%)`)}get numBytesAllocated(){return this._numBytesAllocated}get numBytesFree(){return this._numBytesFree}getNumUsedTextures(){return this.numUsedTextures}getNumFreeTextures(){return this.numFreeTextures}dispose(){if(this.freeTextures!=null){for(let e in this.freeTextures)this.freeTextures[e].forEach(t=>{this.gpgpu.deleteMatrixTexture(t.texture)});for(let e in this.usedTextures)this.usedTextures[e].forEach(t=>{this.gpgpu.deleteMatrixTexture(t.texture)});this.freeTextures=null,this.usedTextures=null,this.numUsedTextures=0,this.numFreeTextures=0,this._numBytesAllocated=0,this._numBytesFree=0}}};function Yee(e,t){let r=e;if(t===r.R32F)return 4;if(t===r.R16F)return 2;if(t===r.RGBA32F||t===e.RGBA)return 16;if(t===r.RGBA16F)return 8;if(t===r.RGBA8)return 4;throw new Error(`Unknown internal format ${t}`)}function Mv(e,t,r,n,a){let s=Jee(t,n),i;if(a){let[l,u]=bd(e[0],e[1]);i=l*u}else{let[l,u]=_h(e[0],e[1]);i=l*u}let o=Yee(r,s);return i*o}function Jee(e,t){switch(e){case 3:return hb(t);case 4:return cb(t);case 1:return ub(t);case 0:return db(t);case 2:return pb(t);default:throw new Error(`Unknown physical texture type ${e}`)}}function Qee(e){return Y().getBool("WEBGL_RENDER_FLOAT32_ENABLED")?e?3:1:e?4:0}function Fv(e,t){if(e===1)return 3;if(e===0||e==null)return Qee(t);if(e===3||e===2)return 2;throw new Error(`Unknown logical texture type ${e}`)}function $v(e,t,r){return`${e[0]}_${e[1]}_${t}_${r}`}var Ka=class{constructor(e,t){this.variableNames=["A"],this.outputShape=e,this.enableShapeUniforms=ln(this.outputShape.length),this.userCode=`
2022-02-10 18:27:21 +01:00
float unaryOperation(float x) {
${t}
}
void main() {
float x = getAAtOutCoords();
float y = unaryOperation(x);
setOutput(y);
}
2022-04-14 17:47:08 +02:00
`}},Xn="if (isnan(x)) return x;",ete="return x;",Pv="return abs(x);",tte="return (x >= 0.0) ? x : (exp(x) - 1.0);",rte=Xn+`
2022-02-10 18:27:21 +01:00
return (x < 0.0) ? 0.0 : x;
2022-04-14 17:47:08 +02:00
`,nte=Xn+`
2022-02-10 18:27:21 +01:00
return (x < 0.0) ? 0.0 : min(6.0, x);
2022-04-14 17:47:08 +02:00
`,iu="return x;",ate="return 1.0 / (1.0 + exp(-1.0 * x));",ste="return x;",ite=`
2022-02-10 18:27:21 +01:00
vec4 result;
result.r = (x.r >= 0.0) ? x.r : (exp(x.r) - 1.0);
result.g = (x.g >= 0.0) ? x.g : (exp(x.g) - 1.0);
result.b = (x.b >= 0.0) ? x.b : (exp(x.b) - 1.0);
result.a = (x.a >= 0.0) ? x.a : (exp(x.a) - 1.0);
return result;
2022-04-14 17:47:08 +02:00
`,ote=`
2022-02-10 18:27:21 +01:00
vec4 result = x * vec4(greaterThanEqual(x, vec4(0.0)));
bvec4 isNaN = isnan(x);
result.r = isNaN.r ? x.r : result.r;
result.g = isNaN.g ? x.g : result.g;
result.b = isNaN.b ? x.b : result.b;
result.a = isNaN.a ? x.a : result.a;
return result;
2022-04-14 17:47:08 +02:00
`,lte=`
2022-02-10 18:27:21 +01:00
vec4 result = min(x, vec4(6.)) * vec4(greaterThanEqual(x, vec4(0.0)));
bvec4 isNaN = isnan(x);
result.r = isNaN.r ? x.r : result.r;
result.g = isNaN.g ? x.g : result.g;
result.b = isNaN.b ? x.b : result.b;
result.a = isNaN.a ? x.a : result.a;
return result;
2022-04-14 17:47:08 +02:00
`,ute="return 1.0 / (1.0 + exp(-1.0 * x));",vo=class{constructor(e,t){this.variableNames=["A"],this.packedInputs=!0,this.packedOutput=!0,this.outputShape=e,this.enableShapeUniforms=ln(this.outputShape.length),this.userCode=`
2022-02-10 18:27:21 +01:00
vec4 unaryOperation(vec4 x) {
${t}
}
void main() {
vec4 x = getAAtOutCoords();
vec4 y = unaryOperation(x);
setOutput(y);
}
2022-04-14 17:47:08 +02:00
`}},dte=class{constructor(e){this.variableNames=["A"],this.packedInputs=!0,this.packedOutput=!1,this.outputShape=e,this.enableShapeUniforms=ln(this.outputShape.length);let t=e.length,r=Lr("rc",t),n=gt(t),a=qee(t,r),s=r.slice(-2),i=t<=1?"rc":`vec2(${s.join(",")})`;this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${n} rc = getOutputCoords();
vec4 packedInput = getA(${a});
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
setOutput(getChannel(packedInput, ${i}));
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}},pte=qn.whereImpl,hte=1e-7,cte=1e-4,sy={};function fte(e){return e in sy||(sy[e]={}),sy[e]}var mte=Y().getNumber("CPU_HANDOFF_SIZE_THRESHOLD"),gte=600;function yte(){return Y().global.screen==null?1024:Y().global.screen.height*Y().global.screen.width*window.devicePixelRatio*gte/1024/1024}var KS=class extends Fu{constructor(e){if(super(),this.pendingRead=new WeakMap,this.pendingDisposal=new WeakSet,this.dataRefCount=new WeakMap,this.numBytesInGPU=0,this.uploadWaitMs=0,this.downloadWaitMs=0,this.lastGlFlushTime=0,this.warnedAboutMemory=!1,this.pendingDeletes=0,this.disposed=!1,!Y().getBool("HAS_WEBGL"))throw new Error("WebGL is not supported on this device");let t;if(e!=null){if(e instanceof yu)t=e;else{let r=ya(Y().getNumber("WEBGL_VERSION"),e);t=new yu(r)}this.binaryCache={},this.gpgpuCreatedLocally=!1}else{let r=ya(Y().getNumber("WEBGL_VERSION"));t=new yu(r),this.binaryCache=fte(Y().getNumber("WEBGL_VERSION")),this.gpgpuCreatedLocally=!0}this.gpgpu=t,this.canvas=this.gpgpu.gl.canvas,this.textureManager=new Zee(this.gpgpu),this.numMBBeforeWarning=yte(),this.texData=new qp(this,br())}nextDataId(){return KS.nextDataId++}numDataIds(){return this.texData.numDataIds()-this.pendingDeletes}write(e,t,r){if((Y().getBool("WEBGL_CHECK_NUMERICAL_PROBLEMS")||Y().getBool("DEBUG"))&&this.checkNumericalProblems(e),r==="complex64"&&e!=null)throw new Error("Cannot write to a complex64 dtype. Please use tf.complex(real, imag).");let n={id:this.nextDataId()};return this.texData.set(n,{shape:t,dtype:r,values:e,usage:1,refCount:1}),n}refCount(e){return this.texData.has(e)?this.texData.get(e).refCount:0}incRef(e){let t=this.texData.get(e);t.refCount++}decRef(e){if(this.texData.has(e)){let t=this.texData.get(e);t.refCount--}}move(e,t,r,n,a){if(Y().getBool("DEBUG")&&this.checkNumericalProblems(t),n==="complex64")throw new Error("Cannot write to a complex64 dtype. Please use tf.complex(real, imag).");this.texData.set(e,{shape:r,dtype:n,values:t,usage:1,refCount:a})}disposeIntermediateTensorInfo(e){this.disposeData(e.dataId)}readSync(e){let t=this.texData.get(e),{values:r,dtype:n,complexTensorInfos:a,slice:s,shape:i,isPacked:o}=t;if(s!=null){let h;o?h=new vo(i,iu):h=new Ka(i,iu);let p=this.runWebGLProgram(h,[{dataId:e,shape:i,dtype:n}],n),c=this.readSync(p.dataId);return this.disposeIntermediateTensorInfo(p),c}if(r!=null)return this.convertAndCacheOnCPU(e);if(n==="string")return r;let l=this.activeTimers!=null,u;l&&(u=w.now());let d;if(n==="complex64"){let h=this.readSync(a.real.dataId),p=this.readSync(a.imag.dataId);d=N.mergeRealAndImagArrays(h,p)}else d=this.getValuesFromTexture(e);return l&&(this.downloadWaitMs+=w.now()-u),this.convertAndCacheOnCPU(e,d)}async read(e){if(this.pendingRead.has(e)){let c=this.pendingRead.get(e);return new Promise(f=>c.push(f))}let t=this.texData.get(e),{values:r,shape:n,slice:a,dtype:s,complexTensorInfos:i,isPacked:o}=t;if(a!=null){let c;o?c=new vo(n,iu):c=new Ka(n,iu);let f=this.runWebGLProgram(c,[{dataId:e,shape:n,dtype:s}],s),m=this.read(f.dataId);return this.disposeIntermediateTensorInfo(f),m}if(r!=null)return this.convertAndCacheOnCPU(e);if(Y().getBool("DEBUG")&&!Y().getBool("WEBGL_DOWNLOAD_FLOAT_ENABLED")&&Y().getNumber("WEBGL_VERSION")===2)throw new Error("tensor.data() with WEBGL_DOWNLOAD_FLOAT_ENABLED=false and WEBGL_VERSION=2 not yet supported.");let l=null,u;if(s!=="complex64"&&Y().get("WEBGL_BUFFER_SUPPORTED")){u=this.decode(e);let c=this.texData.get(u.dataId);l=this.gpgpu.createBufferFromTexture(c.texture.texture,...Yc(n))}this.pendingRead.set(e,[]),s!=="complex64"&&await this.gpgpu.createAndWaitForFence();let d;if(s==="complex64"){let c=await Promise.all([this.read(i.real.dataId),this.read(i.imag.dataId)]),f=c[0],m=c[1];d=N.mergeRealAndImagArrays(f,m)}else if(l==null)d=this.getValuesFromTexture(e);else{let c=w.sizeFromShape(n);d=this.gpgpu.downloadFloat32MatrixFromBuffer(l,c)}if(u!=null&&this.disposeIntermediateTensorInfo(u),l!=null){let c=this.gpgpu.gl;we(c,()=>c.deleteBuffer(l))}let h=this.convertAndCacheOnCPU(e,d),p=this.pendingRead.get(e);return this.pendingRead.delete(e),p.forEach(c=>c(h)
2022-02-10 18:27:21 +01:00
if (isnan(a)) return a;
if (isnan(b)) return b;
2022-04-14 17:47:08 +02:00
`,Mu=class{constructor(e,t,r){this.variableNames=["A","B"],this.outputShape=N.assertAndGetBroadcastShape(t,r),this.enableShapeUniforms=ln(this.outputShape.length),this.userCode=`
2022-02-10 18:27:21 +01:00
float binaryOperation(float a, float b) {
${e}
}
void main() {
float a = getAAtOutCoords();
float b = getBAtOutCoords();
setOutput(binaryOperation(a, b));
}
2022-04-14 17:47:08 +02:00
`}},y0=`
2022-02-10 18:27:21 +01:00
result.r = isNaN.r > 0. ? NAN : result.r;
result.g = isNaN.g > 0. ? NAN : result.g;
result.b = isNaN.b > 0. ? NAN : result.b;
result.a = isNaN.a > 0. ? NAN : result.a;
2022-04-14 17:47:08 +02:00
`,Dh=class{constructor(e,t,r,n=!1){this.variableNames=["A","B"],this.supportsBroadcasting=!0,this.packedInputs=!0,this.packedOutput=!0,this.outputShape=N.assertAndGetBroadcastShape(t,r);let a=this.outputShape.length;this.enableShapeUniforms=ln(a);let s="";if(n)if(a===0||w.sizeFromShape(this.outputShape)===1)s=`
2022-02-10 18:27:21 +01:00
result.y = 0.;
result.z = 0.;
result.w = 0.;
2022-04-01 15:13:32 +02:00
`;else if(s=`
${gt(a)} coords = getOutputCoords();
`,a===1)this.enableShapeUniforms?s+=`
2022-02-10 18:27:21 +01:00
result.y = (coords + 1) >= outShape ? 0. : result.y;
result.z = 0.;
result.w = 0.;
2022-04-01 15:13:32 +02:00
`:s+=`
2022-02-10 18:27:21 +01:00
result.y = (coords + 1) >= ${this.outputShape[0]} ? 0. : result.y;
result.z = 0.;
result.w = 0.;
2022-04-11 17:45:24 +02:00
`;else{let i=Lr("coords",a);this.enableShapeUniforms?s+=`
2022-02-10 18:27:21 +01:00
bool nextRowOutOfBounds =
2022-04-01 15:13:32 +02:00
(${i[a-2]} + 1) >= outShape[${a} - 2];
2022-02-10 18:27:21 +01:00
bool nextColOutOfBounds =
2022-04-01 15:13:32 +02:00
(${i[a-1]} + 1) >= outShape[${a} - 1];
2022-02-10 18:27:21 +01:00
result.y = nextColOutOfBounds ? 0. : result.y;
result.z = nextRowOutOfBounds ? 0. : result.z;
result.w = nextColOutOfBounds || nextRowOutOfBounds ? 0. : result.w;
2022-04-01 15:13:32 +02:00
`:s+=`
2022-02-10 18:27:21 +01:00
bool nextRowOutOfBounds =
2022-04-01 15:13:32 +02:00
(${i[a-2]} + 1) >= ${this.outputShape[a-2]};
2022-02-10 18:27:21 +01:00
bool nextColOutOfBounds =
2022-04-01 15:13:32 +02:00
(${i[a-1]} + 1) >= ${this.outputShape[a-1]};
2022-02-10 18:27:21 +01:00
result.y = nextColOutOfBounds ? 0. : result.y;
result.z = nextRowOutOfBounds ? 0. : result.z;
result.w = nextColOutOfBounds || nextRowOutOfBounds ? 0. : result.w;
`}this.userCode=`
vec4 binaryOperation(vec4 a, vec4 b) {
${e}
}
void main() {
vec4 a = getAAtOutCoords();
vec4 b = getBAtOutCoords();
vec4 result = binaryOperation(a, b);
2022-04-01 15:13:32 +02:00
${s}
2022-02-10 18:27:21 +01:00
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}};function an(e){let{inputs:t,backend:r}=e,{x:n}=t;return r.incRef(n.dataId),{dataId:n.dataId,shape:n.shape,dtype:n.dtype}}var vte={kernelName:pi,backendName:"webgl",kernelFunc:an};function Vi(e){let{inputs:t,backend:r}=e,{real:n,imag:a}=t,s=r.makeTensorInfo(n.shape,"complex64"),i=r.texData.get(s.dataId),o=an({inputs:{x:n},backend:r}),l=an({inputs:{x:a},backend:r});return i.complexTensorInfos={real:o,imag:l},s}var wte={kernelName:Xp,backendName:"webgl",kernelFunc:Vi},YS="return (a < 0.) ? b * a : a;",JS=`
2022-02-10 18:27:21 +01:00
vec4 aLessThanZero = vec4(lessThan(a, vec4(0.)));
return (aLessThanZero * (b * a)) + ((vec4(1.0) - aLessThanZero) * a);
2022-04-14 17:47:08 +02:00
`;function kte(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{alpha:s}=n,i=r.makeTensorInfo([],"float32",w.createScalarValue(s,"float32")),o=Y().getBool("WEBGL_PACK_BINARY_OPERATIONS")?new Dh(JS,a.shape,i.shape):new Mu(YS,a.shape,i.shape),l=r.runWebGLProgram(o,[a,i],"float32");return r.disposeIntermediateTensorInfo(i),l}var Ite={kernelName:hi,backendName:"webgl",kernelFunc:kte},QS="return (a < 0.) ? b * a : a;",e8=`
2022-02-10 18:27:21 +01:00
vec4 aLessThanZero = vec4(lessThan(a, vec4(0.)));
return (aLessThanZero * (b * a)) + ((vec4(1.0) - aLessThanZero) * a);
2022-04-14 17:47:08 +02:00
`;function Ste(e){let{inputs:t,backend:r}=e,{x:n,alpha:a}=t,s=Y().getBool("WEBGL_PACK_BINARY_OPERATIONS")?new Dh(e8,n.shape,a.shape):new Mu(QS,n.shape,a.shape);return r.runWebGLProgram(s,[n,a],"float32")}var Tte={kernelName:Ii,backendName:"webgl",kernelFunc:Ste},Td="if (isnan(x)) return x;",Nte=`
2022-02-10 18:27:21 +01:00
if (isnan(a)) return a;
if (isnan(b)) return b;
2022-04-14 17:47:08 +02:00
`,Cte=`
2022-02-10 18:27:21 +01:00
result.r = isNaN.r > 0. ? NAN : result.r;
result.g = isNaN.g > 0. ? NAN : result.g;
result.b = isNaN.b > 0. ? NAN : result.b;
result.a = isNaN.a > 0. ? NAN : result.a;
2022-04-14 17:47:08 +02:00
`;function it({opSnippet:e,packedOpSnippet:t,cpuKernelImpl:r,dtype:n}){return({inputs:a,backend:s})=>{let{x:i}=a,o=s,l=n||i.dtype;if(o.shouldExecuteOnCPU([i])&&r!=null){let h=o.texData.get(i.dataId),p=r(h.values,l);return o.makeTensorInfo(i.shape,l,p)}let u=Y().getBool("WEBGL_PACK_UNARY_OPERATIONS")&&t!=null,d;return u?d=new vo(i.shape,t):d=new Ka(i.shape,e),o.runWebGLProgram(d,[i],l)}}function wr({opSnippet:e,packedOpSnippet:t,checkOutOfBounds:r=!1,supportsComplex:n=!1,cpuKernelImpl:a,dtype:s}){return({inputs:i,backend:o})=>{let{a:l,b:u}=i,d=o;if(n&&l.dtype==="complex64"){let f=d.texData.get(l.dataId),m=d.texData.get(u.dataId),[g,y]=[[f.complexTensorInfos.real,m.complexTensorInfos.real],[f.complexTensorInfos.imag,m.complexTensorInfos.imag]].map(x=>{let[b,v]=x,S={dataId:b.dataId,dtype:b.dtype,shape:l.shape},T={dataId:v.dataId,dtype:v.dtype,shape:u.shape},E=new Mu(e,l.shape,u.shape);return d.runWebGLProgram(E,[S,T],Cr(b.dtype,v.dtype))}),A=Vi({inputs:{real:g,imag:y},backend:d});return d.disposeIntermediateTensorInfo(g),d.disposeIntermediateTensorInfo(y),A}let h=s||Cr(l.dtype,u.dtype);if((l.dtype==="string"||u.dtype==="string"||d.shouldExecuteOnCPU([l,u]))&&a!=null){let f=d.texData.get(l.dataId).values,m=d.texData.get(u.dataId).values,g=l.dtype==="string"?N.fromUint8ToStringArray(f):f,y=l.dtype==="string"?N.fromUint8ToStringArray(m):m,[A,x]=a(l.shape,u.shape,g,y,h),b=d.makeTensorInfo(x,h),v=d.texData.get(b.dataId);return v.values=A,b}let p=Y().getBool("WEBGL_PACK_BINARY_OPERATIONS")&&t!=null,c;return p?c=new Dh(t,l.shape,u.shape,r):c=new Mu(e,l.shape,u.shape),d.runWebGLProgram(c,[l,u],h)}}function A0(e,t=!1){if(e==="linear")return t?ste:ete;if(e==="relu")return t?ote:rte;if(e==="elu")return t?ite:tte;if(e==="relu6")return t?lte:nte;if(e==="prelu")return t?e8:QS;if(e==="leakyrelu")return t?JS:YS;if(e==="sigmoid")return t?ute:ate;throw new Error(`Activation ${e} has not been implemented for the WebGL backend.`)}var t8=class{constructor(e,t,r,n=!1,a=!1,s=!1,i=null,o=!1,l=!1){this.variableNames=["matrixA","matrixB"],this.packedInputs=!0,this.packedOutput=!0,this.outputShape=r,this.enableShapeUniforms=ln(this.outputShape.length);let u=n?e[1]:e[2],d=Math.ceil(u/2),h=n?"i * 2, rc.y":"rc.y, i * 2",p=a?"rc.z, i * 2":"i * 2, rc.z",c=n?["a.xxyy","a.zzww"]:["a.xxzz","a.yyww"],f=a?["b.xzxz","b.ywyw"]:["b.xyxy","b.zwzw"],m="",g="";i&&(o?m=`vec4 activation(vec4 a) {
2022-02-10 18:27:21 +01:00
vec4 b = getPreluActivationWeightsAtOutCoords();
2022-04-01 15:13:32 +02:00
${i}
2022-02-10 18:27:21 +01:00
}`:l?m=`vec4 activation(vec4 a) {
vec4 b = getLeakyreluAlphaAtOutCoords();
2022-04-01 15:13:32 +02:00
${i}
2022-02-10 18:27:21 +01:00
}`:m=`vec4 activation(vec4 x) {
2022-04-01 15:13:32 +02:00
${i}
}`,g="result = activation(result);");let y=s?"result += getBiasAtOutCoords();":"";s&&this.variableNames.push("bias"),o&&this.variableNames.push("preluActivationWeights"),l&&this.variableNames.push("leakyreluAlpha");let A="rc.x",x="rc.x";e[0]<t[0]?A=`int(min(float(rc.x), ${e[0]-1}.))`:t[0]<e[0]&&(x=`int(min(float(rc.x), ${t[0]-1}.))`),this.userCode=`
2022-02-10 18:27:21 +01:00
${m}
// Don't use uniform for sharedDimensionPacked for performance.
2022-04-01 15:13:32 +02:00
const float sharedDimension = ${d}.0;
2022-02-10 18:27:21 +01:00
vec4 dot2x2ARowBCol(ivec3 rc) {
vec4 result = vec4(0);
2022-04-01 15:13:32 +02:00
for (int i = 0; i < ${d}; i++) {
int batchA = ${A};
int batchB = ${x};
vec4 a = getMatrixA(batchA, ${h});
vec4 b = getMatrixB(batchB, ${p});
2022-02-10 18:27:21 +01:00
// These swizzled products need to be separately added.
// See: https://github.com/tensorflow/tfjs/issues/1735
2022-04-01 15:13:32 +02:00
result += (${c[0]} * ${f[0]});
result += (${c[1]} * ${f[1]});
2022-02-10 18:27:21 +01:00
}
return result;
}
void main() {
ivec3 rc = getOutputCoords();
vec4 result = dot2x2ARowBCol(rc);
${y}
${g}
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}},_v={REAL:"return areal * breal - aimag * bimag;",IMAG:"return areal * bimag + aimag * breal;"},zv=class{constructor(e,t,r){this.variableNames=["AReal","AImag","BReal","BImag"],this.outputShape=N.assertAndGetBroadcastShape(t,r),this.userCode=`
2022-02-10 18:27:21 +01:00
float binaryOpComplex(
float areal, float aimag, float breal, float bimag) {
${e}
}
void main() {
float areal = getARealAtOutCoords();
float aimag = getAImagAtOutCoords();
float breal = getBRealAtOutCoords();
float bimag = getBImagAtOutCoords();
setOutput(binaryOpComplex(areal, aimag, breal, bimag));
}
2022-04-14 17:47:08 +02:00
`}},Ov="return a * b;";function mb(e){let{inputs:t,backend:r}=e,{a:n,b:a}=t,s=N.upcastType(n.dtype,a.dtype);if(n.dtype==="complex64"){let o=r.texData.get(n.dataId),l=r.texData.get(a.dataId),u=new zv(_v.REAL,n.shape,a.shape),d=new zv(_v.IMAG,n.shape,a.shape),h=[{dataId:o.complexTensorInfos.real.dataId,dtype:o.complexTensorInfos.real.dtype,shape:n.shape},{dataId:o.complexTensorInfos.imag.dataId,dtype:o.complexTensorInfos.imag.dtype,shape:n.shape},{dataId:l.complexTensorInfos.real.dataId,dtype:l.complexTensorInfos.real.dtype,shape:a.shape},{dataId:l.complexTensorInfos.imag.dataId,dtype:l.complexTensorInfos.imag.dtype,shape:a.shape}],p=r.runWebGLProgram(u,h,"float32"),c=r.runWebGLProgram(d,h,"float32"),f=Vi({inputs:{real:p,imag:c},backend:r});return r.disposeIntermediateTensorInfo(p),r.disposeIntermediateTensorInfo(c),f}if(r.shouldExecuteOnCPU([n,a])){let o=r.texData.get(n.dataId),l=r.texData.get(a.dataId),[u,d]=Cee(n.shape,a.shape,o.values,l.values,s),h=r.makeTensorInfo(d,s),p=r.texData.get(h.dataId);return p.values=u,h}let i;return Y().getBool("WEBGL_PACK_BINARY_OPERATIONS")?i=new Dh(Ov,n.shape,a.shape):i=new Mu(Ov,n.shape,a.shape),r.runWebGLProgram(i,[n,a],s)}var Ete={kernelName:vi,backendName:"webgl",kernelFunc:mb};function Rte(e,t,r){let n=[Po(e.shape),..._o(e.shape)],a={dtype:e.dtype,shape:n,dataId:e.dataId},s=[Po(t),..._o(t)],i=new qS(s,n),o=!0,l=[n],u=r.runWebGLProgram(i,[a],e.dtype,l,o);return{dataId:u.dataId,shape:t,dtype:u.dtype}}function ve(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{shape:s}=n,i=r,o=w.sizeFromShape(a.shape),l=w.inferFromImplicitShape(s,o),u=w.sizeFromShape(l);w.assert(o===u,()=>`The new shape (${l}) has ${u} elements and the old shape (${a.shape}) has ${o} elements. The new shape and old shape must have the same number of elements.`);let d=i.texData.get(a.dataId);return d.isPacked&&!jp(a.shape,l)&&!(d.texture!==null&&jp(d.shape,l))?Rte(a,l,i):(i.incRef(a.dataId),{dataId:a.dataId,shape:l,dtype:a.dtype})}var Mte={kernelName:ul,backendName:"webgl",kernelFunc:ve},Dv=class{constructor(e,t){this.variableNames=["x"];let{windowSize:r,batchSize:n,inSize:a,outSize:s}=e;this.outputShape=[n,s];let i=Math.floor(r/4)*4,o=r%4,l="sumValue += dot(values, ones);";if(t!=null){let d=1/t;l=`sumValue += dot(values * ${w.isInt(d)?d.toPrecision(2):d}, ones);`}let u="";a%r>0&&(u=`
2022-04-01 15:13:32 +02:00
if (inIdx < 0 || inIdx >= ${a}) {
2022-02-10 18:27:21 +01:00
return 0.0;
}
`),this.userCode=`
const vec4 ones = vec4(1.0, 1.0, 1.0, 1.0);
float getValue(int batch, int inIdx) {
2022-02-17 14:15:57 +01:00
${u}
2022-02-10 18:27:21 +01:00
return getX(batch, inIdx);
}
void main() {
ivec2 coords = getOutputCoords();
int batch = coords[0];
int outIdx = coords[1];
2022-04-01 15:13:32 +02:00
int inOffset = outIdx * ${r};
2022-02-10 18:27:21 +01:00
float sumValue = 0.0;
2022-04-01 15:13:32 +02:00
for (int i = 0; i < ${i}; i += 4) {
2022-02-10 18:27:21 +01:00
int inIdx = inOffset + i;
vec4 values = vec4(
getValue(batch, inIdx),
getValue(batch, inIdx + 1),
getValue(batch, inIdx + 2),
getValue(batch, inIdx + 3)
);
${l}
}
2022-04-01 15:13:32 +02:00
int inIdx = inOffset + ${i};
if (${o===1}) {
2022-02-10 18:27:21 +01:00
vec4 values = vec4(getValue(batch, inIdx), 0.0, 0.0, 0.0);
${l}
2022-04-01 15:13:32 +02:00
} else if (${o===2}) {
2022-02-10 18:27:21 +01:00
vec4 values = vec4(
getValue(batch, inIdx),
getValue(batch, inIdx + 1), 0.0, 0.0);
${l}
2022-04-01 15:13:32 +02:00
} else if (${o===3}) {
2022-02-10 18:27:21 +01:00
vec4 values = vec4(
getValue(batch, inIdx),
getValue(batch, inIdx + 1),
getValue(batch, inIdx + 2), 0.0);
${l}
}
setOutput(sumValue);
}
2022-04-14 17:47:08 +02:00
`}},Fte=class{constructor(e,t){this.variableNames=["x"];let{windowSize:r,batchSize:n,inSize:a,outSize:s}=e;this.outputShape=[n,s];let i="0.0",o="";t==="prod"?i="1.0":t==="min"?(i="1.0 / 1e-20",o="min"):t==="max"&&(i="-1.0 / 1e-20",o="max");let l=`${t}(${t}(${t}(minMaxValue[0], minMaxValue[1]), minMaxValue[2]), minMaxValue[3])`;t==="sum"?l="sumValue":t==="prod"?l="prodValue":t==="all"?l="allValue":t==="any"&&(l="anyValue");let u=Math.floor(r/4)*4,d=r%4,h=`
2022-02-10 18:27:21 +01:00
if (${t==="sum"}) {
sumValue += dot(values, ones);
} else if (${t==="prod"}) {
vec2 tmp = vec2(values[0], values[1]) * vec2(values[2], values[3]);
prodValue *= tmp[0] * tmp[1];
} else {
2022-04-01 15:13:32 +02:00
minMaxValue = ${o}(values, minMaxValue);
2022-02-10 18:27:21 +01:00
if (${t==="min"} || ${t==="max"}) {
2022-04-01 15:13:32 +02:00
minMaxValue = ${o}(values, minMaxValue);
2022-02-10 18:27:21 +01:00
bvec4 isNaN = isnan(values);
if (isNaN.r || isNaN.g || isNaN.b || isNaN.a) {
minMaxValue = vec4(NAN);
}
}
}
2022-04-01 15:13:32 +02:00
`,p="vec4";t==="all"?(i="1.0",h=`
2022-02-10 18:27:21 +01:00
bool reducedAllValue = all(values);
float floatedReducedAllValue = float(reducedAllValue);
allValue = float(allValue >= 1.0 && floatedReducedAllValue >= 1.0);
2022-04-01 15:13:32 +02:00
`,p="bvec4"):t==="any"&&(i="0.0",h=`
2022-02-10 18:27:21 +01:00
bool reducedAnyValue = any(values);
float floatedReducedAnyValue = float(reducedAnyValue);
anyValue = float(anyValue >= 1.0 || floatedReducedAnyValue >= 1.0);
2022-04-01 15:13:32 +02:00
`,p="bvec4");let c="";a%r>0&&(c=`
if (inIdx < 0 || inIdx >= ${a}) {
2022-02-10 18:27:21 +01:00
return initializationValue;
}
`),this.userCode=`
2022-04-01 15:13:32 +02:00
const float initializationValue = ${i};
2022-02-10 18:27:21 +01:00
const vec4 ones = vec4(1.0, 1.0, 1.0, 1.0);
float getValue(int batch, int inIdx) {
2022-04-01 15:13:32 +02:00
${c}
2022-02-10 18:27:21 +01:00
return getX(batch, inIdx);
}
void main() {
ivec2 coords = getOutputCoords();
int batch = coords[0];
int outIdx = coords[1];
2022-04-01 15:13:32 +02:00
int inOffset = outIdx * ${r};
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
vec4 minMaxValue = vec4(${i});
2022-02-10 18:27:21 +01:00
float prodValue = 1.0;
float sumValue = 0.0;
float allValue = 1.0;
float anyValue = 0.0;
2022-02-17 14:15:57 +01:00
for (int i = 0; i < ${u}; i += 4) {
2022-02-10 18:27:21 +01:00
int inIdx = inOffset + i;
2022-04-01 15:13:32 +02:00
${p} values = ${p}(
2022-02-10 18:27:21 +01:00
getValue(batch, inIdx),
getValue(batch, inIdx + 1),
getValue(batch, inIdx + 2),
getValue(batch, inIdx + 3)
);
2022-04-01 15:13:32 +02:00
${h}
2022-02-10 18:27:21 +01:00
}
2022-02-17 14:15:57 +01:00
int inIdx = inOffset + ${u};
2022-04-01 15:13:32 +02:00
if (${d===1}) {
${p} values = ${p}(
2022-02-10 18:27:21 +01:00
getValue(batch, inIdx),
initializationValue,
initializationValue,
initializationValue
);
2022-04-01 15:13:32 +02:00
${h}
} else if (${d===2}) {
${p} values = ${p}(
2022-02-10 18:27:21 +01:00
getValue(batch, inIdx),
getValue(batch, inIdx + 1),
initializationValue,
initializationValue
);
2022-04-01 15:13:32 +02:00
${h}
} else if (${d===3}) {
${p} values = ${p}(
2022-02-10 18:27:21 +01:00
getValue(batch, inIdx),
getValue(batch, inIdx + 1),
getValue(batch, inIdx + 2),
initializationValue
);
2022-04-01 15:13:32 +02:00
${h}
2022-02-10 18:27:21 +01:00
}
setOutput(${l});
}
2022-04-14 17:47:08 +02:00
`}};function $te(e){let t=[];for(;t.length===0||t[t.length-1].outSize!==1;){let r=t.length?t[t.length-1].outSize:e[1],n=N.computeOptimalWindowSize(r);t.push({inSize:r,windowSize:n,outSize:Math.ceil(r/n)})}return t}function _l(e,t,r,n){let a=$te(e.shape),s=e;for(let i=0;i<a.length;i++){let{inSize:o,windowSize:l,outSize:u}=a[i],d,h;r==="mean"?d=i===0?new Dv({windowSize:l,inSize:o,batchSize:e.shape[0],outSize:u},o):new Dv({windowSize:l,inSize:o,batchSize:e.shape[0],outSize:u}):d=new Fte({windowSize:l,inSize:o,batchSize:e.shape[0],outSize:u},r),h=s,s=n.runWebGLProgram(d,[s],t),h.dataId!==e.dataId&&n.disposeIntermediateTensorInfo(h)}return s}var Pte=class{constructor(e,t){this.variableNames=["A"];let r=new Array(e.length);for(let s=0;s<r.length;s++)r[s]=e[t[s]];this.outputShape=r,this.rank=r.length;let n=gt(this.rank),a=_te(t);this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${n} resRC = getOutputCoords();
setOutput(getA(${a}));
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}};function _te(e){let t=e.length;if(t>6)throw Error(`Transpose for rank ${t} is not yet supported`);let r=["resRC.x","resRC.y","resRC.z","resRC.w","resRC.u","resRC.v"],n=new Array(t);for(let a=0;a<e.length;a++)n[e[a]]=r[a];return n.join()}var zte=class{constructor(e,t){this.variableNames=["A"],this.packedInputs=!0,this.packedOutput=!0;let r=new Array(e.length);for(let u=0;u<r.length;u++)r[u]=e[t[u]];if(this.outputShape=r,this.rank=r.length,this.rank>6)throw Error(`Packed transpose for rank ${this.rank} is not yet supported.`);let n=gt(this.rank),a=HS("rc",this.rank),s=new Array(this.rank);for(let u=0;u<t.length;u++)s[t[u]]=a[u];let i=`vec2(${s.slice(-2).join()})`,o=`++${a[this.rank-1]} < ${r[this.rank-1]}`,l=`getChannel(getA(${s.join()}), ${i})`;this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${n} rc = getOutputCoords();
2022-02-10 18:27:21 +01:00
vec4 result = vec4(0.);
result[0] = ${l};
2022-04-01 15:13:32 +02:00
if(${o}) {
2022-02-10 18:27:21 +01:00
result[1] = ${l};
}
2022-04-01 15:13:32 +02:00
--${a[this.rank-1]};
if(++${a[this.rank-2]} < ${r[this.rank-2]}) {
2022-02-10 18:27:21 +01:00
result[2] = ${l};
2022-04-01 15:13:32 +02:00
if(${o}) {
2022-02-10 18:27:21 +01:00
result[3] = ${l};
}
}
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}};function x0(e,t,r){let n=Y().getBool("WEBGL_PACK_ARRAY_OPERATIONS")?new zte(e.shape,t):new Pte(e.shape,t);return r.runWebGLProgram(n,[e],e.dtype)}function Ote(e,t,r,n){let a=t,s=e.shape.length,i=w.parseAxisParam(a,e.shape),o=i,l=N.getAxesPermutation(o,s),u=l!=null,d=e;u&&(d=x0(e,l,n),o=N.getInnerMostAxes(o.length,s)),N.assertAxesAreInnerMostDims("sum",o,s);let[h,p]=N.computeOutAndReduceShapes(d.shape,o),c=h;r&&(c=N.expandShapeToKeepDim(h,i));let f=w.sizeFromShape(p),m=w.sizeFromShape(e.shape)/f,g=ve({inputs:{x:d},attrs:{shape:[m,f]},backend:n}),y=ch(e.dtype),A=_l(g,y,"sum",n),x=ve({inputs:{x:A},attrs:{shape:c},backend:n});return n.disposeIntermediateTensorInfo(g),n.disposeIntermediateTensorInfo(A),u&&n.disposeIntermediateTensorInfo(d),x}function b0(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{axis:s,keepDims:i}=n;return Ote(a,s,i,r)}var Dte={kernelName:Fi,backendName:"webgl",kernelFunc:b0};function vr(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{perm:s}=n,i=r,o=a.shape.length,l=new Array(o);for(let d=0;d<l.length;d++)l[d]=a.shape[s[d]];let u;if(i.shouldExecuteOnCPU([a])){let d=i.texData.get(a.dataId).values,h=fb(d,a.shape,a.dtype,s,l);u=i.makeTensorInfo(l,a.dtype);let p=i.texData.get(u.dataId);p.values=h}else u=x0(a,s,i);return u}var Lte={kernelName:Oi,backendName:"webgl",kernelFunc:vr},r8=1e3;function Of({a:e,b:t,transposeA:r,transposeB:n,backend:a,bias:s=null,preluActivationWeights:i=null,leakyreluAlpha:o=0,activation:l=null}){let u=e.shape.length,d=t.shape.length,h=r?e.shape[u-2]:e.shape[u-1],p=n?t.shape[d-1]:t.shape[d-2],c=r?e.shape[u-1]:e.shape[u-2],f=n?t.shape[d-2]:t.shape[d-1],m=e.shape.slice(0,-2),g=t.shape.slice(0,-2),y=w.sizeFromShape(m),A=w.sizeFromShape(g),x=Sl.assertAndGetBroadcastShape(e.shape.slice(0,-2),t.shape.slice(0,-2)).concat([c,f]);w.assert(h===p,()=>`Error in matMul: inner shapes (${h}) and (${p}) of Tensors with shapes ${e.shape} and ${t.shape} and transposeA=${r} and transposeB=${n} must match.`);let b=r?[y,h,c]:[y,c,h],v=n?[A,f,p]:[A,p,f],S=ve({inputs:{x:e},backend:a,attrs:{shape:b}}),T=ve({inputs:{x:t},backend:a,attrs:{shape:v}}),E=[S,T],R=Math.max(y,A),_=r?S.shape[1]:S.shape[2],M=s!=null,I=i!=null,z=l==="leakyrelu",O=l!=null?A0(l,!0):null,j=M||I||z||O!=null,X;if((c===1||f===1)&&_>r8&&j===!1){let Q=S,V=T;r&&(Q=vr({inputs:{x:S},backend:a,attrs:{perm:[0,2,1]}}),E.push(Q)),n&&(V=vr({inputs:{x:T},backend:a,attrs:{perm:[0,2,1]}}),E.push(V));let ee=f!==1,J=f===1,se=Q;ee&&(se=ve({inputs:{x:Q},backend:a,attrs:{shape:[R,_,1]}}),E.push(se));let Z=f===1?2:1,ae=V;J&&(ae=ve({inputs:{x:V},backend:a,attrs:{shape:[R,1,_]}}),E.push(ae));let de=mb({inputs:{a:se,b:ae},backend:a});X=b0({inputs:{x:de},backend:a,attrs:{axis:Z,keepDims:!0}}),E.push(de)}else{let Q=Cr(e.dtype,t.dtype),V=new t8(b,v,[R,c,f],r,n,M,O,I,z),ee=[S,T];if(s!=null&&ee.push(s),I&&ee.push(i),z){let J=a.makeTensorInfo([],"float32",w.createScalarValue(o,"float32"));ee.push(J),E.push(J)}X=a.runWebGLProgram(V,ee,Q)}let D=ve({inputs:{x:X},backend:a,attrs:{shape:x}});E.push(X);for(let Q of E)a.disposeIntermediateTensorInfo(Q);return D}function Bte(e){let{inputs:t,backend:r,attrs:n}=e,{a,b:s,bias:i,preluActivationWeights:o}=t,{transposeA:l,transposeB:u,activation:d,leakyreluAlpha:h}=n;return Of({a,b:s,transposeA:l,transposeB:u,backend:r,bias:i,preluActivationWeights:o,leakyreluAlpha:h,activation:d})}var Wte={kernelName:Ms,backendName:"webgl",kernelFunc:Bte},Lv="return abs(x);";function Vte(e){let{inputs:t,backend:r}=e,{x:n}=t;if(r.shouldExecuteOnCPU([n])&&n.dtype!=="complex64"){let s=r.texData.get(n.dataId),i=GS(s.values);return r.makeTensorInfo(n.shape,n.dtype,i)}let a;return Y().getBool("WEBGL_PACK_UNARY_OPERATIONS")?a=new vo(n.shape,Lv):a=new Ka(n.shape,Lv),r.runWebGLProgram(a,[n],n.dtype)}var Ute={kernelName:Lo,backendName:"webgl",kernelFunc:Vte},Gte=Xn+`
2022-02-10 18:27:21 +01:00
if (abs(x) > 1.) {
return NAN;
}
return acos(x);
2022-04-14 17:47:08 +02:00
`,jte=it({opSnippet:Gte}),Hte={kernelName:Pu,backendName:"webgl",kernelFunc:jte},qte=Xn+`
2022-02-10 18:27:21 +01:00
if (x < 1.0) return NAN;
2022-04-14 17:47:08 +02:00
return log(x + sqrt(x * x - 1.0));`,Kte=it({opSnippet:qte}),Xte={kernelName:_u,backendName:"webgl",kernelFunc:Kte},Bv="return a + b;",Zte=wr({opSnippet:Bv,packedOpSnippet:Bv,supportsComplex:!0,cpuKernelImpl:uee}),Yte={kernelName:Ya,backendName:"webgl",kernelFunc:Zte},Jte=class{constructor(e,t){this.outputShape=[],this.outputShape=e,this.variableNames=t.map((a,s)=>`T${s}`);let r=[];this.variableNames.forEach(a=>{r.push(`float v${a} = get${a}AtOutCoords();`)});let n=this.variableNames.map(a=>`v${a}`).join(" + ");this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${r.join(`
2022-02-10 18:27:21 +01:00
`)}
2022-04-01 15:13:32 +02:00
float result = ${n};
2022-02-10 18:27:21 +01:00
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}},Qte=class{constructor(e,t){this.outputShape=[],this.packedInputs=!0,this.packedOutput=!0,this.outputShape=e,this.variableNames=t.map((a,s)=>`T${s}`);let r=[];this.variableNames.forEach(a=>{r.push(`vec4 v${a} = get${a}AtOutCoords();`)});let n=this.variableNames.map(a=>`v${a}`).join(" + ");this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${r.join(`
2022-02-10 18:27:21 +01:00
`)}
2022-04-01 15:13:32 +02:00
vec4 result = ${n};
2022-02-10 18:27:21 +01:00
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}};function df(e){let{inputs:t,backend:r}=e,n=t;if(n.length===1)return an({inputs:{x:n[0]},backend:r});if(n.length>Y().get("WEBGL_MAX_TEXTURES_IN_SHADER")){let o=Math.floor(n.length/2),l=df({inputs:n.slice(0,o),backend:r}),u=df({inputs:n.slice(o),backend:r});return df({inputs:[l,u],backend:r})}let a=n.map(o=>o.dtype).reduce((o,l)=>Cr(o,l)),s=n.map(o=>o.shape),i=Y().getBool("WEBGL_PACK")?new Qte(n[0].shape,s):new Jte(n[0].shape,s);return r.runWebGLProgram(i,n,a)}var ere={kernelName:qs,backendName:"webgl",kernelFunc:df};function tre(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{axis:s,keepDims:i}=n,o=a.shape.length,l=w.parseAxisParam(s,a.shape),u=l,d=N.getAxesPermutation(u,o),h=a;d!=null&&(h=vr({inputs:{x:a},backend:r,attrs:{perm:d}}),u=N.getInnerMostAxes(u.length,o)),N.assertAxesAreInnerMostDims("all",u,o);let[p,c]=N.computeOutAndReduceShapes(h.shape,u),f=w.sizeFromShape(c),m=ve({inputs:{x:h},backend:r,attrs:{shape:[-1,f]}}),g=_l(m,m.dtype,"all",r),y;if(i){let A=N.expandShapeToKeepDim(p,l);y=ve({inputs:{x:g},backend:r,attrs:{shape:A}})}else y=ve({inputs:{x:g},backend:r,attrs:{shape:p}});return r.disposeIntermediateTensorInfo(m),r.disposeIntermediateTensorInfo(g),d!=null&&r.disposeIntermediateTensorInfo(h),y}var rre={kernelName:zu,backendName:"webgl",kernelFunc:tre};function nre(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{axis:s,keepDims:i}=n,o=a.shape.length,l=w.parseAxisParam(s,a.shape),u=l,d=N.getAxesPermutation(u,o),h=a;d!=null&&(h=vr({inputs:{x:a},backend:r,attrs:{perm:d}}),u=N.getInnerMostAxes(u.length,o)),N.assertAxesAreInnerMostDims("any",u,o);let[p,c]=N.computeOutAndReduceShapes(h.shape,u),f=w.sizeFromShape(c),m=ve({inputs:{x:h},backend:r,attrs:{shape:[-1,f]}}),g=_l(m,m.dtype,"any",r),y;if(i){let A=N.expandShapeToKeepDim(p,l);y=ve({inputs:{x:g},backend:r,attrs:{shape:A}})}else y=ve({inputs:{x:g},backend:r,attrs:{shape:p}});return r.disposeIntermediateTensorInfo(m),r.disposeIntermediateTensorInfo(g),d!=null&&r.disposeIntermediateTensorInfo(h),y}var are={kernelName:Ou,backendName:"webgl",kernelFunc:nre},sre=class{constructor(e,t,r){this.variableNames=["A"];let{windowSize:n,batchSize:a,outSize:s}=e;r||this.variableNames.push("bestIndicesA"),this.outputShape=[a,s];let i=t==="max"?">":"<",o=r?"inOffset + i;":"round(getBestIndicesA(batch, inOffset + i));";this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec2 coords = getOutputCoords();
int batch = coords[0];
int outIdx = coords[1];
2022-04-01 15:13:32 +02:00
int inOffset = outIdx * ${n};
2022-02-10 18:27:21 +01:00
int bestIndex = inOffset;
float bestValue = getA(batch, bestIndex);
2022-04-01 15:13:32 +02:00
for (int i = 0; i < ${n}; i++) {
int inIdx = ${o};
2022-02-10 18:27:21 +01:00
float candidate = getA(batch, inIdx);
2022-04-01 15:13:32 +02:00
if (candidate ${i} bestValue) {
2022-02-10 18:27:21 +01:00
bestValue = candidate;
bestIndex = inIdx;
}
}
setOutput(float(bestIndex));
}
2022-04-14 17:47:08 +02:00
`}},ire=class{constructor(e,t,r,n){this.variableNames=["A"],this.packedInputs=!0,this.packedOutput=!0,w.assert(e.length>2,()=>`Packed arg${r.charAt(0).toUpperCase()+r.slice(1)} supports only inputs with rank above 2.`);let a=e[e.length-1],s=Math.ceil(a/t);this.outputShape=e.slice(0,-1),s>1&&this.outputShape.push(s),n||this.variableNames.push("bestIndicesA");let i=this.outputShape,o=i.length,l=gt(o),u=Lr("coords",o),d,h;if(s===1){h=o+1;let T=gt(h);d=`
2022-04-11 17:45:24 +02:00
${T} sourceLocR = ${T}(${u.join()}, 0);
2022-04-01 15:13:32 +02:00
++${u[o-1]};
2022-04-11 17:45:24 +02:00
${T} sourceLocG = ${T}(${u.join()}, 0);
2022-04-01 15:13:32 +02:00
++${u[o-2]};
2022-04-11 17:45:24 +02:00
${T} sourceLocA = ${T}(${u.join()}, 0);
2022-04-01 15:13:32 +02:00
--${u[o-1]};
2022-04-11 17:45:24 +02:00
${T} sourceLocB = ${T}(${u.join()}, 0);
2022-04-01 15:13:32 +02:00
--${u[o-2]};`}else h=o,d=`
2022-02-10 18:27:21 +01:00
${l} sourceLocR = coords;
2022-04-01 15:13:32 +02:00
++${u[o-1]};
2022-02-10 18:27:21 +01:00
${l} sourceLocG = coords;
2022-04-01 15:13:32 +02:00
++${u[o-2]};
2022-02-10 18:27:21 +01:00
${l} sourceLocA = coords;
2022-04-01 15:13:32 +02:00
--${u[o-1]};
2022-02-10 18:27:21 +01:00
${l} sourceLocB = coords;
2022-04-11 17:45:24 +02:00
--${u[o-2]};`;let p=["x","y","z","w","u","v"].slice(0,h),c="."+p[h-1],f=p.map(T=>"int "+T),m=Lr("sourceLocR",h-1).concat("inIdx.r"),g=Lr("sourceLocG",h-1).concat("inIdx.g"),y=Lr("sourceLocB",h-1).concat("inIdx.b"),A=Lr("sourceLocA",h-1).concat("inIdx.a"),x=r==="max"?"greaterThan":"lessThan",b=n?"":`
2022-02-10 18:27:21 +01:00
inIdx = round(vec4(getBestIndicesAChannel(${m.join()}),
getBestIndicesAChannel(${g.join()}),
getBestIndicesAChannel(${y.join()}),
2022-04-11 17:45:24 +02:00
getBestIndicesAChannel(${A.join()})));`,v=`vec4(
2022-02-10 18:27:21 +01:00
getAChannel(${m.join()}),
hasNextCol ? getAChannel(${g.join()}) : 0.,
hasNextRow ? getAChannel(${y.join()}) : 0.,
2022-04-11 17:45:24 +02:00
hasNextRow && hasNextCol ? getAChannel(${A.join()}) : 0.)`,S=n?"":`
2022-02-10 18:27:21 +01:00
float getBestIndicesAChannel(${f.join()}) {
2022-04-01 15:13:32 +02:00
return getChannel(getBestIndicesA(${p.join()}),
vec2(${p.slice(-2).join()}));
2022-02-10 18:27:21 +01:00
}`;this.userCode=`
float getAChannel(${f.join()}) {
2022-04-01 15:13:32 +02:00
return getChannel(getA(${p.join()}),
vec2(${p.slice(-2).join()}));
2022-02-10 18:27:21 +01:00
}
2022-04-11 17:45:24 +02:00
${S}
2022-02-10 18:27:21 +01:00
void main() {
${l} coords = getOutputCoords();
2022-04-01 15:13:32 +02:00
bool hasNextCol = ${u[o-1]} < ${i[o-1]-1};
bool hasNextRow = ${u[o-2]} < ${i[o-2]-1};
${d}
ivec4 srcIdx = ivec4(sourceLocR${c}, sourceLocG${c},
sourceLocB${c}, sourceLocA${c}) * ${t};
2022-02-10 18:27:21 +01:00
ivec4 inIdx = srcIdx;
vec4 bestIndex = vec4(inIdx);
2022-04-11 17:45:24 +02:00
vec4 bestValue = ${v};
2022-02-10 18:27:21 +01:00
for (int i = 0; i < ${t}; i++) {
inIdx = srcIdx;
${b}
2022-04-11 17:45:24 +02:00
vec4 candidate = ${v};
2022-02-10 18:27:21 +01:00
bvec4 nan = isnan(candidate);
bvec4 replace = bvec4(
2022-04-01 15:13:32 +02:00
vec4(${x}(candidate, bestValue)) * (vec4(1.0) - vec4(nan)));
2022-02-10 18:27:21 +01:00
bestValue = vec4(replace.x ? candidate.x : bestValue.x,
replace.y ? candidate.y : bestValue.y,
replace.z ? candidate.z : bestValue.z,
replace.w ? candidate.w : bestValue.w);
bestIndex = mix(bestIndex, vec4(inIdx), vec4(replace));
srcIdx++;
}
setOutput(bestIndex);
}
2022-04-14 17:47:08 +02:00
`}};function n8(e,t,r,n=null){let a=t.shape[0],s=t.shape[1];n!=null&&(a=n.shape[0],s=n.shape[1]);let i=N.computeOptimalWindowSize(s),o={windowSize:i,inSize:s,batchSize:a,outSize:Math.ceil(s/i)},l=new sre(o,r,n==null),u=[t];n!=null&&u.push(n);let d=e.runWebGLProgram(l,u,"int32");if(d.shape[1]===1)return d;let h=n8(e,t,r,d);return e.disposeIntermediateTensorInfo(d),h}function a8(e,t,r,n=null){let a=n!=null?n.shape:t.shape,s=a[a.length-1],i=N.computeOptimalWindowSize(s),o=new ire(a,i,r,n==null),l=n==null?[t]:[t,n],u=e.runWebGLProgram(o,l,"int32");if(u.shape.length===t.shape.length){let d=a8(e,t,r,u);return e.disposeIntermediateTensorInfo(u),d}return u}function s8(e,t,r,n){let a=[r];if(N.assertAxesAreInnerMostDims("arg"+n.charAt(0).toUpperCase()+n.slice(1),a,t.shape.length),!Y().getBool("WEBGL_PACK_REDUCE")||t.shape.length<=2){let s=[],i=e.texData.get(t.dataId),o=i!==null&&i.isPacked,l=t;o&&(l=e.unpackTensor(t),s.push(l));let[u,d]=N.computeOutAndReduceShapes(l.shape,a),h=w.sizeFromShape(d),p=ve({inputs:{x:l},backend:e,attrs:{shape:[-1,h]}});s.push(p);let c=n8(e,p,n);s.push(c);let f=ve({inputs:{x:c},backend:e,attrs:{shape:u}});return s.forEach(m=>e.disposeIntermediateTensorInfo(m)),f}return a8(e,t,n)}function ore(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{axis:s}=n,i=w.parseAxisParam(s,a.shape),o=N.getAxesPermutation(i,a.shape.length),l=a,u=[];o!=null&&(l=vr({inputs:{x:a},backend:r,attrs:{perm:o}}),u.push(l),i=N.getInnerMostAxes(i.length,l.shape.length)),N.assertAxesAreInnerMostDims("argMax",[i[0]],l.shape.length);let d=s8(r,l,i[0],"max");return u.forEach(h=>r.disposeIntermediateTensorInfo(h)),d}var lre={kernelName:Ks,backendName:"webgl",kernelFunc:ore};function ure(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{axis:s}=n,i=w.parseAxisParam(s,a.shape),o=N.getAxesPermutation(i,a.shape.length),l=a,u=[];o!=null&&(l=vr({inputs:{x:a},backend:r,attrs:{perm:o}}),u.push(l),i=N.getInnerMostAxes(i.length,l.shape.length)),N.assertAxesAreInnerMostDims("argMin",[i[0]],l.shape.length);let d=s8(r,l,i[0],"min");return u.forEach(h=>r.disposeIntermediateTensorInfo(h)),d}var dre={kernelName:Du,backendName:"webgl",kernelFunc:ure},pre=Xn+`
2022-02-10 18:27:21 +01:00
if (abs(x) > 1.) {
return NAN;
}
return asin(x);
2022-04-14 17:47:08 +02:00
`,hre=it({opSnippet:pre}),cre={kernelName:Lu,backendName:"webgl",kernelFunc:hre},fre=Xn+"return log(x + sqrt(x * x + 1.0));",mre=it({opSnippet:fre}),gre={kernelName:Bu,backendName:"webgl",kernelFunc:mre},yre=Xn+`
2022-02-10 18:27:21 +01:00
return atan(x);
2022-04-14 17:47:08 +02:00
`,Are=it({opSnippet:yre}),xre={kernelName:Wu,backendName:"webgl",kernelFunc:Are},bre=Nte+`
2022-02-10 18:27:21 +01:00
return atan(a, b);
2022-04-14 17:47:08 +02:00
`,vre=`
2022-02-10 18:27:21 +01:00
vec4 result = atan(a, b);
vec4 isNaN = min(vec4(isnan(a)) + vec4(isnan(b)), vec4(1.0));
2022-04-14 17:47:08 +02:00
`+Cte+`
2022-02-10 18:27:21 +01:00
return result;
2022-04-14 17:47:08 +02:00
`,wre=wr({opSnippet:bre,packedOpSnippet:vre}),kre={kernelName:Uu,backendName:"webgl",kernelFunc:wre},Ire=Xn+`
2022-02-10 18:27:21 +01:00
if ((x < -1.0) || (x > 1.0)) return NAN;
2022-04-14 17:47:08 +02:00
return (log(1.0 + x) - log(1.0 - x)) / 2.0;`,Sre=it({opSnippet:Ire}),Tre={kernelName:Vu,backendName:"webgl",kernelFunc:Sre},Hp=class{constructor(e,t,r,n=!1,a=!1){if(this.variableNames=["x"],t==="avg"&&r)throw new Error("Cannot compute positions for average pool.");let s=e.filterWidth,i=e.strideHeight,o=e.strideWidth,l=e.dilationHeight,u=e.dilationWidth,d=e.effectiveFilterHeight,h=e.effectiveFilterWidth,p=e.padInfo.top,c=e.padInfo.left;this.outputShape=e.outShape;let f=t==="avg",m=`((batch * ${e.inHeight} + xR) * ${e.inWidth} + xC) * ${e.inChannels} + d`,g=`(xR * ${e.inWidth} + xC) * ${e.inChannels} + d`,y="0.0";if(f||(y="-1.0 / 1e-20"),r){let T=">=";this.userCode=`
2022-04-01 15:13:32 +02:00
const ivec2 strides = ivec2(${i}, ${o});
const ivec2 pads = ivec2(${p}, ${c});
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int batch = coords[0];
int d = coords[3];
ivec2 xRCCorner = coords.yz * strides - pads;
int xRCorner = xRCCorner.x;
int xCCorner = xRCCorner.y;
// max/min x(?, ?, d) to get y(yR, yC, d).
// ? = to be determined
float minMaxValue = 0.0;
float minMaxValueFound = 0.0;
int minMaxPosition = 0;
float avgValue = 0.0;
2022-04-01 15:13:32 +02:00
for (int wR = 0; wR < ${d};
2022-02-10 18:27:21 +01:00
wR += ${l}) {
int xR = xRCorner + wR;
if (xR < 0 || xR >= ${e.inHeight}) {
continue;
}
2022-04-01 15:13:32 +02:00
for (int wC = 0; wC < ${h};
2022-02-17 14:15:57 +01:00
wC += ${u}) {
2022-02-10 18:27:21 +01:00
int xC = xCCorner + wC;
if (xC < 0 || xC >= ${e.inWidth}) {
continue;
}
float value = getX(batch, xR, xC, d);
// If a min / max value has already been found, use it. If not,
// use the current value.
float currMinMaxValue = mix(
value, minMaxValue, minMaxValueFound);
2022-04-11 17:45:24 +02:00
if (value ${T} currMinMaxValue) {
2022-02-10 18:27:21 +01:00
minMaxValue = value;
minMaxValueFound = 1.0;
2022-04-01 15:13:32 +02:00
minMaxPosition = ${n?a?m:g:`wR * ${h} + wC`};
2022-02-10 18:27:21 +01:00
}
}
}
setOutput(float(minMaxPosition));
}
2022-04-11 17:45:24 +02:00
`;return}let A="max",x=`${t}(${t}(${t}(minMaxValue[0], minMaxValue[1]), minMaxValue[2]), minMaxValue[3])`;t==="avg"&&(x="avgValue / count");let b=Math.floor(s/4)*4,v=s%4,S=`
2022-02-10 18:27:21 +01:00
if (${f}) {
avgValue += dot(values, ones);
} else {
2022-04-01 15:13:32 +02:00
minMaxValue = ${A}(values, minMaxValue);
2022-02-10 18:27:21 +01:00
}
`;this.userCode=`
2022-04-01 15:13:32 +02:00
const ivec2 strides = ivec2(${i}, ${o});
const ivec2 pads = ivec2(${p}, ${c});
2022-02-10 18:27:21 +01:00
const float initializationValue = ${y};
const vec4 ones = vec4(1.0, 1.0, 1.0, 1.0);
float count = 0.0;
float getValue(int batch, int xR, int xC, int d) {
if (xC < 0 || xC >= ${e.inWidth}) {
return initializationValue;
}
count += 1.0;
return getX(batch, xR, xC, d);
}
void main() {
ivec4 coords = getOutputCoords();
int batch = coords[0];
int d = coords[3];
ivec2 xRCCorner = coords.yz * strides - pads;
int xRCorner = xRCCorner.x;
int xCCorner = xRCCorner.y;
// max/min x(?, ?, d) to get y(yR, yC, d).
// ? = to be determined
vec4 minMaxValue = vec4(${y});
float avgValue = 0.0;
count = 0.0;
2022-04-01 15:13:32 +02:00
for (int wR = 0; wR < ${d};
2022-02-10 18:27:21 +01:00
wR += ${l}) {
int xR = xRCorner + wR;
if (xR < 0 || xR >= ${e.inHeight}) {
continue;
}
for (int wC = 0; wC < ${b}; wC += 4) {
2022-02-17 14:15:57 +01:00
int xC = xCCorner + wC * ${u};
2022-02-10 18:27:21 +01:00
vec4 values = vec4(
getValue(batch, xR, xC, d),
2022-02-17 14:15:57 +01:00
getValue(batch, xR, xC + ${u}, d),
getValue(batch, xR, xC + 2 * ${u}, d),
getValue(batch, xR, xC + 3 * ${u}, d)
2022-02-10 18:27:21 +01:00
);
2022-04-11 17:45:24 +02:00
${S}
2022-02-10 18:27:21 +01:00
}
int xC = xCCorner + ${b};
2022-04-11 17:45:24 +02:00
if (${v===1}) {
2022-02-10 18:27:21 +01:00
vec4 values = vec4(
getValue(batch, xR, xC, d),
initializationValue,
initializationValue,
initializationValue
);
2022-04-11 17:45:24 +02:00
${S}
} else if (${v===2}) {
2022-02-10 18:27:21 +01:00
vec4 values = vec4(
getValue(batch, xR, xC, d),
2022-02-17 14:15:57 +01:00
getValue(batch, xR, xC + ${u}, d),
2022-02-10 18:27:21 +01:00
initializationValue,
initializationValue
);
2022-04-11 17:45:24 +02:00
${S}
} else if (${v===3}) {
2022-02-10 18:27:21 +01:00
vec4 values = vec4(
getValue(batch, xR, xC, d),
2022-02-17 14:15:57 +01:00
getValue(batch, xR, xC + ${u}, d),
getValue(batch, xR, xC + 2 * ${u}, d),
2022-02-10 18:27:21 +01:00
initializationValue
);
2022-04-11 17:45:24 +02:00
${S}
2022-02-10 18:27:21 +01:00
}
}
2022-04-01 15:13:32 +02:00
setOutput(${x});
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}},gb=class{constructor(e,t,r,n=!1,a=!1){if(this.variableNames=["x"],t==="avg"&&r)throw new Error("Cannot compute positions for average pool.");let s=e.filterWidth,i=e.strideDepth,o=e.strideHeight,l=e.strideWidth,u=e.dilationDepth,d=e.dilationHeight,h=e.dilationWidth,p=e.effectiveFilterDepth,c=e.effectiveFilterHeight,f=e.effectiveFilterWidth,m=e.padInfo.front,g=e.padInfo.top,y=e.padInfo.left;this.outputShape=e.outShape;let A=t==="avg",x="0.0";if(A||(x="-1.0 / 1e-20"),r){let R=">=";this.userCode=`
2022-02-10 18:27:21 +01:00
const ivec3 strides =
2022-04-01 15:13:32 +02:00
ivec3(${i}, ${o}, ${l});
2022-02-10 18:27:21 +01:00
const ivec3 pads = ivec3(${m}, ${g}, ${y});
void main() {
ivec5 coords = getOutputCoords();
int batch = coords.x;
int ch = coords.u;
ivec3 xCorner = ivec3(coords.y, coords.z, coords.w) * strides - pads;
int xDCorner = xCorner.x;
int xRCorner = xCorner.y;
int xCCorner = xCorner.z;
// max/min x(?, ?, ?, ch) to get y(yD, yR, yC, ch).
// ? = to be determined
float minMaxValue = 0.0;
float minMaxValueFound = 0.0;
int minMaxPosition = 0;
2022-04-01 15:13:32 +02:00
for (int wD = 0; wD < ${p};
2022-02-17 14:15:57 +01:00
wD += ${u}) {
2022-02-10 18:27:21 +01:00
int xD = xDCorner + wD;
if (xD < 0 || xD >= ${e.inDepth}) {
continue;
}
2022-04-01 15:13:32 +02:00
for (int wR = 0; wR < ${c};
wR += ${d}) {
2022-02-10 18:27:21 +01:00
int xR = xRCorner + wR;
if (xR < 0 || xR >= ${e.inHeight}) {
continue;
}
for (int wC = 0; wC < ${f};
2022-04-01 15:13:32 +02:00
wC += ${h}) {
2022-02-10 18:27:21 +01:00
int xC = xCCorner + wC;
if (xC < 0 || xC >= ${e.inWidth}) {
continue;
}
float value = getX(batch, xD, xR, xC, ch);
// If a min / max value has already been found, use it. If not,
// use the current value.
float currMinMaxValue = mix(
value, minMaxValue, minMaxValueFound);
if (value ${R} currMinMaxValue) {
minMaxValue = value;
minMaxValueFound = 1.0;
2022-04-01 15:13:32 +02:00
minMaxPosition = ${n?a?`(((batch * ${e.inDepth} + xD) * ${e.inHeight} + xR) * ${e.inWidth} + xC) * ${e.inChannels} + ch`:`((xD * ${e.inHeight} + xR) * ${e.inWidth} + xC) * ${e.inChannels} + ch`:`wD * ${c} * ${f} +
2022-02-10 18:27:21 +01:00
wR * ${f} + wC`};
}
}
}
}
setOutput(float(minMaxPosition));
}
2022-04-11 17:45:24 +02:00
`;return}let b="max",v=`${t}(${t}(${t}(minMaxValue[0], minMaxValue[1]), minMaxValue[2]), minMaxValue[3])`;t==="avg"&&(v="avgValue / count");let S=Math.floor(s/4)*4,T=s%4,E=`
2022-04-01 15:13:32 +02:00
if (${A}) {
2022-02-10 18:27:21 +01:00
avgValue += dot(values, ones);
} else {
minMaxValue = ${b}(values, minMaxValue);
}
`;this.userCode=`
const ivec3 strides =
2022-04-01 15:13:32 +02:00
ivec3(${i}, ${o}, ${l});
2022-02-10 18:27:21 +01:00
const ivec3 pads = ivec3(${m}, ${g}, ${y});
2022-04-01 15:13:32 +02:00
const float initializationValue = ${x};
2022-02-10 18:27:21 +01:00
const vec4 ones = vec4(1.0, 1.0, 1.0, 1.0);
float count = 0.0;
float getValue(int batch, int xD, int xR, int xC, int ch) {
if (xC < 0 || xC >= ${e.inWidth}) {
return initializationValue;
}
count += 1.0;
return getX(batch, xD, xR, xC, ch);
}
void main() {
ivec5 coords = getOutputCoords();
int batch = coords.x;
int ch = coords.u;
ivec3 xCorner = ivec3(coords.y, coords.z, coords.w) * strides - pads;
int xDCorner = xCorner.x;
int xRCorner = xCorner.y;
int xCCorner = xCorner.z;
// max/min x(?, ?, ?, d) to get y(yD, yR, yC, ch).
// ? = to be determined
2022-04-01 15:13:32 +02:00
vec4 minMaxValue = vec4(${x});
2022-02-10 18:27:21 +01:00
float avgValue = 0.0;
count = 0.0;
2022-04-01 15:13:32 +02:00
for (int wD = 0; wD < ${p};
2022-02-17 14:15:57 +01:00
wD += ${u}) {
2022-02-10 18:27:21 +01:00
int xD = xDCorner + wD;
if (xD < 0 || xD >= ${e.inDepth}) {
continue;
}
2022-04-01 15:13:32 +02:00
for (int wR = 0; wR < ${c};
wR += ${d}) {
2022-02-10 18:27:21 +01:00
int xR = xRCorner + wR;
if (xR < 0 || xR >= ${e.inHeight}) {
continue;
}
2022-04-11 17:45:24 +02:00
for (int wC = 0; wC < ${S}; wC += 4) {
2022-04-01 15:13:32 +02:00
int xC = xCCorner + wC * ${h};
2022-02-10 18:27:21 +01:00
vec4 values = vec4(
getValue(batch, xD, xR, xC, ch),
2022-04-01 15:13:32 +02:00
getValue(batch, xD, xR, xC + ${h}, ch),
getValue(batch, xD, xR, xC + 2 * ${h}, ch),
getValue(batch, xD, xR, xC + 3 * ${h}, ch)
2022-02-10 18:27:21 +01:00
);
${E}
}
2022-04-11 17:45:24 +02:00
int xC = xCCorner + ${S};
if (${T===1}) {
2022-02-10 18:27:21 +01:00
vec4 values = vec4(
getValue(batch, xD, xR, xC, ch),
initializationValue,
initializationValue,
initializationValue
);
${E}
2022-04-11 17:45:24 +02:00
} else if (${T===2}) {
2022-02-10 18:27:21 +01:00
vec4 values = vec4(
getValue(batch, xD, xR, xC, ch),
2022-04-01 15:13:32 +02:00
getValue(batch, xD, xR, xC + ${h}, ch),
2022-02-10 18:27:21 +01:00
initializationValue,
initializationValue
);
${E}
2022-04-11 17:45:24 +02:00
} else if (${T===3}) {
2022-02-10 18:27:21 +01:00
vec4 values = vec4(
getValue(batch, xD, xR, xC, ch),
2022-04-01 15:13:32 +02:00
getValue(batch, xD, xR, xC + ${h}, ch),
getValue(batch, xD, xR, xC + 2 * ${h}, ch),
2022-02-10 18:27:21 +01:00
initializationValue
);
${E}
}
}
2022-04-11 17:45:24 +02:00
setOutput(${v});
2022-02-10 18:27:21 +01:00
}
}
2022-04-14 17:47:08 +02:00
`}};function Nre(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t;vd(a,"avgPool");let{filterSize:s,strides:i,pad:o,dimRoundingMode:l}=n,u=1;w.assert(N.eitherStridesOrDilationsAreOne(i,u),()=>`Error in avgPool: Either strides or dilations must be 1. Got strides ${i} and dilations '${u}'`);let d=N.computePool2DInfo(a.shape,s,i,u,o,l);if(d.filterWidth===1&&d.filterHeight===1&&w.arraysEqual(d.inShape,d.outShape))return an({inputs:{x:a},backend:r});let h=new Hp(d,"avg",!1);return r.runWebGLProgram(h,[a],"float32")}var Cre={kernelName:Xs,backendName:"webgl",kernelFunc:Nre};function Ere(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{filterSize:s,strides:i,pad:o,dimRoundingMode:l,dataFormat:u}=n,d=[1,1,1],h=N.computePool3DInfo(a.shape,s,i,d,o,l,u),p=new gb(h,"avg",!1);return r.runWebGLProgram(p,[a],"float32")}var Rre={kernelName:Kp,backendName:"webgl",kernelFunc:Ere},Mre=class{constructor(e){this.variableNames=["dy"],this.outputShape=e.inShape;let t=e.filterHeight,r=e.filterWidth,n=e.strideHeight,a=e.strideWidth,s=e.dilationHeight,i=e.dilationWidth,o=e.effectiveFilterHeight,l=e.effectiveFilterWidth,u=o-1-e.padInfo.top,d=l-1-e.padInfo.left,h=1/(t*r);this.userCode=`
2022-04-01 15:13:32 +02:00
const ivec2 pads = ivec2(${u}, ${d});
const float avgMultiplier = float(${h});
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int b = coords[0];
int d = coords[3];
ivec2 dyRCCorner = coords.yz - pads;
int dyRCorner = dyRCCorner.x;
int dyCCorner = dyRCCorner.y;
// Convolve dy(?, ?, d) with pos mask(:, :, d) to get dx(xR, xC, d).
// ? = to be determined. : = across all values in that axis.
float dotProd = 0.0;
2022-04-01 15:13:32 +02:00
for (int wR = 0; wR < ${o};
wR += ${s}) {
float dyR = float(dyRCorner + wR) / ${n}.0;
2022-02-10 18:27:21 +01:00
if (dyR < 0.0 || dyR >= ${e.outHeight}.0 || fract(dyR) > 0.0) {
continue;
}
int idyR = int(dyR);
for (int wC = 0; wC < ${l};
2022-04-01 15:13:32 +02:00
wC+= ${i}) {
float dyC = float(dyCCorner + wC) / ${a}.0;
2022-02-10 18:27:21 +01:00
if (dyC < 0.0 || dyC >= ${e.outWidth}.0 ||
fract(dyC) > 0.0) {
continue;
}
int idyC = int(dyC);
float dyValue = getDy(b, idyR, idyC, d);
dotProd += dyValue * avgMultiplier;
}
}
setOutput(dotProd);
}
2022-04-14 17:47:08 +02:00
`}},Fre=class{constructor(e){this.variableNames=["dy"],this.outputShape=e.inShape;let t=e.filterDepth,r=e.filterHeight,n=e.filterWidth,a=e.strideDepth,s=e.strideHeight,i=e.strideWidth,o=e.dilationDepth,l=e.dilationHeight,u=e.dilationWidth,d=e.effectiveFilterDepth,h=e.effectiveFilterHeight,p=e.effectiveFilterWidth,c=d-1-e.padInfo.front,f=h-1-e.padInfo.top,m=p-1-e.padInfo.left,g=1/(t*r*n);this.userCode=`
2022-04-01 15:13:32 +02:00
const ivec3 pads = ivec3(${c}, ${f}, ${m});
2022-02-10 18:27:21 +01:00
const float avgMultiplier = float(${g});
void main() {
ivec5 coords = getOutputCoords();
int batch = coords.x;
int ch = coords.u;
ivec3 dyCorner = ivec3(coords.y, coords.z, coords.w) - pads;
int dyDCorner = dyCorner.x;
int dyRCorner = dyCorner.y;
int dyCCorner = dyCorner.z;
// Convolve dy(?, ?, ?, d) with pos mask(:, :, :, ch) to get
// dx(xD, xR, xC, ch).
// ? = to be determined. : = across all values in that axis.
float dotProd = 0.0;
2022-04-01 15:13:32 +02:00
for (int wD = 0; wD < ${d};
wD += ${o}) {
float dyD = float(dyDCorner + wD) / ${a}.0;
2022-02-10 18:27:21 +01:00
if (dyD < 0.0 || dyD >= ${e.outDepth}.0 || fract(dyD) > 0.0) {
continue;
}
int idyD = int(dyD);
2022-04-01 15:13:32 +02:00
for (int wR = 0; wR < ${h};
2022-02-10 18:27:21 +01:00
wR += ${l}) {
2022-04-01 15:13:32 +02:00
float dyR = float(dyRCorner + wR) / ${s}.0;
2022-02-10 18:27:21 +01:00
if (dyR < 0.0 || dyR >= ${e.outHeight}.0 ||
fract(dyR) > 0.0) {
continue;
}
int idyR = int(dyR);
2022-04-01 15:13:32 +02:00
for (int wC = 0; wC < ${p};
2022-02-17 14:15:57 +01:00
wC += ${u}) {
2022-04-01 15:13:32 +02:00
float dyC = float(dyCCorner + wC) / ${i}.0;
2022-02-10 18:27:21 +01:00
if (dyC < 0.0 || dyC >= ${e.outWidth}.0 ||
fract(dyC) > 0.0) {
continue;
}
int idyC = int(dyC);
float dyValue = getDy(batch, idyD, idyR, idyC, ch);
dotProd += dyValue * avgMultiplier;
}
}
}
setOutput(dotProd);
}
2022-04-14 17:47:08 +02:00
`}};function $re(e){let{inputs:t,backend:r,attrs:n}=e,{dy:a,input:s}=t,i=s,{filterSize:o,strides:l,pad:u,dimRoundingMode:d}=n,h=[1,1,1],p=N.computePool3DInfo(i.shape,o,l,h,u,d),c=new Fre(p);return r.runWebGLProgram(c,[a],i.dtype)}var Pre={kernelName:Hf,backendName:"webgl",kernelFunc:$re};function _re(e){let{inputs:t,backend:r,attrs:n}=e,{dy:a,input:s}=t,i=s;vd([a,s],"avgPoolGrad");let{filterSize:o,strides:l,pad:u}=n,d=N.computePool2DInfo(i.shape,o,l,1,u),h=new Mre(d);return r.runWebGLProgram(h,[a],i.dtype)}var zre={kernelName:jf,backendName:"webgl",kernelFunc:_re};function Ore(e){let{inputs:t,backend:r,attrs:n}=e,{a,b:s}=t,{transposeA:i,transposeB:o}=n;return Of({a,b:s,transposeA:i,transposeB:o,backend:r})}var Dre={kernelName:Zs,backendName:"webgl",kernelFunc:Ore},Lre=class{constructor(e,t,r,n,a,s){this.outputShape=[],this.variableNames=["x","mean","variance"],N.assertAndGetBroadcastShape(e,t),N.assertAndGetBroadcastShape(e,r);let i="0.0";n!=null&&(N.assertAndGetBroadcastShape(e,n),this.variableNames.push("offset"),i="getOffsetAtOutCoords()");let o="1.0";a!=null&&(N.assertAndGetBroadcastShape(e,a),this.variableNames.push("scale"),o="getScaleAtOutCoords()"),this.outputShape=e,this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
float x = getXAtOutCoords();
float mean = getMeanAtOutCoords();
float variance = getVarianceAtOutCoords();
2022-04-01 15:13:32 +02:00
float offset = ${i};
float scale = ${o};
float inv = scale * inversesqrt(variance + float(${s}));
2022-02-10 18:27:21 +01:00
setOutput(dot(vec3(x, -mean, offset), vec3(inv, inv, 1)));
}
2022-04-14 17:47:08 +02:00
`}},Bre=class{constructor(e,t,r,n,a,s){this.packedInputs=!0,this.packedOutput=!0,this.variableNames=["x","mean","variance"],N.assertAndGetBroadcastShape(e,t),N.assertAndGetBroadcastShape(e,r);let i="vec4(0.0)";n!=null&&(N.assertAndGetBroadcastShape(e,n),this.variableNames.push("offset"),i="getOffsetAtOutCoords()");let o="vec4(1.0)";a!=null&&(N.assertAndGetBroadcastShape(e,a),this.variableNames.push("scale"),o="getScaleAtOutCoords()"),this.outputShape=e,this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
vec4 offset = ${i};
vec4 scale = ${o};
2022-02-10 18:27:21 +01:00
vec4 x = getXAtOutCoords();
vec4 mean = getMeanAtOutCoords();
vec4 variance = getVarianceAtOutCoords();
2022-04-01 15:13:32 +02:00
vec4 inv = scale * inversesqrt(variance + vec4(${s}));
2022-02-10 18:27:21 +01:00
setOutput((x - mean) * inv + offset);
}
2022-04-14 17:47:08 +02:00
`}},Wre=({inputs:e,backend:t,attrs:r})=>{let{x:n,mean:a,variance:s,offset:i,scale:o}=e;w.assert(a.shape.length===s.shape.length,()=>"Batch normalization gradient requires mean and variance to have equal ranks."),w.assert(i==null||a.shape.length===i.shape.length,()=>"Batch normalization gradient requires mean and offset to have equal ranks."),w.assert(o==null||a.shape.length===o.shape.length,()=>"Batch normalization gradient requires mean and scale to have equal ranks.");let{varianceEpsilon:l}=r;l==null&&(l=.001);let u=[n,a,s],d=null;i!=null&&(d=i.shape,u.push(i));let h=null;o!=null&&(h=o.shape,u.push(o));let p=Y().getBool("WEBGL_PACK_NORMALIZATION")?new Bre(n.shape,a.shape,s.shape,d,h,l):new Lre(n.shape,a.shape,s.shape,d,h,l);return t.runWebGLProgram(p,u,u[0].dtype)},Vre={kernelName:ui,backendName:"webgl",kernelFunc:Wre},Ure=class{constructor(e){this.variableNames=["source"],this.outputShape=e,this.rank=e.length;let t=gt(this.rank);this.customUniforms=[{name:"start",arrayIndex:this.rank,type:"int"}];let r=Gre(this.rank),n,a=e.map((s,i)=>`sourceLoc.${Zy[i]} = start[${i}] + coords.${Zy[i]};`);n=`
2022-02-10 18:27:21 +01:00
${t} sourceLoc;
${t} coords = getOutputCoords();
2022-04-01 15:13:32 +02:00
${a.join(`
2022-02-10 18:27:21 +01:00
`)}
`,this.userCode=`
void main() {
2022-04-01 15:13:32 +02:00
${n}
setOutput(getSource(${r}));
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}},Zy=["x","y","z","w","u","v"];function Gre(e){if(e===1)return"sourceLoc";if(e<=6)return Zy.slice(0,e).map(t=>"sourceLoc."+t).join(",");throw Error(`Slicing for rank ${e} is not yet supported`)}var jre=class{constructor(e){this.variableNames=["source"],this.packedInputs=!0,this.packedOutput=!0,this.outputShape=e,this.rank=e.length,this.customUniforms=[{name:"start",arrayIndex:this.rank,type:"int"}];let t=gt(this.rank),r=Lr("coords",this.rank),n=Lr("sourceLoc",this.rank),a=this.rank===1?"sourceLoc":`vec2(${n.slice(-2).join()})`,s=`getChannel(getSource(${n.join()}), ${a})`,i=`
2022-04-01 15:13:32 +02:00
result.x = ${s};
if (++${r[this.rank-1]} < ${e[this.rank-1]}) {
++${n[this.rank-1]};
result.y = ${s};
--${n[this.rank-1]};
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`,o=this.rank===1?"":`
--${r[this.rank-1]};
if (++${r[this.rank-2]} < ${e[this.rank-2]}) {
++${n[this.rank-2]};
result.z = ${s};
if (++${r[this.rank-1]} < ${e[this.rank-1]}) {
++${n[this.rank-1]};
result.w = ${s};
2022-02-10 18:27:21 +01:00
}
}
`,l=this.rank<=4?`sourceLoc = coords +
2022-04-01 15:13:32 +02:00
${t}(${e.map((u,d)=>`start[${d}]`).join()});`:e.map((u,d)=>`${n[d]} = ${r[d]} + start[${d}];`).join(`
2022-02-10 18:27:21 +01:00
`);this.userCode=`
void main() {
${t} coords = getOutputCoords();
${t} sourceLoc;
${l}
vec4 result = vec4(0.);
2022-04-01 15:12:04 +02:00
${i}
2022-04-01 15:13:32 +02:00
${o}
2022-02-10 18:27:21 +01:00
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}};function Hre(e,t,r,n){let a=n.texData.get(e.dataId),s=n.makeTensorInfo(r,e.dtype),i=n.texData.get(s.dataId);Object.assign(i,a),i.refCount=1,i.shape=r,i.dtype=e.dtype;let o=_t.computeFlatOffset(t,w.computeStrides(e.shape));a.slice&&(o+=a.slice.flatOffset),i.slice={flatOffset:o,origDataId:a.slice&&a.slice.origDataId||e.dataId};let l=n.dataRefCount.get(i.slice.origDataId)||1;return n.dataRefCount.set(i.slice.origDataId,l+1),s}function Nd(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{begin:s,size:i}=n,[o,l]=_t.parseSliceParams(a,s,i);if(_t.assertParamsValid(a,o,l),w.sizeFromShape(l)===0)return r.makeTensorInfo(l,a.dtype,[]);if(r.shouldExecuteOnCPU([a])||a.dtype==="string"){let h=r.texData.get(a.dataId),p=_ee(h.values,o,l,a.shape,a.dtype);return r.makeTensorInfo(l,a.dtype,p)}let{isPacked:u}=r.texData.get(a.dataId),d=_t.isSliceContinous(a.shape,o,l);if(u||!d){let h=Y().getBool("WEBGL_PACK_ARRAY_OPERATIONS")?new jre(l):new Ure(l),p=[o];return r.runWebGLProgram(h,[a],a.dtype,p)}return r.uploadToGPU(a.dataId),Hre(a,o,l,r)}var qre={kernelName:fl,backendName:"webgl",kernelFunc:Nd},Kre=e=>{let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{blockShape:s,crops:i}=n;w.assert(a.shape.length<=4,()=>"batchToSpaceND for rank > 4 with a WebGL backend not implemented yet");let o=s.reduce((A,x)=>A*x),l=N.getReshaped(a.shape,s,o),u=N.getPermuted(l.length,s.length),d=N.getReshapedPermuted(a.shape,s,o),h=N.getSliceBeginCoords(i,s.length),p=N.getSliceSize(d,i,s.length),c=[],f=ve({inputs:{x:a},backend:r,attrs:{shape:l}}),m=vr({inputs:{x:f},backend:r,attrs:{perm:u}}),g=ve({inputs:{x:m},backend:r,attrs:{shape:d}}),y=Nd({inputs:{x:g},backend:r,attrs:{begin:h,size:p}});return c.push(f),c.push(m),c.push(g),c.forEach(A=>r.disposeIntermediateTensorInfo(A)),y},Xre={kernelName:Bo,backendName:"webgl",kernelFunc:Kre};function Zre(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,weights:s}=t,{size:i}=n,o=r.readSync(a.dataId),l=r.readSync(s.dataId),u=US(o,l,s.dtype,s.shape,i);return r.makeTensorInfo([i],s.dtype,u)}var Yre={kernelName:qf,backendName:"webgl",kernelFunc:Zre};function Jre(e){let{inputs:t,backend:r}=e,{s0:n,s1:a}=t,s=r.readSync(n.dataId),i=r.readSync(a.dataId),o=N.assertAndGetBroadcastShape(Array.from(s),Array.from(i));return r.makeTensorInfo([o.length],"int32",Int32Array.from(o))}var Qre={kernelName:Kf,backendName:"webgl",kernelFunc:Jre},ene="return float(a != b);",i8=wr({opSnippet:ene,cpuKernelImpl:Ree,dtype:"bool"}),tne={kernelName:rl,backendName:"webgl",kernelFunc:i8};function Lh(e){let{inputs:t,backend:r}=e,{input:n}=t,a=r.texData.get(n.dataId);return an({inputs:{x:a.complexTensorInfos.real},backend:r})}var rne={kernelName:ah,backendName:"webgl",kernelFunc:Lh},nne="return float(int(x));";function ane(e,t){let r=new Ka(e.shape,nne),n=t.runWebGLProgram(r,[e],"int32");return{dataId:n.dataId,shape:n.shape,dtype:n.dtype}}function Yy(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{dtype:s}=n;if(s==="complex64"){if(a.dtype==="complex64")return an({inputs:{x:a},backend:r});let i=Wt(a.shape),o=Yy({inputs:{x:a},backend:r,attrs:{dtype:"float32"}}),l=Vi({inputs:{real:o,imag:i},backend:r});return i.dispose(),r.disposeIntermediateTensorInfo(o),l}if(a.dtype==="complex64"){let i=Lh({inputs:{input:a},backend:r}),o=Yy({inputs:{x:i},backend:r,attrs:{dtype:s}});return r.disposeIntermediateTensorInfo(i),o}if(!w.hasEncodingLoss(a.dtype,s)){let i=an({inputs:{x:a},backend:r});return{dataId:i.dataId,shape:i.shape,dtype:s}}if(s==="int32")return ane(a,r);if(s==="bool"){let i=r.makeTensorInfo([],"bool",w.getTypedArrayFromDType("bool",1)),o=i8({inputs:{a,b:i},backend:r});return r.disposeIntermediateTensorInfo(i),o}throw new Error(`Error in Cast: failed to cast ${a.dtype} to ${s}`)}var sne={kernelName:Ys,backendName:"webgl",kernelFunc:Yy},Wv="return ceil(x);",ine=it({opSnippet:Wv,packedOpSnippet:Wv,cpuKernelImpl:pee}),one={kernelName:Js,backendName:"webgl",kernelFunc:ine},lne=class{constructor(e){this.variableNames=["A"],this.customUniforms=[{name:"minVal",type:"float"},{name:"maxVal",type:"float"}],this.outputShape=e,this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
float value = getAAtOutCoords();
if (isnan(value)) {
setOutput(value);
return;
}
setOutput(clamp(value, minVal, maxVal));
}
2022-04-14 17:47:08 +02:00
`}},une=class{constructor(e){this.variableNames=["A"],this.packedInputs=!0,this.packedOutput=!0,this.customUniforms=[{name:"minVal",type:"float"},{name:"maxVal",type:"float"}],this.outputShape=e,this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
vec4 value = getAAtOutCoords();
if (any(isnan(value))) {
setOutput(value);
return;
}
setOutput(clamp(value, vec4(minVal), vec4(maxVal)));
}
2022-04-14 17:47:08 +02:00
`}};function dne(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{clipValueMin:s,clipValueMax:i}=n,o;Y().getBool("WEBGL_PACK_CLIP")?o=new une(a.shape):o=new lne(a.shape);let l=[[s],[i]];return r.runWebGLProgram(o,[a],a.dtype,l)}var pne={kernelName:Ja,backendName:"webgl",kernelFunc:dne},hne=class{constructor(e){this.variableNames=["real","imag"],this.outputShape=e,this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
float re = abs(getRealAtOutCoords());
float im = abs(getImagAtOutCoords());
float mx = max(re, im);
// sadly the length function in glsl is not underflow-safe
// (at least not on Intel GPUs). So the safe solution is
// to ensure underflow-safety in all cases.
setOutput(
mx == 0.0 ? 0.0 : mx * length(vec2(1, min(re, im)/mx))
);
}
2022-04-14 17:47:08 +02:00
`}};function Vv(e,t){return{dataId:t.dataId,dtype:t.dtype,shape:e.shape}}function cne(e){let{inputs:t,backend:r}=e,{x:n}=t,a=r.texData.get(n.dataId),s=new hne(n.shape),i=[Vv(n,a.complexTensorInfos.real),Vv(n,a.complexTensorInfos.imag)];return r.runWebGLProgram(s,i,i[0].dtype)}var fne={kernelName:Zp,backendName:"webgl",kernelFunc:cne},mne=class{constructor(e){this.outputShape=[],this.outputShape=N.computeOutShape(e,1),this.variableNames=e.map((s,i)=>`T${i}`);let t=new Array(e.length-1);t[0]=e[0][1];for(let s=1;s<t.length;s++)t[s]=t[s-1]+e[s][1];let r=[`if (yC < ${t[0]}) setOutput(getT0(yR, yC));`];for(let s=1;s<t.length;s++){let i=t[s-1];r.push(`else if (yC < ${t[s]}) setOutput(getT${s}(yR, yC-${i}));`)}let n=t.length,a=t[t.length-1];r.push(`else setOutput(getT${n}(yR, yC-${a}));`),this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec2 coords = getOutputCoords();
int yR = coords.x;
int yC = coords.y;
2022-04-01 15:13:32 +02:00
${r.join(`
2022-02-10 18:27:21 +01:00
`)}
}
2022-04-14 17:47:08 +02:00
`}},gne=class{constructor(e,t){this.packedInputs=!0,this.packedOutput=!0,this.outputShape=[],this.outputShape=N.computeOutShape(e,t);let r=this.outputShape,n=r.length,a=gt(n),s=Lr("coords",n),i=["x","y","z","w","u","v"].slice(0,n);this.variableNames=e.map((f,m)=>`T${m}`);let o=new Array(e.length-1);o[0]=e[0][t];for(let f=1;f<o.length;f++)o[f]=o[f-1]+e[f][t];let l=i[t],u=i.slice(-2),d=i.join(),h=`if (${l} < ${o[0]}) {
2022-02-10 18:27:21 +01:00
return getChannel(
2022-04-01 15:13:32 +02:00
getT0(${d}), vec2(${u.join()}));
}`;for(let f=1;f<o.length;f++){let m=o[f-1];h+=`
if (${l} < ${o[f]} && ${l} >= ${o[f-1]}) {
2022-02-10 18:27:21 +01:00
return getChannel(
2022-04-14 17:47:08 +02:00
getT${f}(${Qc(i,l,m)}),
vec2(${Qc(u,l,m)}));
2022-04-01 15:13:32 +02:00
}`}let p=o.length,c=o[o.length-1];h+=`
2022-02-10 18:27:21 +01:00
return getChannel(
2022-04-14 17:47:08 +02:00
getT${p}(${Qc(i,l,c)}),
vec2(${Qc(u,l,c)}));`,this.userCode=`
2022-04-01 15:13:32 +02:00
float getValue(${i.map(f=>"int "+f)}) {
${h}
2022-02-10 18:27:21 +01:00
}
void main() {
2022-04-01 15:13:32 +02:00
${a} coords = getOutputCoords();
vec4 result = vec4(getValue(${s}), 0., 0., 0.);
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
${s[n-1]} = ${s[n-1]} + 1;
if (${s[n-1]} < ${r[n-1]}) {
result.g = getValue(${s});
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
${s[n-2]} = ${s[n-2]} + 1;
if (${s[n-2]} < ${r[n-2]}) {
result.a = getValue(${s});
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
${s[n-1]} = ${s[n-1]} - 1;
if (${s[n-2]} < ${r[n-2]} &&
${s[n-1]} < ${r[n-1]}) {
result.b = getValue(${s});
2022-02-10 18:27:21 +01:00
}
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}};function Qc(e,t,r){let n=e.indexOf(t);return e.map((a,s)=>s===n?`${a} - ${r}`:a).join()}function v0(e){let{inputs:t,backend:r}=e,{input:n}=t,a=r.texData.get(n.dataId);return an({inputs:{x:a.complexTensorInfos.imag},backend:r})}var yne={kernelName:eh,backendName:"webgl",kernelFunc:v0};function hu(e,t,r){let n=e[0].dtype;if(n==="complex64"){let d=e.map(m=>Lh({inputs:{input:m},backend:r})),h=e.map(m=>v0({inputs:{input:m},backend:r})),p=hu(d,t,r),c=hu(h,t,r),f=Vi({inputs:{real:p,imag:c},backend:r});return d.forEach(m=>r.disposeIntermediateTensorInfo(m)),h.forEach(m=>r.disposeIntermediateTensorInfo(m)),r.disposeIntermediateTensorInfo(p),r.disposeIntermediateTensorInfo(c),f}let a=r.shouldExecuteOnCPU(e);if(n==="string"&&(a=!0),a){let d=e.map(y=>{let A=w.sizeFromShape(y.shape.slice(t));return ve({inputs:{x:y},backend:r,attrs:{shape:[-1,A]}})}),h=d.map(y=>({vals:r.readSync(y.dataId),shape:y.shape})),p=N.computeOutShape(d.map(y=>y.shape),1),c=d[0].shape[0]===1,f=hee(h,p,n,c),m=N.computeOutShape(e.map(y=>y.shape),t),g=r.makeTensorInfo(m,n,f);return d.forEach(y=>r.disposeIntermediateTensorInfo(y)),g}if(e.length>Y().getNumber("WEBGL_MAX_TEXTURES_IN_SHADER")){let d=Math.floor(e.length/2),h=hu(e.slice(0,d),t,r),p=hu(e.slice(d),t,r),c=hu([h,p],t,r);return r.disposeIntermediateTensorInfo(h),r.disposeIntermediateTensorInfo(p),c}if(Y().getBool("WEBGL_PACK_ARRAY_OPERATIONS")&&e[0].shape.length>1){let d=new gne(e.map(h=>h.shape),t);return r.runWebGLProgram(d,e,n)}let{tensors2D:s,outShape:i}=Ane(e,t,r),o=new mne(s.map(d=>d.shape)),l=r.runWebGLProgram(o,s,n);s.forEach(d=>r.disposeIntermediateTensorInfo(d));let u=ve({inputs:{x:l},attrs:{shape:i},backend:r});return r.disposeIntermediateTensorInfo(l),u}function Ane(e,t,r){let n=N.computeOutShape(e.map(a=>a.shape),t);return{tensors2D:e.map(a=>ve({inputs:{x:a},attrs:{shape:[-1,w.sizeFromShape(a.shape.slice(t))]},backend:r})),outShape:n}}function o8(e){let{inputs:t,backend:r,attrs:n}=e,{axis:a}=n,s=w.parseAxisParam(a,t[0].shape)[0],i=N.computeOutShape(t.map(u=>u.shape),s);if(w.sizeFromShape(i)===0)return r.makeTensorInfo(i,t[0].dtype,[]);let o=t.filter(u=>w.sizeFromShape(u.shape)>0);if(o.length===1)return an({inputs:{x:o[0]},backend:r});let l=o.map(u=>u.shape);return N.assertParamsConsistent(l,s),hu(o,s,r)}var xne={kernelName:Wo,backendName:"webgl",kernelFunc:o8},l8=class{constructor(e,t=!1,r=null,n=!1,a=!1){this.variableNames=["x","W"],this.outputShape=e.outShape;let s=e.padInfo.top,i=e.padInfo.left,o=e.strideHeight,l=e.strideWidth,u=e.dilationHeight,d=e.dilationWidth,h=e.filterHeight,p=e.filterWidth,c=Math.floor(e.inChannels/4)*4,f=e.inChannels%4,m=e.dataFormat==="channelsLast",g=m?1:2,y=m?2:3,A=m?3:1,x="",b="";r&&(n?x=`float activation(float a) {
2022-02-10 18:27:21 +01:00
float b = getPreluActivationWeightsAtOutCoords();
2022-04-01 15:13:32 +02:00
${r}
}`:a?x=`float activation(float a) {
2022-02-10 18:27:21 +01:00
float b = getLeakyreluAlphaAtOutCoords();
2022-04-01 15:13:32 +02:00
${r}
}`:x=`
2022-02-10 18:27:21 +01:00
float activation(float x) {
2022-04-01 15:13:32 +02:00
${r}
2022-02-10 18:27:21 +01:00
}
2022-04-11 17:45:24 +02:00
`,b="result = activation(result);");let v=t?"result += getBiasAtOutCoords();":"";t&&this.variableNames.push("bias"),n&&this.variableNames.push("preluActivationWeights"),a&&this.variableNames.push("leakyreluAlpha"),this.userCode=`
2022-04-01 15:13:32 +02:00
${x}
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
const ivec2 strides = ivec2(${o}, ${l});
const ivec2 pads = ivec2(${s}, ${i});
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int batch = coords[0];
2022-04-01 15:13:32 +02:00
int d2 = coords[${A}];
2022-02-10 18:27:21 +01:00
ivec2 xRCCorner =
ivec2(coords[${g}], coords[${y}]) * strides - pads;
int xRCorner = xRCCorner.x;
int xCCorner = xRCCorner.y;
// Convolve x(?, ?, d1) with w(:, :, d1, d2) to get y(yR, yC, d2).
// ? = to be determined. : = across all values in that axis.
float dotProd = 0.0;
2022-04-01 15:13:32 +02:00
for (int wR = 0; wR < ${h}; wR++) {
2022-02-17 14:15:57 +01:00
int xR = xRCorner + wR * ${u};
2022-02-10 18:27:21 +01:00
if (xR < 0 || xR >= ${e.inHeight}) {
continue;
}
2022-04-01 15:13:32 +02:00
for (int wC = 0; wC < ${p}; wC++) {
int xC = xCCorner + wC * ${d};
2022-02-10 18:27:21 +01:00
if (xC < 0 || xC >= ${e.inWidth}) {
continue;
}
2022-04-01 15:13:32 +02:00
for (int d1 = 0; d1 < ${c}; d1 += 4) {
2022-02-10 18:27:21 +01:00
vec4 wValues = vec4(
getW(wR, wC, d1, d2),
getW(wR, wC, d1 + 1, d2),
getW(wR, wC, d1 + 2, d2),
getW(wR, wC, d1 + 3, d2)
);
if (${m}) {
vec4 xValues = vec4(
getX(batch, xR, xC, d1),
getX(batch, xR, xC, d1 + 1),
getX(batch, xR, xC, d1 + 2),
getX(batch, xR, xC, d1 + 3)
);
dotProd += dot(xValues, wValues);
} else {
vec4 xValues = vec4(
getX(batch, d1, xR, xC),
getX(batch, d1 + 1, xR, xC),
getX(batch, d1 + 2, xR, xC),
getX(batch, d1 + 3, xR, xC)
);
dotProd += dot(xValues, wValues);
}
}
if (${f===1}) {
if (${m}) {
dotProd +=
2022-04-01 15:13:32 +02:00
getX(batch, xR, xC, ${c}) *
getW(wR, wC, ${c}, d2);
2022-02-10 18:27:21 +01:00
} else {
dotProd +=
2022-04-01 15:13:32 +02:00
getX(batch, ${c}, xR, xC) *
getW(wR, wC, ${c}, d2);
2022-02-10 18:27:21 +01:00
}
} else if (${f===2}) {
vec2 wValues = vec2(
2022-04-01 15:13:32 +02:00
getW(wR, wC, ${c}, d2),
getW(wR, wC, ${c} + 1, d2)
2022-02-10 18:27:21 +01:00
);
if (${m}) {
vec2 xValues = vec2(
2022-04-01 15:13:32 +02:00
getX(batch, xR, xC, ${c}),
getX(batch, xR, xC, ${c} + 1)
2022-02-10 18:27:21 +01:00
);
dotProd += dot(xValues, wValues);
} else {
vec2 xValues = vec2(
2022-04-01 15:13:32 +02:00
getX(batch, ${c}, xR, xC),
getX(batch, ${c} + 1, xR, xC)
2022-02-10 18:27:21 +01:00
);
dotProd += dot(xValues, wValues);
}
} else if (${f===3}) {
vec3 wValues = vec3(
2022-04-01 15:13:32 +02:00
getW(wR, wC, ${c}, d2),
getW(wR, wC, ${c} + 1, d2),
getW(wR, wC, ${c} + 2, d2)
2022-02-10 18:27:21 +01:00
);
if (${m}) {
vec3 xValues = vec3(
2022-04-01 15:13:32 +02:00
getX(batch, xR, xC, ${c}),
getX(batch, xR, xC, ${c} + 1),
getX(batch, xR, xC, ${c} + 2)
2022-02-10 18:27:21 +01:00
);
dotProd += dot(xValues, wValues);
} else {
vec3 xValues = vec3(
2022-04-01 15:13:32 +02:00
getX(batch, ${c}, xR, xC),
getX(batch, ${c} + 1, xR, xC),
getX(batch, ${c} + 2, xR, xC)
2022-02-10 18:27:21 +01:00
);
dotProd += dot(xValues, wValues);
}
}
}
}
float result = dotProd;
2022-04-11 17:45:24 +02:00
${v}
2022-02-10 18:27:21 +01:00
${b}
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}},bne=class{constructor(e){this.variableNames=["x","W"],this.outputShape=e.outShape;let t=e.padInfo.front,r=e.padInfo.top,n=e.padInfo.left,a=e.strideDepth,s=e.strideHeight,i=e.strideWidth,o=e.dilationDepth,l=e.dilationHeight,u=e.dilationWidth,d=e.filterDepth,h=e.filterHeight,p=e.filterWidth,c=Math.floor(e.inChannels/4)*4,f=e.inChannels%4;this.userCode=`
2022-04-01 15:13:32 +02:00
const ivec3 strides = ivec3(${a}, ${s}, ${i});
const ivec3 pads = ivec3(${t}, ${r}, ${n});
2022-02-10 18:27:21 +01:00
void main() {
ivec5 coords = getOutputCoords();
int batch = coords.x;
int d2 = coords.u;
ivec3 xFRCCorner = ivec3(coords.y, coords.z, coords.w) * strides - pads;
int xFCorner = xFRCCorner.x;
int xRCorner = xFRCCorner.y;
int xCCorner = xFRCCorner.z;
// Convolve x(?, ?, ?, d1) with w(:, :, :, d1, d2) to get
// y(yF, yR, yC, d2). ? = to be determined. : = across all
// values in that axis.
float dotProd = 0.0;
2022-04-01 15:13:32 +02:00
for (int wF = 0; wF < ${d}; wF++) {
int xF = xFCorner + wF * ${o};
2022-02-10 18:27:21 +01:00
if (xF < 0 || xF >= ${e.inDepth}) {
continue;
}
2022-04-01 15:13:32 +02:00
for (int wR = 0; wR < ${h}; wR++) {
2022-02-10 18:27:21 +01:00
int xR = xRCorner + wR * ${l};
if (xR < 0 || xR >= ${e.inHeight}) {
continue;
}
2022-04-01 15:13:32 +02:00
for (int wC = 0; wC < ${p}; wC++) {
2022-02-17 14:15:57 +01:00
int xC = xCCorner + wC * ${u};
2022-02-10 18:27:21 +01:00
if (xC < 0 || xC >= ${e.inWidth}) {
continue;
}
2022-04-01 15:13:32 +02:00
for (int d1 = 0; d1 < ${c}; d1 += 4) {
2022-02-10 18:27:21 +01:00
vec4 xValues = vec4(
getX(batch, xF, xR, xC, d1),
getX(batch, xF, xR, xC, d1 + 1),
getX(batch, xF, xR, xC, d1 + 2),
getX(batch, xF, xR, xC, d1 + 3)
);
vec4 wValues = vec4(
getW(wF, wR, wC, d1, d2),
getW(wF, wR, wC, d1 + 1, d2),
getW(wF, wR, wC, d1 + 2, d2),
getW(wF, wR, wC, d1 + 3, d2)
);
dotProd += dot(xValues, wValues);
}
if (${f===1}) {
dotProd +=
2022-04-01 15:13:32 +02:00
getX(batch, xF, xR, xC, ${c}) *
getW(wF, wR, wC, ${c}, d2);
2022-02-10 18:27:21 +01:00
} else if (${f===2}) {
vec2 xValues = vec2(
2022-04-01 15:13:32 +02:00
getX(batch, xF, xR, xC, ${c}),
getX(batch, xF, xR, xC, ${c} + 1)
2022-02-10 18:27:21 +01:00
);
vec2 wValues = vec2(
2022-04-01 15:13:32 +02:00
getW(wF, wR, wC, ${c}, d2),
getW(wF, wR, wC, ${c} + 1, d2)
2022-02-10 18:27:21 +01:00
);
dotProd += dot(xValues, wValues);
} else if (${f===3}) {
vec3 xValues = vec3(
2022-04-01 15:13:32 +02:00
getX(batch, xF, xR, xC, ${c}),
getX(batch, xF, xR, xC, ${c} + 1),
getX(batch, xF, xR, xC, ${c} + 2)
2022-02-10 18:27:21 +01:00
);
vec3 wValues = vec3(
2022-04-01 15:13:32 +02:00
getW(wF, wR, wC, ${c}, d2),
getW(wF, wR, wC, ${c} + 1, d2),
getW(wF, wR, wC, ${c} + 2, d2)
2022-02-10 18:27:21 +01:00
);
dotProd += dot(xValues, wValues);
}
}
}
}
setOutput(dotProd);
}
2022-04-14 17:47:08 +02:00
`}},vne=class{constructor(e,t){this.variableNames=["A"],this.packedInputs=!0,this.packedOutput=!0,this.customUniforms=[{name:"inputShape",type:"ivec3"},{name:"pad",type:"ivec2"},{name:"stride",type:"ivec2"},{name:"dilation",type:"ivec2"},{name:"inChannels",type:"int"},{name:"itemsPerBlockRow",type:"int"},{name:"outWidth",type:"int"}],this.outputShape=e,this.enableShapeUniforms=ln(this.outputShape.length);let{dataFormat:r}=t,n=Gr(),a=r==="channelsLast",s=a?0:1,i=a?1:2,o=this.enableShapeUniforms?"if(blockIndex < outShape[1] && pos < outShape[0]) {":`if(blockIndex < ${e[1]} && pos < ${e[0]}) {`,l="";for(let u=0;u<=1;u++)for(let d=0;d<=1;d++)l+=`
2022-04-01 15:13:32 +02:00
blockIndex = rc.y + ${d};
2022-02-17 14:15:57 +01:00
pos = rc.x + ${u};
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
${o}
2022-02-10 18:27:21 +01:00
offsetY = int(blockIndex / outWidth) * stride[0] - pad[0];
d0 = offsetY + dilation[0] * (pos / itemsPerBlockRow);
2022-04-01 15:13:32 +02:00
if(d0 < inputShape[${s}] && d0 >= 0) {
2022-02-10 18:27:21 +01:00
// Use custom imod instead mod. On Intel GPU, mod may generate
// unexpected value.
// https://github.com/tensorflow/tfjs/issues/5447
offsetX = imod(blockIndex, outWidth) * stride[1] - pad[1];
d1 = offsetX + dilation[1] * (imod(pos, itemsPerBlockRow) /
inChannels);
2022-04-01 15:13:32 +02:00
if(d1 < inputShape[${i}] && d1 >= 0) {
2022-02-10 18:27:21 +01:00
ch = imod(pos, inChannels);
2022-04-01 15:13:32 +02:00
if (${a}) {
2022-02-10 18:27:21 +01:00
innerDims = vec2(d1, ch);
2022-04-01 15:13:32 +02:00
result[${u*2+d}] = getChannel(
2022-02-10 18:27:21 +01:00
getA(d0, int(innerDims.x),
int(innerDims.y)), innerDims);
} else {
innerDims = vec2(d0, d1);
2022-04-01 15:13:32 +02:00
result[${u*2+d}] = getChannel(
2022-02-10 18:27:21 +01:00
getA(ch, int(innerDims.x),
int(innerDims.y)), innerDims);
}
}
}
}
`;this.userCode=`
void main() {
ivec2 rc = getOutputCoords();
vec4 result = vec4(0);
int blockIndex, pos, offsetY, d0, offsetX, d1, ch;
vec2 innerDims;
${l}
2022-04-01 15:13:32 +02:00
${n.output} = result;
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}};function u8({x:e,filter:t,convInfo:r,backend:n,bias:a=null,preluActivationWeights:s=null,leakyreluAlpha:i=0,activation:o=null}){let l=e.shape,u=n.texData.get(e.dataId),d=r.inChannels,h=l[0]*l[1]*l[2],p=r.outChannels,c=r.dataFormat==="channelsLast",f=!1,m=!1,g,y=[];if(!((h===1||p===1)&&d>r8)&&u.isPacked&&c&&u.texture!=null&&l[2]%2!==0&&w.arraysEqual(u.shape.slice(-3),l.slice(-3))){let A=l[0]*l[1]*(l[2]+1),x={dataId:e.dataId,shape:[1,A,r.inChannels],dtype:e.dtype},b=u.shape;u.shape=u.shape.slice(),u.shape[u.shape.length-2]++,w.assert(jp(u.shape,x.shape),()=>`packed reshape ${u.shape} to ${x.shape} isn't free`);let v=ve({inputs:{x:t},backend:n,attrs:{shape:[1,r.inChannels,r.outChannels]}});y.push(v);let S=Of({a:x,b:v,backend:n,transposeA:f,transposeB:m,bias:a,activation:o,preluActivationWeights:s,leakyreluAlpha:i}),T=n.texData.get(S.dataId);w.assert(T.isPacked,()=>"batchMatMul result is expected to be packed"),u.shape=b,T.shape=r.outShape,g=an({inputs:{x:S},backend:n}),g.shape=r.outShape,y.push(S)}else{let A=c?l[0]*l[1]*l[2]:l[0]*l[2]*l[3],x=ve({inputs:{x:e},backend:n,attrs:{shape:[1,A,r.inChannels]}}),b=ve({inputs:{x:t},backend:n,attrs:{shape:[1,r.inChannels,r.outChannels]}}),v=Of({a:x,b,transposeA:f,transposeB:m,backend:n,bias:a,activation:o,preluActivationWeights:s,leakyreluAlpha:i});g=ve({inputs:{x:v},backend:n,attrs:{shape:r.outShape}}),y.push(x),y.push(b),y.push(v)}for(let A of y)n.disposeIntermediateTensorInfo(A);return g}function d8({x:e,filter:t,convInfo:r,backend:n,bias:a=null,preluActivationWeights:s=null,leakyreluAlpha:i=0,activation:o=null}){let{filterWidth:l,filterHeight:u,inChannels:d,outWidth:h,outHeight:p,dataFormat:c}=r,f=c==="channelsLast",m=l*u*d,g=p*h,y=[m,g],A=!0,x=!1,b=[],v=ve({inputs:{x:e},backend:n,attrs:{shape:e.shape.slice(1)}}),S=ve({inputs:{x:t},backend:n,attrs:{shape:[1,m,w.sizeFromShape(t.shape)/m]}});b.push(v),b.push(S);let T=new vne(y,r),E=[v.shape,[r.padInfo.top,r.padInfo.left],[r.strideHeight,r.strideWidth],[r.dilationHeight,r.dilationWidth],[r.inChannels],[r.filterWidth*r.inChannels],[r.outWidth]],R=n.runWebGLProgram(T,[v],"float32",E),_=ve({inputs:{x:R},backend:n,attrs:{shape:[1,y[0],y[1]]}});b.push(R),b.push(_);let M=a!=null,I=s!=null,z=o==="leakyrelu",O=o?A0(o,!0):null,j=new t8(_.shape,S.shape,[1,g,r.outChannels],A,x,M,O,I,z),X=[_,S];if(a&&X.push(a),I&&X.push(s),z){let ee=n.makeTensorInfo([],"float32",w.createScalarValue(i,"float32"));X.push(ee),b.push(ee)}let D=n.runWebGLProgram(j,X,"float32"),Q=f?[1,p,h,r.outChannels]:[1,r.outChannels,p,h],V=ve({inputs:{x:D},backend:n,attrs:{shape:Q}});b.push(D);for(let ee of b)n.disposeIntermediateTensorInfo(ee);return V}function wne(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,filter:s}=t,{strides:i,pad:o,dataFormat:l,dilations:u,dimRoundingMode:d}=n,h=N.convertConv2DDataFormat(l),p=N.computeConv2DInfo(a.shape,s.shape,i,u,o,d,!1,h),c;if(p.filterHeight===1&&p.filterWidth===1&&p.dilationHeight===1&&p.dilationWidth===1&&p.strideHeight===1&&p.strideWidth===1&&(p.padInfo.type==="SAME"||p.padInfo.type==="VALID"))c=u8({x:a,filter:s,convInfo:p,backend:r});else if(Y().getBool("WEBGL_CONV_IM2COL")&&a.shape[0]===1)c=d8({x:a,filter:s,convInfo:p,backend:r});else{let m=new l8(p);c=r.runWebGLProgram(m,[a,s],"float32")}let f=ve({inputs:{x:c},backend:r,attrs:{shape:p.outShape}});return r.disposeIntermediateTensorInfo(c),f}var kne={kernelName:Qs,backendName:"webgl",kernelFunc:wne},Ine=class{constructor(e){this.variableNames=["x","dy"],this.outputShape=e.filterShape;let t=e.strideHeight,r=e.strideWidth,n=e.padInfo.top,a=e.padInfo.left,s=e.dataFormat==="channelsLast";this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int wR = coords.x;
int wC = coords.y;
int d1 = coords.z;
int d2 = coords.w;
// Convolve x(?, ?, d1) with dy(:, :, d2) to get dw(wR, wC, d1, d2).
// ? = to be determined. : = across all values in that axis.
float dotProd = 0.0;
for (int b = 0; b < ${e.batchSize}; b++) {
for (int yR = 0; yR < ${e.outHeight}; yR++) {
2022-04-01 15:13:32 +02:00
int xR = wR + yR * ${t} - ${n};
2022-02-10 18:27:21 +01:00
if (xR < 0 || xR >= ${e.inHeight}) {
continue;
}
for (int yC = 0; yC < ${e.outWidth}; yC++) {
2022-04-01 15:13:32 +02:00
int xC = wC + yC * ${r} - ${a};
2022-02-10 18:27:21 +01:00
if (xC < 0 || xC >= ${e.inWidth}) {
continue;
}
2022-04-01 15:13:32 +02:00
if (${s}) {
2022-02-10 18:27:21 +01:00
float dyValue = getDy(b, yR, yC, d2);
float xValue = getX(b, xR, xC, d1);
dotProd += (xValue * dyValue);
} else {
float dyValue = getDy(b, d2, yR, yC);
float xValue = getX(b, d1, xR, xC);
dotProd += (xValue * dyValue);
}
}
}
}
setOutput(dotProd);
}
2022-04-14 17:47:08 +02:00
`}},Sne=class{constructor(e){this.variableNames=["dy","W"],this.outputShape=e.inShape;let t=e.filterHeight,r=e.filterWidth,n=e.strideHeight,a=e.strideWidth,s=e.dataFormat==="channelsLast",i=t-1-e.padInfo.top,o=r-1-e.padInfo.left,l=s?1:2,u=s?2:3,d=s?3:1;this.userCode=`
2022-04-01 15:13:32 +02:00
const ivec2 pads = ivec2(${i}, ${o});
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int batch = coords[0];
2022-04-01 15:13:32 +02:00
int d1 = coords[${d}];
2022-02-10 18:27:21 +01:00
2022-02-17 14:15:57 +01:00
ivec2 dyCorner = ivec2(coords[${l}], coords[${u}]) - pads;
2022-02-10 18:27:21 +01:00
int dyRCorner = dyCorner.x;
int dyCCorner = dyCorner.y;
// Convolve dy(?, ?, d2) with w(:, :, d1, d2) to compute dx(xR, xC, d1).
// ? = to be determined. : = across all values in that axis.
float dotProd = 0.0;
for (int wR = 0; wR < ${t}; wR++) {
2022-04-01 15:13:32 +02:00
float dyR = float(dyRCorner + wR) / ${n}.0;
2022-02-10 18:27:21 +01:00
if (dyR < 0.0 || dyR >= ${e.outHeight}.0 || fract(dyR) > 0.0) {
continue;
}
int idyR = int(dyR);
int wRPerm = ${t} - 1 - wR;
2022-04-01 15:13:32 +02:00
for (int wC = 0; wC < ${r}; wC++) {
float dyC = float(dyCCorner + wC) / ${a}.0;
2022-02-10 18:27:21 +01:00
if (dyC < 0.0 || dyC >= ${e.outWidth}.0 ||
fract(dyC) > 0.0) {
continue;
}
int idyC = int(dyC);
2022-04-01 15:13:32 +02:00
int wCPerm = ${r} - 1 - wC;
2022-02-10 18:27:21 +01:00
for (int d2 = 0; d2 < ${e.outChannels}; d2++) {
2022-04-01 15:13:32 +02:00
if (${s}) {
2022-02-10 18:27:21 +01:00
float xValue = getDy(batch, idyR, idyC, d2);
float wValue = getW(wRPerm, wCPerm, d1, d2);
dotProd += xValue * wValue;
} else {
float xValue = getDy(batch, d2, idyR, idyC);
float wValue = getW(wRPerm, wCPerm, d1, d2);
dotProd += xValue * wValue;
}
}
}
}
setOutput(dotProd);
}
2022-04-14 17:47:08 +02:00
`}},Tne=class{constructor(e){this.variableNames=["x","dy"],this.outputShape=e.filterShape;let t=e.strideDepth,r=e.strideHeight,n=e.strideWidth,a=e.padInfo.front,s=e.padInfo.top,i=e.padInfo.left;this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec5 coords = getOutputCoords();
int wF = coords.x;
int wR = coords.y;
int wC = coords.z;
int d1 = coords.w;
int d2 = coords.u;
float dotProd = 0.0;
for (int b = 0; b < ${e.batchSize}; b++) {
for (int yF = 0; yF < ${e.outDepth}; yF++) {
2022-04-01 15:13:32 +02:00
int xF = wF + yF * ${t} - ${a};
2022-02-10 18:27:21 +01:00
if (xF < 0 || xF >= ${e.inDepth}) {
continue;
}
for (int yR = 0; yR < ${e.outHeight}; yR++) {
2022-04-01 15:13:32 +02:00
int xR = wR + yR * ${r} - ${s};
2022-02-10 18:27:21 +01:00
if (xR < 0 || xR >= ${e.inHeight}) {
continue;
}
for (int yC = 0; yC < ${e.outWidth}; yC++) {
2022-04-01 15:13:32 +02:00
int xC = wC + yC * ${n} - ${i};
2022-02-10 18:27:21 +01:00
if (xC < 0 || xC >= ${e.inWidth}) {
continue;
}
float dyValue = getDy(b, yF, yR, yC, d2);
float xValue = getX(b, xF, xR, xC, d1);
dotProd += (xValue * dyValue);
}
}
}
}
setOutput(dotProd);
}
2022-04-14 17:47:08 +02:00
`}},Nne=class{constructor(e){this.variableNames=["dy","W"],this.outputShape=e.inShape;let t=e.filterDepth,r=e.filterHeight,n=e.filterWidth,a=e.strideDepth,s=e.strideHeight,i=e.strideWidth,o=t-1-e.padInfo.front,l=r-1-e.padInfo.top,u=n-1-e.padInfo.left;this.userCode=`
2022-04-01 15:13:32 +02:00
const ivec3 pads = ivec3(${o}, ${l}, ${u});
2022-02-10 18:27:21 +01:00
void main() {
ivec5 coords = getOutputCoords();
int batch = coords.x;
int d1 = coords.u;
ivec3 dyCorner = ivec3(coords.y, coords.z, coords.w) - pads;
int dyFCorner = dyCorner.x;
int dyRCorner = dyCorner.y;
int dyCCorner = dyCorner.z;
float dotProd = 0.0;
for (int wF = 0; wF < ${t}; wF++) {
2022-04-01 15:13:32 +02:00
float dyF = float(dyFCorner + wF) / ${a}.0;
2022-02-10 18:27:21 +01:00
if (dyF < 0.0 || dyF >= ${e.outDepth}.0 || fract(dyF) > 0.0) {
continue;
}
int idyF = int(dyF);
int wFPerm = ${t} - 1 - wF;
2022-04-01 15:13:32 +02:00
for (int wR = 0; wR < ${r}; wR++) {
float dyR = float(dyRCorner + wR) / ${s}.0;
2022-02-10 18:27:21 +01:00
if (dyR < 0.0 || dyR >= ${e.outHeight}.0 ||
fract(dyR) > 0.0) {
continue;
}
int idyR = int(dyR);
2022-04-01 15:13:32 +02:00
int wRPerm = ${r} - 1 - wR;
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
for (int wC = 0; wC < ${n}; wC++) {
float dyC = float(dyCCorner + wC) / ${i}.0;
2022-02-10 18:27:21 +01:00
if (dyC < 0.0 || dyC >= ${e.outWidth}.0 ||
fract(dyC) > 0.0) {
continue;
}
int idyC = int(dyC);
2022-04-01 15:13:32 +02:00
int wCPerm = ${n} - 1 - wC;
2022-02-10 18:27:21 +01:00
for (int d2 = 0; d2 < ${e.outChannels}; d2++) {
float xValue = getDy(batch, idyF, idyR, idyC, d2);
float wValue = getW(wFPerm, wRPerm, wCPerm, d1, d2);
dotProd += xValue * wValue;
}
}
}
}
setOutput(dotProd);
}
2022-04-14 17:47:08 +02:00
`}};function Cne(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,dy:s}=t,{strides:i,pad:o,dataFormat:l,dimRoundingMode:u,filterShape:d}=n,h=N.convertConv2DDataFormat(l),p=N.computeConv2DInfo(a.shape,d,i,1,o,u,!1,h),c=new Ine(p);return r.runWebGLProgram(c,[a,s],"float32")}var Ene={kernelName:Xf,backendName:"webgl",kernelFunc:Cne};function Rne(e){let{inputs:t,backend:r,attrs:n}=e,{dy:a,filter:s}=t,{inputShape:i,strides:o,pad:l,dataFormat:u,dimRoundingMode:d}=n,h=N.convertConv2DDataFormat(u),p=N.computeConv2DInfo(i,s.shape,o,1,l,d,!1,h),c=new Sne(p);return r.runWebGLProgram(c,[a,s],"float32")}var Mne={kernelName:ei,backendName:"webgl",kernelFunc:Rne};function Fne(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,filter:s}=t,{strides:i,pad:o,dilations:l}=n,u=N.computeConv3DInfo(a.shape,s.shape,i,l,o),d=new bne(u);return r.runWebGLProgram(d,[a,s],"float32")}var $ne={kernelName:Yp,backendName:"webgl",kernelFunc:Fne};function Pne(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,dy:s}=t,{strides:i,pad:o,filterShape:l}=n,u=N.computeConv3DInfo(a.shape,l,i,1,o),d=new Tne(u);return r.runWebGLProgram(d,[a,s],"float32")}var _ne={kernelName:Zf,backendName:"webgl",kernelFunc:Pne};function zne(e){let{inputs:t,backend:r,attrs:n}=e,{dy:a,filter:s}=t,{pad:i,strides:o,inputShape:l}=n,u=N.computeConv3DInfo(l,s.shape,o,1,i),d=new Nne(u);return r.runWebGLProgram(d,[a,s],"float32")}var One={kernelName:Yf,backendName:"webgl",kernelFunc:zne},Dne=Td+`
2022-02-10 18:27:21 +01:00
return cos(x);
2022-04-14 17:47:08 +02:00
`,Lne=it({opSnippet:Dne}),Bne={kernelName:ti,backendName:"webgl",kernelFunc:Lne},Wne=`
2022-02-10 18:27:21 +01:00
float e2x = exp(-x);
return (e2x + 1.0 / e2x) / 2.0;
2022-04-14 17:47:08 +02:00
`,Vne=it({opSnippet:Wne}),Une={kernelName:ri,backendName:"webgl",kernelFunc:Vne},Gne=class{constructor(e,t,r,n,a){this.variableNames=["Image","Boxes","BoxInd"],this.outputShape=[];let[s,i,o,l]=e,[u]=t,[d,h]=r;this.outputShape=[u,d,h,l];let p=n==="bilinear"?1:0,[c,f]=[`${i-1}.0`,`${o-1}.0`],[m,g,y]=d>1?[`${(i-1)/(d-1)}`,"(y2-y1) * height_ratio",`y1*${c} + float(y)*(height_scale)`]:["0.0","0.0",`0.5 * (y1+y2) * ${c}`],[A,x,b]=h>1?[`${(o-1)/(h-1)}`,"(x2-x1) * width_ratio",`x1*${f} + float(x)*(width_scale)`]:["0.0","0.0",`0.5 * (x1+x2) * ${f}`];this.userCode=`
2022-02-10 18:27:21 +01:00
const float height_ratio = float(${m});
2022-04-01 15:13:32 +02:00
const float width_ratio = float(${A});
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int b = coords[0];
int y = coords[1];
int x = coords[2];
int d = coords[3];
// get box vals
float y1 = getBoxes(b,0);
float x1 = getBoxes(b,1);
float y2 = getBoxes(b,2);
float x2 = getBoxes(b,3);
// get image in batch index
int bInd = round(getBoxInd(b));
2022-04-01 15:13:32 +02:00
if(bInd < 0 || bInd >= ${s}) {
2022-02-10 18:27:21 +01:00
return;
}
float height_scale = ${g};
2022-04-01 15:13:32 +02:00
float width_scale = ${x};
2022-02-10 18:27:21 +01:00
float in_y = ${y};
2022-04-01 15:13:32 +02:00
if( in_y < 0.0 || in_y > ${c} ) {
setOutput(float(${a}));
2022-02-10 18:27:21 +01:00
return;
}
float in_x = ${b};
if( in_x < 0.0 || in_x > ${f} ) {
2022-04-01 15:13:32 +02:00
setOutput(float(${a}));
2022-02-10 18:27:21 +01:00
return;
}
vec2 sourceFracIndexCR = vec2(in_x,in_y);
2022-04-01 15:13:32 +02:00
if(${p} == 1) {
2022-02-10 18:27:21 +01:00
// Compute the four integer indices.
ivec2 sourceFloorCR = ivec2(sourceFracIndexCR);
ivec2 sourceCeilCR = ivec2(ceil(sourceFracIndexCR));
float topLeft = getImage(b, sourceFloorCR.y, sourceFloorCR.x, d);
float bottomLeft = getImage(b, sourceCeilCR.y, sourceFloorCR.x, d);
float topRight = getImage(b, sourceFloorCR.y, sourceCeilCR.x, d);
float bottomRight = getImage(b, sourceCeilCR.y, sourceCeilCR.x, d);
vec2 fracCR = sourceFracIndexCR - vec2(sourceFloorCR);
float top = topLeft + (topRight - topLeft) * fracCR.x;
float bottom = bottomLeft + (bottomRight - bottomLeft) * fracCR.x;
float newValue = top + (bottom - top) * fracCR.y;
setOutput(newValue);
} else {
// Compute the coordinators of nearest neighbor point.
ivec2 sourceNearestCR = ivec2(floor(
sourceFracIndexCR + vec2(0.5,0.5)));
float newValue = getImage(b, sourceNearestCR.y, sourceNearestCR.x, d);
setOutput(newValue);
}
}
2022-04-14 17:47:08 +02:00
`}},jne=e=>{let{inputs:t,backend:r,attrs:n}=e,{image:a,boxes:s,boxInd:i}=t,{cropSize:o,method:l,extrapolationValue:u}=n,d=new Gne(a.shape,s.shape,o,l,u);return r.runWebGLProgram(d,[a,s,i],"float32")},Hne={kernelName:Uo,backendName:"webgl",kernelFunc:jne},Uv=class{constructor(e,t,r){this.variableNames=["x"],this.customUniforms=[{name:"index",type:"float"}],this.outputShape=e;let n=e.length,a=t?"1.0":`getX(${Gv(n,"coords")})`,s=e[e.length-1],i="",o="";t?(i=r?`end != ${s-1}`:"end != 0",o=r?"end + 1":"end - 1"):(i=r?`end + pow2 < ${s}`:"end >= pow2",o=r?"end + pow2":"end - pow2"),this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${gt(n)} coords = getOutputCoords();
2022-04-14 17:47:08 +02:00
int end = ${jv(n,"coords")};
2022-04-01 15:13:32 +02:00
float val = ${a};
2022-02-10 18:27:21 +01:00
int pow2 = int(pow(2.0, index));
2022-04-01 15:13:32 +02:00
if (${i}) {
int idx = ${o};
2022-04-14 17:47:08 +02:00
${jv(n,"coords")} = idx;
val *= getX(${Gv(n,"coords")});
2022-02-10 18:27:21 +01:00
}
setOutput(val);
}
2022-04-14 17:47:08 +02:00
`}};function Gv(e,t){if(e===1)return`${t}`;if(e===2)return`${t}.x, ${t}.y`;if(e===3)return`${t}.x, ${t}.y, ${t}.z`;if(e===4)return`${t}.x, ${t}.y, ${t}.z, ${t}.w`;throw Error(`Cumulative product for rank ${e} is not yet supported`)}function jv(e,t){if(e===1)return`${t}`;if(e===2)return`${t}.y`;if(e===3)return`${t}.z`;if(e===4)return`${t}.w`;throw Error(`Cumulative product for rank ${e} is not yet supported`)}function qne(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{axis:s,exclusive:i,reverse:o}=n,l=a.shape.length,u=N.getAxesPermutation([s],l),d=a;u!=null&&(d=vr({inputs:{x:a},backend:r,attrs:{perm:u}}));let h=N.getInnerMostAxes(1,l)[0];if(h!==l-1)throw new Error(`WebGL cumprod shader expects an inner-most axis=${a.shape.length-1} but got axis=${s}`);let p=d.shape[h],c=an({inputs:{x:d},backend:r});for(let f=0;f<=Math.ceil(Math.log2(p))-1;f++){let m=new Uv(d.shape,!1,o),g=[[f]],y=c;c=r.runWebGLProgram(m,[c],c.dtype,g),r.disposeIntermediateTensorInfo(y)}if(i){let f=new Uv(d.shape,i,o),m=c;c=r.runWebGLProgram(f,[c],c.dtype),r.disposeIntermediateTensorInfo(m)}if(u!=null){let f=N.getUndoAxesPermutation(u),m=vr({inputs:{x:c},backend:r,attrs:{perm:f}});return r.disposeIntermediateTensorInfo(c),r.disposeIntermediateTensorInfo(d),m}return c}var Kne={kernelName:Gu,backendName:"webgl",kernelFunc:qne},Hv=class{constructor(e,t,r){this.variableNames=["x"],this.customUniforms=[{name:"index",type:"float"}],this.outputShape=e;let n=e.length,a=t?"0.0":`getX(${qv(n,"coords")})`,s=e[e.length-1],i="",o="";t?(i=r?`end != ${s-1}`:"end != 0",o=r?"end + 1":"end - 1"):(i=r?`end + pow2 < ${s}`:"end >= pow2",o=r?"end + pow2":"end - pow2"),this.userCode=`
2022-03-16 16:19:56 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${gt(n)} coords = getOutputCoords();
2022-04-14 17:47:08 +02:00
int end = ${Kv(n,"coords")};
2022-04-01 15:13:32 +02:00
float val = ${a};
2022-03-16 16:19:56 +01:00
int pow2 = int(pow(2.0, index));
2022-04-01 15:13:32 +02:00
if (${i}) {
int idx = ${o};
2022-04-14 17:47:08 +02:00
${Kv(n,"coords")} = idx;
val += getX(${qv(n,"coords")});
2022-03-16 16:19:56 +01:00
}
setOutput(val);
}
2022-04-14 17:47:08 +02:00
`}};function qv(e,t){if(e===1)return`${t}`;if(e===2)return`${t}.x, ${t}.y`;if(e===3)return`${t}.x, ${t}.y, ${t}.z`;if(e===4)return`${t}.x, ${t}.y, ${t}.z, ${t}.w`;throw Error(`Cumulative sum for rank ${e} is not yet supported`)}function Kv(e,t){if(e===1)return`${t}`;if(e===2)return`${t}.y`;if(e===3)return`${t}.z`;if(e===4)return`${t}.w`;throw Error(`Cumulative sum for rank ${e} is not yet supported`)}function Xne(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{axis:s,exclusive:i,reverse:o}=n,l=a.shape.length,u=N.getAxesPermutation([s],l),d=a;u!=null&&(d=vr({inputs:{x:a},backend:r,attrs:{perm:u}}));let h=N.getInnerMostAxes(1,l)[0];if(h!==l-1)throw new Error(`WebGL cumsum shader expects an inner-most axis=${a.shape.length-1} but got axis=${s}`);let p=d.shape[h],c=an({inputs:{x:d},backend:r});for(let f=0;f<=Math.ceil(Math.log2(p))-1;f++){let m=new Hv(d.shape,!1,o),g=[[f]],y=c;c=r.runWebGLProgram(m,[c],c.dtype,g),r.disposeIntermediateTensorInfo(y)}if(i){let f=new Hv(d.shape,i,o),m=c;c=r.runWebGLProgram(f,[c],c.dtype),r.disposeIntermediateTensorInfo(m)}if(u!=null){let f=N.getUndoAxesPermutation(u),m=vr({inputs:{x:c},backend:r,attrs:{perm:f}});return r.disposeIntermediateTensorInfo(c),r.disposeIntermediateTensorInfo(d),m}return c}var Zne={kernelName:Vo,backendName:"webgl",kernelFunc:Xne};function Yne(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,weights:s}=t,{size:i,binaryOutput:o}=n;if(a.shape.length===1){let l=r.readSync(a.dataId),u=r.readSync(s.dataId),d=US(l,u,s.dtype,s.shape,i);return r.makeTensorInfo([i],s.dtype,d)}else if(a.shape.length===2){let l=r.bufferSync(a),u=r.bufferSync(s),d=dee(l,u,i,o);return r.makeTensorInfo(d.shape,s.dtype,d.values)}throw new Error(`Error in denseBincount: input must be at most rank 2, but got rank${a.shape.length}.`)}var Jne={kernelName:Jf,backendName:"webgl",kernelFunc:Yne},Qne=class{constructor(e,t,r){this.variableNames=["x"],this.outputShape=[],this.outputShape=e,this.blockSize=t,this.dataFormat=r,this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int b = coords[0];
int h = ${this.getHeightCoordString()};
int w = ${this.getWidthCoordString()};
int d = ${this.getDepthCoordString()};
int in_h = h / ${t};
int offset_h = imod(h, ${t});
int in_w = w / ${t};
int offset_w = imod(w, ${t});
int offset_d = (offset_h * ${t} + offset_w) *
${this.getOutputDepthSize()};
int in_d = d + offset_d;
float result = ${this.getInputSamplingString()};
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}getHeightCoordString(){return this.dataFormat==="NHWC"?"coords[1]":"coords[2]"}getWidthCoordString(){return this.dataFormat==="NHWC"?"coords[2]":"coords[3]"}getDepthCoordString(){return this.dataFormat==="NHWC"?"coords[3]":"coords[1]"}getOutputDepthSize(){return this.dataFormat==="NHWC"?this.outputShape[3]:this.outputShape[1]}getInputSamplingString(){return this.dataFormat==="NHWC"?"getX(b, in_h, in_w, in_d)":"getX(b, in_d, in_h, in_w)"}};function eae(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{blockSize:s,dataFormat:i}=n,o=a.shape[0],l=i==="NHWC"?a.shape[1]:a.shape[2],u=i==="NHWC"?a.shape[2]:a.shape[3],d=i==="NHWC"?a.shape[3]:a.shape[1],h=l*s,p=u*s,c=d/(s*s),f=i==="NHWC"?[o,h,p,c]:[o,c,h,p],m=new Qne(f,s,i);return r.runWebGLProgram(m,[a],a.dtype)}var tae={kernelName:Go,backendName:"webgl",kernelFunc:eae},p8=class{constructor(e,t=!1,r=null,n=!1,a=!1){this.variableNames=["x","W"],this.customUniforms=[{name:"pads",type:"ivec2"},{name:"strides",type:"ivec2"},{name:"dilations",type:"ivec2"},{name:"inDims",type:"ivec2"}],this.outputShape=e.outShape,this.enableShapeUniforms=ln(this.outputShape.length);let s=e.filterHeight,i=e.filterWidth,o=e.outChannels/e.inChannels,l="",u="";r&&(n?l=`float activation(float a) {
2022-02-10 18:27:21 +01:00
float b = getPreluActivationWeightsAtOutCoords();
2022-04-01 15:13:32 +02:00
${r}
}`:a?l=`float activation(float a) {
2022-02-10 18:27:21 +01:00
float b = getLeakyreluAlphaAtOutCoords();
2022-04-01 15:13:32 +02:00
${r}
2022-02-10 18:27:21 +01:00
}`:l=`
float activation(float x) {
2022-04-01 15:13:32 +02:00
${r}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`,u="result = activation(result);");let d=t?"result += getBiasAtOutCoords();":"";t&&this.variableNames.push("bias"),n&&this.variableNames.push("preluActivationWeights"),a&&this.variableNames.push("leakyreluAlpha"),this.userCode=`
2022-02-10 18:27:21 +01:00
${l}
void main() {
ivec4 coords = getOutputCoords();
int batch = coords.x;
ivec2 xRCCorner = coords.yz * strides - pads;
int d2 = coords.w;
2022-04-01 15:13:32 +02:00
int d1 = d2 / ${o};
int q = d2 - d1 * ${o};
2022-02-10 18:27:21 +01:00
int xRCorner = xRCCorner.x;
int xCCorner = xRCCorner.y;
// Convolve x(?, ?, d1) with w(:, :, d1, q) to get y(yR, yC, d2).
// ? = to be determined. : = across all values in that axis.
float dotProd = 0.0;
// TO DO(dsmilkov): Flatten the two for loops and vec4 the operations.
2022-04-01 15:13:32 +02:00
for (int wR = 0; wR < ${s}; wR++) {
2022-02-10 18:27:21 +01:00
int xR = xRCorner + wR * dilations[0];
if (xR < 0 || xR >= inDims[0]) {
continue;
}
2022-04-01 15:13:32 +02:00
for (int wC = 0; wC < ${i}; wC++) {
2022-02-10 18:27:21 +01:00
int xC = xCCorner + wC * dilations[1];
if (xC < 0 || xC >= inDims[1]) {
continue;
}
float xVal = getX(batch, xR, xC, d1);
float wVal = getW(wR, wC, d1, q);
dotProd += xVal * wVal;
}
}
float result = dotProd;
2022-04-01 15:13:32 +02:00
${d}
2022-02-17 14:15:57 +01:00
${u}
2022-02-10 18:27:21 +01:00
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}},h8=class{constructor(e,t=!1,r=null,n=!1,a=!1){this.variableNames=["x","W"],this.packedInputs=!0,this.packedOutput=!0,this.customUniforms=[{name:"pads",type:"ivec2"},{name:"strides",type:"ivec2"},{name:"dilations",type:"ivec2"},{name:"inDims",type:"ivec2"}],this.outputShape=e.outShape,this.enableShapeUniforms=ln(this.outputShape.length);let s=e.outChannels/e.inChannels,i=e.padInfo.left,o=e.strideWidth,l=e.dilationWidth,u=e.filterHeight,d=e.filterWidth,h=d,p=`
2022-02-10 18:27:21 +01:00
int xR; int xC; int xCOffset;
2022-04-01 15:13:32 +02:00
vec4 wTexel; vec4 previous; vec4 final;`;for(let g=0;g<d;g++)p+=`
2022-02-10 18:27:21 +01:00
vec4 xTexelC${g*2};
int xTexelC${g*2}Ready;
vec4 xTexelC${g*2+1};
int xTexelC${g*2+1}Ready;
2022-04-01 15:13:32 +02:00
vec4 xC${g};`;p+=`
2022-02-17 14:15:57 +01:00
for (int r = 0; r < ${u}; r++) {
2022-04-01 15:13:32 +02:00
`;for(let g=0;g<d;g++)p+=`
2022-02-10 18:27:21 +01:00
xTexelC${g*2} = vec4(0.0);
xTexelC${g*2}Ready = 0;
xTexelC${g*2+1} = vec4(0.0);
xTexelC${g*2+1}Ready = 0;
2022-04-01 15:13:32 +02:00
xC${g} = vec4(0.0);`;p+=`
2022-02-10 18:27:21 +01:00
xR = xRCorner + r * dilations[0];
if (xR >=0 && xR < inDims[0]) {
2022-04-01 15:13:32 +02:00
`;for(let g=0;g<(h+1)/2;g++){let y=g*2;if(p+=`
2022-02-10 18:27:21 +01:00
xC = xCCorner + ${y*l};
2022-04-01 15:13:32 +02:00
`,o===1){if(y<d&&(i%2===1?(p+=`
2022-02-10 18:27:21 +01:00
xCOffset = xC + 1;
if (xCOffset >= 0 && xCOffset < inDims[1] && xTexelC${y}Ready == 0) {
xTexelC${y} = getX(batch, xR, xCOffset, d1);
// Need to manually clear unused channels in case
// we're reading from recycled texture.
if (xCOffset + 1 >= inDims[1]) {
xTexelC${y}.zw = vec2(0.0);
}
xTexelC${y}Ready = 1;
}
2022-04-01 15:13:32 +02:00
`,l===1&&y>0?p+=`
2022-02-10 18:27:21 +01:00
xC${y} = vec4(xTexelC${y-2}.zw, xTexelC${y}.xy);
2022-04-01 15:13:32 +02:00
`:p+=`
2022-02-10 18:27:21 +01:00
xCOffset = xC + 1 - 2;
if (xCOffset >= 0 && xCOffset < inDims[1]) {
previous = getX(batch, xR, xCOffset, d1);
// Need to manually clear unused channels in case
// we're reading from recycled texture.
if (xCOffset + 1 >= inDims[1]) {
previous.zw = vec2(0.0);
}
xC${y} = vec4(previous.zw, xTexelC${y}.xy);
} else {
xC${y} = vec4(0.0, 0.0, xTexelC${y}.xy);
}
2022-04-01 15:13:32 +02:00
`):p+=`
2022-02-10 18:27:21 +01:00
if (xC >= 0 && xC < inDims[1] && xTexelC${y}Ready == 0) {
xTexelC${y} = getX(batch, xR, xC, d1);
if (xC + 1 >= inDims[1]) {
xTexelC${y}.zw = vec2(0.0);
}
xTexelC${y}Ready = 1;
}
xC${y} = xTexelC${y};
2022-04-11 17:45:24 +02:00
`,y+1<d)){let A=i%2===0?w.nearestLargerEven(l):l;l%2===0&&i%2===1||l%2!==0&&i%2!==1?(p+=`
2022-04-01 15:13:32 +02:00
xCOffset = xC + imod(pads[1], 2) + ${A};
2022-02-10 18:27:21 +01:00
if (xCOffset >= 0 && xCOffset < inDims[1] && xTexelC${y+1}Ready == 0) {
xTexelC${y+1} = getX(batch, xR, xCOffset, d1);
// Need to manually clear unused channels in case
// we're reading from recycled texture.
if (xCOffset + 1 >= inDims[1]) {
xTexelC${y+1}.zw = vec2(0.0);
}
xTexelC${y+1}Ready = 1;
}
2022-04-01 15:13:32 +02:00
`,l>1&&(p+=`
2022-02-10 18:27:21 +01:00
xCOffset -= 2;
if (xCOffset >= 0 && xCOffset < inDims[1] && xTexelC${y}Ready == 0) {
xTexelC${y} = getX(batch, xR, xCOffset, d1);
xTexelC${y}Ready = 1;
}
2022-04-01 15:13:32 +02:00
`),p+=`
2022-02-10 18:27:21 +01:00
xC${y+1} = vec4(xTexelC${y}.zw, xTexelC${y+1}.xy);
2022-04-01 15:13:32 +02:00
`):A===1?p+=`
2022-02-10 18:27:21 +01:00
xC${y+1} = xTexelC${y};
2022-04-01 15:13:32 +02:00
`:p+=`
xCOffset = xC + ${A};
2022-02-10 18:27:21 +01:00
if (xCOffset >= 0 && xCOffset < inDims[1] && xTexelC${y+1}Ready == 0) {
xTexelC${y+1} = getX(batch, xR, xCOffset, d1);
if (xCOffset + 1 >= inDims[1]) {
xTexelC${y+1}.zw = vec2(0.0);
}
xTexelC${y+1}Ready = 1;
}
xC${y+1} = xTexelC${y+1};
2022-04-01 15:13:32 +02:00
`}}else y<d&&(i%2===1?(p+=`
2022-02-10 18:27:21 +01:00
xCOffset = xC + 1 - strides[1];
if(xCOffset >= 0 && xCOffset < inDims[1] && xTexelC${y}Ready == 0) {
xTexelC${y} = getX(batch, xR, xCOffset, d1);
// Need to manually clear unused channels in case
// we're reading from recycled texture.
if (xCOffset + 1 >= inDims[1]) {
xTexelC${y}.zw = vec2(0.0);
}
xTexelC${y}Ready = 1;
}
if(xC + 1 >= 0 && xC + 1 < inDims[1] && xTexelC${y+1}Ready == 0) {
xTexelC${y+1} = getX(batch, xR, xC + 1, d1);
// Need to manually clear unused channels in case
// we're reading from recycled texture.
if (xC + 2 >= inDims[1]) {
xTexelC${y+1}.zw = vec2(0.0);
}
xTexelC${y+1}Ready = 1;
}
xC${y} = vec4(xTexelC${y}.zw, xTexelC${y+1}.zw);
2022-04-01 15:13:32 +02:00
`,y+1<d&&(p+=`
2022-02-10 18:27:21 +01:00
final = vec4(0.0);
xCOffset = xC + 1 + strides[1];
if(xCOffset >= 0 && xCOffset < inDims[1]) {
final = getX(batch, xR, xCOffset, d1);
}
xC${y+1} = vec4(xTexelC${y+1}.xy, final.xy);
2022-04-01 15:13:32 +02:00
`)):(p+=`
2022-02-10 18:27:21 +01:00
if(xC >= 0 && xC < inDims[1] && xTexelC${y}Ready == 0) {
xTexelC${y} = getX(batch, xR, xC, d1);
if (xC + 1 >= inDims[1]) {
xTexelC${y}.zw = vec2(0.0);
}
xTexelC${y}Ready = 1;
}
xCOffset = xC + strides[1];
if(xCOffset >= 0 && xCOffset < inDims[1] && xTexelC${y+1}Ready == 0) {
xTexelC${y+1} = getX(batch, xR, xCOffset, d1);
if (xCOffset + 1 >= inDims[1]) {
xTexelC${y+1}.zw = vec2(0.);
}
xTexelC${y+1}Ready = 1;
}
xC${y} = vec4(
xTexelC${y}.xy, xTexelC${y+1}.xy);
2022-04-01 15:13:32 +02:00
`,y+1<d&&(p+=`
2022-02-10 18:27:21 +01:00
xC${y+1} = vec4(xTexelC${y}.zw, xTexelC${y+1}.zw);
2022-04-01 15:13:32 +02:00
`)));y<d&&(p+=`
2022-02-10 18:27:21 +01:00
wTexel = getW(r, ${y}, d1, q);
dotProd += xC${y} * vec4(wTexel.xz, wTexel.xz);
2022-04-01 15:13:32 +02:00
`,y+1<d&&(p+=`
2022-02-10 18:27:21 +01:00
wTexel = getW(r, ${y+1}, d1, q);
dotProd += xC${y+1} * vec4(wTexel.xz, wTexel.xz);
2022-04-01 15:13:32 +02:00
`))}p+=`
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`,p+=`
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;let c="",f="";r&&(n?c=`vec4 activation(vec4 a) {
2022-02-10 18:27:21 +01:00
vec4 b = getPreluActivationWeightsAtOutCoords();
2022-04-01 15:13:32 +02:00
${r}
}`:a?c=`vec4 activation(vec4 a) {
2022-02-10 18:27:21 +01:00
vec4 b = getLeakyreluAlphaAtOutCoords();
2022-04-01 15:13:32 +02:00
${r}
}`:c=`vec4 activation(vec4 x) {
${r}
}`,f="result = activation(result);");let m=t?"result += getBiasAtOutCoords();":"";t&&this.variableNames.push("bias"),n&&this.variableNames.push("preluActivationWeights"),a&&this.variableNames.push("leakyreluAlpha"),this.userCode=`
${c}
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int batch = coords.x;
ivec2 xRCCorner = coords.yz * strides - pads;
int d2 = coords.w;
2022-04-01 15:13:32 +02:00
int d1 = d2 / ${s};
int q = d2 - d1 * ${s};
2022-02-10 18:27:21 +01:00
int xRCorner = xRCCorner.x;
int xCCorner = xRCCorner.y;
//intialize dotProd with a small epsilon seems to reduce GPU accuracy loss.
vec4 dotProd = vec4(0.000000000000001);
2022-04-01 15:13:32 +02:00
${p}
2022-02-10 18:27:21 +01:00
vec4 result = dotProd - vec4(0.000000000000001);
${m}
${f}
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}};function rae(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,filter:s}=t,{strides:i,pad:o,dilations:l,dimRoundingMode:u}=n,d=l;d==null&&(d=[1,1]),w.assert(N.eitherStridesOrDilationsAreOne(i,d),()=>`Error in depthwiseConv2d: Either strides or dilations must be 1. Got strides ${i} and dilations '${d}'`);let h=N.computeConv2DInfo(a.shape,s.shape,i,d,o,u,!0),p;Y().getBool("WEBGL_PACK_DEPTHWISECONV")&&h.strideWidth<=2&&h.outChannels/h.inChannels===1?p=new h8(h):p=new p8(h);let c=[[h.padInfo.top,h.padInfo.left],[h.strideHeight,h.strideWidth],[h.dilationHeight,h.dilationWidth],[h.inHeight,h.inWidth]];return r.runWebGLProgram(p,[a,s],"float32",c)}var nae={kernelName:ni,backendName:"webgl",kernelFunc:rae},aae=class{constructor(e){this.variableNames=["x","dy"],this.outputShape=e.filterShape;let t=e.strideHeight,r=e.strideWidth,n=e.padInfo.top,a=e.padInfo.left,s=e.outChannels/e.inChannels;this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int wR = coords.x;
int wC = coords.y;
int d1 = coords.z;
int dm = coords.w;
2022-04-01 15:13:32 +02:00
int d2 = d1 * ${s} + dm;
2022-02-10 18:27:21 +01:00
float dotProd = 0.0;
// TO DO: Vec4 over the batch size
for (int b = 0; b < ${e.batchSize}; b++) {
for (int yR = 0; yR < ${e.outHeight}; yR++) {
2022-04-01 15:13:32 +02:00
int xR = wR + yR * ${t} - ${n};
2022-02-10 18:27:21 +01:00
if (xR < 0 || xR >= ${e.inHeight}) {
continue;
}
for (int yC = 0; yC < ${e.outWidth}; yC++) {
2022-04-01 15:13:32 +02:00
int xC = wC + yC * ${r} - ${a};
2022-02-10 18:27:21 +01:00
if (xC < 0 || xC >= ${e.inWidth}) {
continue;
}
float dyValue = getDy(b, yR, yC, d2);
float xValue = getX(b, xR, xC, d1);
dotProd += (xValue * dyValue);
}
}
}
setOutput(dotProd);
}
2022-04-14 17:47:08 +02:00
`}},sae=class{constructor(e){this.variableNames=["dy","W"],this.outputShape=e.inShape;let t=e.filterHeight,r=e.filterWidth,n=e.strideHeight,a=e.strideWidth,s=t-1-e.padInfo.top,i=r-1-e.padInfo.left,o=e.outChannels/e.inChannels;this.userCode=`
2022-04-01 15:13:32 +02:00
const ivec2 pads = ivec2(${s}, ${i});
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int batch = coords[0];
int d1 = coords[3];
ivec2 dyCorner = coords.yz - pads;
int dyRCorner = dyCorner.x;
int dyCCorner = dyCorner.y;
float dotProd = 0.0;
for (int wR = 0; wR < ${t}; wR++) {
2022-04-01 15:13:32 +02:00
float dyR = float(dyRCorner + wR) / ${n}.0;
2022-02-10 18:27:21 +01:00
if (dyR < 0.0 || dyR >= ${e.outHeight}.0 || fract(dyR) > 0.0) {
continue;
}
int idyR = int(dyR);
int wRPerm = ${t} - 1 - wR;
2022-04-01 15:13:32 +02:00
for (int wC = 0; wC < ${r}; wC++) {
float dyC = float(dyCCorner + wC) / ${a}.0;
2022-02-10 18:27:21 +01:00
if (dyC < 0.0 || dyC >= ${e.outWidth}.0 ||
fract(dyC) > 0.0) {
continue;
}
int idyC = int(dyC);
2022-04-01 15:13:32 +02:00
int wCPerm = ${r} - 1 - wC;
2022-02-10 18:27:21 +01:00
// TO DO: Vec4 over the channelMul
2022-04-01 15:13:32 +02:00
for (int dm = 0; dm < ${o}; dm++) {
int d2 = d1 * ${o} + dm;
2022-02-10 18:27:21 +01:00
float xValue = getDy(batch, idyR, idyC, d2);
float wValue = getW(wRPerm, wCPerm, d1, dm);
dotProd += xValue * wValue;
}
}
}
setOutput(dotProd);
}
2022-04-14 17:47:08 +02:00
`}};function iae(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,dy:s}=t,{strides:i,dilations:o,pad:l,dimRoundingMode:u,filterShape:d}=n,h=N.computeConv2DInfo(a.shape,d,i,o,l,u,!0),p=new aae(h);return r.runWebGLProgram(p,[a,s],"float32")}var oae={kernelName:Qf,backendName:"webgl",kernelFunc:iae};function lae(e){let{inputs:t,backend:r,attrs:n}=e,{dy:a,filter:s}=t,{strides:i,dilations:o,pad:l,dimRoundingMode:u,inputShape:d}=n,h=N.computeConv2DInfo(d,s.shape,i,o,l,u,!0),p=new sae(h);return r.runWebGLProgram(p,[a,s],"float32")}var uae={kernelName:em,backendName:"webgl",kernelFunc:lae},dae=class{constructor(e){this.variableNames=["X"],this.outputShape=[e,e],this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec2 coords = getOutputCoords();
float val = coords[0] == coords[1] ? getX(coords[0]) : 0.0;
setOutput(val);
}
2022-04-14 17:47:08 +02:00
`}};function pae(e){let{inputs:t,backend:r}=e,{x:n}=t,a=[...n.shape,...n.shape],s=w.sizeFromShape(n.shape),i=ve({inputs:{x:n},backend:r,attrs:{shape:[s]}}),o=new dae(s),l=r.runWebGLProgram(o,[i],i.dtype),u=ve({inputs:{x:l},backend:r,attrs:{shape:a}});return r.disposeIntermediateTensorInfo(i),r.disposeIntermediateTensorInfo(l),u}var hae={kernelName:tm,backendName:"webgl",kernelFunc:pae},cae=class{constructor(e){this.variableNames=["x","W"],this.outputShape=e.outShape;let{inHeight:t,inWidth:r,padInfo:n,strideHeight:a,strideWidth:s,filterHeight:i,filterWidth:o,dilationHeight:l,dilationWidth:u}=e,{top:d,left:h}=n;this.userCode=`
2022-04-01 15:13:32 +02:00
const ivec2 strides = ivec2(${a}, ${s});
const ivec2 pads = ivec2(${d}, ${h});
2022-02-10 18:27:21 +01:00
const float neg_infinity = -3.4e38;
void main() {
ivec4 coords = getOutputCoords();
int batch = coords.x;
int d1 = coords.w;
ivec2 outTopLeftCorner =
coords.yz * strides - pads;
int hBeg = outTopLeftCorner.x;
int wBeg = outTopLeftCorner.y;
float curVal = neg_infinity;
2022-04-01 15:13:32 +02:00
for (int h = 0; h < ${i}; h++) {
2022-02-10 18:27:21 +01:00
int hIn = hBeg + h * ${l};
if (hIn >= 0 && hIn < ${t}) {
2022-04-01 15:13:32 +02:00
for (int w = 0; w < ${o}; w++) {
2022-02-17 14:15:57 +01:00
int wIn = wBeg + w * ${u};
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
if (wIn >= 0 && wIn < ${r}) {
2022-02-10 18:27:21 +01:00
float xVal = getX(batch, hIn, wIn, d1);
float wVal = getW(h, w, d1);
float val = xVal + wVal;
if (val > curVal) {
curVal = val;
}
}
}
}
}
float result = curVal;
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}};function fae(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,filter:s}=t,{strides:i,pad:o,dilations:l}=n,u=N.computeDilation2DInfo(a.shape,s.shape,i,o,"NHWC",l),d,h=new cae(u);d=r.runWebGLProgram(h,[a,s],"float32");let p=ve({inputs:{x:d},backend:r,attrs:{shape:u.outShape}});return r.disposeIntermediateTensorInfo(d),p}var mae={kernelName:Jp,backendName:"webgl",kernelFunc:fae};function gae(e){let{inputs:t,backend:r,attrs:n}=e,{equation:a}=n,s=t,{allDims:i,summedDims:o,idDims:l}=N.decodeEinsumEquation(a,s.length);N.checkEinsumDimSizes(i.length,l,s);let{path:u,steps:d}=N.getEinsumComputePath(o,l),h=d.length,p=null,c=i.length,f=[];for(let m=0;m<h;++m){for(let g of d[m]){let{permutationIndices:y,expandDims:A}=N.getEinsumPermutation(c,l[g]),x;N.isIdentityPermutation(y)?x=s[g]:(x=vr({inputs:{x:s[g]},backend:r,attrs:{perm:y}}),f.push(x));let b=x.shape.slice();for(let v=0;v<A.length;++v)b.splice(A[v],0,1);w.arraysEqual(x.shape,b)||(x=ve({inputs:{x},backend:r,attrs:{shape:b}}),f.push(x)),p===null?p=x:(p=mb({inputs:{a:x,b:p},backend:r}),f.push(p))}m<h-1&&(u[m]>=0&&(p=b0({inputs:{x:p},backend:r,attrs:{axis:u[m]-(i.length-c),keepDims:!1}}),f.push(p)),c--)}for(let m of f)m!==p&&r.disposeIntermediateTensorInfo(m);return p}var yae={kernelName:Qp,backendName:"webgl",kernelFunc:gae},Aae="return (x >= 0.0) ? x : (exp(x) - 1.0);",xae=`
2022-02-10 18:27:21 +01:00
vec4 result;
result.r = (x.r >= 0.0) ? x.r : (exp(x.r) - 1.0);
result.g = (x.g >= 0.0) ? x.g : (exp(x.g) - 1.0);
result.b = (x.b >= 0.0) ? x.b : (exp(x.b) - 1.0);
result.a = (x.a >= 0.0) ? x.a : (exp(x.a) - 1.0);
return result;
2022-04-14 17:47:08 +02:00
`,bae=it({opSnippet:Aae,packedOpSnippet:xae}),vae={kernelName:si,backendName:"webgl",kernelFunc:bae},wae="return (b >= 1.0) ? a : a * (b + 1.0);",kae=`
2022-02-10 18:27:21 +01:00
vec4 bGTEZero = vec4(greaterThanEqual(b, vec4(0.)));
return (bGTEZero * a) + ((vec4(1.0) - bGTEZero) * (a * (b + vec4(1.0))));
2022-04-14 17:47:08 +02:00
`,Iae=e=>{let{inputs:t,backend:r}=e,{dy:n,y:a}=t,s=Y().getBool("WEBGL_PACK_BINARY_OPERATIONS")?new Dh(kae,n.shape,a.shape):new Mu(wae,n.shape,a.shape);return r.runWebGLProgram(s,[n,a],n.dtype)},Sae={kernelName:rm,backendName:"webgl",kernelFunc:Iae},Tae=`
2022-02-10 18:27:21 +01:00
return vec4(equal(a, b));
2022-04-14 17:47:08 +02:00
`,Nae="return float(a == b);",Cae=wr({opSnippet:Nae,packedOpSnippet:Tae,dtype:"bool",cpuKernelImpl:cee}),Eae={kernelName:jo,backendName:"webgl",kernelFunc:Cae},Rae=`
2022-02-10 18:27:21 +01:00
// Error function is calculated approximately with elementary function.
// See "Handbook of Mathematical Functions with Formulas,
// Graphs, and Mathematical Tables", Abramowitz and Stegun.
2022-04-01 15:13:32 +02:00
float p = ${N.ERF_P};
float a1 = ${N.ERF_A1};
float a2 = ${N.ERF_A2};
float a3 = ${N.ERF_A3};
float a4 = ${N.ERF_A4};
float a5 = ${N.ERF_A5};
2022-02-10 18:27:21 +01:00
float sign = sign(x);
x = abs(x);
float t = 1.0 / (1.0 + p * x);
return sign * (1.0 - (((((a5*t + a4)*t) + a3)*t + a2)*t + a1)*t*exp(-x*x));
2022-04-14 17:47:08 +02:00
`,Mae=it({opSnippet:Rae}),Fae={kernelName:ju,backendName:"webgl",kernelFunc:Mae},$ae=Td+`
2022-02-10 18:27:21 +01:00
return exp(x);
2022-04-14 17:47:08 +02:00
`,Pae=`
2022-02-10 18:27:21 +01:00
vec4 result = exp(x);
bvec4 isNaN = isnan(x);
result.r = isNaN.r ? x.r : result.r;
result.g = isNaN.g ? x.g : result.g;
result.b = isNaN.b ? x.b : result.b;
result.a = isNaN.a ? x.a : result.a;
return result;
2022-04-14 17:47:08 +02:00
`,c8=it({opSnippet:$ae,packedOpSnippet:Pae,cpuKernelImpl:fee,dtype:"float32"}),_ae={kernelName:ii,backendName:"webgl",kernelFunc:c8};function Jy(e){let{inputs:t,attrs:r,backend:n}=e,{dim:a}=r,{input:s}=t,i=s.shape.length,o=s.shape.slice(),l=a;return a<0&&(w.assert(-(i+1)<=a,()=>`Axis must be in the interval [${-(i+1)}, ${i}]`),l=i+a+1),o.splice(l,0,1),ve({inputs:{x:s},backend:n,attrs:{shape:o}})}var zae={kernelName:Ho,backendName:"webgl",kernelFunc:Jy},Xv="return exp(x) - 1.0;",Oae=it({opSnippet:Xv,packedOpSnippet:Xv,cpuKernelImpl:mee}),Dae={kernelName:qo,backendName:"webgl",kernelFunc:Oae},Zv=class{constructor(e,t,r){this.variableNames=["real","imag"];let n=t[1];this.outputShape=t;let a=r?`2.0 * ${Math.PI}`:`-2.0 * ${Math.PI}`,s=r?`${n}.0`:"1.0",i;if(e==="real")i="return real * expR - imag * expI;";else if(e==="imag")i="return real * expI + imag * expR;";else throw new Error(`FFT component must be either "real" or "imag", got ${e}.`);this.userCode=`
2022-04-01 15:13:32 +02:00
const float exponentMultiplier = ${a};
2022-02-10 18:27:21 +01:00
float unaryOpComplex(float real, float expR, float imag, float expI) {
2022-04-01 15:13:32 +02:00
${i}
2022-02-10 18:27:21 +01:00
}
float mulMatDFT(int batch, int index) {
2022-04-01 15:13:32 +02:00
float indexRatio = float(index) / float(${n});
2022-02-10 18:27:21 +01:00
float exponentMultiplierTimesIndexRatio =
exponentMultiplier * indexRatio;
float result = 0.0;
2022-04-01 15:13:32 +02:00
for (int i = 0; i < ${n}; i++) {
2022-02-10 18:27:21 +01:00
// x = (-2|2 * PI / N) * index * i;
float x = exponentMultiplierTimesIndexRatio * float(i);
float expR = cos(x);
float expI = sin(x);
float real = getReal(batch, i);
float imag = getImag(batch, i);
result +=
2022-04-01 15:13:32 +02:00
unaryOpComplex(real, expR, imag, expI) / ${s};
2022-02-10 18:27:21 +01:00
}
return result;
}
void main() {
ivec2 coords = getOutputCoords();
setOutput(mulMatDFT(coords[0], coords[1]));
}
2022-04-14 17:47:08 +02:00
`}};function f8(e,t,r){let n=r.texData.get(e.dataId),a=w.sizeFromShape(e.shape),s=e.shape[e.shape.length-1],i=a/s,o=ve({inputs:{x:e},backend:r,attrs:{shape:[i,s]}}),l=o.shape,u=new Zv("real",l,t),d=new Zv("imag",l,t),h=[{dataId:n.complexTensorInfos.real.dataId,dtype:n.complexTensorInfos.real.dtype,shape:l},{dataId:n.complexTensorInfos.imag.dataId,dtype:n.complexTensorInfos.imag.dtype,shape:l}],p=r.runWebGLProgram(u,h,"float32"),c=r.runWebGLProgram(d,h,"float32"),f=Vi({inputs:{real:p,imag:c},backend:r});r.disposeIntermediateTensorInfo(p),r.disposeIntermediateTensorInfo(c);let m=ve({inputs:{x:f},backend:r,attrs:{shape:e.shape}});return r.disposeIntermediateTensorInfo(o),r.disposeIntermediateTensorInfo(f),m}function Lae(e){let{inputs:t,backend:r}=e,{input:n}=t;return f8(n,!1,r)}var Bae={kernelName:nm,backendName:"webgl",kernelFunc:Lae},Wae=class{constructor(e,t){this.outputShape=[],this.customUniforms=[{name:"value",type:"float"}],this.variableNames=["x"],this.outputShape=e,this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
// Input can be obtained from uniform value.
setOutput(value);
}
2022-04-14 17:47:08 +02:00
`}};function Bh(e){let{backend:t,attrs:r}=e,{shape:n,value:a}=r,{dtype:s}=r;if(s=s||w.inferDtype(a),s==="string"){let i=w.getArrayFromDType(s,w.sizeFromShape(n));return i.fill(a),t.makeTensorInfo(n,s,i)}else{let i=new Wae(n,a),o=[[a]];return t.runWebGLProgram(i,[],s,o)}}var Vae={kernelName:Hu,backendName:"webgl",kernelFunc:Bh},Uae=class{constructor(e){this.variableNames=["Image"],this.outputShape=[];let t=e[2];this.outputShape=e,this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int x = coords[2];
int coordX = ${t} - x - 1;
float outputValue;
if(coordX >= 0 && coordX < ${t}) {
outputValue = getImage(coords[0], coords[1], coordX, coords[3]);
} else {
outputValue = getImage(coords[0], coords[1], coords[2], coords[3]);
}
setOutput(outputValue);
}
2022-04-14 17:47:08 +02:00
`}},Gae={kernelName:Ko,backendName:"webgl",kernelFunc:({inputs:e,backend:t})=>{let{image:r}=e,n=t,a=new Uae(r.shape);return n.runWebGLProgram(a,[r],r.dtype)}},Yv="return floor(x);",jae=it({opSnippet:Yv,packedOpSnippet:Yv,cpuKernelImpl:gee}),Hae={kernelName:oi,backendName:"webgl",kernelFunc:jae},qae=`
2022-02-10 18:27:21 +01:00
float s = sign(a) * sign(b);
int ia = round(a);
int ib = round(b);
if (ib != 0) {
// Windows (D3D) wants guaranteed non-zero int division at compile-time.
return float(idiv(ia, ib, s));
} else {
return NAN;
}
2022-04-14 17:47:08 +02:00
`,Kae=`
2022-02-10 18:27:21 +01:00
ivec4 ia = round(a);
ivec4 ib = round(b);
bvec4 cond = notEqual(ib, ivec4(0));
ivec4 result = ivec4(0);
vec4 s = sign(a) * sign(b);
// Windows (D3D) wants guaranteed non-zero int division at compile-time.
if (cond[0]) {
result[0] = idiv(ia[0], ib[0], s[0]);
}
if (cond[1]) {
result[1] = idiv(ia[1], ib[1], s[1]);
}
if (cond[2]) {
result[2] = idiv(ia[2], ib[2], s[2]);
}
if (cond[3]) {
result[3] = idiv(ia[3], ib[3], s[3]);
}
return vec4(result);
2022-04-14 17:47:08 +02:00
`,Xae=wr({opSnippet:qae,packedOpSnippet:Kae,dtype:"int32"}),Zae={kernelName:li,backendName:"webgl",kernelFunc:Xae},Yae=class{constructor(e){this.variableNames=["A"];let t=Gr(),[r,n]=e;this.outputShape=e,this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec3 coords = getOutputCoords();
int texR = coords[0];
int texC = coords[1];
int depth = coords[2];
2022-04-01 15:13:32 +02:00
vec2 uv = (vec2(texC, texR) + halfCR) / vec2(${n}.0, ${r}.0);
2022-02-10 18:27:21 +01:00
vec4 values = ${t.texture2D}(A, uv);
float value;
if (depth == 0) {
value = values.r;
} else if (depth == 1) {
value = values.g;
} else if (depth == 2) {
value = values.b;
} else if (depth == 3) {
value = values.a;
}
setOutput(floor(value * 255.0 + 0.5));
}
2022-04-14 17:47:08 +02:00
`}},Jae=class{constructor(e){this.variableNames=["A"],this.packedInputs=!1,this.packedOutput=!0;let t=Gr(),[r,n]=e;this.outputShape=e,this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec3 coords = getOutputCoords();
int texR = coords[0];
int texC = coords[1];
int depth = coords[2];
vec4 result = vec4(0.);
for(int row=0; row<=1; row++) {
for(int col=0; col<=1; col++) {
texC = coords[1] + row;
depth = coords[2] + col;
vec2 uv = (vec2(texC, texR) + halfCR) /
2022-04-01 15:13:32 +02:00
vec2(${n}.0, ${r}.0);
2022-02-10 18:27:21 +01:00
vec4 values = ${t.texture2D}(A, uv);
float value;
if (depth == 0) {
value = values.r;
} else if (depth == 1) {
value = values.g;
} else if (depth == 2) {
value = values.b;
} else if (depth == 3) {
value = values.a;
}
result[row * 2 + col] = floor(value * 255.0 + 0.5);
}
}
${t.output} = result;
}
2022-04-14 17:47:08 +02:00
`}},Qae={kernelName:Pp,backendName:"webgl",kernelFunc:ese},ou;function ese(e){let{inputs:t,backend:r,attrs:n}=e,{pixels:a}=t,{numChannels:s}=n,i=typeof HTMLVideoElement!="undefined"&&a instanceof HTMLVideoElement,o=typeof HTMLImageElement!="undefined"&&a instanceof HTMLImageElement,[l,u]=i?[a.videoWidth,a.videoHeight]:[a.width,a.height],d=[u,l],h=[u,l,s];(o||i)&&(ou==null&&(ou=document.createElement("canvas").getContext("2d")),ou.canvas.width=l,ou.canvas.height=u,ou.drawImage(a,0,0,l,u),a=ou.canvas);let p=r.makeTensorInfo(d,"int32");r.texData.get(p.dataId).usage=2,r.gpgpu.uploadPixelDataToTexture(r.getTexture(p.dataId),a);let c=Y().getBool("WEBGL_PACK")?new Jae(h):new Yae(h),f=r.runWebGLProgram(c,[p],"int32");return r.disposeData(p.dataId),f}function tse(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,filter:s,bias:i,preluActivationWeights:o}=t,{strides:l,pad:u,dataFormat:d,dilations:h,dimRoundingMode:p,activation:c,leakyreluAlpha:f}=n,m=N.convertConv2DDataFormat(d),g=N.computeConv2DInfo(a.shape,s.shape,l,h,u,p,!1,m),y,A=[];if(g.filterHeight===1&&g.filterWidth===1&&g.dilationHeight===1&&g.dilationWidth===1&&g.strideHeight===1&&g.strideWidth===1&&(g.padInfo.type==="SAME"||g.padInfo.type==="VALID"))y=u8({x:a,filter:s,convInfo:g,backend:r,bias:i,activation:c,preluActivationWeights:o,leakyreluAlpha:f});else if(Y().getBool("WEBGL_CONV_IM2COL")&&a.shape[0]===1)y=d8({x:a,filter:s,convInfo:g,backend:r,bias:i,activation:c,preluActivationWeights:o,leakyreluAlpha:f});else{let b=i!=null,v=o!=null,S=c==="leakyrelu",T=c?A0(c,!1):null,E=new l8(g,b,T,v,S),R=[a,s];if(i&&R.push(i),o&&R.push(o),S){let _=r.makeTensorInfo([],"float32",w.createScalarValue(f,"float32"));R.push(_),A.push(_)}y=r.runWebGLProgram(E,R,"float32")}let x=ve({inputs:{x:y},backend:r,attrs:{shape:g.outShape}});return A.push(y),A.forEach(b=>r.disposeIntermediateTensorInfo(b)),x}var rse={kernelName:Fs,backendName:"webgl",kernelFunc:tse};function nse(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,filter:s,bias:i,preluActivationWeights:o}=t,{strides:l,pad:u,dilations:d,dimRoundingMode:h,activation:p,leakyreluAlpha:c}=n,f=[],m=d;m==null&&(m=[1,1]),w.assert(N.eitherStridesOrDilationsAreOne(l,m),()=>`Error in depthwiseConv2d: Either strides or dilations must be 1. Got strides ${l} and dilations '${m}'`);let g=N.computeConv2DInfo(a.shape,s.shape,l,m,u,h,!0),y=Y().getBool("WEBGL_PACK_DEPTHWISECONV")&&g.strideWidth<=2&&g.outChannels/g.inChannels===1,A=p?A0(p,y):null,x=[a,s],b=i!=null,v=o!=null,S=p==="leakyrelu";if(b&&x.push(i),v&&x.push(o),S){let _=r.makeTensorInfo([],"float32",w.createScalarValue(c,"float32"));x.push(_),f.push(_)}let T;y?T=new h8(g,b,A,v,S):T=new p8(g,b,A,v,S);let E=[[g.padInfo.top,g.padInfo.left],[g.strideHeight,g.strideWidth],[g.dilationHeight,g.dilationWidth],[g.inHeight,g.inWidth]],R=r.runWebGLProgram(T,x,"float32",E);return f.forEach(_=>r.disposeIntermediateTensorInfo(_)),R}var ase={kernelName:$s,backendName:"webgl",kernelFunc:nse},sse=class{constructor(e,t,r){this.sliceDim=e,this.strides=t,this.variableNames=["x","indices"],this.outputShape=r;let n=gt(t.length),a=gt(r.length),s=this.sliceDim>1?"strides[j]":"strides";this.userCode=`
2022-04-01 15:13:32 +02:00
${n} strides = ${n}(${this.strides});
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${a} coords = getOutputCoords();
2022-02-10 18:27:21 +01:00
int flattenIndex = 0;
for (int j = 0; j < ${this.sliceDim}; j++) {
int index = round(getIndices(coords[0], j));
2022-04-01 15:13:32 +02:00
flattenIndex += index * ${s};
2022-02-10 18:27:21 +01:00
}
setOutput(getX(flattenIndex, coords[1]));
}
2022-04-14 17:47:08 +02:00
`}};function ise(e){let{inputs:t,backend:r}=e,{params:n,indices:a}=t,s=a.shape,i=s[s.length-1],o=w.sizeFromShape(n.shape),[l,u,d,h]=N.prepareAndValidate(n,a),p=ve({inputs:{x:a},backend:r,attrs:{shape:[u,i]}}),c=ve({inputs:{x:n},backend:r,attrs:{shape:[w.sizeFromShape(n.shape)/d,d]}});if(r.shouldExecuteOnCPU([n,a])||n.dtype==="string"){let y=r.readSync(a.dataId),A=r.bufferSync(n),x=yee(y,A,n.dtype,u,i,d,h,n.shape,o);return r.makeTensorInfo(l,n.dtype,x.values)}let f=new sse(i,h,[u,d]),m=r.runWebGLProgram(f,[c,p],c.dtype),g=ve({inputs:{x:m},backend:r,attrs:{shape:l}});return r.disposeIntermediateTensorInfo(p),r.disposeIntermediateTensorInfo(c),r.disposeIntermediateTensorInfo(m),g}var ose={kernelName:Zo,backendName:"webgl",kernelFunc:ise},lse=class{constructor(e,t){this.variableNames=["A","indices"],this.outputShape=t,this.rank=t.length;let r=gt(this.rank),n=use(e,2);this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${r} resRC = getOutputCoords();
2022-02-10 18:27:21 +01:00
int index = int(getIndices(resRC.x, resRC.z));
float inBounds = (index >= 0) && (index < ${e[2]}) ? 1.0 : 0.0;
2022-04-01 15:13:32 +02:00
setOutput(inBounds * getA(${n}));
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}};function use(e,t){let r=["resRC.x","resRC.y","resRC.z","resRC.w"],n=[];for(let a=0;a<e.length;a++)a===2?n.push("index"):n.push(`${r[a]}`);return n.join()}function m8(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,indices:s}=t,{axis:i,batchDims:o}=n,l=w.parseAxisParam(i,a.shape)[0];if(Y().get("DEBUG")){let A=r.readSync(s.dataId),x=a.shape[l];for(let b=0;b<A.length;++b){let v=A[b];w.assert(v<=x-1&&v>=0,()=>`GatherV2: the index value ${v} is not in [0, ${x-1}]`)}}let u=N.segment_util.collectGatherOpShapeInfo(a,s,l,o),d=w.sizeFromShape(s.shape),h=[],p=ve({inputs:{x:a},backend:r,attrs:{shape:[u.batchSize,u.outerSize,u.dimSize,u.sliceSize]}}),c=ve({inputs:{x:s},backend:r,attrs:{shape:[u.batchSize,d/u.batchSize]}});h.push(p),h.push(c);let f=[u.batchSize,u.outerSize,d/u.batchSize,u.sliceSize];if(r.shouldExecuteOnCPU([a,s])||a.dtype==="string"){let A=r.bufferSync(c),x=r.bufferSync(p),b=Aee(x,A,f);return h.forEach(v=>r.disposeIntermediateTensorInfo(v)),r.makeTensorInfo(u.outputShape,b.dtype,b.values)}let m=new lse(p.shape,f),g=r.runWebGLProgram(m,[p,c],p.dtype);h.push(g);let y=ve({inputs:{x:g},backend:r,attrs:{shape:u.outputShape}});return h.forEach(A=>r.disposeIntermediateTensorInfo(A)),y}var dse={kernelName:Xo,backendName:"webgl",kernelFunc:m8},pse="return float(a > b);",hse=`
2022-02-10 18:27:21 +01:00
return vec4(greaterThan(a, b));
2022-04-14 17:47:08 +02:00
`,cse=wr({opSnippet:pse,packedOpSnippet:hse,cpuKernelImpl:xee,dtype:"bool"}),fse={kernelName:Yo,backendName:"webgl",kernelFunc:cse},mse="return float(a >= b);",gse=`
2022-02-10 18:27:21 +01:00
return vec4(greaterThanEqual(a, b));
2022-04-14 17:47:08 +02:00
`,yse=wr({opSnippet:mse,packedOpSnippet:gse,dtype:"bool",cpuKernelImpl:bee}),Ase={kernelName:di,backendName:"webgl",kernelFunc:yse};function xse(e){let{inputs:t,backend:r}=e,{input:n}=t;return f8(n,!0,r)}var bse={kernelName:am,backendName:"webgl",kernelFunc:xse},vse="return float(!isnan(x) && !isinf(x));",wse=it({opSnippet:vse,dtype:"bool"}),kse={kernelName:qu,backendName:"webgl",kernelFunc:wse},Ise="return float(isinf(x));",Sse=it({opSnippet:Ise,dtype:"bool"}),Tse={kernelName:Ku,backendName:"webgl",kernelFunc:Sse},Nse="return float(isnan(x));",Cse=it({opSnippet:Nse,dtype:"bool"}),Ese={kernelName:Xu,backendName:"webgl",kernelFunc:Cse},Rse="return float(a < b);",Mse=`
2022-02-10 18:27:21 +01:00
return vec4(lessThan(a, b));
2022-04-14 17:47:08 +02:00
`,Fse=wr({opSnippet:Rse,packedOpSnippet:Mse,cpuKernelImpl:vee,dtype:"bool"}),$se={kernelName:Jo,backendName:"webgl",kernelFunc:Fse},Pse="return float(a <= b);",_se=`
2022-02-10 18:27:21 +01:00
return vec4(lessThanEqual(a, b));
2022-04-14 17:47:08 +02:00
`,zse=wr({opSnippet:Pse,packedOpSnippet:_se,cpuKernelImpl:wee,dtype:"bool"}),Ose={kernelName:Qo,backendName:"webgl",kernelFunc:zse};function Dse(e){let{backend:t,attrs:r}=e,{start:n,stop:a,num:s}=r,i=kee(n,a,s);return t.makeTensorInfo([i.length],"float32",i)}var Lse={kernelName:sm,backendName:"webgl",kernelFunc:Dse},Bse=Td+`
2022-02-10 18:27:21 +01:00
return x < 0.0 ? 0./0. : log(x);
2022-04-14 17:47:08 +02:00
`,Wse=`
2022-02-10 18:27:21 +01:00
vec4 result = log(x);
bvec4 isNaN = isnan(x);
result.r = isNaN.r ? x.r : (x.r < 0.0 ? 0./0. : result.r);
result.g = isNaN.g ? x.g : (x.g < 0.0 ? 0./0. : result.g);
result.b = isNaN.b ? x.b : (x.b < 0.0 ? 0./0. : result.b);
result.a = isNaN.a ? x.a : (x.a < 0.0 ? 0./0. : result.a);
return result;
2022-04-14 17:47:08 +02:00
`,Vse=it({opSnippet:Bse,packedOpSnippet:Wse,cpuKernelImpl:Iee}),Use={kernelName:ci,backendName:"webgl",kernelFunc:Vse},Gse=Td+`
2022-02-10 18:27:21 +01:00
return log(1.0 + x);
2022-04-14 17:47:08 +02:00
`,jse=it({opSnippet:Gse}),Hse={kernelName:Zu,backendName:"webgl",kernelFunc:jse},qse="return float(a >= 1.0 && b >= 1.0);",Kse=`
2022-02-10 18:27:21 +01:00
return vec4(
vec4(greaterThanEqual(a, vec4(1.0))) *
vec4(greaterThanEqual(b, vec4(1.0))));
2022-04-14 17:47:08 +02:00
`,Xse=wr({opSnippet:qse,packedOpSnippet:Kse,dtype:"bool"}),Zse={kernelName:el,backendName:"webgl",kernelFunc:Xse},Yse="return float(!(x >= 1.0));",Jse=it({opSnippet:Yse}),Qse={kernelName:Yu,backendName:"webgl",kernelFunc:Jse},eie="return float(a >= 1.0 || b >= 1.0);",tie=`
2022-02-10 18:27:21 +01:00
return min(
vec4(greaterThanEqual(a, vec4(1.0))) +
vec4(greaterThanEqual(b, vec4(1.0))),
vec4(1.0));
2022-04-14 17:47:08 +02:00
`,rie=wr({opSnippet:eie,packedOpSnippet:tie,dtype:"bool"}),nie={kernelName:th,backendName:"webgl",kernelFunc:rie},aie=class{constructor(e,t,r,n,a){this.variableNames=["x"],this.outputShape=[];let s=t,i=e[3]-1;this.outputShape=e;let o,l=`float(${r}) + float(${n}) * sum`;a===.5?o=`inversesqrt(${l})`:a===1?o=`1.0/(${l})`:o=`exp(log(${l}) * float(-${a}));`,this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int b = coords[0];
int r = coords[1];
int c = coords[2];
int d = coords[3];
float x = getX(b, r, c, d);
float sum = 0.0;
2022-04-01 15:13:32 +02:00
for (int j = -${s}; j <= ${s}; j++) {
2022-02-10 18:27:21 +01:00
int idx = d + j;
2022-04-01 15:13:32 +02:00
if (idx >= 0 && idx <= ${i}) {
2022-02-10 18:27:21 +01:00
float z = getX(b, r, c, idx);
sum += z * z;
}
}
2022-04-01 15:13:32 +02:00
float val = x * ${o};
2022-02-10 18:27:21 +01:00
setOutput(val);
}
2022-04-14 17:47:08 +02:00
`}},sie=class{constructor(e,t,r,n,a){this.variableNames=["x"],this.outputShape=[],this.packedInputs=!0,this.packedOutput=!0;let s=t,i=e[3]-1;this.outputShape=e;let o,l=`float(${r}) + float(${n}) * sum`;a===.5?o=`inversesqrt(${l})`:a===1?o=`1.0/(${l})`:o=`exp(log(${l}) * float(-${a}));`,this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int b = coords.x;
int r = coords.y;
int c = coords.z;
int d = coords.w;
bool hasNextCol = d < ${this.outputShape[3]};
bool hasNextRow = c < ${this.outputShape[2]};
vec4 sum = vec4(0.);
vec4 xFragAtOutputCoords = getX(b, r, c, d);
vec4 xAtOutputCoords = vec4(
getChannel(xFragAtOutputCoords, vec2(c, d)),
hasNextCol ?
getChannel(xFragAtOutputCoords, vec2(c, d + 1)) : 0.0,
hasNextRow ?
getChannel(xFragAtOutputCoords , vec2(c + 1, d)) : 0.0,
(hasNextRow && hasNextCol) ?
getChannel(xFragAtOutputCoords, vec2(c + 1, d + 1)) : 0.0
);
2022-04-01 15:13:32 +02:00
int firstChannel = d - ${s};
2022-02-10 18:27:21 +01:00
vec2 cache = vec2(0.);
if(firstChannel >= 0){
vec4 firstChannelFrag = getX(b, r, c, firstChannel);
cache.x = getChannel(firstChannelFrag, vec2(c, firstChannel));
if(hasNextRow){
cache.y = getChannel(firstChannelFrag, vec2(c + 1, firstChannel));
}
}
ivec2 depth = ivec2(d, d + 1);
2022-04-01 15:13:32 +02:00
for (int j = - ${s}; j <= ${s}; j++) {
2022-02-10 18:27:21 +01:00
ivec2 idx = depth + j;
bvec2 aboveLowerBound = greaterThanEqual(idx, ivec2(0));
2022-04-01 15:13:32 +02:00
bvec2 belowUpperBound = lessThanEqual(idx, ivec2(${i}));
2022-02-10 18:27:21 +01:00
bool depthInRange = aboveLowerBound.x && belowUpperBound.x;
bool depthPlusOneInRange = aboveLowerBound.y && belowUpperBound.y;
if(depthInRange || depthPlusOneInRange){
vec4 z = vec4(0.);
vec4 xFragAtCurrentDepth;
z.xz = cache.xy;
if(depthPlusOneInRange && hasNextCol){
xFragAtCurrentDepth = idx.y != d ?
getX(b, r, c, idx.y) : xFragAtOutputCoords;
z.y = getChannel(xFragAtCurrentDepth, vec2(c, idx.y));
if(hasNextRow){
z.w = getChannel(xFragAtCurrentDepth, vec2(c + 1, idx.y));
}
}
cache.xy = z.yw;
sum += z * z;
}
}
2022-04-01 15:13:32 +02:00
vec4 result = xAtOutputCoords * ${o};
2022-02-10 18:27:21 +01:00
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}},iie=e=>{let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{depthRadius:s,bias:i,alpha:o,beta:l}=n,u=Y().getBool("WEBGL_PACK_NORMALIZATION")?new sie(a.shape,s,i,o,l):new aie(a.shape,s,i,o,l);return r.runWebGLProgram(u,[a],a.dtype)},oie={kernelName:rh,backendName:"webgl",kernelFunc:iie},lie=class{constructor(e,t,r,n,a){this.variableNames=["inputImage","outputImage","dy"],this.outputShape=[],this.outputShape=e,this.depth=e[3],this.depthRadius=t,this.bias=r,this.alpha=n,this.beta=a,this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int b = coords[0];
int r = coords[1];
int c = coords[2];
float result = 0.0;
for (int d = 0; d < ${this.depth}; ++d) {
int depthBegin = int(max(0.0, float(d - ${t})));
int depthEnd = int(min(float(${this.depth}),
float(d + ${t} + 1)));
const int MIN_DEPTH_BEGIN = 0;
const int MAX_DEPTH_END = ${this.depth};
float norm = 0.0;
for (int k = MIN_DEPTH_BEGIN; k < MAX_DEPTH_END; ++k) {
if (k < depthBegin){
continue;
}
else if (k >= depthBegin && k < depthEnd) {
norm += getInputImage(b, r, c, k) * getInputImage(b, r, c, k);
}
else {
break;
}
}
2022-04-01 15:13:32 +02:00
norm = float(${n}) * norm + float(${r});
2022-02-10 18:27:21 +01:00
for(int k = MIN_DEPTH_BEGIN; k < MAX_DEPTH_END; ++k){
if (k < depthBegin){
continue;
}
else if (k >= depthBegin && k < depthEnd){
2022-04-01 15:13:32 +02:00
float dyi = -2.0 * float(${n})
* float(${a})
2022-02-10 18:27:21 +01:00
* getInputImage(b ,r ,c, k) * getOutputImage(b, r, c, d)
/ norm;
if (k == d) {
2022-04-01 15:13:32 +02:00
dyi += pow(norm, -1.0 * ${a});
2022-02-10 18:27:21 +01:00
}
if (k == coords[3]) {
dyi *= getDy(b, r, c, d);
result += dyi;
}
}
else {
break;
}
}
}
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}},uie=e=>{let{inputs:t,backend:r,attrs:n}=e,{x:a,y:s,dy:i}=t,{depthRadius:o,bias:l,alpha:u,beta:d}=n,h=new lie(a.shape,o,l,u,d);return r.runWebGLProgram(h,[a,s,i],a.dtype)},die={kernelName:im,backendName:"webgl",kernelFunc:uie};function pie(e,t,r,n){let a=w.sizeFromShape(t),s=w.sizeFromShape(e.shape)/a,i=ve({inputs:{x:e},attrs:{shape:[s,a]},backend:n}),o=_l(i,e.dtype,"max",n),l=ve({inputs:{x:o},attrs:{shape:r},backend:n});return n.disposeIntermediateTensorInfo(i),n.disposeIntermediateTensorInfo(o),l}function g8(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{reductionIndices:s,keepDims:i}=n,o=a.shape.length,l=w.parseAxisParam(s,a.shape),u=l,d=N.getAxesPermutation(u,o),h=d!=null,p=r.shouldExecuteOnCPU([a]),c=a;if(h){if(p){let A=r.texData.get(c.dataId).values,x=new Array(o);for(let S=0;S<x.length;S++)x[S]=a.shape[d[S]];let b=fb(A,a.shape,a.dtype,d,x);c=r.makeTensorInfo(x,a.dtype);let v=r.texData.get(c.dataId);v.values=b}else c=x0(a,d,r);u=N.getInnerMostAxes(u.length,o)}N.assertAxesAreInnerMostDims("max",u,o);let[f,m]=N.computeOutAndReduceShapes(c.shape,u),g=f;i&&(g=N.expandShapeToKeepDim(f,l));let y;if(p){let A=r.texData.get(c.dataId).values,x=See(A,w.sizeFromShape(m),g,a.dtype);y=r.makeTensorInfo(g,a.dtype);let b=r.texData.get(y.dataId);b.values=x}else y=pie(c,m,g,r);return h&&r.disposeIntermediateTensorInfo(c),y}var hie={kernelName:fi,backendName:"webgl",kernelFunc:g8},cie=ZS+`
2022-02-10 18:27:21 +01:00
return max(a, b);
2022-04-14 17:47:08 +02:00
`,fie=`
2022-02-10 18:27:21 +01:00
vec4 result = vec4(max(a, b));
vec4 isNaN = min(vec4(isnan(a)) + vec4(isnan(b)), vec4(1.0));
2022-04-14 17:47:08 +02:00
`+y0+`
2022-02-10 18:27:21 +01:00
return result;
2022-04-14 17:47:08 +02:00
`,mie=wr({opSnippet:cie,packedOpSnippet:fie,cpuKernelImpl:Tee}),gie={kernelName:mi,backendName:"webgl",kernelFunc:mie};function yie(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t;vd(a,"maxPool");let{filterSize:s,strides:i,pad:o,dimRoundingMode:l}=n,u=1;w.assert(N.eitherStridesOrDilationsAreOne(i,u),()=>`Error in maxPool: Either strides or dilations must be 1. Got strides ${i} and dilations '${u}'`);let d=N.computePool2DInfo(a.shape,s,i,u,o,l);if(d.filterWidth===1&&d.filterHeight===1&&w.arraysEqual(d.inShape,d.outShape))return an({inputs:{x:a},backend:r});let h=new Hp(d,"max",!1);return r.runWebGLProgram(h,[a],a.dtype)}var Aie={kernelName:gi,backendName:"webgl",kernelFunc:yie};function xie(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{filterSize:s,strides:i,pad:o,dataFormat:l,dimRoundingMode:u}=n,d=[1,1,1],h=N.computePool3DInfo(a.shape,s,i,d,o,u,l),p=new gb(h,"max",!1);return r.runWebGLProgram(p,[a],a.dtype)}var bie={kernelName:nh,backendName:"webgl",kernelFunc:xie},vie=class{constructor(e){this.variableNames=["dy","maxPos"],this.outputShape=e.inShape;let t=e.strideHeight,r=e.strideWidth,n=e.dilationHeight,a=e.effectiveFilterHeight,s=e.effectiveFilterWidth,i=a-1-e.padInfo.top,o=s-1-e.padInfo.left,l=a*s-1;this.userCode=`
2022-04-01 15:13:32 +02:00
const ivec2 pads = ivec2(${i}, ${o});
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int b = coords[0];
int d = coords[3];
ivec2 dyRCCorner = coords.yz - pads;
int dyRCorner = dyRCCorner.x;
int dyCCorner = dyRCCorner.y;
// Convolve dy(?, ?, d) with pos mask(:, :, d) to get dx(xR, xC, d).
// ? = to be determined. : = across all values in that axis.
float dotProd = 0.0;
2022-04-01 15:13:32 +02:00
for (int wR = 0; wR < ${a};
wR += ${n}) {
2022-02-10 18:27:21 +01:00
float dyR = float(dyRCorner + wR) / ${t}.0;
if (dyR < 0.0 || dyR >= ${e.outHeight}.0 || fract(dyR) > 0.0) {
continue;
}
int idyR = int(dyR);
2022-04-01 15:13:32 +02:00
for (int wC = 0; wC < ${s}; wC++) {
float dyC = float(dyCCorner + wC) / ${r}.0;
2022-02-10 18:27:21 +01:00
if (dyC < 0.0 || dyC >= ${e.outWidth}.0 ||
fract(dyC) > 0.0) {
continue;
}
int idyC = int(dyC);
float dyValue = getDy(b, idyR, idyC, d);
int maxPosValue = ${l} - int(getMaxPos(b, idyR, idyC, d));
// Get the current value, check it against the value from the
// position matrix.
2022-04-01 15:13:32 +02:00
int curPosValue = wR * ${s} + wC;
2022-02-10 18:27:21 +01:00
float mask = float(maxPosValue == curPosValue ? 1.0 : 0.0);
dotProd += dyValue * mask;
}
}
setOutput(dotProd);
}
2022-04-14 17:47:08 +02:00
`}},wie=class{constructor(e){this.variableNames=["dy","maxPos"],this.outputShape=e.inShape;let t=e.strideDepth,r=e.strideHeight,n=e.strideWidth,a=e.dilationDepth,s=e.dilationHeight,i=e.dilationWidth,o=e.effectiveFilterDepth,l=e.effectiveFilterHeight,u=e.effectiveFilterWidth,d=o-1-e.padInfo.front,h=l-1-e.padInfo.top,p=u-1-e.padInfo.left,c=o*l*u-1;this.userCode=`
2022-04-01 15:13:32 +02:00
const ivec3 pads = ivec3(${d}, ${h}, ${p});
2022-02-10 18:27:21 +01:00
void main() {
ivec5 coords = getOutputCoords();
int batch = coords.x;
int ch = coords.u;
ivec3 dyCorner = ivec3(coords.y, coords.z, coords.w) - pads;
int dyDCorner = dyCorner.x;
int dyRCorner = dyCorner.y;
int dyCCorner = dyCorner.z;
// Convolve dy(?, ?, ?, ch) with pos mask(:, :, :, d) to get
// dx(xD, xR, xC, ch).
// ? = to be determined. : = across all values in that axis.
float dotProd = 0.0;
2022-04-01 15:13:32 +02:00
for (int wD = 0; wD < ${o};
wD += ${a}) {
2022-02-10 18:27:21 +01:00
float dyD = float(dyDCorner + wD) / ${t}.0;
if (dyD < 0.0 || dyD >= ${e.outDepth}.0 || fract(dyD) > 0.0) {
continue;
}
int idyD = int(dyD);
for (int wR = 0; wR < ${l};
2022-04-01 15:13:32 +02:00
wR += ${s}) {
float dyR = float(dyRCorner + wR) / ${r}.0;
2022-02-10 18:27:21 +01:00
if (dyR < 0.0 || dyR >= ${e.outHeight}.0 ||
fract(dyR) > 0.0) {
continue;
}
int idyR = int(dyR);
2022-02-17 14:15:57 +01:00
for (int wC = 0; wC < ${u};
2022-04-01 15:13:32 +02:00
wC += ${i}) {
float dyC = float(dyCCorner + wC) / ${n}.0;
2022-02-10 18:27:21 +01:00
if (dyC < 0.0 || dyC >= ${e.outWidth}.0 ||
fract(dyC) > 0.0) {
continue;
}
int idyC = int(dyC);
float dyValue = getDy(batch, idyD, idyR, idyC, ch);
2022-04-01 15:13:32 +02:00
int maxPosValue = ${c} -
2022-02-10 18:27:21 +01:00
int(getMaxPos(batch, idyD, idyR, idyC, ch));
// Get the current value, check it against the value from the
// position matrix.
int curPosValue =
2022-02-17 14:15:57 +01:00
wD * ${l} * ${u} +
wR * ${u} + wC;
2022-02-10 18:27:21 +01:00
float mask = float(maxPosValue == curPosValue ? 1.0 : 0.0);
dotProd += dyValue * mask;
}
}
}
setOutput(dotProd);
}
2022-04-14 17:47:08 +02:00
`}};function kie(e){let{inputs:t,backend:r,attrs:n}=e,{dy:a,input:s}=t,i=s,{filterSize:o,strides:l,pad:u,dimRoundingMode:d}=n,h=[1,1,1],p=N.computePool3DInfo(i.shape,o,l,h,u,d),c=new gb(p,"max",!0),f=r.runWebGLProgram(c,[i],i.dtype),m=new wie(p),g=r.runWebGLProgram(m,[a,f],i.dtype);return r.disposeIntermediateTensorInfo(f),g}var Iie={kernelName:lm,backendName:"webgl",kernelFunc:kie};function Sie(e){let{inputs:t,backend:r,attrs:n}=e,{dy:a,input:s,output:i}=t,o=s;vd([s,i],"maxPoolGrad");let{filterSize:l,strides:u,pad:d,dimRoundingMode:h}=n,p=N.computePool2DInfo(o.shape,l,u,1,d,h),c=!0,f=new Hp(p,"max",c),m=r.runWebGLProgram(f,[o],o.dtype),g=new vie(p),y=r.runWebGLProgram(g,[a,m],o.dtype);return r.disposeIntermediateTensorInfo(m),y}var Tie={kernelName:om,backendName:"webgl",kernelFunc:Sie};function Nie(e,t,r,n){let a=new Hp(r,"max",!1),s=n.runWebGLProgram(a,[e],"float32");a=new Hp(r,"max",!0,!0,t);let i=n.runWebGLProgram(a,[e],"float32");return[s,i]}var Cie={kernelName:um,backendName:"webgl",kernelFunc:({inputs:e,attrs:t,backend:r})=>{let{x:n}=e,{filterSize:a,strides:s,pad:i,includeBatchInIndex:o}=t,l=r;w.assert(n.shape.length===4,()=>`Error in maxPool: input must be rank 4 but got rank ${n.shape.length}.`);let u=[1,1];w.assert(N.eitherStridesOrDilationsAreOne(s,u),()=>`Error in maxPool: Either strides or dilations must be 1. Got strides ${s} and dilations '${u}'`);let d=N.computePool2DInfo(n.shape,a,s,u,i),[h,p]=Nie(n,o,d,l);return[h,p]}};function Eie(e,t,r,n){let a=w.sizeFromShape(t),s=w.sizeFromShape(e.shape)/a,i=ve({inputs:{x:e},attrs:{shape:[s,a]},backend:n}),o=_l(i,"float32","mean",n),l=ve({inputs:{x:o},attrs:{shape:r},backend:n});return n.disposeIntermediateTensorInfo(i),n.disposeIntermediateTensorInfo(o),l}var Rie={kernelName:yi,backendName:"webgl",kernelFunc:({inputs:e,attrs:t,backend:r})=>{let{x:n}=e,{keepDims:a,axis:s}=t,i=r,o=n.shape.length,l=w.parseAxisParam(s,n.shape),u=l,d=N.getAxesPermutation(u,o),h=d!=null,p=i.shouldExecuteOnCPU([n]),c=[],f=n;if(h){if(p){let x=i.texData.get(f.dataId).values,b=new Array(o);for(let T=0;T<b.length;T++)b[T]=n.shape[d[T]];let v=fb(x,n.shape,n.dtype,d,b);f=i.makeTensorInfo(b,n.dtype);let S=i.texData.get(f.dataId);S.values=v}else f=x0(n,d,i);c.push(f),u=N.getInnerMostAxes(u.length,o)}N.assertAxesAreInnerMostDims("sum",u,o);let[m,g]=N.computeOutAndReduceShapes(f.shape,u),y=m;a&&(y=N.expandShapeToKeepDim(m,l));let A=Eie(f,g,y,i);for(let x of c)i.disposeIntermediateTensorInfo(x);return A}};function Mie(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{axis:s,keepDims:i}=n,o=a.shape.length,l=w.parseAxisParam(s,a.shape),u=l,d=N.getAxesPermutation(u,o),h=a;d!=null&&(h=vr({inputs:{x:a},backend:r,attrs:{perm:d}}),u=N.getInnerMostAxes(u.length,a.shape.length)),N.assertAxesAreInnerMostDims("min",u,o);let[p,c]=N.computeOutAndReduceShapes(h.shape,u),f=w.sizeFromShape(c),m=ve({inputs:{x:h},backend:r,attrs:{shape:[-1,f]}}),g=_l(m,m.dtype,"min",r),y;if(i){let A=N.expandShapeToKeepDim(p,l);y=ve({inputs:{x:g},backend:r,attrs:{shape:A}})}else y=ve({inputs:{x:g},backend:r,attrs:{shape:p}});return r.disposeIntermediateTensorInfo(m),r.disposeIntermediateTensorInfo(g),d!=null&&r.disposeIntermediateTensorInfo(h),y}var Fie={kernelName:Ai,backendName:"webgl",kernelFunc:Mie},$ie=ZS+`
2022-02-10 18:27:21 +01:00
return min(a, b);
2022-04-14 17:47:08 +02:00
`,Pie=`
2022-02-10 18:27:21 +01:00
vec4 result = vec4(min(a, b));
vec4 isNaN = min(vec4(isnan(a)) + vec4(isnan(b)), vec4(1.0));
2022-04-14 17:47:08 +02:00
`+y0+`
2022-02-10 18:27:21 +01:00
return result;
2022-04-14 17:47:08 +02:00
`,_ie=wr({opSnippet:$ie,packedOpSnippet:Pie,cpuKernelImpl:Nee}),zie={kernelName:xi,backendName:"webgl",kernelFunc:_ie},Oie=class{constructor(e,t,r){this.variableNames=["x"],this.outputShape=t.map((u,d)=>u[0]+e[d]+u[1]);let n=e.length,a=gt(n),s=t.map(u=>u[0]).join(","),i=t.map((u,d)=>u[0]+e[d]).join(","),o=["coords[0]","coords[1]","coords[2]","coords[3]"].slice(0,n),l=r==="reflect"?0:1;if(n===1){this.userCode=`
2022-04-01 15:13:32 +02:00
int start = ${s};
int end = ${i};
2022-02-10 18:27:21 +01:00
void main() {
int outC = getOutputCoords();
if (outC < start) {
outC = start * 2 - outC - ${l};
} else if(outC >= end) {
outC = (end - 1) * 2 - outC + ${l};
}
setOutput(getX(outC - start));
}
`;return}this.userCode=`
2022-04-01 15:13:32 +02:00
${a} start = ${a}(${s});
${a} end = ${a}(${i});
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${a} outC = getOutputCoords();
for (int i = 0; i < ${n}; i++) {
2022-02-10 18:27:21 +01:00
if (outC[i] < start[i]) {
outC[i] = start[i] * 2 - outC[i] - ${l};
} else if(outC[i] >= end[i]) {
outC[i] = (end[i] - 1) * 2 - outC[i] + ${l};
}
}
2022-04-01 15:13:32 +02:00
${a} coords = outC - start;
setOutput(getX(${o}));
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}},Die=class{constructor(e,t,r){this.variableNames=["x"],this.packedInputs=!0,this.packedOutput=!0,this.outputShape=t.map((c,f)=>c[0]+e[f]+c[1]);let n=e.length,a=gt(n),s=t.map(c=>c[0]).join(","),i=t.map((c,f)=>c[0]+e[f]).join(","),o=Lr("rc",n),l=Lr("source",n),u=`${o[n-1]} < ${this.outputShape[n-1]}`,d=n===1?"source":`vec2(${l.slice(-2).join()})`,h=r==="reflect"?0:1,p="";if(n===1){let c=`
2022-04-01 15:13:32 +02:00
${a} source = rc;
2022-02-10 18:27:21 +01:00
if (source < start) {
2022-04-01 15:13:32 +02:00
source = start * 2 - source - ${h};
2022-02-10 18:27:21 +01:00
} else if (source >= end) {
2022-04-01 15:13:32 +02:00
source = (end - 1) * 2 - source + ${h};
2022-02-10 18:27:21 +01:00
}
source -= start;
2022-04-01 15:13:32 +02:00
`;p=`
${a} rc = outputLoc;
${c}
result[0] = getChannel(getX(${l.join()}), ${d});
${o[n-1]} += 1;
2022-02-17 14:15:57 +01:00
if(${u}) {
2022-04-01 15:13:32 +02:00
${c}
result[1] = getChannel(getX(${l.join()}), ${d});
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`}else{let c=`
${a} source = rc;
${a} lt = ${a}(lessThan(source, start));
${a} gte = ${a}(greaterThanEqual(source, end));
${a} orig = 1 - (lt + gte);
2022-02-10 18:27:21 +01:00
source = orig * source +
2022-04-01 15:13:32 +02:00
lt * (start * 2 - source - ${h}) +
gte * ((end - 1) * 2 - source + ${h});
2022-02-10 18:27:21 +01:00
source -= start;
2022-04-01 15:13:32 +02:00
`;p=`
${a} rc = outputLoc;
${c}
result[0] = getChannel(getX(${l.join()}), ${d});
${o[n-1]} += 1;
2022-02-17 14:15:57 +01:00
if(${u}) {
2022-04-01 15:13:32 +02:00
${c}
result[1] = getChannel(getX(${l.join()}), ${d});
2022-02-10 18:27:21 +01:00
}
rc = outputLoc;
2022-04-01 15:13:32 +02:00
${o[n-2]} += 1;
if(${o[n-2]} < ${this.outputShape[n-2]}) {
${c}
result[2] = getChannel(getX(${l.join()}), ${d});
${o[n-1]} += 1;
2022-02-17 14:15:57 +01:00
if(${u}) {
2022-04-01 15:13:32 +02:00
${c}
result[3] = getChannel(getX(${l.join()}), ${d});
2022-02-10 18:27:21 +01:00
}
}
`}this.userCode=`
2022-04-01 15:13:32 +02:00
const ${a} start = ${a}(${s});
const ${a} end = ${a}(${i});
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${a} outputLoc = getOutputCoords();
2022-02-10 18:27:21 +01:00
vec4 result = vec4(0.);
2022-04-01 15:13:32 +02:00
${p}
2022-02-10 18:27:21 +01:00
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}},Lie=({inputs:e,backend:t,attrs:r})=>{let{x:n}=e,{paddings:a,mode:s}=r,i=Y().getBool("WEBGL_PACK_ARRAY_OPERATIONS")?new Die(n.shape,a,s):new Oie(n.shape,a,s);return t.runWebGLProgram(i,[n],n.dtype)},Bie={kernelName:bi,backendName:"webgl",kernelFunc:Lie},Wie=`if (b == 0.0) return NAN;
return mod(a, b);`,Vie=`
2022-02-10 18:27:21 +01:00
vec4 result = mod(a, b);
vec4 isNaN = vec4(equal(b, vec4(0.0)));
2022-04-14 17:47:08 +02:00
`+y0+`
2022-02-10 18:27:21 +01:00
return result;
2022-04-14 17:47:08 +02:00
`,Uie=wr({opSnippet:Wie,packedOpSnippet:Vie}),Gie={kernelName:Ju,backendName:"webgl",kernelFunc:Uie},jie=class{constructor(e,t,r){this.variableNames=["probs"],this.customUniforms=[{name:"seed",type:"float"}],this.outputShape=[e,r],this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec2 coords = getOutputCoords();
int batch = coords[0];
float r = random(seed);
float cdf = 0.0;
for (int i = 0; i < ${t-1}; i++) {
cdf += getProbs(batch, i);
if (r < cdf) {
setOutput(float(i));
return;
}
}
// If no other event happened, last event happened.
setOutput(float(${t-1}));
}
2022-04-14 17:47:08 +02:00
`}},Hie=`
2022-02-10 18:27:21 +01:00
if (a == b) {
return 1.0;
};
2022-04-14 17:47:08 +02:00
return a / b;`,qie=`
2022-02-10 18:27:21 +01:00
// vec4 one = vec4(equal(a, b));
// return one + (vec4(1.0) - one) * a / b;
vec4 result = a / b;
if(a.x == b.x) {
result.x = 1.;
}
if(a.y == b.y) {
result.y = 1.;
}
if(a.z == b.z) {
result.z = 1.;
}
if(a.w == b.w) {
result.w = 1.;
}
return result;
2022-04-14 17:47:08 +02:00
`,y8=wr({opSnippet:Hie,packedOpSnippet:qie,checkOutOfBounds:!0}),Kie={kernelName:ai,backendName:"webgl",kernelFunc:y8},Jv="return a - b;",A8=wr({opSnippet:Jv,packedOpSnippet:Jv,supportsComplex:!0,cpuKernelImpl:Uee}),Xie={kernelName:_i,backendName:"webgl",kernelFunc:A8};function x8(e){let{inputs:t,backend:r,attrs:n}=e,{logits:a}=t,{dim:s}=n,i=w.parseAxisParam([s],a.shape),o=g8({inputs:{x:a},backend:r,attrs:{reductionIndices:i,keepDims:!1}}),l=N.expandShapeToKeepDim(o.shape,i),u=ve({inputs:{x:o},backend:r,attrs:{shape:l}}),d=A8({inputs:{a,b:u},backend:r}),h=c8({inputs:{x:d},backend:r}),p=b0({inputs:{x:h},backend:r,attrs:{axis:i,keepDims:!1}}),c=ve({inputs:{x:p},backend:r,attrs:{shape:l}}),f=y8({inputs:{a:h,b:c},backend:r});return r.disposeIntermediateTensorInfo(o),r.disposeIntermediateTensorInfo(u),r.disposeIntermediateTensorInfo(d),r.disposeIntermediateTensorInfo(h),r.disposeIntermediateTensorInfo(p),r.disposeIntermediateTensorInfo(c),f}var Zie={kernelName:$i,backendName:"webgl",kernelFunc:x8};function Yie(e){let{inputs:t,backend:r,attrs:n}=e,{logits:a}=t,{numSamples:s,seed:i,normalized:o}=n,l=o?a:x8({inputs:{logits:a},backend:r,attrs:{dim:a.shape.length-1}}),u=l.shape[0],d=l.shape[1],h=new jie(u,d,s),p=[[i]],c=r.runWebGLProgram(h,[l],"int32",p);return o||r.disposeIntermediateTensorInfo(l),c}var Jie={kernelName:dm,backendName:"webgl",kernelFunc:Yie},Qie=Xn+`
2022-02-10 18:27:21 +01:00
return -x;
2022-04-14 17:47:08 +02:00
`,eoe=`
2022-02-10 18:27:21 +01:00
vec4 result = -x;
bvec4 isNaN = isnan(x);
result.r = isNaN.r ? x.r : result.r;
result.g = isNaN.g ? x.g : result.g;
result.b = isNaN.b ? x.b : result.b;
result.a = isNaN.a ? x.a : result.a;
return result;
2022-04-14 17:47:08 +02:00
`;function toe(e){let{inputs:t,backend:r}=e,{x:n}=t;if(r.shouldExecuteOnCPU([n])){let s=r.texData.get(n.dataId),[i,o]=Eee(s.values,n.shape,n.dtype);return r.makeTensorInfo(o,n.dtype,i)}let a;return Y().getBool("WEBGL_PACK_UNARY_OPERATIONS")?a=new vo(n.shape,eoe):a=new Ka(n.shape,Qie),r.runWebGLProgram(a,[n],n.dtype)}var roe={kernelName:tl,backendName:"webgl",kernelFunc:toe},noe=qn.nonMaxSuppressionV3Impl;function aoe(e){N.warn("tf.nonMaxSuppression() in webgl locks the UI thread. Call tf.nonMaxSuppressionAsync() instead");let{inputs:t,backend:r,attrs:n}=e,{boxes:a,scores:s}=t,{maxOutputSize:i,iouThreshold:o,scoreThreshold:l}=n,u=r.readSync(a.dataId),d=r.readSync(s.dataId),{selectedIndices:h}=noe(u,d,i,o,l);return r.makeTensorInfo([h.length],"int32",new Int32Array(h))}var soe={kernelName:nl,backendName:"webgl",kernelFunc:aoe},ioe=qn.nonMaxSuppressionV4Impl;function ooe(e){N.warn("tf.nonMaxSuppression() in webgl locks the UI thread. Call tf.nonMaxSuppressionAsync() instead");let{inputs:t,backend:r,attrs:n}=e,{boxes:a,scores:s}=t,{maxOutputSize:i,iouThreshold:o,scoreThreshold:l,padToMaxOutputSize:u}=n,d=r.readSync(a.dataId),h=r.readSync(s.dataId),{selectedIndices:p,validOutputs:c}=ioe(d,h,i,o,l,u);return[r.makeTensorInfo([p.length],"int32",new Int32Array(p)),r.makeTensorInfo([],"int32",new Int32Array([c]))]}var loe={kernelName:Qu,backendName:"webgl",kernelFunc:ooe},uoe=qn.nonMaxSuppressionV5Impl;function doe(e){N.warn("tf.nonMaxSuppression() in webgl locks the UI thread. Call tf.nonMaxSuppressionAsync() instead");let{inputs:t,backend:r,attrs:n}=e,{boxes:a,scores:s}=t,{maxOutputSize:i,iouThreshold:o,scoreThreshold:l,softNmsSigma:u}=n,d=r.readSync(a.dataId),h=r.readSync(s.dataId),p=i,c=o,f=l,m=u,{selectedIndices:g,selectedScores:y}=uoe(d,h,p,c,f,m);return[r.makeTensorInfo([g.length],"int32",new Int32Array(g)),r.makeTensorInfo([y.length],"float32",new Float32Array(y))]}var poe={kernelName:al,backendName:"webgl",kernelFunc:doe},hoe=class{constructor(e,t,r,n){this.variableNames=["indices"],this.outputShape=[e,t],this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec2 coords = getOutputCoords();
int index = round(getIndices(coords.x));
2022-04-01 15:13:32 +02:00
setOutput(mix(float(${n}), float(${r}),
2022-02-10 18:27:21 +01:00
float(index == coords.y)));
}
2022-04-14 17:47:08 +02:00
`}},coe=e=>{let{inputs:t,backend:r,attrs:n}=e,{indices:a}=t,{depth:s,onValue:i,offValue:o}=n,l=w.sizeFromShape(a.shape),u=new hoe(l,s,i,o),d=ve({inputs:{x:a},backend:r,attrs:{shape:[l]}}),h=r.runWebGLProgram(u,[d],a.dtype);r.disposeIntermediateTensorInfo(d);let p=[...a.shape,s],c=ve({inputs:{x:h},backend:r,attrs:{shape:p}});return r.disposeIntermediateTensorInfo(h),c},foe={kernelName:il,backendName:"webgl",kernelFunc:coe};function Df(e){let{inputs:t,backend:r}=e,{x:n}=t;if(n.dtype==="complex64"){let a=Lh({inputs:{input:n},backend:r}),s=Df({inputs:{x:a},backend:r}),i=v0({inputs:{input:n},backend:r}),o=Df({inputs:{x:i},backend:r}),l=Vi({inputs:{real:s,imag:o},backend:r});return r.disposeIntermediateTensorInfo(a),r.disposeIntermediateTensorInfo(s),r.disposeIntermediateTensorInfo(i),r.disposeIntermediateTensorInfo(o),l}else return Bh({attrs:{shape:n.shape,dtype:n.dtype,value:n.dtype==="string"?"":0},backend:r})}var moe={kernelName:kl,backendName:"webgl",kernelFunc:Df};function b8(e){let{inputs:t,backend:r}=e,{x:n}=t;if(n.dtype==="string")throw new Error("onesLike is not supported under string dtype");if(n.dtype==="complex64"){let a=Lh({inputs:{input:n},backend:r}),s=b8({inputs:{x:a},backend:r}),i=v0({inputs:{input:n},backend:r}),o=Df({inputs:{x:i},backend:r}),l=Vi({inputs:{real:s,imag:o},backend:r});return r.disposeIntermediateTensorInfo(a),r.disposeIntermediateTensorInfo(s),r.disposeIntermediateTensorInfo(i),r.disposeIntermediateTensorInfo(o),l}else return Bh({attrs:{shape:n.shape,dtype:n.dtype,value:1},backend:r})}var goe={kernelName:sl,backendName:"webgl",kernelFunc:b8};function yoe(e){let{inputs:t,backend:r,attrs:n}=e,{axis:a}=n;if(t.length===1)return Jy({inputs:{input:t[0]},backend:r,attrs:{dim:a}});let s=t[0].shape,i=t[0].dtype;t.forEach(d=>{w.assertShapesMatch(s,d.shape,"All tensors passed to stack must have matching shapes"),w.assert(i===d.dtype,()=>"All tensors passed to stack must have matching dtypes")});let o=[],l=t.map(d=>{let h=Jy({inputs:{input:d},backend:r,attrs:{dim:a}});return o.push(h),h}),u=o8({inputs:l,backend:r,attrs:{axis:a}});return o.forEach(d=>r.disposeIntermediateTensorInfo(d)),u}var Aoe={kernelName:ol,backendName:"webgl",kernelFunc:yoe},xoe=class{constructor(e,t,r){this.variableNames=["x"],this.customUniforms=[{name:"value",type:"float"}],this.outputShape=t.map((l,u)=>l[0]+e[u]+l[1]);let n=e.length,a=gt(n),s=t.map(l=>l[0]).join(","),i=t.map((l,u)=>l[0]+e[u]).join(","),o=["coords[0]","coords[1]","coords[2]","coords[3]"].slice(0,n);if(n===1){this.userCode=`
2022-04-01 15:13:32 +02:00
int start = ${s};
int end = ${i};
2022-02-10 18:27:21 +01:00
void main() {
int outC = getOutputCoords();
if (outC < start || outC >= end) {
setOutput(value);
} else {
setOutput(getX(outC - start));
}
}
`;return}this.userCode=`
2022-04-01 15:13:32 +02:00
${a} start = ${a}(${s});
${a} end = ${a}(${i});
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${a} outC = getOutputCoords();
2022-02-10 18:27:21 +01:00
if (any(lessThan(outC, start)) || any(greaterThanEqual(outC, end))) {
setOutput(value);
} else {
2022-04-01 15:13:32 +02:00
${a} coords = outC - start;
setOutput(getX(${o}));
2022-02-10 18:27:21 +01:00
}
}
2022-04-14 17:47:08 +02:00
`}},boe=class{constructor(e,t,r){this.variableNames=["x"],this.packedInputs=!0,this.packedOutput=!0,this.customUniforms=[{name:"value",type:"float"}],this.outputShape=t.map((f,m)=>f[0]+e[m]+f[1]);let n=e.length,a=gt(n),s=t.map(f=>f[0]).join(","),i=t.map((f,m)=>f[0]+e[m]).join(","),o=Lr("rc",n),l=Lr("source",n),u=`${o[n-1]} < ${this.outputShape[n-1]}`,d=n===1?"source":`vec2(${l.slice(-2).join()})`,h=[`${a} rc = outputLoc;`,`${o[n-1]} += 1;
2022-02-17 14:15:57 +01:00
if(${u}) {
2022-04-01 15:13:32 +02:00
`,n===1?"":`}
2022-02-10 18:27:21 +01:00
rc = outputLoc;
2022-04-01 15:13:32 +02:00
${o[n-2]} += 1;
if(${o[n-2]} < ${this.outputShape[n-2]}) {`,n===1?"":` ${o[n-1]} += 1;
if(${u}) {`],p=n===1?"rc < start || rc >= end":"any(lessThan(rc, start)) || any(greaterThanEqual(rc, end))",c="";for(let f=0,m=n===1?2:4;f<m;f++)c+=`
${h[f]}
if (${p}) {
2022-02-10 18:27:21 +01:00
result[${f}] = float(value);
} else {
2022-04-01 15:13:32 +02:00
${a} source = rc - start;
result[${f}] = getChannel(getX(${l.join()}), ${d});
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;c+=n===1?"} ":"}}",this.userCode=`
const ${a} start = ${a}(${s});
const ${a} end = ${a}(${i});
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${a} outputLoc = getOutputCoords();
2022-02-10 18:27:21 +01:00
vec4 result = vec4(0.);
2022-04-01 15:13:32 +02:00
${c}
2022-02-10 18:27:21 +01:00
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`}},v8=e=>{let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{paddings:s,constantValue:i}=n;if(w.sizeFromShape(a.shape)===0){let u=s.map((d,h)=>d[0]+a.shape[h]+d[1]);return Bh({backend:r,attrs:{shape:u,value:i,dtype:a.dtype}})}let o=Y().getBool("WEBGL_PACK_ARRAY_OPERATIONS")?new boe(a.shape,s,i):new xoe(a.shape,s,i),l=[[i]];return r.runWebGLProgram(o,[a],a.dtype,l)},voe={kernelName:wi,backendName:"webgl",kernelFunc:v8},woe=`
2022-02-10 18:27:21 +01:00
if(a < 0.0 && floor(b) < b){
return NAN;
}
if (b == 0.0) {
return 1.0;
}
return (round(mod(b, 2.0)) != 1) ?
pow(abs(a), b) : sign(a) * pow(abs(a), b);
2022-04-14 17:47:08 +02:00
`,koe=`
2022-02-10 18:27:21 +01:00
// isModRound1 has 1 for components with round(mod(b, 2.0)) == 1, 0 otherwise.
vec4 isModRound1 = vec4(equal(round(mod(b, 2.0)), ivec4(1)));
vec4 multiplier = sign(a) * isModRound1 + (vec4(1.0) - isModRound1);
vec4 result = multiplier * pow(abs(a), b);
// Ensure that a^0 = 1, including 0^0 = 1 as this correspond to TF and JS
bvec4 isExpZero = equal(b, vec4(0.0));
result.r = isExpZero.r ? 1.0 : result.r;
result.g = isExpZero.g ? 1.0 : result.g;
result.b = isExpZero.b ? 1.0 : result.b;
result.a = isExpZero.a ? 1.0 : result.a;
vec4 isNaN = vec4(lessThan(a, vec4(0.0))) * vec4(lessThan(floor(b), b));
2022-04-14 17:47:08 +02:00
`+y0+`
2022-02-10 18:27:21 +01:00
return result;
2022-04-14 17:47:08 +02:00
`,Ioe=wr({opSnippet:woe,packedOpSnippet:koe}),Soe={kernelName:ki,backendName:"webgl",kernelFunc:Ioe};function Toe(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{axis:s,keepDims:i}=n,o=a.shape.length,l=[],u=w.parseAxisParam(s,a.shape),d=u,h=N.getAxesPermutation(d,o),p=a;h!=null&&(p=vr({inputs:{x:a},backend:r,attrs:{perm:h}}),d=N.getInnerMostAxes(d.length,o),l.push(p)),N.assertAxesAreInnerMostDims("prod",d,o);let c;if(r.shouldExecuteOnCPU([p])){let f=r.texData.get(p.dataId).values,{outVals:m,outShape:g,outDtype:y}=Mee(p.shape,p.dtype,f,d);c=r.makeTensorInfo(g,y,m)}else{let[f,m]=N.computeOutAndReduceShapes(p.shape,d),g=w.sizeFromShape(m),y=ve({inputs:{x:p},backend:r,attrs:{shape:[-1,g]}}),A=ch(a.dtype),x=_l(y,A,"prod",r);c=ve({inputs:{x},backend:r,attrs:{shape:f}}),l.push(y),l.push(x)}if(i){l.push(c);let f=N.expandShapeToKeepDim(c.shape,u);c=ve({inputs:{x:c},backend:r,attrs:{shape:f}})}return l.forEach(f=>r.disposeIntermediateTensorInfo(f)),c}var Noe={kernelName:ll,backendName:"webgl",kernelFunc:Toe},w8=e=>{let{backend:t,attrs:r}=e,{start:n,stop:a,step:s,dtype:i}=r,o=Fee(n,a,s,i);return t.makeTensorInfo([o.length],i,o)},Coe={kernelName:ed,backendName:"webgl",kernelFunc:w8},Eoe="return 1.0 / x;",Roe=it({opSnippet:Eoe}),Moe={kernelName:td,backendName:"webgl",kernelFunc:Roe},Foe=Xn+`
2022-02-10 18:27:21 +01:00
return (x < 0.0) ? 0.0 : x;
2022-04-14 17:47:08 +02:00
`,$oe=`
2022-02-10 18:27:21 +01:00
vec4 result = x * vec4(greaterThanEqual(x, vec4(0.0)));
bvec4 isNaN = isnan(x);
result.r = isNaN.r ? x.r : result.r;
result.g = isNaN.g ? x.g : result.g;
result.b = isNaN.b ? x.b : result.b;
result.a = isNaN.a ? x.a : result.a;
return result;
2022-04-14 17:47:08 +02:00
`,Poe=it({opSnippet:Foe,packedOpSnippet:$oe}),_oe={kernelName:Si,backendName:"webgl",kernelFunc:Poe},zoe=Xn+`
2022-02-10 18:27:21 +01:00
return (x < 0.0) ? 0.0 : min(6.0, x);
2022-04-14 17:47:08 +02:00
`,Ooe=`
2022-02-10 18:27:21 +01:00
vec4 result = min(x, vec4(6.)) * vec4(greaterThanEqual(x, vec4(0.0)));
bvec4 isNaN = isnan(x);
result.r = isNaN.r ? x.r : result.r;
result.g = isNaN.g ? x.g : result.g;
result.b = isNaN.b ? x.b : result.b;
result.a = isNaN.a ? x.a : result.a;
return result;
2022-04-14 17:47:08 +02:00
`,Doe=it({opSnippet:zoe,packedOpSnippet:Ooe}),Loe={kernelName:Ni,backendName:"webgl",kernelFunc:Doe},Boe=class{constructor(e,t,r,n,a){this.variableNames=["A"],this.outputShape=[];let[s,i,o,l]=e;this.outputShape=[s,t,r,l];let u=[n&&t>1?i-1:i,n&&r>1?o-1:o],d=[n&&t>1?t-1:t,n&&r>1?r-1:r],h;a?h="(vec2(yRC) + vec2(0.5)) * effectiveInputOverOutputRatioRC - vec2(0.5)":h="vec2(yRC) * effectiveInputOverOutputRatioRC",this.userCode=`
2022-02-10 18:27:21 +01:00
const vec2 effectiveInputOverOutputRatioRC = vec2(
2022-04-01 15:13:32 +02:00
${u[0]/d[0]},
${u[1]/d[1]});
const vec2 inputShapeRC = vec2(${i}.0, ${o}.0);
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int b = coords[0];
int d = coords[3];
ivec2 yRC = coords.yz;
// Fractional source index.
2022-04-01 15:13:32 +02:00
vec2 sourceFracIndexRC = ${h};
2022-02-10 18:27:21 +01:00
// Compute the four integer indices.
ivec2 sourceFloorRC = ivec2(max(sourceFracIndexRC, vec2(0.0)));
ivec2 sourceCeilRC = ivec2(
min(inputShapeRC - 1.0, ceil(sourceFracIndexRC)));
float topLeft = getA(b, sourceFloorRC.x, sourceFloorRC.y, d);
float bottomLeft = getA(b, sourceCeilRC.x, sourceFloorRC.y, d);
float topRight = getA(b, sourceFloorRC.x, sourceCeilRC.y, d);
float bottomRight = getA(b, sourceCeilRC.x, sourceCeilRC.y, d);
vec2 fracRC = sourceFracIndexRC - vec2(sourceFloorRC);
float top = topLeft + (topRight - topLeft) * fracRC.y;
float bottom = bottomLeft + (bottomRight - bottomLeft) * fracRC.y;
float newValue = top + (bottom - top) * fracRC.x;
setOutput(newValue);
}
2022-04-14 17:47:08 +02:00
`}},Woe=class{constructor(e,t,r,n,a){this.variableNames=["A"],this.packedInputs=!0,this.packedOutput=!0,this.outputShape=[];let[s,i,o,l]=e;this.outputShape=[s,t,r,l];let u=[n&&t>1?i-1:i,n&&r>1?o-1:o],d=[n&&t>1?t-1:t,n&&r>1?r-1:r],h;a?h="(vec3(yRC) + vec3(0.5)) * effectiveInputOverOutputRatioRC - vec3(0.5)":h="vec3(yRC) * effectiveInputOverOutputRatioRC",this.userCode=`
2022-02-10 18:27:21 +01:00
const vec3 effectiveInputOverOutputRatioRC = vec3(
2022-04-01 15:13:32 +02:00
${u[0]/d[0]},
${u[1]/d[1]},
${u[1]/d[1]});
const vec3 inputShapeRC = vec3(${i}.0, ${o}.0,
${o}.0);
2022-02-10 18:27:21 +01:00
float getAValue(int b, int r, int c, int d) {
return getChannel(getA(b, r, c, d), vec2(c, d));
}
void main() {
ivec4 coords = getOutputCoords();
int b = coords[0];
int d = coords[3];
// Calculate values for next column in yRC.z.
ivec3 yRC = coords.yzz + ivec3(0, 0, 1);
// Fractional source index.
2022-04-01 15:13:32 +02:00
vec3 sourceFracIndexRC = ${h};
2022-02-10 18:27:21 +01:00
// Compute the four integer indices.
ivec3 sourceFloorRC = ivec3(max(sourceFracIndexRC, vec3(0.0)));
ivec3 sourceCeilRC = ivec3(
min(inputShapeRC - 1.0, ceil(sourceFracIndexRC)));
// Should we calculate next column and row elements in 2x2 packed cell.
bool hasNextCol = d < ${l-1};
2022-04-01 15:13:32 +02:00
bool hasNextRow = coords.z < ${r-1};
2022-02-10 18:27:21 +01:00
// In parallel, construct four corners for all four components in
// packed 2x2 cell.
vec4 topLeft = vec4(
getAValue(b, sourceFloorRC.x, sourceFloorRC.y, d),
hasNextCol ? getAValue(b, sourceFloorRC.x, sourceFloorRC.y, d + 1)
: 0.0,
hasNextRow ? getAValue(b, sourceFloorRC.x, sourceFloorRC.z, d)
: 0.0,
(hasNextRow && hasNextCol) ?
getAValue(b, sourceFloorRC.x, sourceFloorRC.z, d + 1) : 0.0);
vec4 bottomLeft = vec4(
getAValue(b, sourceCeilRC.x, sourceFloorRC.y, d),
hasNextCol ? getAValue(b, sourceCeilRC.x, sourceFloorRC.y, d + 1)
: 0.0,
hasNextRow ? getAValue(b, sourceCeilRC.x, sourceFloorRC.z, d)
: 0.0,
(hasNextRow && hasNextCol) ?
getAValue(b, sourceCeilRC.x, sourceFloorRC.z, d + 1) : 0.0);
vec4 topRight = vec4(
getAValue(b, sourceFloorRC.x, sourceCeilRC.y, d),
hasNextCol ? getAValue(b, sourceFloorRC.x, sourceCeilRC.y, d + 1)
: 0.0,
hasNextRow ? getAValue(b, sourceFloorRC.x, sourceCeilRC.z, d)
: 0.0,
(hasNextRow && hasNextCol) ?
getAValue(b, sourceFloorRC.x, sourceCeilRC.z, d + 1) : 0.0);
vec4 bottomRight = vec4(
getAValue(b, sourceCeilRC.x, sourceCeilRC.y, d),
hasNextCol ? getAValue(b, sourceCeilRC.x, sourceCeilRC.y, d + 1)
: 0.0,
hasNextRow ? getAValue(b, sourceCeilRC.x, sourceCeilRC.z, d)
: 0.0,
(hasNextRow && hasNextCol) ?
getAValue(b, sourceCeilRC.x, sourceCeilRC.z, d + 1) : 0.0);
vec3 fracRC = sourceFracIndexRC - vec3(sourceFloorRC);
vec4 top = mix(topLeft, topRight, fracRC.yyzz);
vec4 bottom = mix(bottomLeft, bottomRight, fracRC.yyzz);
vec4 newValue = mix(top, bottom, fracRC.x);
setOutput(newValue);
}
2022-04-14 17:47:08 +02:00
`}};function Voe(e){let{inputs:t,backend:r,attrs:n}=e,{images:a}=t,{alignCorners:s,halfPixelCenters:i,size:o}=n,[l,u]=o,d=Y().getBool("WEBGL_PACK_IMAGE_OPERATIONS")?new Woe(a.shape,l,u,s,i):new Boe(a.shape,l,u,s,i);return r.runWebGLProgram(d,[a],"float32")}var Uoe={kernelName:Ti,backendName:"webgl",kernelFunc:Voe},Goe=class{constructor(e,t,r){this.variableNames=["dy"],this.outputShape=[],this.outputShape=t;let[,n,a]=t,[,s,i]=e,o=[r&&s>1?n-1:n,r&&i>1?a-1:a],l=[r&&s>1?s-1:s,r&&i>1?i-1:i],u=o[0]/l[0],d=o[1]/l[1],h=1/u,p=1/d,c=Math.ceil(h)*2+2,f=Math.ceil(p)*2+2;this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int b = coords[0];
int d = coords[3];
int r = coords[1];
int c = coords[2];
float accumulator = 0.0;
2022-02-17 14:15:57 +01:00
const float heightScale = float(${u});
2022-04-01 15:13:32 +02:00
const float widthScale = float(${d});
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
const float invHeightScale = float(${h});
const float invWidthScale = float(${p});
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
const int winHeight = int(${c});
2022-02-10 18:27:21 +01:00
const int winWidth = int(${f});
// Compute bounds for where in dy we will look
float startRLerp = floor(float(r) * invHeightScale);
int startDyR = int(startRLerp - float(winHeight / 2));
float startCLerp = floor(float(c) * invWidthScale);
int startDyC = int(startCLerp - float(winWidth / 2));
// Loop over dy
for (int dyROffset = 0; dyROffset < winHeight; dyROffset++) {
int dyR = dyROffset + startDyR;
// Guard against the window exceeding the bounds of dy
2022-04-01 15:13:32 +02:00
if (dyR < 0 || dyR >= ${s}) {
2022-02-10 18:27:21 +01:00
continue;
}
for (int dyCOffset = 0; dyCOffset < winWidth; dyCOffset++) {
int dyC = dyCOffset + startDyC;
// Guard against the window exceeding the bounds of dy
2022-04-01 15:13:32 +02:00
if (dyC < 0 || dyC >= ${i}) {
2022-02-10 18:27:21 +01:00
continue;
}
float dxR = float(dyR) * heightScale;
int topDxRIndex = int(floor(dxR));
2022-04-01 15:13:32 +02:00
int bottomDxRIndex = int(min(ceil(dxR), ${n-1}.0));
2022-02-10 18:27:21 +01:00
float dxRLerp = dxR - float(topDxRIndex);
float inverseDxRLerp = 1.0 - dxRLerp;
float dxC = float(dyC) * widthScale;
int leftDxCIndex = int(floor(dxC));
2022-04-01 15:13:32 +02:00
int rightDxCIndex = int(min(ceil(dxC), ${a-1}.0));
2022-02-10 18:27:21 +01:00
float dxCLerp = dxC - float(leftDxCIndex);
float inverseDxCLerp = 1.0 - dxCLerp;
if (r == topDxRIndex && c == leftDxCIndex) {
// topLeft
accumulator +=
getDy(b, dyR, dyC, d) * inverseDxRLerp * inverseDxCLerp;
}
if (r == topDxRIndex && c == rightDxCIndex) {
// topRight
accumulator += getDy(b, dyR, dyC, d) * inverseDxRLerp * dxCLerp;
}
if (r == bottomDxRIndex && c == leftDxCIndex) {
// bottomLeft
accumulator += getDy(b, dyR, dyC, d) * dxRLerp * inverseDxCLerp;
}
if (r == bottomDxRIndex && c == rightDxCIndex) {
// bottomRight
accumulator += getDy(b, dyR, dyC, d) * dxRLerp * dxCLerp;
}
}
}
// End loop over dy
setOutput(accumulator);
}
2022-04-14 17:47:08 +02:00
`}};function joe(e){let{inputs:t,backend:r,attrs:n}=e,{images:a,dy:s}=t,{alignCorners:i}=n,o=new Goe(s.shape,a.shape,i);return r.runWebGLProgram(o,[s],s.dtype)}var Hoe={kernelName:hm,backendName:"webgl",kernelFunc:joe},qoe=class{constructor(e,t,r,n,a){this.variableNames=["A"],this.outputShape=[];let[s,i,o,l]=e;this.outputShape=[s,t,r,l];let u=[n&&t>1?i-1:i,n&&r>1?o-1:o],d=[n&&t>1?t-1:t,n&&r>1?r-1:r],h=n?"0.5":"0.0",p;a?p="max((vec2(yRC) + vec2(0.5)) * effectiveInputOverOutputRatioRC, vec2(0.0))":p="vec2(yRC) * effectiveInputOverOutputRatioRC",this.userCode=`
2022-02-10 18:27:21 +01:00
const vec2 effectiveInputOverOutputRatioRC = vec2(
2022-04-01 15:13:32 +02:00
${u[0]/d[0]},
${u[1]/d[1]});
const vec2 inputShapeRC = vec2(${i}.0, ${o}.0);
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int b = coords[0];
int d = coords[3];
ivec2 yRC = coords.yz;
// Fractional source index.
2022-04-01 15:13:32 +02:00
vec2 sourceFracIndexRC = ${p};
2022-02-10 18:27:21 +01:00
// Compute the coordinators of nearest neighbor point.
ivec2 sourceNearestRC = ivec2(
2022-04-01 15:13:32 +02:00
min(inputShapeRC - 1.0, floor(sourceFracIndexRC + ${h})));
2022-02-10 18:27:21 +01:00
float newValue = getA(b, sourceNearestRC.x, sourceNearestRC.y, d);
setOutput(newValue);
}
2022-04-14 17:47:08 +02:00
`}},Koe=class{constructor(e,t,r,n,a){this.variableNames=["A"],this.packedInputs=!0,this.packedOutput=!0,this.outputShape=[];let[s,i,o,l]=e;this.outputShape=[s,t,r,l];let u=[n&&t>1?i-1:i,n&&r>1?o-1:o],d=[n&&t>1?t-1:t,n&&r>1?r-1:r],h=n?"0.5":"0.0",p;a?p="max((vec3(yRC) + vec3(0.5)) * effectiveInputOverOutputRatioRC, vec3(0.0))":p="vec3(yRC) * effectiveInputOverOutputRatioRC",this.userCode=`
2022-02-10 18:27:21 +01:00
const vec3 effectiveInputOverOutputRatioRC = vec3(
2022-04-01 15:13:32 +02:00
${u[0]/d[0]},
${u[1]/d[1]},
${u[1]/d[1]});
const vec3 inputShapeRC = vec3(${i}.0, ${o}.0,
${o}.0);
2022-02-10 18:27:21 +01:00
float getAValue(int b, int r, int c, int d) {
return getChannel(getA(b, r, c, d), vec2(c, d));
}
void main() {
ivec4 coords = getOutputCoords();
int b = coords[0];
int d = coords[3];
// Calculate values for next column in yRC.z.
ivec3 yRC = coords.yzz + ivec3(0, 0, 1);
// Fractional source index.
2022-04-01 15:13:32 +02:00
vec3 sourceFracIndexRC = ${p};
2022-02-10 18:27:21 +01:00
// Compute the coordinators of nearest neighbor point.
ivec3 sourceNearestRC = ivec3(
2022-04-01 15:13:32 +02:00
min(inputShapeRC - 1.0, floor(sourceFracIndexRC + ${h})));
2022-02-10 18:27:21 +01:00
// Should we calculate next column and row elements in 2x2 packed cell.
bool hasNextCol = d < ${l-1};
2022-04-01 15:13:32 +02:00
bool hasNextRow = coords.z < ${r-1};
2022-02-10 18:27:21 +01:00
vec4 newValue = vec4(
getAValue(b, sourceNearestRC.x, sourceNearestRC.y, d),
hasNextCol ? getAValue(b, sourceNearestRC.x, sourceNearestRC.y, d + 1)
: 0.0,
hasNextRow ? getAValue(b, sourceNearestRC.x, sourceNearestRC.z, d)
: 0.0,
(hasNextRow && hasNextCol) ?
getAValue(b, sourceNearestRC.x, sourceNearestRC.z, d + 1) : 0.0);
setOutput(newValue);
}
2022-04-14 17:47:08 +02:00
`}};function Xoe(e){let{inputs:t,backend:r,attrs:n}=e,{images:a}=t,{alignCorners:s,halfPixelCenters:i,size:o}=n,[l,u]=o,d=Y().getBool("WEBGL_PACK_IMAGE_OPERATIONS")?new Koe(a.shape,l,u,s,i):new qoe(a.shape,l,u,s,i);return r.runWebGLProgram(d,[a],a.dtype)}var Zoe={kernelName:rd,backendName:"webgl",kernelFunc:Xoe},Yoe=class{constructor(e,t,r){this.variableNames=["dy"],this.outputShape=[],this.outputShape=t;let[,n,a]=t,[,s,i]=e,o=[r&&s>1?n-1:n,r&&i>1?a-1:a],l=[r&&s>1?s-1:s,r&&i>1?i-1:i],u=o[0]/l[0],d=o[1]/l[1],h=1/u,p=1/d,c=Math.ceil(h)*2+2,f=Math.ceil(p)*2+2;this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec4 coords = getOutputCoords();
int b = coords[0];
int d = coords[3];
int r = coords[1];
int c = coords[2];
float accumulator = 0.0;
2022-02-17 14:15:57 +01:00
const float heightScale = float(${u});
2022-04-01 15:13:32 +02:00
const float widthScale = float(${d});
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
const float invHeightScale = float(${h});
const float invWidthScale = float(${p});
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
const int winHeight = int(${c});
2022-02-10 18:27:21 +01:00
const int winWidth = int(${f});
// Compute bounds for where in dy we will look
float startRLerp = floor(float(r) * invHeightScale);
int startDyR = int(floor(startRLerp - float(winHeight / 2)));
float startCLerp = floor(float(c) * invWidthScale);
int startDyC = int(floor(startCLerp - float(winWidth / 2)));
// Loop over dy
for (int dyROffset = 0; dyROffset < winHeight; dyROffset++) {
int dyR = dyROffset + startDyR;
// Guard against the window exceeding the bounds of dy
2022-04-01 15:13:32 +02:00
if (dyR < 0 || dyR >= ${s}) {
2022-02-10 18:27:21 +01:00
continue;
}
for (int dyCOffset = 0; dyCOffset < winWidth; dyCOffset++) {
int dyC = dyCOffset + startDyC;
// Guard against the window exceeding the bounds of dy
2022-04-01 15:13:32 +02:00
if (dyC < 0 || dyC >= ${i}) {
2022-02-10 18:27:21 +01:00
continue;
}
float sourceFracRow =
2022-04-01 15:13:32 +02:00
float(${o[0]}) *
2022-02-10 18:27:21 +01:00
(float(dyR) / float(${l[0]}));
float sourceFracCol =
2022-04-01 15:13:32 +02:00
float(${o[1]}) *
2022-02-10 18:27:21 +01:00
(float(dyC) / float(${l[1]}));
int sourceNearestRow = int(min(
2022-04-01 15:13:32 +02:00
float(int(${n}) - 1),
${r} ? float(round(sourceFracRow)) :
2022-02-10 18:27:21 +01:00
float(floor(sourceFracRow))));
int sourceNearestCol = int(min(
2022-04-01 15:13:32 +02:00
float(int(${a}) - 1),
${r} ? float(round(sourceFracCol)) :
2022-02-10 18:27:21 +01:00
float(floor(sourceFracCol))));
if (r == sourceNearestRow && c == sourceNearestCol) {
accumulator += getDy(b, dyR, dyC, d);
}
}
}
// End loop over dy
setOutput(accumulator);
}
2022-04-14 17:47:08 +02:00
`}};function Joe(e){let{inputs:t,backend:r,attrs:n}=e,{images:a,dy:s}=t,{alignCorners:i}=n,o=new Yoe(s.shape,a.shape,i);return r.runWebGLProgram(o,[s],s.dtype)}var Qoe={kernelName:pm,backendName:"webgl",kernelFunc:Joe},ele=class{constructor(e,t){this.variableNames=["x"];let r=e.length;if(r>4)throw new Error(`WebGL backend: Reverse of rank-${r} tensor is not yet supported`);if(this.outputShape=e,r===1){this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
int coord = getOutputCoords();
setOutput(getX(${e[0]} - coord - 1));
}
2022-04-01 15:13:32 +02:00
`;return}let n=i=>t.indexOf(i)!==-1&&e[i]!==1?`${e[i]} - coords[${i}] - 1`:`coords[${i}]`,a=e.map((i,o)=>n(o)).join(","),s=gt(r);this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${s} coords = getOutputCoords();
setOutput(getX(${a}));
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}},tle=class{constructor(e,t){this.variableNames=["x"],this.packedInputs=!0,this.packedOutput=!0;let r=e.length;if(r>4)throw new Error(`WebGL backend: Reverse of rank-${r} tensor is not yet supported`);this.outputShape=e;let n=Lr("rc",r),a=`${n[r-1]} + 1 < ${this.outputShape[r-1]}`,s=`${n[r-2]} + 1 < ${this.outputShape[r-2]}`,i=gt(r);r===1?this.userCode=`
2022-02-10 18:27:21 +01:00
void main(){
int rc = getOutputCoords();
vec4 result = vec4(0.);
result.r = getChannel(getX(${e[0]} - rc - 1),
${e[0]} - rc - 1);
2022-04-01 15:13:32 +02:00
if(${a}){
2022-02-10 18:27:21 +01:00
result.g = getChannel(getX(${e[0]} - (rc + 1) - 1),
${e[0]} - (rc + 1) - 1);
}
setOutput(result);
}
`:this.userCode=`
void main() {
2022-04-01 15:13:32 +02:00
${i} rc = getOutputCoords();
2022-02-10 18:27:21 +01:00
vec4 result = vec4(0.);
2022-04-01 15:13:32 +02:00
result.r = ${o(n.slice())};
if(${a}){
result.g = ${l(n.slice())};
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
if(${s}) {
result.b = ${u(n.slice())};
if(${a}) {
result.a = ${d(n.slice())};
2022-02-10 18:27:21 +01:00
}
}
setOutput(result);
}
2022-04-14 17:47:08 +02:00
`;function o(c){return h(c)}function l(c){return c[r-1]="("+c[r-1]+" + 1)",h(c)}function u(c){return c[r-2]="("+c[r-2]+" + 1)",h(c)}function d(c){return c[r-1]="("+c[r-1]+" + 1)",c[r-2]="("+c[r-2]+" + 1)",h(c)}function h(c){let f=e.map((y,A)=>p(A,c)),m=f.join(","),g=f.slice(-2).join(",");return`getChannel(getX(${m}), vec2(${g}))`}function p(c,f){return t.indexOf(c)!==-1&&e[c]!==1?`${e[c]} - ${f[c]} - 1`:`${f[c]}`}}};function rle(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{dims:s}=n,i=a.shape.length,o=w.parseAxisParam(s,a.shape);if(i===0)return an({inputs:{x:a},backend:r});let l=Y().getBool("WEBGL_PACK_ARRAY_OPERATIONS")?new tle(a.shape,o):new ele(a.shape,o);return r.runWebGLProgram(l,[a],a.dtype)}var nle={kernelName:dl,backendName:"webgl",kernelFunc:rle},ale=class{constructor(e,t){this.variableNames=["Image"],this.outputShape=[],this.customUniforms=[{name:"params",type:"vec4"}];let r=e[1],n=e[2];this.outputShape=e;let a="";typeof t=="number"?a=`float outputValue = ${t.toFixed(2)};`:a=`
2022-02-10 18:27:21 +01:00
vec3 fill = vec3(${t.join(",")});
float outputValue = fill[coords[3]];`,this.userCode=`
void main() {
ivec4 coords = getOutputCoords();
int x = coords[2];
int y = coords[1];
float coordXFloat = (float(x) - params[0]) * params[3] -
(float(y) - params[1]) * params[2];
float coordYFloat = (float(x) - params[0]) * params[2] +
(float(y) - params[1]) * params[3];
int coordX = int(round(coordXFloat + params[0]));
int coordY = int(round(coordYFloat + params[1]));
2022-04-01 15:13:32 +02:00
${a}
if(coordX >= 0 && coordX < ${n} && coordY >= 0 && coordY < ${r}) {
2022-02-10 18:27:21 +01:00
outputValue = getImage(coords[0], coordY, coordX, coords[3]);
}
setOutput(outputValue);
}
2022-04-14 17:47:08 +02:00
`}},sle={kernelName:Il,backendName:"webgl",kernelFunc:({inputs:e,attrs:t,backend:r})=>{let{image:n}=e,{radians:a,fillValue:s,center:i}=t,o=r,l=new ale(n.shape,s),[u,d]=N.getImageCenter(i,n.shape[1],n.shape[2]),h=[[u,d,Math.sin(a),Math.cos(a)]];return o.runWebGLProgram(l,[n],n.dtype,h)}},ile=`
2022-02-10 18:27:21 +01:00
// OpenGL ES does not support round function.
// The algorithm is based on banker's rounding.
float base = floor(x);
if ((x - base) < 0.5) {
return floor(x);
} else if ((x - base) > 0.5) {
return ceil(x);
} else {
if (mod(base, 2.0) == 0.0) {
return base;
} else {
return base + 1.0;
}
}
2022-04-14 17:47:08 +02:00
`,ole=it({opSnippet:ile}),lle={kernelName:pl,backendName:"webgl",kernelFunc:ole},ule="return inversesqrt(x);",dle=it({opSnippet:ule,cpuKernelImpl:$ee}),ple={kernelName:Ci,backendName:"webgl",kernelFunc:dle},k8=class{constructor(e,t,r,n,a,s,i=!0){this.variableNames=["updates","indices","defaultValue"],this.outputShape=s;let o=gt(a.length),l=gt(s.length),u="";r===1?u="i":r===2&&(u="i, j");let d=`getIndices(${u})`,h="";n===1?h="i":n===2&&(h="i, coords[1]");let p=`getUpdates(${h})`,c=t>1?"strides[j]":"strides";this.userCode=`
2022-04-01 15:13:32 +02:00
${o} strides = ${o}(${a});
2022-02-10 18:27:21 +01:00
void main() {
${l} coords = getOutputCoords();
float sum = 0.0;
bool found = false;
for (int i = 0; i < ${e}; i++) {
int flattenedIndex = 0;
for (int j = 0; j < ${t}; j++) {
2022-04-01 15:13:32 +02:00
int index = round(${d});
flattenedIndex += index * ${c};
2022-02-10 18:27:21 +01:00
}
if (flattenedIndex == coords[0]) {
2022-04-01 15:13:32 +02:00
sum += ${p};
2022-02-10 18:27:21 +01:00
found = true;
}
}
setOutput(mix(getDefaultValue(), sum, float(found)));
}
2022-04-14 17:47:08 +02:00
`}};function hle(e){let{inputs:t,backend:r,attrs:n}=e,{indices:a,updates:s}=t,{shape:i}=n,{sliceRank:o,numUpdates:l,sliceSize:u,strides:d,outputSize:h}=N.calculateShapes(s,a,i),p=[h/u,u];if(h===0)return r.makeTensorInfo(i,a.dtype);let c=ve({inputs:{x:a},backend:r,attrs:{shape:[l,o]}}),f=ve({inputs:{x:s},backend:r,attrs:{shape:[l,u]}}),m=r.makeTensorInfo([],"float32",new Float32Array([0])),g=new k8(l,o,c.shape.length,f.shape.length,d,p),y=r.runWebGLProgram(g,[f,c,m],f.dtype),A=ve({inputs:{x:y},backend:r,attrs:{shape:i}});return r.disposeIntermediateTensorInfo(c),r.disposeIntermediateTensorInfo(f),r.disposeIntermediateTensorInfo(y),r.disposeIntermediateTensorInfo(m),A}var cle={kernelName:hl,backendName:"webgl",kernelFunc:hle},fle=class{constructor(e,t,r){this.variableNames=["c","a","b"],this.outputShape=t;let n,a;if(r>4)throw Error(`Where for rank ${r} is not yet supported`);if(r===1)a="resRC",n="resRC";else{let i=["resRC.x","resRC.y","resRC.z","resRC.w"],o=[],l=[];for(let u=0;u<t.length;u++)l.push(`${i[u]}`),u<e&&o.push(`${i[u]}`);n=o.join(),a=l.join()}let s=gt(r);this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${s} resRC = getOutputCoords();
float cVal = getC(${n});
2022-02-10 18:27:21 +01:00
if (cVal >= 1.0) {
2022-04-01 15:13:32 +02:00
setOutput(getA(${a}));
2022-02-10 18:27:21 +01:00
} else {
2022-04-01 15:13:32 +02:00
setOutput(getB(${a}));
2022-02-10 18:27:21 +01:00
}
}
2022-04-14 17:47:08 +02:00
`}};function mle(e){let{inputs:t,backend:r}=e,{condition:n,t:a,e:s}=t,i=new fle(n.shape.length,a.shape,a.shape.length);return r.runWebGLProgram(i,[n,a,s],Cr(a.dtype,s.dtype))}var gle={kernelName:cl,backendName:"webgl",kernelFunc:mle},yle=`
2022-02-10 18:27:21 +01:00
// Stable and Attracting Fixed Point (0, 1) for Normalized Weights.
// see: https://arxiv.org/abs/1706.02515
2022-04-01 15:13:32 +02:00
float scaleAlpha = ${N.SELU_SCALEALPHA};
float scale = ${N.SELU_SCALE};
2022-02-10 18:27:21 +01:00
return (x >= 0.0) ? scale * x : scaleAlpha * (exp(x) - 1.0);
2022-04-14 17:47:08 +02:00
`,Ale=it({opSnippet:yle}),xle={kernelName:nd,backendName:"webgl",kernelFunc:Ale},ble=Td+`
2022-02-10 18:27:21 +01:00
return 1.0 / (1.0 + exp(-1.0 * x));
2022-04-14 17:47:08 +02:00
`,vle=`
2022-02-10 18:27:21 +01:00
vec4 result = 1.0 / (1.0 + exp(-1.0 * x));
bvec4 isNaN = isnan(x);
result.r = isNaN.r ? x.r : result.r;
result.g = isNaN.g ? x.g : result.g;
result.b = isNaN.b ? x.b : result.b;
result.a = isNaN.a ? x.a : result.a;
return result;
2022-04-14 17:47:08 +02:00
`,wle=it({opSnippet:ble,packedOpSnippet:vle,cpuKernelImpl:Pee}),kle={kernelName:Ri,backendName:"webgl",kernelFunc:wle},Ile=`
2022-02-10 18:27:21 +01:00
if (isnan(x)) { return 0.0; }
return sign(x);
2022-04-14 17:47:08 +02:00
`,Sle=it({opSnippet:Ile}),Tle={kernelName:ad,backendName:"webgl",kernelFunc:Sle},Nle=Td+`
2022-02-10 18:27:21 +01:00
return sin(x);
2022-04-14 17:47:08 +02:00
`,Cle=it({opSnippet:Nle}),Ele={kernelName:Ei,backendName:"webgl",kernelFunc:Cle},Rle=`
2022-02-10 18:27:21 +01:00
float e2x = exp(x);
return (e2x - 1.0 / e2x) / 2.0;
2022-04-14 17:47:08 +02:00
`,Mle=it({opSnippet:Rle}),Fle={kernelName:ml,backendName:"webgl",kernelFunc:Mle},$le=`
2022-02-10 18:27:21 +01:00
float epsilon = 1.1920928955078125e-7;
float threshold = log(epsilon) + 2.0;
bool too_large = x > -threshold;
bool too_small = x < threshold;
float result;
float exp_x = exp(x);
if (too_large){
result = x;
}
else if (too_small){
result = exp_x;
}
else{
result = log(exp_x + 1.0);
}
return result;
2022-04-14 17:47:08 +02:00
`,Ple=it({opSnippet:$le}),_le={kernelName:sd,backendName:"webgl",kernelFunc:Ple},zle=e=>{let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{blockShape:s,paddings:i}=n;w.assert(a.shape.length<=4,()=>"spaceToBatchND for rank > 4 with a WebGL backend not implemented yet");let o=s.reduce((y,A)=>y*A),l=[[0,0]];l.push(...i);for(let y=1+s.length;y<a.shape.length;++y)l.push([0,0]);let u=[],d=v8({inputs:{x:a},backend:r,attrs:{paddings:l,constantValue:0}}),h=N.getReshaped(d.shape,s,o,!1),p=N.getPermuted(h.length,s.length,!1),c=N.getReshapedPermuted(d.shape,s,o,!1),f=ve({inputs:{x:d},backend:r,attrs:{shape:h}}),m=vr({inputs:{x:f},backend:r,attrs:{perm:p}}),g=ve({inputs:{x:m},backend:r,attrs:{shape:c}});return u.push(d),u.push(f),u.push(m),u.forEach(y=>r.disposeIntermediateTensorInfo(y)),g},Ole={kernelName:gl,backendName:"webgl",kernelFunc:zle};function Dle(e){let{inputs:t,backend:r}=e,{indices:n,values:a,denseShape:s,defaultValue:i}=t;if(s.shape.length!==1)throw new Error(`Dense shape must be a vector, saw:
2022-04-01 15:13:32 +02:00
${s.shape}`);if(n.shape.length!==2)throw new Error(`Indices must be a matrix, saw:
${n.shape}`);if(a.shape.length!==1)throw new Error(`Values must be a vector, saw:
${a.shape}`);if(i.shape.length!==0)throw new Error(`Default value must be a scalar, saw:
2022-04-14 17:47:08 +02:00
${i.shape}`);let o=r.readSync(n.dataId),l=r.readSync(a.dataId),u=r.readSync(s.dataId),d=r.readSync(i.dataId)[0],[h,p,c,f,m]=zee(o,n.shape,n.dtype,l,a.dtype,u,d);return[r.makeTensorInfo(p,n.dtype,h),r.makeTensorInfo([p[0]],a.dtype,c),r.makeTensorInfo([f.length],"bool",new Uint8Array(f.map(g=>Number(g)))),r.makeTensorInfo([m.length],n.dtype,new Int32Array(m))]}var Lle={kernelName:sh,backendName:"webgl",kernelFunc:Dle};function Ble(e){let{inputs:t,backend:r}=e,{inputIndices:n,inputShape:a,newShape:s}=t;if(n.shape.length!==2)throw new Error(`Input indices should be a matrix but received shape ${n.shape}`);if(a.shape.length!==1)throw new Error(`Input shape should be a vector but received shape ${a.shape}`);if(s.shape.length!==1)throw new Error(`Target shape should be a vector but received shape ${s.shape}`);let i=Array.from(r.readSync(a.dataId)),o=r.readSync(n.dataId),l=Array.from(r.readSync(s.dataId)),[u,d,h]=Oee(o,n.shape,n.dtype,i,l);return[r.makeTensorInfo(d,n.dtype,u),r.makeTensorInfo([h.length],s.dtype,new Int32Array(h))]}var Wle={kernelName:id,backendName:"webgl",kernelFunc:Ble};function Vle(e){let{inputs:t,backend:r}=e,{data:n,indices:a,segmentIds:s}=t;if(n.shape.length<1)throw new Error("Data should be at least 1 dimensional but received scalar");if(a.shape.length!==1)throw new Error(`Indices should be a vector but received shape
2022-04-01 15:13:32 +02:00
${a.shape}`);if(s.shape.length!==1)throw new Error(`Segment ids should be a vector but received shape
2022-04-14 17:47:08 +02:00
${s.shape}`);let i=r.readSync(n.dataId),o=r.readSync(a.dataId),l=r.readSync(s.dataId),[u,d]=jS(i,n.shape,n.dtype,o,l,!0);return r.makeTensorInfo(d,n.dtype,u)}var Ule={kernelName:ih,backendName:"webgl",kernelFunc:Vle};function Gle(e){let{inputs:t,backend:r}=e,{data:n,indices:a,segmentIds:s}=t;if(n.shape.length<1)throw new Error("Data should be at least 1 dimensional but received scalar");if(a.shape.length!==1)throw new Error(`Indices should be a vector but received shape
2022-04-01 15:13:32 +02:00
${a.shape}`);if(s.shape.length!==1)throw new Error(`Segment ids should be a vector but received shape
2022-04-14 17:47:08 +02:00
${s.shape}`);let i=r.readSync(n.dataId),o=r.readSync(a.dataId),l=r.readSync(s.dataId),[u,d]=jS(i,n.shape,n.dtype,o,l);return r.makeTensorInfo(d,n.dtype,u)}var jle={kernelName:oh,backendName:"webgl",kernelFunc:Gle};function Hle(e){let{inputs:t,backend:r,attrs:n}=e,{sparseIndices:a,sparseValues:s,defaultValue:i}=t,{outputShape:o}=n,{sliceRank:l,numUpdates:u,strides:d,outputSize:h}=N.calculateShapes(s,a,o),p=!1,c=new k8(u,l,a.shape.length,s.shape.length,d,[h,1],p),f=r.runWebGLProgram(c,[s,a,i],s.dtype),m=ve({inputs:{x:f},backend:r,attrs:{shape:o}});return r.disposeIntermediateTensorInfo(f),m}var qle={kernelName:lh,backendName:"webgl",kernelFunc:Hle};function Kle(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{numOrSizeSplits:s,axis:i}=n,o=w.parseAxisParam(i,a.shape)[0],l=N.prepareSplitSize(a,s,o),u=a.shape.length,d=new Array(u).fill(0),h=a.shape.slice();return l.map(p=>{let c=[...h];c[o]=p;let f=Nd({inputs:{x:a},backend:r,attrs:{begin:d,size:c}});return d[o]+=p,f})}var Xle={kernelName:yl,backendName:"webgl",kernelFunc:Kle},Qv="return sqrt(x);",Zle=it({opSnippet:Qv,packedOpSnippet:Qv,cpuKernelImpl:Dee}),Yle={kernelName:Mi,backendName:"webgl",kernelFunc:Zle},Jle="return x * x;",Qle=it({opSnippet:Jle}),eue={kernelName:od,backendName:"webgl",kernelFunc:Qle},ew="return (a - b) * (a - b);",tue=wr({opSnippet:ew,packedOpSnippet:ew}),rue={kernelName:Pi,backendName:"webgl",kernelFunc:tue};function nue({inputs:e,attrs:t,backend:r}){let{x:n}=e,a=Xn+`
2022-02-10 18:27:21 +01:00
return x > 0.0 ? 1.0 : float(${t.alpha});
2022-04-14 17:47:08 +02:00
`,s=new Ka(n.shape,a);return r.runWebGLProgram(s,[n],n.dtype)}var aue={kernelName:Di,backendName:"webgl",kernelFunc:nue},sue=class{constructor(e,t,r){this.variableNames=["x"],this.outputShape=r;let n=r.length,a=gt(r.length),s=gt(r.length),i="";if(n===1)i="coords * strides + begin";else{let o=0;i=r.map((l,u)=>(o++,r.length===1?`coords * strides[${u}] + begin[${u}]`:`coords[${o-1}] * strides[${u}] + begin[${u}]`)).join(",")}this.userCode=`
2022-04-01 15:13:32 +02:00
${a} begin = ${a}(${e});
${a} strides = ${a}(${t});
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${s} coords = getOutputCoords();
setOutput(getX(${i}));
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}};function iue(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{begin:s,end:i,strides:o,beginMask:l,endMask:u,ellipsisMask:d,newAxisMask:h,shrinkAxisMask:p}=n,{finalShapeSparse:c,finalShape:f,isIdentity:m,sliceDim0:g,isSimpleSlice:y,begin:A,end:x,strides:b}=_t.sliceInfo(a.shape,s,i,o,l,u,d,h,p),v;if(m)v=ve({inputs:{x:a},backend:r,attrs:{shape:f}});else if(g||y){w.assert(a.shape.length>=1,()=>`Input must have rank at least 1, got: ${a.shape.length}`);let T=_t.computeOutShape(A,x,b),E=Nd({inputs:{x:a},backend:r,attrs:{begin:A,size:T}});v=ve({inputs:{x:E},backend:r,attrs:{shape:f}}),r.disposeIntermediateTensorInfo(E)}else if(r.shouldExecuteOnCPU([a])){let T=r.readSync(a.dataId),E=We(a.shape,a.dtype,T),R=Lee(c,E,b,A);v=r.makeTensorInfo(f,a.dtype,R.values)}else{let T=new sue(A,b,c);v=r.runWebGLProgram(T,[a],a.dtype)}let S=ve({inputs:{x:v},backend:r,attrs:{shape:f}});return r.disposeIntermediateTensorInfo(v),S}var oue={kernelName:Al,backendName:"webgl",kernelFunc:iue};function lue(e){let{inputs:t,backend:r,attrs:n}=e,{separator:a,nGramWidths:s,leftPad:i,rightPad:o,padWidth:l,preserveShortSequences:u}=n,{data:d,dataSplits:h}=t,p=r.readSync(d.dataId),c=r.readSync(h.dataId),[f,m]=Bee(p,c,a,s,i,o,l,u);return[r.makeTensorInfo([f.length],"string",f),r.makeTensorInfo(h.shape,"int32",m)]}var uue={kernelName:uh,backendName:"webgl",kernelFunc:lue};function due(e){let{inputs:t,backend:r,attrs:n}=e,{skipEmpty:a}=n,{input:s,delimiter:i}=t;if(s.dtype!=="string")throw new Error("Input must be of datatype string");if(s.shape.length!==1)throw new Error(`Input must be a vector, got shape: ${s.shape}`);if(i.shape.length!==0)throw new Error(`Delimiter must be a scalar, got shape: ${i.shape}`);let o=r.readSync(s.dataId),l=r.readSync(i.dataId)[0],[u,d,h]=Wee(o,l,a),p=d.length;return[r.makeTensorInfo([p,2],"int32",u),r.makeTensorInfo([p],"string",d),r.makeTensorInfo([2],"int32",new Int32Array(h))]}var pue={kernelName:cm,backendName:"webgl",kernelFunc:due};function hue(e){let{inputs:t,backend:r,attrs:n}=e,{numBuckets:a}=n,{input:s}=t;if(s.dtype!=="string")throw new Error("Input must be of datatype string");if(a<=0)throw new Error("Number of buckets must be at least 1");let i=r.readSync(s.dataId),o=Vee(i,a);return r.makeTensorInfo(s.shape,"int32",o)}var cue={kernelName:fm,backendName:"webgl",kernelFunc:hue},fue="return tan(x);",mue=it({opSnippet:fue}),gue={kernelName:xl,backendName:"webgl",kernelFunc:mue},yue=`
2022-02-10 18:27:21 +01:00
float e2x = exp(-2.0 * abs(x));
return sign(x) * (1.0 - e2x) / (1.0 + e2x);
2022-04-14 17:47:08 +02:00
`,Aue=it({opSnippet:yue}),xue={kernelName:zi,backendName:"webgl",kernelFunc:Aue},bue=class{constructor(e,t){this.variableNames=["A"];let r=new Array(e.length);for(let s=0;s<r.length;s++)r[s]=e[s]*t[s];this.outputShape=r,this.rank=r.length;let n=gt(this.rank),a=vue(e);this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
2022-04-01 15:13:32 +02:00
${n} resRC = getOutputCoords();
setOutput(getA(${a}));
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}};function vue(e){let t=e.length;if(t>5)throw Error(`Tile for rank ${t} is not yet supported`);if(t===1)return`imod(resRC, ${e[0]})`;let r=["resRC.x","resRC.y","resRC.z","resRC.w","resRC.u"],n=[];for(let a=0;a<e.length;a++)n.push(`imod(${r[a]}, ${e[a]})`);return n.join()}function I8(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{reps:s}=n;if(a.dtype==="string"||a.shape.length>5){let o=r.readSync(a.dataId),l=a.dtype==="string"?o.map(h=>w.decodeString(h)):o,u=We(a.shape,a.dtype,l),d=Gee(u,s);return r.makeTensorInfo(d.shape,d.dtype,d.values)}let i=new bue(a.shape,s);return r.runWebGLProgram(i,[a],a.dtype)}var wue={kernelName:Qa,backendName:"webgl",kernelFunc:I8},kue=class{constructor(e){this.variableNames=["x","indices"],this.customUniforms=[{name:"n",type:"int"},{name:"firstPass",type:"int"},{name:"negativeInf",type:"float"},{name:"dir",type:"int"},{name:"inc",type:"int"}],this.outputShape=e,this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
ivec2 coords = getOutputCoords();
int batch = coords[0];
int elemIdx = coords[1];
// We compare elements pair-wise within a group of size 2 * inc.
// The comparing rule for each group alternates between ascending
// and descending. Within each group, we compare each pair at
// positions i and i+inc. To decide whether an element at position i
// is x0 or x1, we mod it by 2 * inc, if the result is smaller than
// inc, it is in the first half of the group, we denote it as x0,
// otherwise we denote it as x1.
// For example, as shown in the Bitonic top K paper referenced above,
// Figure5(a) shows that element[1] is in the
// second half of the group when group size is 2, but it is in the
// first half of the group when group size is 4.
bool isFirstInPair = imod(elemIdx, 2 * inc) < inc;
int i = isFirstInPair ? elemIdx : elemIdx - inc;
int i0 = firstPass == 1 ? i : int(getIndices(batch, i));
int i1 = firstPass == 1 ? i + inc : int(getIndices(batch, i + inc));
float x0 = i0 < n ? getX(batch, i0) : negativeInf;
float x1 = i1 < n ? getX(batch, i1) : negativeInf;
// Denotes which direction indices are in (ascending or descending).
bool reverse = imod(elemIdx, 2 * dir) >= dir;
bool isGreater = x0 > x1 || (x0 == x1 && i1 > i0);
if (reverse == isGreater) { // Elements in opposite order of direction
int iTemp = i0;
i0 = i1;
i1 = iTemp;
}
if (isFirstInPair) {
setOutput(float(i0));
} else {
setOutput(float(i1));
}
}
2022-04-14 17:47:08 +02:00
`}},Iue=class{constructor(e){this.variableNames=["x","indices"],this.customUniforms=[{name:"n",type:"int"},{name:"firstPass",type:"int"},{name:"k",type:"int"}],this.outputShape=e,this.userCode=`
2022-02-10 18:27:21 +01:00
void main() {
// Takes max of indices (0, k), (1, k + 1), (2, k + 2) ...
ivec2 coords = getOutputCoords();
int batch = coords[0];
int elemIdx = coords[1];
// The output size is half of the previous size.
// If the previous sequence is | | | | _ _ _ _ | | | | _ _ _ _ (k=4),
// we only need to output the indices at positions |, the indices at
// positions _ can be thrown away, see Figure5(b) After Phase 2
// (Merge phase) in the Bitonic Top K paper referenced above.
// For example, the paper shows we only need to output the orange bars.
// The output sequence should look like this | | | | | | | |.
// Because the sequence is halved, to map the output index back
// to the previous sequence to find the corresponding value,
// we need to double the index. When we double the index,
// we basically interpolate a position, so 2i looks like
// | _ | _ | _ | _ | _ | _ | _. We move the | to the first k position
// of each 2k positions by - elemIdx % k. E.g. for output at
// index 4,5,6,7, we want to get the corresponding element at
// original index 8,9,10,11, for output at index 8,9,10,11,
// we want to get the corresponding element at original index
// 16,17,18,19, so on and so forth.
int i = elemIdx < k ? elemIdx : (elemIdx * 2 - imod(elemIdx, k));
int i0 = firstPass == 1 ? i : int(getIndices(batch, i));
int i1 = firstPass == 1 ? i + k : int(getIndices(batch, i + k));
float x0 = getX(batch, i0);
float x1 = i1 < n ? getX(batch, i1) : x0;
setOutput(x0 >= x1 ? float(i0) : float(i1));
}
2022-04-14 17:47:08 +02:00
`}};function po(e,t){t!==null&&e.disposeIntermediateTensorInfo(t)}function tw(e){let t=1;for(;t<e;)t*=2;return t}function Sue(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{k:s,sorted:i}=n,o=Y().getNumber("TOPK_LAST_DIM_CPU_HANDOFF_SIZE_THRESHOLD"),l=Y().getNumber("TOPK_K_CPU_HANDOFF_THRESHOLD"),u=a.shape,d=u[u.length-1];if(r.shouldExecuteOnCPU([a])||d<o||s>l){let R=r.readSync(a.dataId),[_,M]=jee(R,u,a.dtype,s,i);return[r.makeTensorInfo(_.shape,_.dtype,_.values),r.makeTensorInfo(M.shape,M.dtype,M.values)]}if(s===0)return u[u.length-1]=0,[r.makeTensorInfo(u,a.dtype,[]),r.makeTensorInfo(u,"int32",[])];if(d===1)return[a,Bh({attrs:{shape:u,dtype:"int32",value:0},backend:r})];let h=r.texData.get(a.dataId),p=h!==null&&h.isPacked,c=p?r.unpackTensor(a):a,f=w.sizeFromShape(u)/d,m=ve({inputs:{x:c},attrs:{shape:[f,d]},backend:r});p&&po(r,c);let g=tw(s),y=tw(d),A=null,x=()=>A===null?[m,m]:[m,A],b=(R,_,M)=>{let I=x(),z=new kue(M),O=[[d],[A===null?1:0],[Number.NEGATIVE_INFINITY],[R],[_]],j=A;A=r.runWebGLProgram(z,I,"int32",O),po(r,j)};for(let R=1;R<g;R*=2){let _=R*2;for(let M=R;M>=1;M/=2)b(_,M,[f,y])}for(let R=y;R>g;R/=2){let _=x(),M=new Iue([f,R/2]),I=[[d],[A===null?1:0],[g]],z=A;A=r.runWebGLProgram(M,_,"int32",I),po(r,z);let O=g/2,j=O*2;for(let X=O;X>=1;X/=2)b(j,X,A.shape)}let v=A;A=Nd({inputs:{x:A},backend:r,attrs:{begin:0,size:[f,s]}}),po(r,v);let S=m8({inputs:{x:m,indices:A},backend:r,attrs:{axis:1,batchDims:1}});po(r,m);let T=u.slice(0,-1);T.push(s),v=A,A=ve({inputs:{x:A},attrs:{shape:T},backend:r}),po(r,v);let E=S;return S=ve({inputs:{x:S},attrs:{shape:T},backend:r}),po(r,E),[S,A]}var Tue={kernelName:bl,backendName:"webgl",kernelFunc:Sue},Nue=class{constructor(e,t,r,n,a,s){this.variableNames=["Image","Transforms"],this.outputShape=s;let i=r==="nearest"?1:2,o;switch(n){case"constant":o=1;break;case"reflect":o=2;break;case"wrap":o=3;break;case"nearest":o=4;break;default:o=1;break}this.userCode=`
2022-02-10 18:27:21 +01:00
float mapCoord(float outCoord, float len) {
float inCoord = outCoord;
2022-04-01 15:13:32 +02:00
if(${o} == 2) {
2022-02-10 18:27:21 +01:00
if (inCoord < 0.0) {
if (len <= 1.0) {
inCoord = 0.0;
} else {
float sz2 = 2.0 * len;
if (inCoord < sz2) {
inCoord = sz2 * float(int(float(-inCoord / sz2))) +
inCoord;
}
inCoord = inCoord < -len ? inCoord + sz2 : -inCoord - 1.0;
}
} else if (inCoord > len - 1.0) {
if (len <= 1.0) {
inCoord = 0.0;
} else {
float sz2 = 2.0 * len;
inCoord -= sz2 * float(int(float(inCoord / sz2)));
if (inCoord >= len) {
inCoord = sz2 - inCoord - 1.0;
}
}
}
return clamp(inCoord, 0.0, len - 1.0);
2022-04-01 15:13:32 +02:00
} else if (${o} == 3) {
2022-02-10 18:27:21 +01:00
if (inCoord < 0.0) {
if (len <= 1.0) {
inCoord = 0.0;
} else {
float sz = len - 1.0;
inCoord += len * (float(int(float(-inCoord / sz))) + 1.0);
}
} else if (inCoord > len - 1.0) {
if (len <= 1.0) {
inCoord = 0.0;
} else {
float sz = len - 1.0;
inCoord -= len * float(int(float(inCoord / sz)));
}
}
return clamp(inCoord, 0.0, len - 1.0);
2022-04-01 15:13:32 +02:00
} else if (${o} == 4) {
2022-02-10 18:27:21 +01:00
return clamp(outCoord, 0.0, len - 1.0);
} else {
return outCoord;
}
}
float readWithFillValue(int batch, int coordY, int coordX,
int channel) {
float outputValue;
if (0 <= coordY && coordY < ${e} && 0 <= coordX && coordX < ${t}) {
outputValue = getImage(batch, coordY, coordX, channel);
} else {
2022-04-01 15:13:32 +02:00
outputValue = float(${a});
2022-02-10 18:27:21 +01:00
}
return outputValue;
}
void main() {
ivec4 coords = getOutputCoords();
float outputValue;
int batch = coords[0];
int x = coords[2];
int y = coords[1];
int channel = coords[3];
float xf = float(x);
float yf = float(y);
float a1 = getTransforms(batch, 0);
float a2 = getTransforms(batch, 1);
float a3 = getTransforms(batch, 2);
float b1 = getTransforms(batch, 3);
float b2 = getTransforms(batch, 4);
float b3 = getTransforms(batch, 5);
float c1 = getTransforms(batch, 6);
float c2 = getTransforms(batch, 7);
float projection = c1 * xf + c2 * yf + 1.0;
if (projection == 0.0) {
2022-04-01 15:13:32 +02:00
outputValue = float(${a});
2022-02-10 18:27:21 +01:00
} else {
float inX = (a1 * xf + a2 * yf + a3) / projection;
float inY = (b1 * xf + b2 * yf + b3) / projection;
float mapX = mapCoord(inX, float(${t}));
float mapY = mapCoord(inY, float(${e}));
2022-04-01 15:13:32 +02:00
if (${i} == 1) {
2022-02-10 18:27:21 +01:00
int coordY = int(round(mapY));
int coordX = int(round(mapX));
outputValue = readWithFillValue(batch, coordY, coordX,
channel);
} else {
float yFloor = floor(mapY);
float xFloor = floor(mapX);
float yCeil = yFloor + 1.0;
float xCeil = xFloor + 1.0;
float valueYFloor = (xCeil - mapX) *
readWithFillValue(batch, int(yFloor), int(xFloor), channel) +
(mapX - xFloor) *
readWithFillValue(batch, int(yFloor), int(xCeil), channel);
float valueYCeil = (xCeil - mapX) *
readWithFillValue(batch, int(yCeil), int(xFloor), channel) +
(mapX - xFloor) *
readWithFillValue(batch, int(yCeil), int(xCeil), channel);
outputValue = (yCeil - mapY) * valueYFloor +
(mapY - yFloor) * valueYCeil;
}
}
setOutput(outputValue);
}
2022-04-14 17:47:08 +02:00
`}};function Cue(e){let{inputs:t,backend:r,attrs:n}=e,{image:a,transforms:s}=t,{interpolation:i,fillMode:o,fillValue:l,outputShape:u}=n,[d,h,p,c]=a.shape,[f,m]=u!=null?u:[h,p],g=[d,f,m,c],y=new Nue(h,p,i,o,l,g);return r.runWebGLProgram(y,[a,s],"float32")}var Eue={kernelName:vl,backendName:"webgl",kernelFunc:Cue};function Rue(e){let{inputs:t,attrs:r,backend:n}=e,{axis:a}=r,{x:s}=t;vd(s,"unique"),console.warn("WARNING: ","UI might be locked temporarily as data is being downloaded");let i=n.readSync(s.dataId),{outputValues:o,outputShape:l,indices:u}=Hee(i,a,s.shape,s.dtype);return[n.makeTensorInfo(l,s.dtype,o),n.makeTensorInfo([u.length],"int32",u)]}var Mue={kernelName:mm,backendName:"webgl",kernelFunc:Rue};function Fue(e){let{inputs:t,backend:r,attrs:n}=e,{value:a}=t,{axis:s}=n;s<0&&(s+=a.shape.length);let i=a,o=i.shape.length,l=a.shape[s],u=new Array(o-1),d=0;for(let m=0;m<o;m++)m!==s&&(u[d++]=i.shape[m]);let h=[],p=new Array(o).fill(0),c=i.shape.slice();c[s]=1;let f=new Array(l);for(let m=0;m<f.length;m++){p[s]=m;let g=Nd({inputs:{x:i},backend:r,attrs:{begin:p,size:c}}),y=ve({inputs:{x:g},backend:r,attrs:{shape:u}});f[m]=y,h.push(g)}return h.forEach(m=>r.disposeIntermediateTensorInfo(m)),f}var $ue={kernelName:wl,backendName:"webgl",kernelFunc:Fue},Pue=class{constructor(e,t){this.variableNames=["x","segmentIds"];let r=e.windowSize,n=e.batchSize,a=e.inSize,s=e.numSegments,i=s*Math.ceil(a/r);this.outputShape=[n,i];let o="0.0",l="sumValue",u=Math.floor(r/4)*4,d=r%4,h=`
2022-02-10 18:27:21 +01:00
sumValue += dot(values, segFilter);
2022-04-01 15:13:32 +02:00
`,p="";a%r>0&&(p=`
if (inIdx < 0 || inIdx >= ${a}) {
2022-02-10 18:27:21 +01:00
return initializationValue;
}
2022-04-01 15:13:32 +02:00
`);let c="";a%r>0&&(c=`
if (inIdx < 0 || inIdx >= ${a}) {
2022-02-10 18:27:21 +01:00
return -1.0;
}
`),this.userCode=`
2022-04-01 15:13:32 +02:00
const float initializationValue = ${o};
2022-02-10 18:27:21 +01:00
float getValue(int batch, int inIdx) {
2022-04-01 15:13:32 +02:00
${p}
2022-02-10 18:27:21 +01:00
return getX(batch, inIdx);
}
float getSegmentIdAtIndex(int inIdx) {
2022-04-01 15:13:32 +02:00
${c}
2022-02-10 18:27:21 +01:00
return getSegmentIds(inIdx);
}
void main() {
ivec2 coords = getOutputCoords();
int batch = coords[0];
int outIdx = coords[1];
int inOffset = int(floor(float(outIdx) / float(
2022-04-01 15:13:32 +02:00
${s})) * float(${r}));
int currentSeg = int(mod(float(outIdx), float(${s})));
2022-02-10 18:27:21 +01:00
float sumValue = 0.0;
2022-02-17 14:15:57 +01:00
for (int i = 0; i < ${u}; i += 4) {
2022-02-10 18:27:21 +01:00
int inIdx = inOffset + i;
vec4 values = vec4(
getValue(batch, inIdx),
getValue(batch, inIdx + 1),
getValue(batch, inIdx + 2),
getValue(batch, inIdx + 3)
);
vec4 segFilter = vec4(
int(getSegmentIdAtIndex(inIdx)) == currentSeg ? 1 : 0,
int(getSegmentIdAtIndex(inIdx + 1)) == currentSeg ? 1 : 0,
int(getSegmentIdAtIndex(inIdx + 2)) == currentSeg ? 1 : 0,
int(getSegmentIdAtIndex(inIdx + 3)) == currentSeg ? 1 : 0
);
2022-04-01 15:13:32 +02:00
${h}
2022-02-10 18:27:21 +01:00
}
2022-02-17 14:15:57 +01:00
int inIdx = inOffset + ${u};
2022-04-01 15:13:32 +02:00
if (${d===1}) {
2022-02-10 18:27:21 +01:00
vec4 values = vec4(
getValue(batch, inIdx),
initializationValue,
initializationValue,
initializationValue
);
int inIdxSeg = int(getSegmentIdAtIndex(inIdx));
vec4 segFilter = vec4(
int(getSegmentIdAtIndex(inIdx)) == currentSeg ? 1 : 0,
0,
0,
0
);
2022-04-01 15:13:32 +02:00
${h}
} else if (${d===2}) {
2022-02-10 18:27:21 +01:00
vec4 values = vec4(
getValue(batch, inIdx),
getValue(batch, inIdx + 1),
initializationValue,
initializationValue
);
vec4 segFilter = vec4(
int(getSegmentIdAtIndex(inIdx)) == currentSeg ? 1 : 0,
int(getSegmentIdAtIndex(inIdx + 1)) == currentSeg ? 1 : 0,
0,
0
);
2022-04-01 15:13:32 +02:00
${h}
} else if (${d===3}) {
2022-02-10 18:27:21 +01:00
vec4 values = vec4(
getValue(batch, inIdx),
getValue(batch, inIdx + 1),
getValue(batch, inIdx + 2),
initializationValue
);
vec4 segFilter = vec4(
int(getSegmentIdAtIndex(inIdx)) == currentSeg ? 1 : 0,
int(getSegmentIdAtIndex(inIdx + 1)) == currentSeg ? 1 : 0,
int(getSegmentIdAtIndex(inIdx + 2)) == currentSeg ? 1 : 0,
0
);
2022-04-01 15:13:32 +02:00
${h}
2022-02-10 18:27:21 +01:00
}
setOutput(${l});
}
2022-04-14 17:47:08 +02:00
`}};function _ue(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,segmentIds:s}=t,{numSegments:i}=n,o=a.shape.length,l=[],u=0,d=N.getAxesPermutation([u],o),h=a;d!=null&&(h=vr({inputs:{x:a},backend:r,attrs:{perm:d}}),l.push(h),u=N.getInnerMostAxes(1,o)[0]);let p=N.segment_util.computeOutShape(h.shape,u,i),c=w.sizeFromShape([h.shape[u]]),f=ve({inputs:{x:h},backend:r,attrs:{shape:[-1,c]}});l.push(f);let m=ch(a.dtype),g=(b,v,S,T,E)=>{let R=b.shape[0],_=b.shape[1],M=N.segment_util.segOpComputeOptimalWindowSize(_,E),I={windowSize:M,inSize:_,batchSize:R,numSegments:E},z=new Pue(I,v),O=r.compileAndRun(z,[b,S],T);if(l.push(O),O.shape[1]===E)return O;let j=w8({backend:r,attrs:{start:0,stop:E,step:1,dtype:"float32"}}),X=I8({inputs:{x:j},backend:r,attrs:{reps:[_/M]}});return l.push(j),l.push(X),g(O,v,X,T,E)},y=g(f,"unsortedSegmentSum",s,m,i),A=ve({inputs:{x:y},backend:r,attrs:{shape:p}}),x=A;if(d!=null){l.push(A);let b=N.getUndoAxesPermutation(d);x=vr({inputs:{x},backend:r,attrs:{perm:b}})}return l.forEach(b=>r.disposeIntermediateTensorInfo(b)),x}var zue={kernelName:dh,backendName:"webgl",kernelFunc:_ue},Oue=[Wte,Ute,Hte,Xte,Yte,ere,rre,are,lre,dre,cre,gre,xre,kre,Tre,Cre,Rre,Pre,zre,Dre,Vre,Xre,Yre,Qre,sne,one,pne,wte,fne,xne,kne,Ene,Mne,$ne,_ne,One,Bne,Une,Hne,Kne,Zne,Jne,tae,nae,oae,uae,hae,mae,yae,vae,Sae,Eae,Fae,_ae,zae,Dae,Bae,Vae,Gae,Hae,Zae,Qae,rse,ase,ose,dse,fse,Ase,vte,bse,yne,kse,Tse,Ese,Ite,$se,Ose,Lse,Use,Hse,Zse,Qse,nie,oie,die,hie,gie,Aie,bie,Iie,Tie,Cie,Rie,Fie,zie,Bie,Gie,Jie,Ete,roe,soe,loe,poe,tne,foe,goe,Aoe,voe,Soe,Tte,Noe,Coe,rne,Kie,Moe,_oe,Loe,Mte,Uoe,Hoe,Zoe,Qoe,nle,sle,lle,ple,cle,gle,xle,kle,Tle,Ele,Fle,qre,Zie,_le,Ole,Lle,Wle,Ule,jle,qle,Xle,Yle,eue,rue,aue,oue,uue,pue,cue,Xie,Dte,gue,xue,wue,Tue,Eue,Lte,Mue,$ue,zue,moe];for(let e of Oue)Gn(e);var za=Y();za.registerFlag("WEBGPU_DEFERRED_SUBMIT_BATCH_SIZE",()=>15);za.registerFlag("WEBGPU_CPU_FORWARD",()=>!0);za.registerFlag("WEBGPU_MATMUL_WORK_PER_THREAD",()=>4);za.registerFlag("WEBGPU_USE_NAIVE_CONV2D",()=>!1);za.registerFlag("WEBGPU_USE_NAIVE_CONV2D_TRANSPOSE",()=>!1);za.registerFlag("WEBGPU_CONV_SEPARATE_IM2COL_SHADER",()=>!1);za.registerFlag("WEBGPU_USE_LOW_POWER_GPU",()=>!1);za.registerFlag("WEBGPU_CPU_HANDOFF_SIZE_THRESHOLD",()=>1e3);za.registerFlag("WEBGPU_USE_PROFILE_TOOL",()=>!1);za.registerFlag("WEBGPU_USE_IMPORT",()=>!1);var Due="return a + b;",Lue="return areal * breal - aimag * bimag;",Bue="return areal * bimag + aimag * breal;",Wue="return a / b;",Vue="return a * b;",Uue="return (a - b) * (a - b);",Gue="return a - b;",jue="return f32(a == b);",Hue="return vec4<f32>(a == b);",que="return f32(a > b);",Kue="return vec4<f32>(a > b);",Xue="return f32(a >= b);",Zue="return vec4<f32>(a >= b);",Yue="return f32(a < b);",Jue="return vec4<f32>(a < b);",Que="return f32(a <= b);",ede="return vec4<f32>(a <= b);",tde="return f32(f32(a) >= 1.0 && f32(b) >= 1.0);",rde=`return (vec4<f32>(a >= vec4<f32>(1.0)) *
vec4<f32>(b >= vec4<f32>(1.0)));`,nde=`
2022-04-01 15:12:04 +02:00
if (isnan(a)) { return a; }
if (isnan(b)) { return b; }
2022-04-14 17:47:08 +02:00
`,S8=`
2022-04-01 15:12:04 +02:00
if (isNaN.r) {
resultTemp.r = uniforms.NAN;
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:12:04 +02:00
if (isNaN.g) {
resultTemp.g = uniforms.NAN;
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:12:04 +02:00
if (isNaN.b) {
resultTemp.b = uniforms.NAN;
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:12:04 +02:00
if (isNaN.a) {
resultTemp.a = uniforms.NAN;
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`,ade=`
2022-04-01 15:12:04 +02:00
let s = sign(a) * sign(b);
let ia = i32(round(a));
let ib = i32(round(b));
return f32(idiv(ia, ib, s));
2022-04-14 17:47:08 +02:00
`,sde=`
2022-04-01 15:12:04 +02:00
let ia = vec4<i32>(round(a));
let ib = vec4<i32>(round(b));
let cond = ib != vec4<i32>(0);
var resultTemp = vec4<i32>(0);
let s = sign(a) * sign(b);
// Windows (D3D) wants guaranteed non-zero int division at compile-time.
if (cond[0]) {
resultTemp[0] = idiv(ia[0], ib[0], s[0]);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:12:04 +02:00
if (cond[1]) {
resultTemp[1] = idiv(ia[1], ib[1], s[1]);
}
if (cond[2]) {
resultTemp[2] = idiv(ia[2], ib[2], s[2]);
}
if (cond[3]) {
resultTemp[3] = idiv(ia[3], ib[3], s[3]);
}
return vec4<f32>(resultTemp);
2022-04-14 17:47:08 +02:00
`,ide="return f32(a != b);",ode="return vec4<f32>(a != b);",lde=`
2022-04-01 15:12:04 +02:00
if(a < 0.0 && floor(b) < b) {
return uniforms.NAN;
}
if (b == 0.0) {
return 1.0;
}
if (round(abs(b) % 2.0) != 1.0) {
return pow(abs(a), b);
}
return sign(a) * pow(abs(a), b);
2022-04-14 17:47:08 +02:00
`,ude=`
2022-04-01 15:12:04 +02:00
let isModRound1Bool = vec4<i32>(round(abs(b) % vec4<f32>(2.0))) == vec4<i32>(1);
let isModRound1 = vec4<f32>(isModRound1Bool);
let multiplier = sign(a) * isModRound1 + (vec4<f32>(1.0) - isModRound1);
var resultTemp = multiplier * pow(abs(a), b);
// Ensure that a^0 = 1, including 0^0 = 1 as this correspond to TF and JS
let isExpZero = b == vec4<f32>(0.0);
if (isExpZero.r) {
resultTemp.r = 1.0;
}
if (isExpZero.g) {
resultTemp.g = 1.0;
}
if (isExpZero.b) {
resultTemp.b = 1.0;
}
if (isExpZero.a) {
resultTemp.a = 1.0;
}
let isNaN = a < vec4<f32>(0.0) & floor(b) < b;
2022-04-14 17:47:08 +02:00
${S8}
2022-04-01 15:12:04 +02:00
return resultTemp;
2022-04-14 17:47:08 +02:00
`,dde="if (a < 0.0) { return b * a; } return a;",pde=`
2022-04-01 15:12:04 +02:00
let aLessThanZero = vec4<f32>(a < vec4<f32>(0.0));
return (aLessThanZero * (b * a)) + ((vec4<f32>(1.0) - aLessThanZero) * a);
2022-04-14 17:47:08 +02:00
`;function rw(e,t){let r=t?S8:nde;return t?`
2022-04-01 15:12:04 +02:00
var resultTemp = vec4<f32>(${e}(a, b));
let isNaN = isnanVec4(a) | isnanVec4(b);
2022-04-01 15:13:32 +02:00
`+r+`
2022-04-01 15:12:04 +02:00
return resultTemp;
2022-04-01 15:13:32 +02:00
`:r+`
2022-04-01 15:12:04 +02:00
return ${e}(a, b);
2022-04-14 17:47:08 +02:00
`}function Wh(e,t){switch(e){case 0:return Vue;case 1:return Due;case 2:return Gue;case 3:return Wue;case 4:return t?Hue:jue;case 5:return t?Kue:que;case 6:return t?Zue:Xue;case 7:return t?Jue:Yue;case 8:return t?ede:Que;case 9:return t?rde:tde;case 10:return t?ode:ide;case 11:return Uue;case 12:return t?sde:ade;case 14:return t?pde:dde;case 15:return rw("max",t);case 16:return rw("min",t);case 13:return t?ude:lde;case 17:return Lue;case 18:return Bue;default:throw new Error(`BinaryType ${e} is not implemented!`)}}var hde="return abs(a);",cde="return ceil(a);",fde="return cos(a);",mde=`
2022-04-01 15:12:04 +02:00
let e2x = exp(-a);
return (e2x + 1.0 / e2x) / 2.0;
2022-04-14 17:47:08 +02:00
`,gde="return exp(a) - 1.0;",yde="if (a >= 0.0) { return a; } return (exp(a) - 1.0);",Ade=`
2022-04-01 15:12:04 +02:00
var resFloat = exp(a) - vec4<f32>(1.0);
if (a.r >= 0.0) {
resFloat.r = a.r;
}
if (a.g >= 0.0) {
resFloat.g = a.g;
}
if (a.b >= 0.0) {
resFloat.b = a.b;
}
if (a.a >= 0.0) {
resFloat.a = a.a;
}
return resFloat;
2022-04-14 17:47:08 +02:00
`,xde="return exp(a);",bde="return floor(a);",vde="return a;",wde=`if (a < 0.0) { return 1.0/0.0; }
return log(a);`,kde="return f32(!(a >= 1.0));",Ide="return -a;",Sde="if (a < 0.0) { return uniforms.alpha * a; } return a;",Tde=`
2022-04-05 18:25:41 +02:00
let aLessThanZero = vec4<f32>(a < vec4<f32>(0.0));
return (aLessThanZero * (uniforms.alpha * a)) + ((vec4<f32>(1.0) - aLessThanZero) * a);
2022-04-14 17:47:08 +02:00
`,Nde="if(a < 0.0) { return 0.0; } return a;",Cde="return clamp(a, 0.0, 6.0);",Ede="return clamp(a, vec4<f32>(0.0, 0.0, 0.0, 0.0), vec4<f32>(6.0, 6.0, 6.0, 6.0));",Rde=`
2022-04-01 15:12:04 +02:00
var resFloat = a * vec4<f32>(a >= vec4<f32>(0.0));
let isNaN = isnanVec4(a);
if (isNaN.r) {
resFloat.r = a.r;
}
if (isNaN.g) {
resFloat.g = a.g;
}
if (isNaN.b) {
resFloat.b = a.b;
}
if (isNaN.a) {
resFloat.a = a.a;
}
return resFloat;
2022-04-14 17:47:08 +02:00
`,Mde="return 1.0/sqrt(a);",Fde="return 1.0 / (1.0 + exp(-1.0 * a));",$de="return sin(a);",Pde=`
2022-04-01 15:12:04 +02:00
let e2x = exp(a);
return (e2x - 1.0 / e2x) / 2.0;
2022-04-14 17:47:08 +02:00
`,_de="return sqrt(a);",zde="return a * a;",Ode=`
2022-04-01 15:12:04 +02:00
let e2x = exp(-2.0 * abs(a));
return sign(a) * (1.0 - e2x) / (1.0 + e2x);
2022-04-14 17:47:08 +02:00
`,Dde="return f32(i32((a)));";function fo(e,t){switch(e){case 0:return hde;case 2:return fde;case 3:return mde;case 1:return cde;case 4:return t?Ade:yde;case 5:return xde;case 6:return gde;case 7:return bde;case 8:return vde;case 9:return wde;case 10:return kde;case 11:return Ide;case 14:return t?Tde:Sde;case 12:return t?Rde:Nde;case 13:return t?Ede:Cde;case 15:return Mde;case 18:return Fde;case 16:return $de;case 17:return Pde;case 19:return _de;case 20:return zde;case 21:return Ode;case 22:return Dde;default:throw new Error(`BinaryType ${e} is not implemented!`)}}function ss(e,t=!1){if(e===null)return null;if(e==="linear")return fo(8);if(e==="relu")return fo(12,t);if(e==="elu")return fo(4,t);if(e==="relu6")return fo(13,t);if(e==="prelu")return Wh(14,t);if(e==="sigmoid")return fo(18,t);if(e==="leakyrelu")return fo(14,t);throw new Error(`Activation ${e} has not been implemented for the WebGPU backend.`)}function Lde(e,t){if(Math.max(...e)>3)throw new Error("Cannot symbolically compute strides for rank > 4 tensor.");let r=e.length,n=e.map(s=>`${t}[${s}]`),a=new Array(r-1);a[r-2]=n[r-1];for(let s=r-3;s>=0;--s)a[s]=`(${a[s+1]} * ${n[s+1]})`;return a}function gr(e){if(e<=1)return"i32";if(e===2)return"vec2<i32>";if(e===3)return"vec3<i32>";if(e===4)return"vec4<i32>";throw Error(`GPU for rank ${e} is not yet supported`)}function pf(e,t){return e==="float32"?t?"vec4<f32>":"f32":e==="int32"||e==="bool"?t?"vec4<i32>":"i32":e}function yb(){return`
2022-04-01 15:12:04 +02:00
@stage(compute) @workgroup_size(workGroupSizeX, workGroupSizeY, workGroupSizeZ)
2022-04-11 17:45:24 +02:00
`}function Ui(){return`
2022-04-14 17:47:08 +02:00
${yb()}
2022-04-01 15:12:04 +02:00
fn main(@builtin(local_invocation_id) LocalId : vec3<u32>,
@builtin(global_invocation_id) GlobalId : vec3<u32>,
@builtin(num_workgroups) NumWorkgroups: vec3<u32>) {
localId = LocalId;
globalId = GlobalId;
numWorkgroups = NumWorkgroups;
2022-04-01 15:13:32 +02:00
`}function tt(){return`
2022-04-11 17:45:24 +02:00
${Ui()}
2022-04-01 15:12:04 +02:00
let index = getGlobalIndex();
2022-04-14 17:47:08 +02:00
`}function Bde(e,t,r,n=!1){let a=[];if(a.push(`
2022-04-01 15:13:32 +02:00
let workGroupSizeX = ${r.workGroupSize[0]}u;
let workGroupSizeY = ${r.workGroupSize[1]}u;
let workGroupSizeZ = ${r.workGroupSize[2]}u;
2022-04-01 15:12:04 +02:00
var<private> localId: vec3<u32>;
var<private> globalId: vec3<u32>;
var<private> numWorkgroups: vec3<u32>;
// Only used when the y/z dimension of workgroup size is 1.
fn getGlobalIndex() -> i32 {
if (numWorkgroups.y == 1u && numWorkgroups.z == 1u) {
return i32(globalId.x);
}
let localInvocationIndex = localId.z * workGroupSizeX * workGroupSizeY +
localId.y * workGroupSizeX + localId.x;
let workGroupID = (globalId - localId)/vec3<u32>(
workGroupSizeX, workGroupSizeY, workGroupSizeZ);
return i32((workGroupID.z * numWorkgroups.x * numWorkgroups.y +
workGroupID.y * numWorkgroups.x + workGroupID.x) *
(workGroupSizeX * workGroupSizeY * workGroupSizeZ) +
localInvocationIndex);
}
2022-04-01 15:13:32 +02:00
`),n===!0)return a.push(`
2022-04-01 15:12:04 +02:00
struct Uniform {
size : i32,
numChannels : i32,
outShapeStrides : vec2<i32>,
dispatchSize : vec3<u32>,
};
2022-04-14 17:47:08 +02:00
@group(0) @binding(0) var<storage, write> result: array<${pf(t.dtype,r.isVec4)}>;
2022-04-01 15:12:04 +02:00
@group(0) @binding(2) var<uniform> uniforms: Uniform;
2022-04-14 17:47:08 +02:00
`),[nw,a.join(`
`),aw(t.shape),r.getUserCode()].join(`
2022-04-11 17:45:24 +02:00
`);let s="struct Uniforms { NAN : f32, ";r.variableNames.forEach((d,h)=>{s+=`${d.charAt(0).toLowerCase()+d.slice(1)}Shape : ${gr(e[h].shape.length)}, `}),s+=`outShape : ${gr(t.shape.length)}, `;let i=t.shape.length-1;s+=`
outShapeStrides: ${gr(i)}, `,r.size&&(s+="size : i32, "),r.uniforms&&(s+=r.uniforms),s+="};",a.push(s),r.atomic?a.push(`
2022-04-01 15:12:04 +02:00
@group(0) @binding(0) var<storage, read_write> result: array<atomic<i32>>;
2022-04-01 15:13:32 +02:00
`):a.push(`
2022-04-14 17:47:08 +02:00
@group(0) @binding(0) var<storage, write> result: array<${pf(t.dtype,r.isVec4)}>;
2022-04-01 15:13:32 +02:00
`),r.variableNames.forEach((d,h)=>{a.push(`
2022-04-14 17:47:08 +02:00
@group(0) @binding(${1+h}) var<storage, read> ${d}: array<${pf(e[h].dtype,r.isVec4)}>;
2022-04-01 15:13:32 +02:00
`)}),s!==""&&a.push(`
@group(0) @binding(${1+r.variableNames.length}) var<uniform> uniforms: Uniforms;
2022-04-14 17:47:08 +02:00
`);let[o,l]=Hde(t.shape,r.dispatchLayout),u=[nw,a.join(`
`),aw(t.shape),o,Wde(t.shape.length)];if(r.atomic||u.push(Vde(t.shape,t.dtype,r.isVec4)),l===t.shape.length){let d=e.map(h=>Ude(h,t.shape,r.isVec4,r.dispatchLayout.x.length===t.shape.length)).join(`
2022-04-01 15:13:32 +02:00
`);u.push(d)}return u.push(r.getUserCode()),u.join(`
2022-04-14 17:47:08 +02:00
`)}var nw=`
2022-04-01 15:12:04 +02:00
// Checks whether coordinates lie within the bounds of the shape.
fn coordsInBounds2D(coord : vec2<i32>, shape : vec2<i32>) -> bool {
return all(coord >= vec2<i32>(0)) && all(coord < shape);
}
fn coordsInBounds3D(coord : vec3<i32>, shape : vec3<i32>) -> bool {
return all(coord >= vec3<i32>(0)) && all(coord < shape);
}
fn coordsInBounds4D(coord : vec4<i32>, shape : vec4<i32>) -> bool {
return all(coord >= vec4<i32>(0)) && all(coord < shape);
}
fn getIndexFromCoords1D(coord : i32, shape : i32) -> i32 {
return coord;
}
fn getIndexFromCoords2D(coords : vec2<i32>, shape : vec2<i32>) -> i32 {
return dot(coords, vec2<i32>(shape.y, 1));
}
fn getIndexFromCoords3D(coords : vec3<i32>, shape : vec3<i32>) -> i32 {
return dot(coords, vec3<i32>(shape.y * shape.z, shape.z, 1));
2022-02-10 18:27:21 +01:00
}
fn getIndexFromCoords4D(coords : vec4<i32>, shape : vec4<i32>) -> i32 {
return dot(coords, vec4<i32>(
shape.y * shape.z * shape.w, shape.z * shape.w, shape.w, 1));
}
fn idiv(a: i32, b: i32, sign: f32) -> i32 {
var res: i32 = a / b;
let mod: i32 = a % b;
if (sign < 0. && mod != 0) {
res = res - 1;
}
return res;
}
2022-03-07 19:24:06 +01:00
// NaN defination in IEEE 754-1985 is :
// - sign = either 0 or 1.
// - biased exponent = all 1 bits.
// - fraction = anything except all 0 bits (since all 0 bits represents infinity).
// https://en.wikipedia.org/wiki/IEEE_754-1985#Representation_of_non-numbers
fn isnan(val: f32) -> bool {
let floatToUint: u32 = bitcast<u32>(val);
return (floatToUint & 0x7fffffffu) > 0x7f800000u;
2022-02-10 18:27:21 +01:00
}
2022-03-07 19:24:06 +01:00
fn isnanVec4(val : vec4<f32>) -> vec4<bool> {
return vec4<bool>(isnan(val[0]), isnan(val[1]), isnan(val[2]), isnan(val[3]));
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`;function Wde(e){let t="";switch(e){case 0:case 1:t+=`
2022-02-10 18:27:21 +01:00
fn getOutputIndexFromCoords(coords : i32) -> i32 {
return coords;
}
`;break;case 2:t+=`
fn getOutputIndexFromCoords(coords : vec2<i32>) -> i32 {
return dot(coords, vec2<i32>(uniforms.outShapeStrides, 1));
}
`;break;case 3:t+=`
fn getOutputIndexFromCoords(coords : vec3<i32>) -> i32 {
return dot(coords, vec3<i32>(uniforms.outShapeStrides.x, uniforms.outShapeStrides.y, 1));
}
`;break;case 4:t+=`
fn getOutputIndexFromCoords(coords : vec4<i32>) -> i32 {
return dot(coords, vec4<i32>(
uniforms.outShapeStrides.x, uniforms.outShapeStrides.y, uniforms.outShapeStrides.z, 1));
}
2022-04-14 17:47:08 +02:00
`;break;default:w.assert(!1,()=>`Unsupported ${e}D shape`);break}return t}function Vde(e,t,r){let n=e.length,a=pf(t,r),s;if(r?s=`fn setOutputAtIndex(flatIndex : i32, value : vec4<f32>) {
2022-04-01 15:13:32 +02:00
result[flatIndex] = ${a}(value);
2022-02-10 18:27:21 +01:00
}
fn setOutputAtIndexI32(flatIndex : i32, value : vec4<i32>) {
2022-04-01 15:13:32 +02:00
result[flatIndex] = ${a}(value);
}`:s=`fn setOutputAtIndex(flatIndex : i32, value : f32) {
result[flatIndex] = ${a}(value);
2022-02-10 18:27:21 +01:00
}
fn setOutputAtIndexI32(flatIndex : i32, value : i32) {
2022-04-01 15:13:32 +02:00
result[flatIndex] = ${a}(value);
2022-04-11 17:45:24 +02:00
}`,n>=2){let i=["d0","d1","d2","d3"].slice(0,n),o=gr(n);r?s+=`
2022-04-01 15:13:32 +02:00
fn setOutputAtCoords(${i.map(l=>`${l} : i32`).join(", ")}, value : vec4<f32>) {
let flatIndex = getOutputIndexFromCoords(${o}(${i.join(", ")}));
2022-02-10 18:27:21 +01:00
setOutputAtIndex(flatIndex / 4, value);
}
2022-04-01 15:13:32 +02:00
fn setOutputAtCoordsI32(${i.map(l=>`${l} : i32`).join(", ")}, value : vec4<i32>) {
let flatIndex = getOutputIndexFromCoords(${o}(${i.join(", ")}));
2022-02-10 18:27:21 +01:00
setOutputAtIndexI32(flatIndex / 4, value);
}
2022-04-01 15:13:32 +02:00
`:s+=`
fn setOutputAtCoords(${i.map(l=>`${l} : i32`).join(", ")}, value : f32) {
let flatIndex = getOutputIndexFromCoords(${o}(${i.join(", ")}));
2022-02-10 18:27:21 +01:00
setOutputAtIndex(flatIndex, value);
}
2022-04-01 15:13:32 +02:00
fn setOutputAtCoordsI32(${i.map(l=>`${l} : i32`).join(", ")}, value : i32) {
let flatIndex = getOutputIndexFromCoords(${o}(${i.join(", ")}));
2022-02-10 18:27:21 +01:00
setOutputAtIndexI32(flatIndex, value);
}
2022-04-14 17:47:08 +02:00
`}return s}function Ude(e,t,r,n){let a=Gde(e,r);return e.shape.length<=t.length&&(a+=jde(e,t,r,n)),a}function Gde(e,t){let r=e.name,n=e.shape.length,a=gr(n),s="get"+r.charAt(0).toUpperCase()+r.slice(1),i=["d0","d1","d2","d3"].slice(0,n),o=i.map(d=>`${d} : i32`).join(", ");if(n<1)return t?`
2022-04-01 15:13:32 +02:00
fn ${s}() -> vec4<f32> {
return vec4<f32>(${r}[0]);
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
fn ${s}() ->f32 {
return f32(${r}[0]);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;let l=`uniforms.${r.charAt(0).toLowerCase()+r.slice(1)}Shape`,u=`${n}D`;return n===0&&(u="1D"),t?`
fn ${s}(${o}) -> vec4<f32> {
return vec4<f32>(${r}[getIndexFromCoords${u}(${a}(${i.join(",")}),
2022-02-10 18:27:21 +01:00
${l}) / 4]);
}
`:`
2022-04-01 15:13:32 +02:00
fn ${s}(${o}) -> f32 {
return f32(${r}[getIndexFromCoords${u}(${a}(${i.join(",")}),
2022-02-10 18:27:21 +01:00
${l})]);
}
2022-04-14 17:47:08 +02:00
`}function jde(e,t,r,n){let a=e.name,s=a.charAt(0).toUpperCase()+a.slice(1),i="get"+s+"ByOutput",o=e.shape.length,l=t.length,u=gr(l);if(w.arraysEqual(e.shape,t)&&n)return r?`
2022-04-01 15:13:32 +02:00
fn ${i}Index(globalIndex : i32) -> vec4<f32> {
return vec4<f32>(${a}[globalIndex]);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
fn ${i}Coords(coords : ${u}) -> vec4<f32> {
return vec4<f32>(${a}[${l>1?"getOutputIndexFromCoords(coords)":"coords"} / 4]);
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
fn ${i}Index(globalIndex : i32) -> f32 {
return f32(${a}[globalIndex]);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
fn ${i}Coords(coords : ${u}) -> f32 {
return f32(${a}[${l>1?"getOutputIndexFromCoords(coords)":"coords"}]);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;let d=N.getBroadcastDims(e.shape,t),h=l-o,p="";if(o===0)return r?`
fn ${i}Index(globalIndex : i32) -> vec4<f32> {
return get${s}();
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
fn ${i}Coords(coords : ${u}) -> vec4<f32> {
return get${s}();
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
fn ${i}Index(globalIndex : i32) -> f32{
return get${s}();
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
fn ${i}Coords(coords : ${u}) -> f32{
return get${s}();
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`;l<2&&d.length>=1?p="coords = 0;":p=d.map(g=>`coords[${g+h}] = 0;`).join(`
2022-04-11 17:45:24 +02:00
`);let c="";if(l<2&&o>0)c="coords";else if(l>1){let g=gr(o),y=e.shape.map((A,x)=>`coords[${x+h}]`).join(", ");c=`${g}(${y})`}else c="coords";let f=`uniforms.${a.charAt(0).toLowerCase()+a.slice(1)}Shape`,m=`${o}D`;return r?`
2022-04-01 15:13:32 +02:00
fn ${i}Index(globalIndex : i32) -> vec4<f32> {
2022-02-10 18:27:21 +01:00
var coords = getCoordsFromIndex(globalIndex);
2022-04-01 15:13:32 +02:00
${p}
return ${a}[getIndexFromCoords${m}(${c}, ${f}) / 4];
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
fn ${i}Coords(coordsIn : ${u}) -> vec4<f32> {
2022-02-10 18:27:21 +01:00
var coords = coordsIn;
2022-04-01 15:13:32 +02:00
${p}
return ${a}[getIndexFromCoords${m}(${c}, ${f}) / 4];
2022-02-10 18:27:21 +01:00
}
`:`
2022-04-01 15:13:32 +02:00
fn ${i}Index(globalIndex : i32) -> f32 {
2022-02-10 18:27:21 +01:00
var coords = getCoordsFromIndex(globalIndex);
2022-04-01 15:13:32 +02:00
${p}
return f32(${a}[getIndexFromCoords${m}(${c}, ${f})]);
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
fn ${i}Coords(coordsIn : ${u}) -> f32 {
2022-02-10 18:27:21 +01:00
var coords = coordsIn;
2022-04-01 15:13:32 +02:00
${p}
return f32(${a}[getIndexFromCoords${m}(${c}, ${f})]);
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}function Hde(e,t){let{x:r,y:n=[],z:a=[]}=t,s=e.length;if(r.length===s)return[`fn getOutputCoords() -> ${gr(s)}{
2022-02-10 18:27:21 +01:00
let globalIndex = getGlobalIndex();
return getCoordsFromIndex(globalIndex);
}
2022-04-14 17:47:08 +02:00
`,s];let i="",o=[r,n,a],l=0;for(let p=0;p<o.length;p++){let c=o[p];if(c.length!==0)if(l+=c.length,c.length===1)i+=`let d${c[0]} = i32(globalId[${p}]);`;else{let f=Lde(c,"uniforms.outShape");i+=`var index${p} = i32(globalId[${p}]);`;for(let m=0;m<f.length;m++)i+=`let d${c[m]} = index${p} / ${f[m]};`,m===f.length-1?i+=`let d${c[m+1]} = index${p} - d${c[m]} * ${f[m]};`:i+=`index${p} = index${p} - d${c[m]} * ${f[m]};`}}let u=[];for(let p=0;p<l;p++)u.push(`d${p}`);let d=gr(l),h=`fn getOutputCoords() -> ${d} {
2022-04-01 15:13:32 +02:00
${i}
2022-04-14 17:47:08 +02:00
`;return u.length===0?h+=`return ${d}(0); }`:h+=`return ${d}(${u.join(",")}); }`,[h,l]}function aw(e){let t=e.length;if(t<=1)return"fn getCoordsFromIndex(index : i32) -> i32 { return index; }";let r=w.computeStrides(e),n=gr(t),a=[];for(let i=0;i<t;i++)a.push(`d${i}`);if(r.length===1)return` fn getCoordsFromIndex(index : i32) -> vec2<i32> {
2022-02-10 18:27:21 +01:00
let d0 = index / uniforms.outShapeStrides; let d1 = index - d0 * uniforms.outShapeStrides;
return vec2<i32>(d0, d1);
2022-04-01 15:13:32 +02:00
}`;let s="var index2 = index;"+r.map((i,o)=>{let l=`let ${a[o]} = index2 / uniforms.outShapeStrides[${o}]`,u=o===r.length-1?`let ${a[o+1]} = index2 - ${a[o]} * uniforms.outShapeStrides[${o}]`:`index2 = index2 - ${a[o]} * uniforms.outShapeStrides[${o}]`;return`${l}; ${u};`}).join("");return`
fn getCoordsFromIndex(index : i32) -> ${n} {
${s}
return ${n}(${a.join(",")});
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
`}var T8={};Le(T8,{ArrayBufferToTypedArray:()=>C8,GPUBytesPerElement:()=>Qy,computeDispatch:()=>Oe,computeWorkGroupSizeForConv2d:()=>Ab,computeWorkGroupSizeForMatMul:()=>N8,computeWorkPerThreadForConv2d:()=>xb,flatDispatchLayout:()=>Xe,isWebGPUSupported:()=>bb,tilesFitEvenlyIntoShape:()=>Za});var So=e=>{let t=1;for(let r=0;r<e.length;r++)t*=e[r];return t};function Za(e,t){if(e.length!==t.length)throw new Error(`Cannot compute whether rank ${e.length} tiles fit evenly into rank ${t.length} shape - ranks must match.`);return t.every((r,n)=>r%e[n]===0)}function Oe(e,t,r=[1,1,1],n=[1,1,1]){let[a,s,i]=[Math.ceil(So(e.x.map(o=>t[o]))/(r[0]*n[0])),e.y?Math.ceil(So(e.y.map(o=>t[o]))/(r[1]*n[1])):1,e.z?Math.ceil(So(e.z.map(o=>t[o]))/(r[2]*n[2])):1];return[a,s,i]}function Ab(e,t){let r=So(e.x.map(a=>t[a])),n=So(e.y.map(a=>t[a]));return r<=4?[4,16,1]:n<=4?[16,4,1]:[16,16,1]}function N8(e,t,r){return e===1?[32,1,1]:r===1?[1,32,1]:[8,8,1]}function xb(e,t){let r=So(e.x.map(a=>t[a])),n=So(e.y.map(a=>t[a]));return r<=4?[1,2,1]:n<=4?[2,1,1]:[2,2,1]}function Xe(e){return{x:e.map((t,r)=>r)}}function Qy(e){if(e==="float32"||e==="int32"||e==="bool"||e==="string")return 4;if(e==="complex64")return 8;throw new Error(`Unknown dtype ${e}`)}function C8(e,t){if(t==="float32")return new Float32Array(e);if(t==="int32")return new Int32Array(e);if(t==="bool"||t==="string")return Uint8Array.from(new Int32Array(e));throw new Error(`Unknown dtype ${t}`)}function bb(){return(typeof window!="undefined"||typeof WorkerGlobalScope!="undefined")&&!!navigator.gpu}function E8(e,t,r,n){return w.assert(n%4===0&&e[0]===4,()=>"tileInner must be divisible by 4. And ColPerThread must be 4"),`
2022-04-01 15:13:32 +02:00
var<workgroup> mm_Asub : array<array<vec4<f32>, ${n/e[0]}>, ${t}>;
var<workgroup> mm_Bsub : array<array<vec4<f32>, ${r/e[0]}>, ${n}>;
2022-02-10 18:27:21 +01:00
let RowPerThread = ${e[1]};
let ColPerThread = ${e[0]};
2022-04-01 15:13:32 +02:00
let TileInner = ${n};
2022-02-10 18:27:21 +01:00
2022-04-11 17:45:24 +02:00
${Ui()}
2022-02-10 18:27:21 +01:00
let tileRow = ${t===1?"0":"i32(localId.y) * RowPerThread"};
let tileCol = i32(localId.x);
let globalRow = ${t===1?"0":"i32(globalId.y) * RowPerThread"};
let globalCol = i32(globalId.x);
let numTiles = (uniforms.dimInner - 1) / TileInner + 1;
var acc: array<vec4<f32>, RowPerThread>;
var ACached : vec4<f32>;
var BCached : array<vec4<f32>, 4>;
// Loop over shared dimension.
var globalColA = tileCol;
let RowPerThreadB = TileInner / i32(workGroupSizeY);
let tileRowB = i32(localId.y) * RowPerThreadB;
for (var t = 0; t < numTiles; t = t + 1) {
// Load one tile of A into local memory.
for (var innerRow = 0; innerRow < RowPerThread; innerRow = innerRow + 1) {
let inputRow = tileRow + innerRow;
let inputCol = tileCol;
mm_Asub[inputRow][inputCol] = mm_readA(globalRow + innerRow, globalColA, globalId);
}
globalColA = globalColA + TileInner / ColPerThread;
// Load one tile of B into local memory.
for (var innerRow = 0; innerRow < RowPerThreadB; innerRow = innerRow + 1) {
let inputRow = tileRowB + innerRow;
let inputCol = tileCol;
mm_Bsub[inputRow][inputCol] = mm_readB(t * TileInner + inputRow, globalCol, globalId);
}
workgroupBarrier();
// Compute acc values for a single thread.
for (var k = 0; k < TileInner / ColPerThread; k = k + 1) {
BCached[0] = mm_Bsub[k * ColPerThread][tileCol];
BCached[1] = mm_Bsub[k * ColPerThread + 1][tileCol];
BCached[2] = mm_Bsub[k * ColPerThread + 2][tileCol];
BCached[3] = mm_Bsub[k * ColPerThread + 3][tileCol];
for (var i = 0; i < RowPerThread; i = i + 1) {
ACached = mm_Asub[tileRow + i][k];
acc[i] = BCached[0] * ACached.x + acc[i];
acc[i] = BCached[1] * ACached.y + acc[i];
acc[i] = BCached[2] * ACached.z + acc[i];
acc[i] = BCached[3] * ACached.w + acc[i];
}
}
workgroupBarrier();
}
for (var innerRow = 0; innerRow < RowPerThread; innerRow = innerRow + 1) {
mm_write(globalRow + innerRow,
globalCol,
acc[innerRow], globalId);
}
2022-04-14 17:47:08 +02:00
}`}var qde=class{constructor(e,t,r,n=null,a=null,s=null){this.variableNames=["A","B"],this.uniforms="dimAOuter : i32, dimBOuter : i32, dimInner : i32,",this.workGroupSize=[8,8,1],this.isVec4=!0,this.outputShape=t,this.dispatchLayout={x:[2],y:[1],z:[0]},t[1]===1?this.elementsPerThread=[4,1,1]:this.elementsPerThread=[4,4,1],this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,this.elementsPerThread);let i=n!=null,o=s!=null;i&&this.variableNames.push("bias"),o&&this.variableNames.push("preluActivationWeights"),this.tileAOuter=t[1]===1?1:this.workGroupSize[1]*this.elementsPerThread[1],this.tileBOuter=this.workGroupSize[0]*this.elementsPerThread[0],this.tileInner=this.tileBOuter,this.aShape=e,this.addBias=i,this.activation=a,this.hasPreluActivationWeights=o,[this.fitA,this.fitB]=this.getShapeFit(),this.shaderKey=`matMulPackedVec4_${this.activation}_${this.fitA}_${this.fitB}_${this.elementsPerThread}`}getShapeFit(){let e=this.aShape[2],t=this.outputShape[2],r=[this.outputShape[0],e,t],n=[this.tileAOuter,this.tileInner],a=[this.tileInner,this.tileBOuter];return[Za(n,this.aShape.slice(1)),Za(a,r.slice(1))]}getUserCode(){let e=this.fitA?"return A[batch * batchASize + row * uniforms.dimInner / 4 + col]":`if (coordsInBounds2D(vec2<i32>(row, col * 4), vec2<i32>(uniforms.dimAOuter, uniforms.dimInner))) {
2022-04-01 15:12:04 +02:00
return A[batch * batchASize + row * uniforms.dimInner / 4 + col];
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:12:04 +02:00
return vec4<f32>(0.0)`,t=this.fitB?"return B[batch * batchBSize + row * uniforms.dimBOuter / 4 + col]":`if(coordsInBounds2D(vec2<i32>(row, col * 4), vec2<i32>(uniforms.dimInner, uniforms.dimBOuter))) {
return B[batch * batchBSize + row * uniforms.dimBOuter / 4 + col];
2022-02-10 18:27:21 +01:00
}
2022-04-11 17:45:24 +02:00
return vec4<f32>(0.0)`,r="",n="";if(this.activation){let s=ss(this.activation,this.isVec4);this.hasPreluActivationWeights?r=`fn activation(a : vec4<f32>, outCoord : vec3<i32>) -> vec4<f32> {
2022-02-10 18:27:21 +01:00
let b = getPreluActivationWeightsByOutputCoords(outCoord);
2022-04-01 15:13:32 +02:00
${s}
}`:r=`
2022-02-10 18:27:21 +01:00
fn activation(a : vec4<f32>, outCoord : vec3<i32>) -> vec4<f32> {
2022-04-01 15:13:32 +02:00
${s}
}`,n="value = activation(value, outCoord);"}let a=this.addBias?"value = value + getBiasByOutputCoords(outCoord);":"";return`
${r}
2022-02-10 18:27:21 +01:00
fn mm_readA(row : i32, col : i32, globalId : vec3<u32>) -> vec4<f32> {
let batchASize = uniforms.aShape[1] * uniforms.aShape[2] / 4;
let batch = i32(globalId.z);
${e};
}
fn mm_readB(row : i32, col : i32, globalId : vec3<u32>) -> vec4<f32> {
let batchBSize = uniforms.bShape[1] * uniforms.bShape[2] / 4;
let batch = i32(globalId.z);
${t};
}
fn mm_write(row : i32, col : i32, valueIn : vec4<f32>, globalId : vec3<u32>) {
if (row < uniforms.aShape[1] && col * 4 < uniforms.bShape[2])
{
var value = valueIn;
let batch = i32(globalId.z);
let outCoord = vec3<i32>(batch, row, col * 4);
2022-04-01 15:13:32 +02:00
${a}
${n}
2022-02-10 18:27:21 +01:00
setOutputAtCoords(outCoord[0], outCoord[1], outCoord[2], value);
}
}
2022-04-14 17:47:08 +02:00
${E8(this.elementsPerThread,this.tileAOuter,this.tileBOuter,this.tileInner)}
`}};function vb(e,t){let r=t[1]*e[1],n=t[0]*e[0],a=r>n?r:n;return`
2022-04-01 15:13:32 +02:00
var<workgroup> mm_Asub : array<array<f32, ${a}>, ${r}>;
var<workgroup> mm_Bsub : array<array<f32, ${n}>, ${a}>;
2022-04-11 17:45:24 +02:00
${Ui()}
2022-02-10 18:27:21 +01:00
let tileRow = i32(localId.y) * ${e[1]};
let tileCol = i32(localId.x) * ${e[0]};
let globalRow = i32(globalId.y) * ${e[1]};
let globalCol = i32(globalId.x) * ${e[0]};
2022-04-01 15:13:32 +02:00
let numTiles = (uniforms.dimInner - 1) / ${a} + 1;
2022-02-10 18:27:21 +01:00
var acc : array<array<f32, ${e[0]}>, ${e[1]}>;
var ACached : f32;
var BCached : array<f32, ${e[0]}>;
// Without this initialization strange values show up in acc.
for (var innerRow = 0; innerRow < ${e[1]}; innerRow = innerRow + 1) {
for (var innerCol = 0; innerCol < ${e[0]}; innerCol = innerCol + 1) {
acc[innerRow][innerCol] = 0.0;
}
}
2022-04-01 15:13:32 +02:00
let ColPerThreadA = ${a} / ${t[0]};
2022-02-10 18:27:21 +01:00
let tileColA = i32(localId.x) * ColPerThreadA;
2022-04-01 15:13:32 +02:00
let RowPerThreadB = ${a} / ${t[1]};
2022-02-10 18:27:21 +01:00
let tileRowB = i32(localId.y) * RowPerThreadB;
// Loop over shared dimension.
for (var t = 0; t < numTiles; t = t + 1) {
// Load one tile of A into local memory.
for (var innerRow = 0; innerRow < ${e[1]}; innerRow = innerRow + 1) {
for (var innerCol = 0; innerCol < ColPerThreadA; innerCol = innerCol + 1) {
let inputRow = tileRow + innerRow;
let inputCol = tileColA + innerCol;
mm_Asub[inputRow][inputCol] = mm_readA(
globalRow + innerRow,
2022-04-01 15:13:32 +02:00
t * ${a} + inputCol, globalId);
2022-02-10 18:27:21 +01:00
}
}
// Load one tile of B into local memory.
for (var innerRow = 0; innerRow < RowPerThreadB; innerRow = innerRow + 1) {
for (var innerCol = 0; innerCol < ${e[0]}; innerCol = innerCol + 1) {
let inputRow = tileRowB + innerRow;
let inputCol = tileCol + innerCol;
mm_Bsub[inputRow][inputCol] = mm_readB(
2022-04-01 15:13:32 +02:00
t * ${a} + inputRow,
2022-02-10 18:27:21 +01:00
globalCol + innerCol, globalId);
}
}
workgroupBarrier();
// Compute acc values for a single thread.
2022-04-01 15:13:32 +02:00
for (var k = 0; k < ${a}; k = k + 1) {
2022-02-10 18:27:21 +01:00
for (var inner = 0; inner < ${e[0]}; inner = inner + 1) {
BCached[inner] = mm_Bsub[k][tileCol + inner];
}
for (var innerRow = 0; innerRow < ${e[1]}; innerRow = innerRow + 1) {
ACached = mm_Asub[tileRow + innerRow][k];
for (var innerCol = 0; innerCol < ${e[0]}; innerCol = innerCol + 1) {
acc[innerRow][innerCol] = acc[innerRow][innerCol] + ACached * BCached[innerCol];
}
}
}
workgroupBarrier();
}
for (var innerRow = 0; innerRow < ${e[1]}; innerRow = innerRow + 1) {
for (var innerCol = 0; innerCol < ${e[0]}; innerCol = innerCol + 1) {
if ((globalCol + innerCol) < uniforms.dimBOuter &&
(globalRow + innerRow) < uniforms.dimAOuter) {
mm_write(globalRow + innerRow,
globalCol + innerCol,
acc[innerRow][innerCol], globalId);
}
}
}
}
2022-04-14 17:47:08 +02:00
`}function Kde(e){return`
2022-02-10 18:27:21 +01:00
let TileSize = ${e[0]*4};
var<workgroup> mm_Asub : array<vec4<f32>, ${e[0]}>;
2022-04-11 17:45:24 +02:00
${Ui()}
2022-02-10 18:27:21 +01:00
let tileCol = i32(localId.x);
let globalCol = i32(globalId.x);
let globalRow = i32(globalId.y);
let numTiles = (uniforms.dimInner - 1) / TileSize + 1;
// Without this initialization strange values show up in acc.
var acc = 0.0;
// Loop over shared dimension.
for (var t = 0; t < numTiles; t = t + 1) {
// Load one tile of A into local memory.
let colA = t * TileSize + tileCol * 4;
mm_Asub[tileCol] = vec4<f32>(mm_readA(globalRow, colA, globalId),
mm_readA(globalRow, colA + 1, globalId),
mm_readA(globalRow, colA + 2, globalId),
mm_readA(globalRow, colA + 3, globalId));
workgroupBarrier();
// Compute acc values for a single thread.
for (var k = 0; k < TileSize / 4; k = k + 1) {
let rowB = t * TileSize + k * 4;
let BCached = vec4<f32>(mm_readB(rowB, globalCol, globalId),
mm_readB(rowB + 1, globalCol, globalId),
mm_readB(rowB + 2, globalCol, globalId),
mm_readB(rowB + 3, globalCol, globalId));
let ACached = mm_Asub[k];
acc = acc + dot(ACached, BCached);
}
workgroupBarrier();
}
if (globalRow < uniforms.dimAOuter && globalCol < uniforms.dimBOuter) {
mm_write(globalRow, globalCol, acc, globalId);
}
}
2022-04-14 17:47:08 +02:00
`}var R8=class{constructor(e,t,r,n=!1,a=!1,s=null,i=null,o=null){this.variableNames=["A","B"],this.uniforms="dimAOuter : i32, dimBOuter : i32, dimInner : i32,",this.workGroupSize=[16,16,1],this.outputShape=t,this.dispatchLayout={x:[2],y:[1],z:[0]};let l=n?e[1]:e[2];this.workGroupSize=N8(t[1],l,t[2]),(t[1]===1||t[2]===1)&&(r=1),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,[r,r,1]),w.arraysEqual(this.dispatch,[1,1,1])&&(r=1,this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,[r,r,1]));let u=s!=null,d=o!=null;u&&this.variableNames.push("bias"),d&&this.variableNames.push("preluActivationWeights"),this.workPerThread=r,this.aShape=e,this.transposeA=n,this.transposeB=a,this.addBias=u,this.activation=i,this.hasPreluActivationWeights=d;let h=this.outputShape[2],p=this.transposeB?[this.outputShape[0],h,l]:[this.outputShape[0],l,h];[this.fitA,this.fitB]=this.getShapeFit(p),this.shaderKey=`matMulPacked_${this.workPerThread}_${n}_${a}_${this.activation}_${this.fitA}_${this.fitB}_${this.outputShape[1]>1}`}getShapeFit(e){let t=this.workGroupSize[1]*this.workPerThread,r=this.workGroupSize[0]*this.workPerThread,n=t>r?t:r;this.outputShape[1]===1&&(n*=4),w.assert(n%this.workGroupSize[0]===0&&n%this.workGroupSize[1]===0,()=>"tileInner must be multiple of workgroupsize.x and workgroupsize.y");let a=[t,n],s=[n,r];return[Za(a,this.aShape.slice(1)),Za(s,e.slice(1))]}getUserCode(){let e;this.transposeA===!1?e=this.fitA?"return A[batch * batchASize + row * uniforms.dimInner + col];":`if(coordsInBounds2D(vec2<i32>(row, col), vec2<i32>(uniforms.dimAOuter, uniforms.dimInner))) {
2022-04-01 15:12:04 +02:00
return A[batch * batchASize + row * uniforms.dimInner + col];
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:12:04 +02:00
return 0.0;`:e=this.fitA?"return A[batch * batchASize + col * uniforms.dimAOuter + row];":`if(coordsInBounds2D(vec2<i32>(row, col), vec2<i32>(uniforms.dimAOuter, uniforms.dimInner))) {
return A[batch* batchASize + col * uniforms.dimAOuter + row];
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:12:04 +02:00
return 0.0;`;let t;this.transposeB===!1?t=this.fitB?"return B[batch * batchBSize + row * uniforms.dimBOuter + col];":`if(coordsInBounds2D(vec2<i32>(row, col), vec2<i32>(uniforms.dimInner, uniforms.dimBOuter))) {
return B[batch * batchBSize + row * uniforms.dimBOuter + col];
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:12:04 +02:00
return 0.0;`:t=this.fitB?"return B[batch * batchBSize + col * uniforms.dimInner + row];":`if(coordsInBounds2D(vec2<i32>(row, col), vec2<i32>(uniforms.dimInner, uniforms.dimBOuter))) {
return B[batch * batchBSize + col * uniforms.dimInner + row];
2022-02-10 18:27:21 +01:00
}
2022-04-11 17:45:24 +02:00
return 0.0;`;let r="",n="";if(this.activation){let s=ss(this.activation,!1);this.hasPreluActivationWeights?r=`fn activation(a : f32, outCoord : vec3<i32>) -> f32 {
2022-02-10 18:27:21 +01:00
let b = getPreluActivationWeightsByOutputCoords(outCoord);
2022-04-01 15:13:32 +02:00
${s}
}`:r=`
2022-02-10 18:27:21 +01:00
fn activation(a : f32, outCoord : vec3<i32>) -> f32 {
2022-04-01 15:13:32 +02:00
${s}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`,n="value = activation(value, outCoord);"}let a=this.addBias?"value = value + getBiasByOutputCoords(outCoord);":"";return`
${r}
2022-02-10 18:27:21 +01:00
fn mm_readA(row : i32, col : i32, globalId : vec3<u32>) -> f32 {
let batchASize = uniforms.aShape[1] * uniforms.aShape[2];
let batch = i32(globalId.z);
${e}
}
fn mm_readB(row : i32, col : i32, globalId : vec3<u32>) -> f32 {
let batch = i32(globalId.z);
let batchBSize = uniforms.bShape[1] * uniforms.bShape[2];
${t}
}
fn mm_write(row : i32, col : i32, valueIn : f32, globalId : vec3<u32>) {
var value = valueIn;
let batch = i32(globalId.z);
let outCoord = vec3<i32>(batch, row, col);
2022-04-01 15:13:32 +02:00
${a}
${n}
2022-02-10 18:27:21 +01:00
setOutputAtCoords(batch, row, col, value);
}
2022-04-14 17:47:08 +02:00
${this.outputShape[1]>1?vb([this.workPerThread,this.workPerThread,1],this.workGroupSize):Kde(this.workGroupSize)}
`}};function Xde(){return`
2022-02-10 18:27:21 +01:00
var<workgroup> sumValues : array<f32, workGroupSizeX>;
2022-04-11 17:45:24 +02:00
${Ui()}
2022-02-10 18:27:21 +01:00
let coords = getOutputCoords();
let batch = coords[0];
let row = coords[1];
let col = coords[2];
var sum = 0.0;
let Length = uniforms.dimInner;
for (var k = i32(localId.x); k < Length; k = k + i32(workGroupSizeX)) {
let dataA = mm_readA(batch, row, k);
let dataB = mm_readB(batch, k, col);
sum = sum + dataA * dataB;
}
sumValues[localId.x] = sum;
workgroupBarrier();
for(var currentSize = workGroupSizeX / 2u; currentSize > 1u;
currentSize = currentSize / 2u) {
if (localId.x < currentSize)
{
sumValues[localId.x] = sumValues[localId.x] + sumValues[localId.x + currentSize];
}
workgroupBarrier();
}
if (localId.x == 0u) {
sum = sumValues[0] + sumValues[1];
mm_write(batch, row, col, sum);
}
}
2022-04-14 17:47:08 +02:00
`}var Zde=class{constructor(e,t=!1,r=!1,n=null,a=null,s=null){this.variableNames=["A","B"],this.uniforms="dimAOuter : i32, dimBOuter : i32, dimInner : i32,",this.workGroupSize=[256,1,1],this.outputShape=e,this.dispatchLayout={x:[],y:[1,2],z:[0]},this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize);let i=n!=null,o=s!=null;i&&this.variableNames.push("bias"),o&&this.variableNames.push("preluActivationWeights"),this.transposeA=t,this.transposeB=r,this.addBias=i,this.activation=a,this.hasPreluActivationWeights=o,this.shaderKey=`matMulReduce_${this.activation}_${t}_${r}`}getUserCode(){let e;this.transposeA===!1?e="return A[batch * batchASize + row * uniforms.dimInner + col];":e="return A[batch * batchASize + col * uniforms.dimAOuter + row];";let t;this.transposeB===!1?t="return B[batch * batchBSize + row * uniforms.dimBOuter + col];":t="return B[batch * batchBSize + col * uniforms.dimInner + row];";let r="",n="";if(this.activation){let s=ss(this.activation,!1);this.hasPreluActivationWeights?r=`fn activation(a : f32, outCoord : vec3<i32>) -> f32 {
2022-02-10 18:27:21 +01:00
let b = getPreluActivationWeightsByOutputCoords(outCoord);
2022-04-01 15:13:32 +02:00
${s}
}`:r=`
2022-02-10 18:27:21 +01:00
fn activation(a : f32, outCoord : vec3<i32>) -> f32 {
2022-04-01 15:13:32 +02:00
${s}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`,n="value = activation(value, outCoord);"}let a=this.addBias?"value = value + getBiasByOutputCoords(outCoord);":"";return`
${r}
2022-02-10 18:27:21 +01:00
fn mm_readA(batch: i32, row : i32, col : i32) -> f32 {
let batchASize = uniforms.aShape[1] * uniforms.aShape[2];
${e}
}
fn mm_readB(batch: i32, row : i32, col : i32) -> f32 {
let batchBSize = uniforms.bShape[1] * uniforms.bShape[2];
${t}
}
fn mm_write(batch: i32, row : i32, col : i32, valueIn : f32) {
var value = valueIn;
let outCoord = vec3<i32>(batch, row, col);
2022-04-01 15:13:32 +02:00
${a}
${n}
2022-02-10 18:27:21 +01:00
setOutputAtCoords(batch, row, col, value);
}
2022-04-14 17:47:08 +02:00
${Xde()}
`}};function Yde(e){let t=e[1]/2,r=e[0],n=t>r?t:r;return`
2022-04-01 15:13:32 +02:00
var<workgroup> mm_Asub1 : array<array<f32, ${n}>, ${t}>;
var<workgroup> mm_Bsub1 : array<array<f32, ${r}>, ${n}>;
var<workgroup> mm_Asub2 : array<array<f32, ${n}>, ${t}>;
var<workgroup> mm_Bsub2 : array<array<f32, ${r}>, ${n}>;
2022-02-10 18:27:21 +01:00
// If the output size is small for matrix multiplication, avoid to use vec4
// and handle some elements per thread to optimally utilize the ALU.
// Introduces two shared memory buffers, some logical threads could handle
// arithmetic operations and others handle IO operations between barrier api,
// makes ALUs and load/store units work simultaneously, could improves
// the performance.
2022-04-11 17:45:24 +02:00
${Ui()}
2022-02-10 18:27:21 +01:00
let tileRow = i32(localId.y);
let tileCol = i32(localId.x);
let globalRow = i32(globalId.y);
let globalCol = i32(globalId.x);
// uniforms.dimInner should be greater than 0.
2022-04-01 15:13:32 +02:00
let numTiles = (uniforms.dimInner - 1) / ${n} + 1;
2022-02-10 18:27:21 +01:00
var acc = 0.0;
var globalColA = tileCol;
var globalRowB = tileRow;
for (var t = 0; t < numTiles; t = t + 1) {
if (t == 0) {
if (tileRow < ${t}) {
// Load one tile of A and B into local memory.
// globalRow is always greater than or equal tileRow.
mm_Asub1[tileRow][tileCol] =
mm_readA((globalRow - tileRow) / 2 + tileRow, globalColA, globalId);
2022-04-01 15:13:32 +02:00
globalColA = globalColA + ${n};
2022-02-10 18:27:21 +01:00
mm_Bsub1[tileRow][tileCol] = mm_readB(globalRowB, globalCol, globalId);
2022-04-01 15:13:32 +02:00
globalRowB = globalRowB + ${n};
2022-02-10 18:27:21 +01:00
}
} else {
if (tileRow < ${t}) {
// Load one tile of A and B into local memory.
// globalRow is always greater than or equal tileRow.
mm_Asub1[tileRow][tileCol] =
mm_readA((globalRow - tileRow) / 2 + tileRow, globalColA, globalId);
2022-04-01 15:13:32 +02:00
globalColA = globalColA + ${n};
2022-02-10 18:27:21 +01:00
mm_Bsub1[tileRow][tileCol] = mm_readB(globalRowB, globalCol, globalId);
2022-04-01 15:13:32 +02:00
globalRowB = globalRowB + ${n};
2022-02-10 18:27:21 +01:00
} else {
// Compute acc values for a single thread.
2022-04-01 15:13:32 +02:00
for (var k = 0; k < ${n}; k = k + 1) {
2022-02-10 18:27:21 +01:00
let subRow = tileRow - ${t};
if (subRow < 0) {
continue;
}
acc = acc + mm_Asub2[subRow][k] * mm_Bsub2[k][tileCol];
}
}
}
workgroupBarrier();
if (t != 0) {
t = t + 1;
}
if (t < numTiles) {
if (tileRow < ${t}) {
// Load one tile of A and B into local memory.
// globalRow is always greater than or equal tileRow.
mm_Asub2[tileRow][tileCol] =
mm_readA((globalRow - tileRow) / 2 + tileRow, globalColA, globalId);
2022-04-01 15:13:32 +02:00
globalColA = globalColA + ${n};
2022-02-10 18:27:21 +01:00
mm_Bsub2[tileRow][tileCol] = mm_readB(globalRowB, globalCol, globalId);
2022-04-01 15:13:32 +02:00
globalRowB = globalRowB + ${n};
2022-02-10 18:27:21 +01:00
} else {
// Compute acc values for a single thread.
2022-04-01 15:13:32 +02:00
for (var k = 0; k < ${n}; k = k + 1) {
2022-02-10 18:27:21 +01:00
let subRow = tileRow - ${t};
if (subRow < 0) {
continue;
}
acc = acc + mm_Asub1[subRow][k] * mm_Bsub1[k][tileCol];
}
}
}
workgroupBarrier();
}
let writeCol = (globalRow - tileRow) / 2 + tileRow - ${t};
if (tileRow >= ${t} && writeCol >= 0) {
mm_write(writeCol, globalCol, acc, globalId);
}
}
2022-04-14 17:47:08 +02:00
`}var Jde=class{constructor(e,t,r,n=null,a=null,s=null){this.variableNames=["A","B"],this.uniforms="dimAOuter : i32, dimBOuter : i32, dimInner : i32,",this.workGroupSize=[8,16,1],w.assert(e[1]<=16||t[2]<=16,()=>"This program can be only used when A width or B Height are small"),this.outputShape=r,this.dispatchLayout={x:[2],y:[1],z:[0]},this.dispatch=[Math.ceil(r[2]/this.workGroupSize[0]),Math.ceil(r[1]*2/this.workGroupSize[1]),r[0]];let i=n!=null;i&&this.variableNames.push("bias");let o=s!=null;o&&this.variableNames.push("preluActivationWeights"),this.addBias=i,this.activation=a,this.hasPreluActivationWeights=o,this.shaderKey=`matMulSmallOutputSize_${this.activation}`}getUserCode(){let e=`if (coordsInBounds2D(vec2<i32>(row, col), vec2<i32>(uniforms.dimAOuter, uniforms.dimInner))) {
2022-04-01 15:12:04 +02:00
return A[batch * batchASize + row * uniforms.dimInner + col];
2022-02-10 18:27:21 +01:00
}
return 0.0;`,t=`if (coordsInBounds2D(vec2<i32>(row, col), vec2<i32>(uniforms.dimInner, uniforms.dimBOuter))) {
2022-04-01 15:12:04 +02:00
return B[batch * batchBSize + row * uniforms.dimBOuter + col];
2022-02-10 18:27:21 +01:00
}
2022-04-11 17:45:24 +02:00
return 0.0;`,r="",n="";if(this.activation){let s=ss(this.activation,!1);this.hasPreluActivationWeights?r=`fn activation(a : f32, outCoord : vec3<i32>) -> f32 {
2022-02-10 18:27:21 +01:00
let b = getPreluActivationWeightsByOutputCoords(outCoord);
2022-04-01 15:13:32 +02:00
${s}
}`:r=`fn activation(a : f32, outCoord : vec3<i32>) -> f32 {
${s}
}`,n="value = activation(value, outCoord);"}let a=this.addBias?"value = value + getBiasByOutputCoords(outCoord);":"";return`
${r}
2022-02-10 18:27:21 +01:00
fn mm_readA(row : i32, col : i32, globalId : vec3<u32>) -> f32 {
let batchASize = uniforms.aShape[1] * uniforms.aShape[2];
let batch = i32(globalId.z);
${e}
}
fn mm_readB(row : i32, col : i32, globalId : vec3<u32>) -> f32 {
let batch = i32(globalId.z);
let batchBSize = uniforms.bShape[1] * uniforms.bShape[2];
${t}
}
fn mm_write(row : i32, col : i32, valueIn : f32, globalId : vec3<u32>) {
if (coordsInBounds2D(vec2<i32>(row, col), vec2<i32>(uniforms.dimAOuter, uniforms.dimBOuter))) {
let batch = i32(globalId.z);
let outCoord = vec3<i32>(batch, row, col);
var value = valueIn;
2022-04-01 15:13:32 +02:00
${a}
${n}
2022-02-10 18:27:21 +01:00
setOutputAtCoords(batch, row, col, value);
}
}
2022-04-14 17:47:08 +02:00
${Yde(this.workGroupSize)}
`}};function qe(e){let{inputs:t,attrs:r}=e,{x:n}=t,{shape:a}=r,s=w.sizeFromShape(n.shape),i=w.inferFromImplicitShape(a,s),o=w.sizeFromShape(i);return w.assert(s===o,()=>`The new shape (${i}) has ${o} elements and the old shape (${n.shape}) has ${s} elements. The new shape and old shape must have the same number of elements.`),e.backend.incRef(n.dataId),{dataId:n.dataId,shape:i,dtype:n.dtype}}var Qde={kernelName:ul,backendName:"webgpu",kernelFunc:qe};function wb({a:e,b:t,transposeA:r,transposeB:n,backend:a,bias:s=null,preluActivationWeights:i=null,leakyreluAlpha:o=0,activation:l=null}){let u=e.shape.length,d=t.shape.length,h=r?e.shape[u-2]:e.shape[u-1],p=n?t.shape[d-1]:t.shape[d-2],c=r?e.shape[u-1]:e.shape[u-2],f=n?t.shape[d-2]:t.shape[d-1],m=e.shape.slice(0,-2),g=t.shape.slice(0,-2),y=w.sizeFromShape(m),A=w.sizeFromShape(g),x=Sl.assertAndGetBroadcastShape(e.shape.slice(0,-2),t.shape.slice(0,-2)).concat([c,f]);w.assert(h===p,()=>`Error in matMul: inner shapes (${h}) and (${p}) of Tensors with shapes ${e.shape} and ${t.shape} and transposeA=${r} and transposeB=${n} must match.`);let b=r?[y,h,c]:[y,c,h],v=n?[A,f,p]:[A,p,f],S=qe({inputs:{x:e},backend:a,attrs:{shape:b}}),T=qe({inputs:{x:t},backend:a,attrs:{shape:v}}),E=[S,T],R=Math.max(y,A),_=h%4===0&&f%4===0&&!r&&!n&&f>=32,M;c*f<=32?M=new Zde([R,c,f],r,n,s,l,i):!r&&!n&&(c<=16&&(f<=512||p>=2*f)||f<=16&&(c<=512||h>=2*c))?M=new Jde(b,v,[R,c,f],s,l,i):_?M=new qde(b,[R,c,f],Y().get("WEBGPU_MATMUL_WORK_PER_THREAD"),s,l,i):M=new R8(b,[R,c,f],Y().get("WEBGPU_MATMUL_WORK_PER_THREAD"),r,n,s,l,i);let I=[S,T];s&&I.push(s),i&&I.push(i);let z=[{type:"int32",data:[c]},{type:"int32",data:[f]},{type:"int32",data:[h]}];l==="leakyrelu"&&(z.push({type:"float32",data:[o]}),M.uniforms+=" alpha : f32,");let O=a.runWebGPUProgram(M,I,e.dtype,z),j=qe({inputs:{x:O},backend:a,attrs:{shape:x}});E.push(O);for(let X of E)a.disposeData(X.dataId);return j}function epe(e){let{inputs:t,backend:r,attrs:n}=e,{a,b:s,bias:i,preluActivationWeights:o}=t,{transposeA:l,transposeB:u,activation:d,leakyreluAlpha:h}=n;return wb({a,b:s,transposeA:l,transposeB:u,backend:r,bias:i,preluActivationWeights:o,leakyreluAlpha:h,activation:d})}var tpe={kernelName:Ms,backendName:"webgpu",kernelFunc:epe},sw=class{constructor(e,t,r){this.variableNames=["AReal","AImag","BReal","BImag"],this.workGroupSize=[128,1,1],this.size=!0,this.outputShape=N.assertAndGetBroadcastShape(t,r),this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.shaderKey=`binaryOpComplex_${e}`,this.op=e}getUserCode(){return`
2022-02-10 18:27:21 +01:00
fn binaryOpComplex(
areal : f32, aimag : f32, breal : f32, bimag : f32) -> f32 {
2022-04-14 17:47:08 +02:00
${Wh(this.op,!1)}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if(index < uniforms.size) {
let areal = getARealByOutputIndex(index);
let aimag = getAImagByOutputIndex(index);
let breal = getBRealByOutputIndex(index);
let bimag = getBImagByOutputIndex(index);
setOutputAtIndex(index, binaryOpComplex(areal, aimag, breal, bimag));
}
}
2022-04-14 17:47:08 +02:00
`}},rpe=class{constructor(e,t,r,n){this.variableNames=["A","B"],this.size=!0;let a=256;this.workGroupSize=[a,1,1],this.outputShape=N.assertAndGetBroadcastShape(t,r),this.dispatchLayout=Xe(this.outputShape),this.lastDimensionSize=n?r[0]:t[0],this.lastDimensionSize<256?this.workPerThread=1:this.lastDimensionSize<512?this.workPerThread=2:this.workPerThread=4,this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,[this.workPerThread,1,1]),this.useSharedMemoryWithB=n,this.op=e,this.shaderKey=`binaryShared_${e}_${this.lastDimensionSize}_${this.useSharedMemoryWithB}`}getUserCode(){let e=this.lastDimensionSize>1?`coords[${this.outputShape.length-1}]`:"0",t=this.useSharedMemoryWithB?`let a = getAByOutputCoords(coords);
2022-02-10 18:27:21 +01:00
let b = sharedBuf[${e}];`:`let a = sharedBuf[${e}];
let b = getBByOutputCoords(coords);`;return`
fn binaryOperation(a : f32, b : f32) -> f32 {
2022-04-14 17:47:08 +02:00
${Wh(this.op,!1)}
2022-02-10 18:27:21 +01:00
}
var<workgroup> sharedBuf : array<f32, ${this.lastDimensionSize}>;
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
// Fill in the shared memory buffer. Here we need a loop to make sure
// that all data in A|B are uploaded when |sharedMemorySize| is larger
// than work group size.
for(var localIndex = i32(localId.x); localIndex < ${this.lastDimensionSize}; localIndex = localIndex + ${this.workGroupSize[0]}) {
2022-04-01 15:12:04 +02:00
sharedBuf[localIndex] = f32(${this.useSharedMemoryWithB?"B":"A"}[localIndex]);
2022-02-10 18:27:21 +01:00
}
workgroupBarrier();
for(var i = 0; i < ${this.workPerThread}; i = i + 1) {
let flatIndex = index * ${this.workPerThread} + i;
if(flatIndex < uniforms.size) {
let coords = getCoordsFromIndex(flatIndex);
${t}
setOutputAtIndex(flatIndex, binaryOperation(a, b));
}
}
}
2022-04-14 17:47:08 +02:00
`}},npe=class{constructor(e,t,r){this.variableNames=["A","B"],this.workPerThread=4,this.isVec4=!0,this.size=!0;let n=128;this.workGroupSize=[n,1,1],this.outputShape=N.assertAndGetBroadcastShape(t,r),this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,[this.workPerThread,1,1]),this.op=e,this.shaderKey=`binaryVec4_${e}`}getUserCode(){return`
2022-02-10 18:27:21 +01:00
fn binaryOperation(a : vec4<f32>, b : vec4<f32>) -> vec4<f32> {
2022-04-14 17:47:08 +02:00
${Wh(this.op,this.isVec4)}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let a = getAByOutputIndex(index);
let b = getBByOutputIndex(index);
setOutputAtIndex(index, binaryOperation(a, b));
}
}
2022-04-14 17:47:08 +02:00
`}},M8=class{constructor(e,t,r){this.variableNames=["A","B"],this.size=!0;let n=128;this.workGroupSize=[n,1,1],this.outputShape=N.assertAndGetBroadcastShape(t,r),this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.shaderKey=`binary_${e}`,this.op=e}getUserCode(){return`
2022-02-10 18:27:21 +01:00
fn binaryOperation(a : f32, b : f32) -> f32 {
2022-04-14 17:47:08 +02:00
${Wh(this.op,!1)}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let a = getAByOutputIndex(index);
let b = getBByOutputIndex(index);
setOutputAtIndex(index, binaryOperation(a, b));
}
}
2022-04-14 17:47:08 +02:00
`}};function iw(e,t,r){if(w.arraysEqual(t,r)&&w.sizeFromShape(t)%4===0)return new npe(e,t,r);let n=t.length===1&&r.length>1&&t[0]<1024,a=r.length===1&&t.length>1&&r[0]<1024;return n||a?new rpe(e,t,r,a):new M8(e,t,r)}function Vn(e){let{inputs:t}=e,{x:r}=t;return e.backend.incRef(r.dataId),{dataId:r.dataId,shape:r.shape,dtype:r.dtype}}var ape={kernelName:pi,backendName:"webgpu",kernelFunc:Vn};function Cd(e){let{inputs:t,backend:r}=e,{real:n,imag:a}=t,s=r.makeTensorInfo(n.shape,"complex64"),i=r.tensorMap.get(s.dataId),o=Vn({inputs:{x:n},backend:r}),l=Vn({inputs:{x:a},backend:r});return i.complexTensorInfos={real:o,imag:l},s}var spe={kernelName:Xp,backendName:"webgpu",kernelFunc:Cd},Vh=class{constructor(e,t){this.variableNames=["A"],this.size=!0;let r=128;this.workGroupSize=[r,1,1],this.outputShape=e,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.op=t,this.shaderKey=`unary_${t}`}getUserCode(){return`
2022-02-10 18:27:21 +01:00
fn unaryOperation(a : f32) -> f32 {
2022-04-14 17:47:08 +02:00
${fo(this.op,!1)}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let a = getAByOutputIndex(index);
setOutputAtIndex(index, unaryOperation(a));
}
}
2022-04-14 17:47:08 +02:00
`}};function kr({opType:e,cpuKernelImpl:t,dtype:r}){return({inputs:n,backend:a})=>{let{x:s}=n,i=a,o=r||s.dtype;if(i.shouldExecuteOnCPU([s])&&t!=null){let u=i.tensorMap.get(s.dataId),d=t(u.values,o);return i.makeTensorInfo(s.shape,o,d)}let l=new Vh(s.shape,e);return i.runWebGPUProgram(l,[s],o)}}function jr({opSnippet:e,cpuKernelImpl:t,supportsComplex:r=!1,dtype:n}){return({inputs:a,backend:s})=>{let{a:i,b:o}=a,l=s;if(r&&i.dtype==="complex64"){let h=l.tensorMap.get(i.dataId),p=l.tensorMap.get(o.dataId),c,f;if(e!==0)[c,f]=[[h.complexTensorInfos.real,p.complexTensorInfos.real],[h.complexTensorInfos.imag,p.complexTensorInfos.imag]].map(g=>{let[y,A]=g,x={dataId:y.dataId,dtype:y.dtype,shape:i.shape},b={dataId:A.dataId,dtype:A.dtype,shape:o.shape},v=iw(e,i.shape,o.shape);return l.runWebGPUProgram(v,[x,b],Cr(y.dtype,A.dtype))});else{let g=new sw(17,i.shape,o.shape),y=new sw(18,i.shape,o.shape),A=[{dataId:h.complexTensorInfos.real.dataId,dtype:h.complexTensorInfos.real.dtype,shape:i.shape},{dataId:h.complexTensorInfos.imag.dataId,dtype:h.complexTensorInfos.imag.dtype,shape:i.shape},{dataId:p.complexTensorInfos.real.dataId,dtype:p.complexTensorInfos.real.dtype,shape:o.shape},{dataId:p.complexTensorInfos.imag.dataId,dtype:p.complexTensorInfos.imag.dtype,shape:o.shape}];c=l.runWebGPUProgram(g,A,"float32"),f=l.runWebGPUProgram(y,A,"float32")}let m=Cd({inputs:{real:c,imag:f},backend:l});return l.disposeData(c.dataId),l.disposeData(f.dataId),m}let u=n||Cr(i.dtype,o.dtype);if((i.dtype==="string"||o.dtype==="string"||l.shouldExecuteOnCPU([i,o]))&&t!=null){let h=l.tensorMap.get(i.dataId).values,p=l.tensorMap.get(o.dataId).values,c=i.dtype==="string"?N.fromUint8ToStringArray(h):h,f=i.dtype==="string"?N.fromUint8ToStringArray(p):p,[m,g]=t(i.shape,o.shape,c,f,u);return l.makeTensorInfo(g,u,m)}let d=iw(e,i.shape,o.shape);return l.runWebGPUProgram(d,[i,o],u)}}var{addImpl:ipe,ceilImpl:ope,concatImpl:lpe,equalImpl:upe,expImpl:dpe,expm1Impl:ppe,floorImpl:hpe,gatherNdImpl:cpe,gatherV2Impl:fpe,greaterEqualImpl:mpe,greaterImpl:gpe,lessEqualImpl:ype,lessImpl:Ape,logImpl:xpe,maxImpl:bpe,maximumImpl:vpe,minimumImpl:wpe,multiplyImpl:kpe,negImpl:Ipe,notEqualImpl:Spe,prodImpl:Tpe,rangeImpl:Npe,rsqrtImpl:Cpe,simpleAbsImpl:Epe,sliceImpl:Rpe,stridedSliceImpl:Mpe,stringNGramsImpl:Fpe,subImpl:$pe,tileImpl:Ppe,topKImpl:_pe,transposeImpl:zpe,uniqueImpl:BAe}=c0,Ope=kr({opType:0,cpuKernelImpl:Epe}),Dpe={kernelName:Lo,backendName:"webgpu",kernelFunc:Ope},Lpe=jr({opSnippet:1,cpuKernelImpl:ipe,supportsComplex:!0}),Bpe={kernelName:Ya,backendName:"webgpu",kernelFunc:Lpe},Wpe=class{constructor(e){this.workPerThread=4,this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=e[0],this.variableNames=e.map((t,r)=>`T${r}`),this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,[this.workPerThread,1,1]),this.shaderKey="addN"}getUserCode(){let e=[];this.variableNames.forEach(r=>{e.push(`let v${r} = get${r}ByOutputCoords(coords);`)});let t=this.variableNames.map(r=>`v${r}`).join(" + ");return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
for (var i = 0; i < ${this.workPerThread}; i = i + 1) {
let flatIndex = index * ${this.workPerThread} + i;
if (flatIndex < uniforms.size) {
let coords = getCoordsFromIndex(flatIndex);
${e.join(`
`)}
setOutputAtIndex(flatIndex, ${t});
}
}
}
2022-04-14 17:47:08 +02:00
`}};function Vpe(e){let{inputs:t,backend:r}=e,n=t;if(n.length===1)return Vn({inputs:{x:n[0]},backend:r});let a=n.map(o=>o.dtype).reduce((o,l)=>Cr(o,l)),s=n.map(o=>o.shape),i=new Wpe(s);return r.runWebGPUProgram(i,n,a)}var Upe={kernelName:qs,backendName:"webgpu",kernelFunc:Vpe},F8=class{constructor(e,t,r){this.workGroupSize=[64,1,1],this.variableNames=["x"],this.uniforms="axis : i32, infinityValue : f32,",this.size=!0;let n=[t];N.assertAxesAreInnerMostDims("arg"+r.charAt(0).toUpperCase()+r.slice(1),n,e.length),this.op=r==="min"?"<":">";let[a]=N.computeOutAndReduceShapes(e,n);this.outputShape=a.length===0?[1]:a,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,[1,1,1]),this.inputShape=e,this.shaderKey=`argMinMax${this.op}`}getUserCode(){let e=`
2022-02-10 18:27:21 +01:00
var<workgroup> xBestIndices : array<i32, ${this.workGroupSize[0]}>;
var<workgroup> xBestValues : array<f32, ${this.workGroupSize[0]}>;
2022-04-01 15:13:32 +02:00
`,t=(n,a)=>this.outputShape.length===1?n:`${n}[${a}]`,r=n=>this.inputShape.length===1?"uniforms.xShape":`uniforms.xShape[${n}]`;return`
2022-02-10 18:27:21 +01:00
fn DIV_CEIL(a : u32, b : u32) -> u32 {
return ((a - 1u) / b + 1u);
}
${e}
// In order to get a flattened index into the input tensor, we need to
// add back the index along the reduced dimension to |outputCoords|.
// This function outputs the offset to the first value along
// |axis| and the stride to get the next value of the input along |axis|.
fn getInputCoordInfo(outputIndex : i32) -> vec2<i32>{
let outputCoords = getCoordsFromIndex(outputIndex);
var i = ${this.outputShape.length-1};
var stride = 1;
var inputStride = 1;
var offset = 0;
for (var r = 1; r <= ${this.inputShape.length}; r = r + 1) {
2022-04-01 15:13:32 +02:00
let length = ${r(`${this.inputShape.length} - r`)};
2022-02-10 18:27:21 +01:00
if (${this.inputShape.length} - r == uniforms.axis) {
inputStride = stride;
} else {
offset = offset + ${t("outputCoords","i")} * stride;
i = i - 1;
}
stride = stride * length;
}
return vec2<i32>(offset, inputStride);
}
fn getInputIndex(coordInfo : vec2<i32>, index : i32) -> i32{
return coordInfo[0] + coordInfo[1] * index;
}
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
let outputIndex = index / i32(workGroupSizeX);
let coordInfo = getInputCoordInfo(outputIndex);
2022-04-01 15:13:32 +02:00
let Length = ${r("uniforms.axis")};
2022-02-10 18:27:21 +01:00
var bestIndex = i32(localId.x);
var bestValue = uniforms.infinityValue;
for (var k = i32(localId.x); k < Length && outputIndex < uniforms.size;
k = k + i32(workGroupSizeX)) {
2022-04-01 15:12:04 +02:00
let candidate = f32(x[getInputIndex(coordInfo, k)]);
2022-03-07 19:24:06 +01:00
if (!isnan(candidate) && candidate ${this.op} bestValue) {
2022-02-10 18:27:21 +01:00
bestValue = candidate;
bestIndex = k;
}
}
xBestValues[localId.x] = bestValue;
xBestIndices[localId.x] = bestIndex;
workgroupBarrier();
var reduceSize = min(u32(Length), workGroupSizeX);
for (var currentSize = reduceSize / 2u; reduceSize > 1u;
currentSize = reduceSize / 2u) {
let interval = DIV_CEIL(reduceSize, 2u);
if (localId.x < currentSize) {
let candidate = xBestValues[localId.x + interval];
if (candidate ${this.op} bestValue) {
bestValue = candidate;
xBestValues[localId.x] = bestValue;
xBestIndices[localId.x] = xBestIndices[localId.x + interval];
}
}
reduceSize = interval;
workgroupBarrier();
}
if (localId.x == 0u && outputIndex < uniforms.size) {
setOutputAtIndexI32(outputIndex, xBestIndices[localId.x]);
}
}
2022-04-14 17:47:08 +02:00
`}},Gpe=class{constructor(e,t){this.variableNames=["A"],this.workGroupSize=[16,16,1];let r=new Array(e.length);for(let n=0;n<r.length;n++)r[n]=e[t[n]];this.outputShape=r,this.dispatchLayout={x:[0],y:[1]},this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,[1,1,1]),this.shaderKey="transposeShared"}getUserCode(){return`
2022-02-10 18:27:21 +01:00
let TILE_DIM = ${this.workGroupSize[0]};
var<workgroup> tile : array<array<f32, ${this.workGroupSize[0]+1}>, ${this.workGroupSize[0]}>;
2022-04-14 17:47:08 +02:00
${yb()}
2022-02-10 18:27:21 +01:00
fn main(@builtin(local_invocation_id) localId : vec3<u32>,
@builtin(workgroup_id) workgroupId : vec3<u32>) {
var x = i32(workgroupId.x) * TILE_DIM + i32(localId.x);
var y = i32(workgroupId.y) * TILE_DIM + i32(localId.y);
let width = uniforms.outShape[0];
let height = uniforms.outShape[1];
if (x < width && y < height) {
2022-04-01 15:12:04 +02:00
tile[localId.y][localId.x] = A[y * width + x];
2022-02-10 18:27:21 +01:00
}
workgroupBarrier();
x = i32(workgroupId.y) * TILE_DIM + i32(localId.x);
y = i32(workgroupId.x) * TILE_DIM + i32(localId.y);
if (x < height && y < width) {
setOutputAtIndex((y * height + x), tile[localId.x]
[localId.y]);
}
}
2022-04-14 17:47:08 +02:00
`}},jpe=class{constructor(e,t){this.variableNames=["A"],this.workPerThread=4,this.workGroupSize=[64,1,1],this.size=!0;let r=new Array(e.length);for(let n=0;n<r.length;n++)r[n]=e[t[n]];this.outputShape=r,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,[this.workPerThread,1,1]),this.newDim=t,this.shaderKey=`transpose_${t}`}getUserCode(){let e=gr(this.outputShape.length),t=Hpe(this.newDim);return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
for(var i = 0; i < ${this.workPerThread}; i = i + 1) {
let flatIndex = index * ${this.workPerThread} + i;
if(flatIndex < uniforms.size) {
let resRC = getCoordsFromIndex(flatIndex);
2022-04-01 15:12:04 +02:00
setOutputAtIndex(flatIndex, A[getIndexFromCoords${this.outputShape.length}D(
2022-02-10 18:27:21 +01:00
${e}(${t}), uniforms.aShape)]);
}
}
}
2022-04-14 17:47:08 +02:00
`}};function Hpe(e){let t=e.length;if(t>4)throw Error(`Transpose for rank ${t} is not yet supported`);let r=new Array(t);for(let n=0;n<e.length;n++)r[e[n]]=`resRC[${n}]`;return r.join()}function zl(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{perm:s}=n,i=r,o=a.shape.length,l=new Array(o);for(let d=0;d<l.length;d++)l[d]=a.shape[s[d]];if(r.shouldExecuteOnCPU([a])){let d=i.tensorMap.get(a.dataId).values,h=zpe(d,a.shape,a.dtype,s,l);return r.makeTensorInfo(l,a.dtype,h)}if(a.shape.length===2&&w.arraysEqual(s,[1,0])){let d=new Gpe(a.shape,s);return i.runWebGPUProgram(d,[a],a.dtype)}let u=new jpe(a.shape,s);return i.runWebGPUProgram(u,[a],a.dtype)}var qpe={kernelName:Oi,backendName:"webgpu",kernelFunc:zl};function Kpe(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{axis:s}=n,i=w.parseAxisParam(s,a.shape),o=N.getAxesPermutation(i,a.shape.length),l=a,u=[];o!=null&&(l=zl({inputs:{x:a},backend:r,attrs:{perm:o}}),u.push(l),i=N.getInnerMostAxes(i.length,l.shape.length)),N.assertAxesAreInnerMostDims("argMax",[i[0]],l.shape.length);let d=new F8(l.shape,i[0],"max"),h=[{type:"int32",data:[i[0]]},{type:"float32",data:[Number.NEGATIVE_INFINITY]}],p=r.runWebGPUProgram(d,[l],"int32",h);return u.forEach(c=>r.disposeData(c.dataId)),p}var Xpe={kernelName:Ks,backendName:"webgpu",kernelFunc:Kpe};function Zpe(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{axis:s}=n,i=w.parseAxisParam(s,a.shape),o=N.getAxesPermutation(i,a.shape.length),l=a,u=[];o!=null&&(l=zl({inputs:{x:a},backend:r,attrs:{perm:o}}),u.push(l),i=N.getInnerMostAxes(i.length,l.shape.length)),N.assertAxesAreInnerMostDims("argMin",[i[0]],l.shape.length);let d=new F8(l.shape,i[0],"min"),h=[{type:"int32",data:[i[0]]},{type:"float32",data:[Number.POSITIVE_INFINITY]}],p=r.runWebGPUProgram(d,[l],"int32",h);return u.forEach(c=>r.disposeData(c.dataId)),p}var Ype={kernelName:Du,backendName:"webgpu",kernelFunc:Zpe},$8=class{constructor(e,t){this.variableNames=["x"],this.uniforms="stride : vec2<i32>, pad : vec2<i32>, dilation : vec2<i32>, convDims : vec2<i32>, filterDims : vec2<i32>,",this.workGroupSize=[128,1,1],this.size=!0,this.outputShape=e.outShape,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.shaderKey=`pool2D_${t}`,this.poolType=t}getUserCode(){let e="resultValue = max(value, resultValue);";this.poolType==="avg"&&(e="resultValue = resultValue + value; count = count + 1.0;");let t="resultValue";return this.poolType==="avg"&&(t="resultValue / count"),`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let coords = getCoordsFromIndex(index);
let batch = coords[0];
let xRCCorner = vec2<i32>(coords.yz) * uniforms.stride - uniforms.pad;
let xRCorner = xRCCorner.x;
let xCCorner = xRCCorner.y;
var resultValue = ${this.poolType==="avg"?"0.0":"-1.0 / pow(10.0, -20.0)"};
var count = 0.0;
for (var wR = 0; wR < uniforms.filterDims.x; wR = wR + uniforms.dilation.x) {
let xR = xRCorner + wR;
if (xR < 0 || xR >= uniforms.convDims.x) {
continue;
}
for (var wC = 0; wC < uniforms.filterDims.y; wC = wC + uniforms.dilation.y) {
let xC = xCCorner + wC;
if (xC < 0 || xC >= uniforms.convDims.y) {
continue;
}
let value = getX(batch, xR, xC, coords[3]);
${e}
}
}
setOutputAtIndex(index, ${t});
}
}
2022-04-14 17:47:08 +02:00
`}},P8=class{constructor(e){this.variableNames=["x"],this.uniforms="stride : vec2<i32>,",this.workGroupSize=[256,1,1],this.size=!0,this.outputShape=e.outShape,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.shaderKey="poolWithFilterSizeEqualsOne"}getUserCode(){return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let coords = getCoordsFromIndex(index);
let batch = coords[0];
let d = coords[3];
let xRCCorner = coords.yz * uniforms.stride;
let xRCorner = xRCCorner.x;
let xCCorner = xRCCorner.y;
let value = getX(batch, xRCorner, xCCorner, d);
setOutputAtIndex(index, value);
}
}
2022-04-14 17:47:08 +02:00
`}};function Jpe(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{filterSize:s,strides:i,pad:o,dimRoundingMode:l}=n,u=1,d=N.computePool2DInfo(a.shape,s,i,u,o,l);if(d.filterWidth===1&&d.filterHeight===1&&w.arraysEqual(d.inShape,d.outShape))return Vn({inputs:{x:a},backend:r});let h,p=[{type:"int32",data:[d.strideHeight,d.strideWidth]}];return d.filterHeight===1&&d.filterWidth===1?h=new P8(d):(h=new $8(d,"avg"),p.push({type:"int32",data:[d.padInfo.top,d.padInfo.left]},{type:"int32",data:[d.dilationHeight,d.dilationWidth]},{type:"int32",data:[d.inHeight,d.inWidth]},{type:"int32",data:[d.effectiveFilterHeight,d.effectiveFilterWidth]})),r.runWebGPUProgram(h,[a],a.dtype,p)}var Qpe={kernelName:Xs,backendName:"webgpu",kernelFunc:Jpe};function ehe(e){let{inputs:t,backend:r,attrs:n}=e,{a,b:s}=t,{transposeA:i,transposeB:o}=n;return wb({a,b:s,transposeA:i,transposeB:o,backend:r})}var the={kernelName:Zs,backendName:"webgpu",kernelFunc:ehe},rhe=class{constructor(e,t){this.variableNames=["source"],this.workPerThread=1,this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=t,this.rank=t.length,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,[this.workPerThread,1,1]),this.start=e,this.uniforms=`start : ${gr(e.length)}, `,this.shaderKey="slice"}getUserCode(){let e=gr(this.rank),t=nhe(this.rank),r;return this.start.length===1?r=this.outputShape.map((n,a)=>"sourceLoc = uniforms.start + coords;"):r=this.outputShape.map((n,a)=>`sourceLoc.${e2[a]} = uniforms.start[${a}] + coords.${e2[a]};`),`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
var sourceLoc : ${e};
let coords = getCoordsFromIndex(index);
2022-04-01 15:13:32 +02:00
${r.join(`
2022-02-10 18:27:21 +01:00
`)}
setOutputAtIndex(index, getSource(${t}));
}
}
2022-04-14 17:47:08 +02:00
`}},e2=["x","y","z","w","u","v"];function nhe(e){if(e===1)return"sourceLoc";if(e<=6)return e2.slice(0,e).map(t=>`sourceLoc.${t}`).join(",");throw Error(`Slicing for rank ${e} is not yet supported`)}function Ed(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{begin:s,size:i}=n,[o,l]=_t.parseSliceParams(a,s,i);if(_t.assertParamsValid(a,o,l),r.shouldExecuteOnCPU([a])||a.dtype==="string"){let h=r.tensorMap.get(a.dataId),p=Rpe(h.values,o,l,a.shape,a.dtype);return r.makeTensorInfo(l,a.dtype,p)}if(w.sizeFromShape(l)===0)return r.makeTensorInfo(l,a.dtype,[]);let u=new rhe(o,l),d=[{type:"int32",data:o}];return r.runWebGPUProgram(u,[a],a.dtype,d)}var ahe={kernelName:fl,backendName:"webgpu",kernelFunc:Ed},she=e=>{let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{blockShape:s,crops:i}=n;w.assert(a.shape.length<=4,()=>"batchToSpaceND for rank > 4 with a WebGPU backend not implemented yet");let o=s.reduce((A,x)=>A*x),l=N.getReshaped(a.shape,s,o),u=N.getPermuted(l.length,s.length),d=N.getReshapedPermuted(a.shape,s,o),h=N.getSliceBeginCoords(i,s.length),p=N.getSliceSize(d,i,s.length),c=[],f=qe({inputs:{x:a},backend:r,attrs:{shape:l}}),m=zl({inputs:{x:f},backend:r,attrs:{perm:u}}),g=qe({inputs:{x:m},backend:r,attrs:{shape:d}}),y=Ed({inputs:{x:g},backend:r,attrs:{begin:h,size:p}});return c.push(f),c.push(m),c.push(g),c.forEach(A=>r.disposeData(A.dataId)),y},ihe={kernelName:Bo,backendName:"webgpu",kernelFunc:she},_8=jr({opSnippet:10,dtype:"bool",cpuKernelImpl:Spe}),ohe={kernelName:rl,backendName:"webgpu",kernelFunc:_8};function Uh(e){let{inputs:t,backend:r}=e,{input:n}=t,a=r.tensorMap.get(n.dataId);return Vn({inputs:{x:a.complexTensorInfos.real},backend:r})}var lhe={kernelName:ah,backendName:"webgpu",kernelFunc:Uh};function uhe(e,t){let r=new Vh(e.shape,22),n=t.runWebGPUProgram(r,[e],"int32");return{dataId:n.dataId,shape:n.shape,dtype:n.dtype}}function t2(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{dtype:s}=n;if(s==="complex64"){if(a.dtype==="complex64")return Vn({inputs:{x:a},backend:r});let i=Wt(a.shape),o=t2({inputs:{x:a},backend:r,attrs:{dtype:"float32"}}),l=Cd({inputs:{real:o,imag:i},backend:r});return i.dispose(),r.disposeData(o.dataId),l}if(a.dtype==="complex64"){let i=Uh({inputs:{input:a},backend:r}),o=t2({inputs:{x:i},backend:r,attrs:{dtype:s}});return r.disposeData(i.dataId),o}if(!w.hasEncodingLoss(a.dtype,s)){let i=Vn({inputs:{x:a},backend:r});return{dataId:i.dataId,shape:i.shape,dtype:s}}if(s==="int32")return uhe(a,r);if(s==="bool"){let i=r.makeTensorInfo([],"bool",w.getTypedArrayFromDType("bool",1)),o=_8({inputs:{a,b:i},backend:r});return r.disposeData(i.dataId),o}throw new Error(`Error in Cast: failed to cast ${a.dtype} to ${s}`)}var dhe={kernelName:Ys,backendName:"webgpu",kernelFunc:t2},phe=kr({opType:1,cpuKernelImpl:ope}),hhe={kernelName:Js,backendName:"webgpu",kernelFunc:phe},che=class{constructor(e){this.variableNames=["A"],this.uniforms="minVal : f32, maxVal : f32,",this.workPerThread=4,this.workGroupSize=[64,1,1],this.isVec4=!0,this.size=!0,this.outputShape=e,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,[this.workPerThread,1,1]),this.shaderKey="clipVec4"}getUserCode(){return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if(index < uniforms.size) {
let value = getAByOutputIndex(index);
var clampedValue : vec4<f32>;
for (var i = 0; i < 4; i = i + 1) {
2022-03-07 19:24:06 +01:00
if (isnan(value[i])) {
2022-02-10 18:27:21 +01:00
clampedValue[i] = value[i];
} else {
clampedValue[i] = clamp(value[i], uniforms.minVal, uniforms.maxVal);
}
}
setOutputAtIndex(index, clampedValue);
}
}
2022-04-14 17:47:08 +02:00
`}},fhe=class{constructor(e){this.variableNames=["A"],this.uniforms="minVal : f32, maxVal : f32,",this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=e,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.shaderKey="clip"}getUserCode(){return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if(index < uniforms.size) {
let value = getAByOutputIndex(index);
2022-03-07 19:24:06 +01:00
if (isnan(value)) {
2022-02-10 18:27:21 +01:00
setOutputAtIndex(index, value);
return;
}
setOutputAtIndex(index, clamp(value, uniforms.minVal, uniforms.maxVal));
}
}
2022-04-14 17:47:08 +02:00
`}};function mhe(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{clipValueMin:s,clipValueMax:i}=n,o,l=[{type:"float32",data:[s]},{type:"float32",data:[i]}];return w.sizeFromShape(a.shape)%4===0?o=new che(a.shape):o=new fhe(a.shape),r.runWebGPUProgram(o,[a],a.dtype,l)}var ghe={kernelName:Ja,backendName:"webgpu",kernelFunc:mhe},yhe=class{constructor(e){this.uniforms="",this.workPerThread=4,this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=N.computeOutShape(e,1),this.variableNames=e.map((t,r)=>`T${r}`),this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,[this.workPerThread,1,1]),this.offsetLength=e.length-1;for(let t=0;t<this.offsetLength;t++)this.uniforms+=`offset${t} : i32,`;this.shaderKey="concat"}getUserCode(){let e=[];if(this.offsetLength>0){e.push("if (yC < uniforms.offset0){ setOutputAtCoords(coords.x, coords.y, getT0(yR, yC)); }");for(let n=1;n<this.offsetLength;n++)e.push(`else if (yC < uniforms.offset${[n]}){ setOutputAtCoords(coords.x, coords.y, getT${n}(yR, yC - uniforms.offset${n-1})); }`);let t=this.offsetLength,r=this.offsetLength-1;e.push(`else { setOutputAtCoords(coords.x, coords.y, getT${t}(yR, yC - uniforms.offset${r})); }`)}else e.push("setOutputAtCoords(coords.x, coords.y, getT0(yR, yC));");return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
for(var i = 0; i < ${this.workPerThread}; i = i + 1) {
let flatIndex = index * ${this.workPerThread} + i;
if(flatIndex < uniforms.size) {
let coords = getCoordsFromIndex(flatIndex);
let yR = coords.x;
let yC = coords.y;
${e.join(`
`)}
}
}
}
2022-04-14 17:47:08 +02:00
`}};function w0(e){let{inputs:t,backend:r}=e,{input:n}=t,a=r.tensorMap.get(n.dataId);return Vn({inputs:{x:a.complexTensorInfos.imag},backend:r})}var Ahe={kernelName:eh,backendName:"webgpu",kernelFunc:w0};function r2(e,t,r){let n=e[0].dtype;if(n==="complex64"){let c=e.map(A=>Uh({inputs:{input:A},backend:r})),f=e.map(A=>w0({inputs:{input:A},backend:r})),m=r2(c,t,r),g=r2(f,t,r),y=Cd({inputs:{real:m,imag:g},backend:r});return c.forEach(A=>r.disposeData(A.dataId)),f.forEach(A=>r.disposeData(A.dataId)),r.disposeData(m.dataId),r.disposeData(g.dataId),y}let a=r.shouldExecuteOnCPU(e);if(n==="string"&&(a=!0),a){let c=e.map(b=>{let v=w.sizeFromShape(b.shape.slice(t));return qe({inputs:{x:b},backend:r,attrs:{shape:[-1,v]}})}),f=c.map(b=>({vals:r.readSync(b.dataId),shape:b.shape})),m=N.computeOutShape(c.map(b=>b.shape),1),g=c[0].shape[0]===1,y=lpe(f,m,n,g),A=N.computeOutShape(e.map(b=>b.shape),t),x=r.makeTensorInfo(A,n,y);return c.forEach(b=>r.disposeData(b.dataId)),x}let{tensors2D:s,outShape:i}=xhe(e,t,r),o=s.map(c=>c.shape),l=new yhe(o),u=[],d=new Array(o.length-1);if(d.length>0){d[0]=o[0][1],u.push({type:"int32",data:[d[0]]});for(let c=1;c<d.length;c++)d[c]=d[c-1]+o[c][1],u.push({type:"int32",data:[d[c]]})}let h=r.runWebGPUProgram(l,s,s[0].dtype,u);s.forEach(c=>r.disposeData(c.dataId));let p=qe({inputs:{x:h},backend:r,attrs:{shape:i}});return r.disposeData(h.dataId),p}function xhe(e,t,r){let n=N.computeOutShape(e.map(a=>a.shape),t);return{tensors2D:e.map(a=>qe({inputs:{x:a},backend:r,attrs:{shape:[w.sizeFromShape(a.shape.slice(0,t)),w.sizeFromShape(a.shape.slice(t))]}})),outShape:n}}function z8(e){let{inputs:t,backend:r,attrs:n}=e,{axis:a}=n,s=w.parseAxisParam(a,t[0].shape)[0],i=N.computeOutShape(t.map(u=>u.shape),s);if(w.sizeFromShape(i)===0)return r.makeTensorInfo(i,t[0].dtype,[]);let o=t.filter(u=>w.sizeFromShape(u.shape)>0);if(o.length===1)return Vn({inputs:{x:o[0]},backend:r});let l=o.map(u=>u.shape);return N.assertParamsConsistent(l,s),r2(o,s,r)}var bhe={kernelName:Wo,backendName:"webgpu",kernelFunc:z8},vhe=class{constructor(e,t=!1,r=null,n=!1,a=!1){this.variableNames=["x","W"],this.uniforms=`filterDims : vec2<i32>, pad : vec2<i32>, stride : vec2<i32>, dilation : vec2<i32>,
2022-04-11 17:45:24 +02:00
dimAOuter : i32, dimBOuter : i32, dimInner : i32,`,this.workGroupSize=[8,8,1],this.isVec4=!0,this.outputShape=e.outShape,w.assert(e.dataFormat==="channelsLast",()=>"TODO: NCHW is unimplemented"),this.dispatchLayout={x:[3],y:[1,2],z:[0]},this.outputShape[1]===1?this.elementsPerThread=[4,1,1]:this.elementsPerThread=[4,4,1],this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,this.elementsPerThread),this.convInfo=e,this.addBias=t,this.activation=r,this.hasPreluActivationWeights=n,this.hasLeakyreluAlpha=a,this.addBias&&this.variableNames.push("bias"),this.hasPreluActivationWeights&&this.variableNames.push("preluActivationWeights"),this.hasLeakyreluAlpha&&this.variableNames.push("leakyreluAlpha"),this.tileAOuter=this.outputShape[1]===1?1:this.workGroupSize[1]*this.elementsPerThread[1],this.tileBOuter=this.workGroupSize[0]*this.elementsPerThread[0],this.tileInner=this.tileBOuter,[this.fitA,this.fitB]=this.getShapeFit(),this.shaderKey=`conv2DMMVec4_${this.activation}_${this.fitA}_${this.fitB}_${this.elementsPerThread}`}getShapeFit(){let e=[this.tileAOuter,this.tileInner],t=[this.tileInner,this.tileBOuter],r=this.outputShape[1]*this.outputShape[2],n=this.outputShape[3],a=this.convInfo.filterHeight*this.convInfo.filterWidth*this.convInfo.inChannels;return[Za(e,[r,a]),Za(t,[a,n])]}getSampleAWithRemainder(e){return`let flatIndex${e} = getIndexFromCoords4D(coord, uniforms.xShape);
2022-02-10 18:27:21 +01:00
let divBy4Remainder${e} = flatIndex${e} % 4;
let divBy4Index${e} = flatIndex${e} / 4;
2022-04-01 15:12:04 +02:00
let curData${e} = x[divBy4Index${e}];
2022-02-10 18:27:21 +01:00
if (divBy4Remainder${e} == 0) {
temp = curData${e};
} else {
// TODO: This could end up being a redundant load with another one in
// the same shader invocation. Perhaps there's an opportunity for
// optimization
2022-04-01 15:12:04 +02:00
let nextData${e} = x[divBy4Index${e} + 1];
2022-02-10 18:27:21 +01:00
if (divBy4Remainder${e} == 1) {
temp = vec4<f32>(curData${e}.yzw, nextData${e}.x);
} else if (divBy4Remainder${e} == 2) {
temp = vec4<f32>(curData${e}.zw, nextData${e}.xy);
} else if (divBy4Remainder${e} == 3) {
temp = vec4<f32>(curData${e}.w, nextData${e}.xyz);
}
}
2022-04-14 17:47:08 +02:00
`}getUserCode(){let e=E8(this.elementsPerThread,this.tileAOuter,this.tileBOuter,this.tileInner),t=`let outRow = r / uniforms.outShape[2];
2022-02-10 18:27:21 +01:00
let outCol = r % uniforms.outShape[2];
let WRow = c / (uniforms.filterDims[1] * uniforms.xShape[3]);
let WCol = c / uniforms.xShape[3] % uniforms.filterDims[1];
let inChCoord = c % uniforms.xShape[3];
var coord = vec4<i32>(
batch,
outRow * uniforms.stride[0] + uniforms.dilation[0] * WRow - uniforms.pad[0],
outCol * uniforms.stride[1] + uniforms.dilation[1] * WCol - uniforms.pad[1],
inChCoord);
var resData = vec4<f32>(0.0);
${this.convInfo.inChannels%4===0?`// The bounds checking is always needed since we use it to pad zero for
// the 'same' padding type.
if (coordsInBounds4D(coord, uniforms.xShape)) {
2022-04-01 15:12:04 +02:00
resData = x[getIndexFromCoords4D(coord, uniforms.xShape) / 4];
2022-02-10 18:27:21 +01:00
} else {
resData = vec4<f32>(0.0); }`:`var temp = vec4<f32>(0.0);
${this.getSampleAWithRemainder(1)}
resData = temp;
if (WCol == (uniforms.filterDims[1] - 1)) {
coord = vec4<i32>(
coord.x, coord.y + 1, coord.z + 1 - uniforms.filterDims[1], 0);
${this.getSampleAWithRemainder(2)}
if (inChCoord == 0) {
resData = vec4<f32>(resData.xyz, temp.x);
} else if (inChCoord == 1) {
resData = vec4<f32>(resData.xy, temp.xy);
} else {
resData = vec4<f32>(resData.x, temp.xyz);
}
}
`}
2022-04-01 15:13:32 +02:00
return resData;`,r=this.fitA?`${t}`:`if (r < uniforms.dimAOuter && c < uniforms.dimInner) {
${t}
2022-02-10 18:27:21 +01:00
}
return vec4<f32>(0.0);
2022-04-01 15:13:32 +02:00
`,n=this.fitB?"return W[row * uniforms.dimBOuter / 4 + col];":`if(coordsInBounds2D(vec2<i32>(row, col * 4), vec2<i32>(uniforms.dimInner, uniforms.dimBOuter))) {
2022-04-01 15:12:04 +02:00
return W[row * uniforms.dimBOuter / 4 + col];
2022-02-10 18:27:21 +01:00
}
return vec4<f32>(0.0);
2022-04-11 17:45:24 +02:00
`,a="",s="";if(this.activation){let o=ss(this.activation,this.isVec4);if(this.hasPreluActivationWeights)a=`fn activation(a : vec4<f32>, outCoord : vec4<i32>) -> vec4<f32> {
2022-02-10 18:27:21 +01:00
let b = getPreluActivationWeightsByOutputCoords(outCoord);
2022-04-01 15:13:32 +02:00
${o}
}`;else{if(this.hasLeakyreluAlpha)throw a=`fn activation(outCoord: vec4<f32>) -> vec4<f32> {
2022-02-10 18:27:21 +01:00
let b = getLeakyreluAlphaByOutputCoords(outCoord);
2022-04-01 15:13:32 +02:00
${o}
}`,new Error("Leakyrelu is not supported.");a=`
2022-02-10 18:27:21 +01:00
fn activation(a : vec4<f32>, outCoord : vec4<i32>) -> vec4<f32> {
2022-04-01 15:13:32 +02:00
${o}
}`}s="value = activation(value, outCoord);"}let i=this.addBias?"value = value + getBiasByOutputCoords(outCoord);":"";return`
${a}
2022-02-10 18:27:21 +01:00
fn mm_readA(row : i32, col : i32, globalId : vec3<u32>) -> vec4<f32> {
let r = row;
let c = col * 4;
var batch = i32(globalId.z);
${r}
}
fn mm_readB(row : i32, col : i32, globalId : vec3<u32>) -> vec4<f32> {
2022-04-01 15:13:32 +02:00
${n}
2022-02-10 18:27:21 +01:00
}
fn mm_write(row : i32, col : i32, valueInput : vec4<f32>, globalId : vec3<u32>) {
var batch = i32(globalId.z);
var value = valueInput;
if (row < uniforms.dimAOuter && col * 4 < uniforms.dimBOuter)
{
let outCoord = vec4<i32>(
batch,
row / uniforms.outShape[2],
row % uniforms.outShape[2],
col * 4);
${i}
2022-04-01 15:13:32 +02:00
${s}
2022-02-10 18:27:21 +01:00
setOutputAtCoords(outCoord[0], outCoord[1], outCoord[2], outCoord[3],
value);
}
}
${e}
2022-04-14 17:47:08 +02:00
`}},whe=class{constructor(e,t=!1,r=null,n=!1){this.variableNames=["x","W"],this.uniforms="filterDims : vec2<i32>, pad : vec2<i32>, stride : vec2<i32>, dilation : vec2<i32>, dimAOuter : i32, dimBOuter : i32, dimInner : i32,",this.outputShape=e.outShape,w.assert(e.dataFormat==="channelsLast",()=>"TODO: NCHW is unimplemented"),this.dispatchLayout={x:[3],y:[1,2],z:[0]},this.workGroupSize=Ab(this.dispatchLayout,this.outputShape),this.elementsPerThread=xb(this.dispatchLayout,this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,this.elementsPerThread),t&&this.variableNames.push("bias"),n&&this.variableNames.push("preluActivationWeights"),this.convInfo=e,this.addBias=t,this.activation=r,this.hasPreluActivationWeights=n,[this.fitA,this.fitB]=this.getShapeFit(),this.shaderKey=`conv2DMM_${this.elementsPerThread}_${this.activation}_${this.fitA}_${this.fitB}`}getShapeFit(){let e=this.workGroupSize[1]*this.elementsPerThread[1],t=this.workGroupSize[0]*this.elementsPerThread[0],r=e>t?e:t;w.assert(r%this.workGroupSize[0]===0&&r%this.workGroupSize[1]===0,()=>"tileInner must be multiple of workgroupsize.x and workgroupsize.y");let n=[e,r],a=[r,t],s=this.outputShape[1]*this.outputShape[2],i=this.outputShape[3],o=this.convInfo.filterHeight*this.convInfo.filterWidth*this.convInfo.inChannels;return[Za(n,[s,o]),Za(a,[o,i])]}getUserCode(){let e=vb(this.elementsPerThread,this.workGroupSize),t=`
2022-02-10 18:27:21 +01:00
let outRow = row / uniforms.outShape[2];
let outCol = row % uniforms.outShape[2];
let WRow = col / (uniforms.filterDims[1] * uniforms.xShape[3]);
let WCol = col / uniforms.xShape[3] % uniforms.filterDims[1];
let coord = vec4<i32>(
batch,
outRow * uniforms.stride[0] + uniforms.dilation[0] * WRow - uniforms.pad[0],
outCol * uniforms.stride[1] + uniforms.dilation[1] * WCol - uniforms.pad[1],
col % uniforms.xShape[3]);
// The bounds checking is always needed since we use it to pad zero for the
// 'same' padding type.
if(coordsInBounds4D(coord, uniforms.xShape)) {
2022-04-01 15:12:04 +02:00
return x[getIndexFromCoords4D(coord, uniforms.xShape)];
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
return 0.0;`,r=this.fitA?`${t}`:`if (row < uniforms.dimAOuter && col < uniforms.dimInner) {
2022-02-10 18:27:21 +01:00
${t}
}
return 0.0;
2022-04-01 15:13:32 +02:00
`,n=this.fitB?"return W[row * uniforms.dimBOuter + col];":`if(coordsInBounds2D(vec2<i32>(row, col), vec2<i32>(uniforms.dimInner, uniforms.dimBOuter))) {
2022-04-01 15:12:04 +02:00
return W[row * uniforms.dimBOuter + col];
2022-02-10 18:27:21 +01:00
}
return 0.0;
2022-04-11 17:45:24 +02:00
`,a="",s="";if(this.activation){let o=ss(this.activation,!1);this.hasPreluActivationWeights?a=`fn activation(a: f32, outCoord : vec4<i32>) -> f32 {
2022-02-10 18:27:21 +01:00
let b = getPreluActivationWeightsByOutputCoords(outCoord);
2022-04-01 15:13:32 +02:00
${o}
}`:a=`
2022-02-10 18:27:21 +01:00
fn activation(a : f32, outCoord : vec4<i32>) -> f32 {
2022-04-01 15:13:32 +02:00
${o}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`,s="value = activation(value, outCoord);"}let i=this.addBias?"value = value + getBiasByOutputCoords(outCoord);":"";return`
${a}
2022-02-10 18:27:21 +01:00
fn mm_readA(row : i32, col : i32, globalId : vec3<u32>) -> f32 {
var batch = i32(globalId.z);
2022-04-01 15:13:32 +02:00
${r}
2022-02-10 18:27:21 +01:00
}
fn mm_readB(row : i32, col : i32, globalId : vec3<u32>) -> f32 {
2022-04-01 15:13:32 +02:00
${n}
2022-02-10 18:27:21 +01:00
}
fn mm_write(row : i32, col : i32, valueInput : f32, globalId : vec3<u32>) {
var batch = i32(globalId.z);
var value = valueInput;
let outCoord = vec4<i32>(
batch,
row / uniforms.outShape[2],
row % uniforms.outShape[2],
col);
2022-04-01 15:13:32 +02:00
${i}
${s}
2022-04-01 15:12:04 +02:00
result[getIndexFromCoords4D(outCoord, uniforms.outShape)] = value;
2022-02-10 18:27:21 +01:00
}
${e}
2022-04-14 17:47:08 +02:00
`}},khe=class{constructor(e,t=!1,r=null,n=!1){this.variableNames=["x","W"],this.uniforms="filterDims : vec2<i32>, pad : vec2<i32>, stride : vec2<i32>, dilation : vec2<i32>,",this.workGroupSize=[128,1,1],this.outputShape=e.outShape,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),w.assert(e.dataFormat==="channelsLast",()=>"TODO: NCHW is unimplemented"),t&&this.variableNames.push("bias"),n&&this.variableNames.push("preluActivationWeights"),this.convInfo=e,this.addBias=t,this.activation=r,this.hasPreluActivationWeights=n,this.shaderKey=`conv2DNaive_${this.activation}`}getUserCode(){let e="",t="";if(this.activation){let n=ss(this.activation);this.hasPreluActivationWeights?e=`fn activation(a : f32, outCoord : vec4<i32>) -> f32{
2022-02-10 18:27:21 +01:00
let b = getPreluActivationWeightsByOutputCoords(outCoord);
2022-04-01 15:13:32 +02:00
${n}
2022-02-10 18:27:21 +01:00
}`:e=`
fn activation(a : f32, outCoord : vec4<i32>) -> f32{
2022-04-01 15:13:32 +02:00
${n}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`,t="value = activation(value, outCoord);"}let r=this.addBias?"value = value + getBiasByOutputCoords(outCoord);":"";return`
2022-02-10 18:27:21 +01:00
${e}
fn readInp(batch : i32, row : i32, col : i32, chan : i32) -> f32 {
let coord = vec4<i32>(batch, row, col, chan);
if(coordsInBounds4D(coord, uniforms.xShape)) {
return getX(batch, row, col, chan);
}
return 0.0;
}
fn readFilt(row : i32, col : i32, xChannel : i32, outChannel : i32) -> f32{
let coord = vec4<i32>(row, col, xChannel, outChannel);
if(coordsInBounds4D(coord, uniforms.wShape)) {
return getW(row, col, xChannel, outChannel);
}
return 0.0;
}
fn writeResult(batch : i32, row : i32, col : i32, chan : i32, value : f32) {
let coord = vec4<i32>(batch, row, col, chan);
if (coordsInBounds4D(coord, uniforms.outShape)) {
2022-04-01 15:13:32 +02:00
${r}
2022-02-10 18:27:21 +01:00
${t}
setOutputAtCoords(batch, row, col, chan, value);
}
}
2022-04-11 17:45:24 +02:00
${Ui()}
2022-02-10 18:27:21 +01:00
let coords = getOutputCoords();
let batch = coords[0];
let outChannel = coords[3];
var acc = 0.0;
for (var row = 0; row < uniforms.filterDims[0]; row = row + 1) {
for (var col = 0; col < uniforms.filterDims[1]; col = col + 1) {
for (var xChannel = 0; xChannel < uniforms.xShape[3]; xChannel = xChannel + 1) {
let coordRow = coords[1] * uniforms.stride[0] + uniforms.dilation[0] * row - uniforms.pad[0];
let coordCol = coords[2] * uniforms.stride[1] + uniforms.dilation[1] * col - uniforms.pad[1];
let v = readInp(batch, coordRow, coordCol, xChannel);
let f = readFilt(row, col, xChannel, outChannel);
acc = acc + v * f;
}
}
}
writeResult(batch, coords[1], coords[2], outChannel, acc);
}
2022-04-14 17:47:08 +02:00
`}},Ihe=class{constructor(e,t){this.variableNames=["A"],this.uniforms=`pad : vec2<i32>, stride : vec2<i32>, dilation : vec2<i32>, outWidth : i32, itemsPerBlockRow : i32,
2022-04-01 15:13:32 +02:00
inChannels : i32,`,this.workPerThread=4,this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=e,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,[this.workPerThread,1,1]),this.isChannelsLast=t,this.shaderKey=`im2col_${this.isChannelsLast}`}getUserCode(){let e=this.isChannelsLast?0:1,t=this.isChannelsLast?1:2;return`
${tt()}
2022-04-01 15:12:04 +02:00
for(var i = 0; i<${this.workPerThread}; i = i + 1) {
let flatIndex = index * ${this.workPerThread} + i;
let rc = getCoordsFromIndex(flatIndex);
if(flatIndex < uniforms.size) {
let blockIndex = rc[0];
let pos = rc[1];
let offsetY = blockIndex / uniforms.outWidth * uniforms.stride[1] - uniforms.pad[1];
let d0 = offsetY + uniforms.dilation[1] * pos / uniforms.itemsPerBlockRow;
var value = 0.0;
if(d0 < uniforms.aShape[${e}] && d0 >= 0) {
let offsetX = (blockIndex % uniforms.outWidth) * uniforms.stride[0] -
uniforms.pad[0];
let d1 = offsetX + uniforms.dilation[0] * ((pos %
uniforms.itemsPerBlockRow) / uniforms.inChannels);
let ch = pos % uniforms.inChannels;
if(d1 < uniforms.aShape[${t}] && d1 >= 0) {
value = getA(d0, d1, ch);
}
}
setOutputAtIndex(flatIndex, value);
}
}
}
2022-04-14 17:47:08 +02:00
`}};function She({x:e,filter:t,convInfo:r,backend:n,bias:a=null,preluActivationWeights:s=null,leakyreluAlpha:i=0,activation:o=null}){let l=e.shape,u=r.dataFormat==="channelsLast",d=!1,h=!1,p=r.filterHeight===r.inHeight&&r.filterWidth===r.inWidth&&r.padInfo.type==="VALID",c,f;if(p){let y=r.inHeight*r.inWidth*r.inChannels;c=qe({inputs:{x:e},backend:n,attrs:{shape:[1,r.batchSize,y]}}),f=qe({inputs:{x:t},backend:n,attrs:{shape:[1,y,r.outChannels]}})}else{let y=u?l[0]*l[1]*l[2]:l[0]*l[2]*l[3];c=qe({inputs:{x:e},backend:n,attrs:{shape:[1,y,r.inChannels]}}),f=qe({inputs:{x:t},backend:n,attrs:{shape:[1,r.inChannels,r.outChannels]}})}let m=wb({a:c,b:f,transposeA:d,transposeB:h,backend:n,bias:a,activation:o,preluActivationWeights:s,leakyreluAlpha:i}),g=qe({inputs:{x:m},backend:n,attrs:{shape:r.outShape}});return n.disposeData(c.dataId),n.disposeData(f.dataId),n.disposeData(m.dataId),g}function The({x:e,filter:t,convInfo:r,backend:n,bias:a=null,preluActivationWeights:s=null,leakyreluAlpha:i=0,activation:o=null}){let{filterWidth:l,filterHeight:u,inChannels:d,strideWidth:h,strideHeight:p,padInfo:c,outWidth:f,outHeight:m,dilationWidth:g,dilationHeight:y,dataFormat:A}=r,x=A==="channelsLast",b=l*u*d,v=m*f,S=[v,b],T=!1,E=!1,R=[],_=qe({inputs:{x:e},backend:n,attrs:{shape:e.shape.slice(1)}}),M=qe({inputs:{x:t},backend:n,attrs:{shape:[1,b,-1]}});R.push(_),R.push(M);let I=new Ihe(S,x),z=[{type:"int32",data:[c.left,c.top]},{type:"int32",data:[h,p]},{type:"int32",data:[g,y]},{type:"int32",data:[f]},{type:"int32",data:[d*l]},{type:"int32",data:[d]}],O=n.runWebGPUProgram(I,[_],_.dtype,z),j=qe({inputs:{x:O},backend:n,attrs:{shape:[1,S[0],S[1]]}});R.push(O),R.push(j);let X=[1,S[0],S[1]],D=new R8(X,[1,v,r.outChannels],Y().get("WEBGPU_MATMUL_WORK_PER_THREAD"),T,E,a,o,s),Q=X[1],V=X[2],ee=r.outChannels,J=[{type:"int32",data:[Q]},{type:"int32",data:[ee]},{type:"int32",data:[V]}],se=[j,M];a&&se.push(a),s&&se.push(s),o==="leakyrelu"&&(z.push({type:"float32",data:[i]}),D.uniforms+=" alpha : f32,");let Z=n.runWebGPUProgram(D,se,j.dtype,J),ae=x?[1,m,f,r.outChannels]:[1,r.outChannels,m,f],de=qe({inputs:{x:Z},backend:n,attrs:{shape:ae}});R.push(Z);for(let Ae of R)n.disposeData(Ae.dataId);return de}function O8({x:e,filter:t,convInfo:r,backend:n,bias:a=null,preluActivationWeights:s=null,leakyreluAlpha:i=0,activation:o=null}){let l=a!=null,u=s!=null,d;if(r.filterHeight===r.inHeight&&r.filterWidth===r.inWidth&&r.padInfo.type==="VALID"||r.filterHeight===1&&r.filterWidth===1&&r.dilationHeight===1&&r.dilationWidth===1&&r.strideHeight===1&&r.strideWidth===1&&(r.padInfo.type==="SAME"||r.padInfo.type==="VALID"))return She({x:e,filter:t,convInfo:r,backend:n,bias:a,activation:o,preluActivationWeights:s,leakyreluAlpha:i});if(Y().getBool("WEBGPU_CONV_SEPARATE_IM2COL_SHADER")&&e.shape[0]===1)return The({x:e,filter:t,convInfo:r,backend:n,bias:a,preluActivationWeights:s,leakyreluAlpha:i,activation:o});let h=Y().getBool("WEBGPU_USE_NAIVE_CONV2D"),p=(r.inChannels%4===0||r.inChannels===3&&r.padInfo.type==="VALID")&&r.outChannels%4===0,c=[r.padInfo.top,r.padInfo.left],f=[{type:"int32",data:[r.filterHeight,r.filterWidth]},{type:"int32",data:[...c]},{type:"int32",data:[r.strideHeight,r.strideWidth]},{type:"int32",data:[r.dilationHeight,r.dilationWidth]}];if(h)d=new khe(r,l,o,u);else{p?d=new vhe(r,l,o,u):d=new whe(r,l,o,u);let g=r.outShape[1]*r.outShape[2],y=r.outShape[3],A=r.filterHeight*r.filterWidth*r.inShape[3];f.push({type:"int32",data:[g]},{type:"int32",data:[y]},{type:"int32",data:[A]})}let m=[e,t];return l&&m.push(a),u&&m.push(s),o==="leakyrelu"&&(f.push({type:"float32",data:[i]}),d.uniforms+=" alpha : f32,"),n.runWebGPUProgram(d,m,e.dtype,f)}function Nhe(e){let{inputs:t,attrs:r,backend:n}=e,{x:a,filter:s}=t,{strides:i,pad:o,dataFormat:l,dilations:u,dimRoundingMode:d}=r,h=N.convertConv2DDataFormat(l),p=N.computeConv2DInfo(a.shape,s.shape,i,u,o,d,!1,h);return O8({x:a,filter:s,convInfo:p,backend:n})}var Che={kernelName:Qs,backendName:"webgpu",kernelFunc:Nhe},Ehe=class{constructor(e){this.variableNames=["x","W"],this.uniforms="filterDims : vec2<i32>, pads : vec2<i32>, stride
2022-02-10 18:27:21 +01:00
fn mm_readA(row : i32, col : i32, globalId : vec3<u32>) -> f32 {
var batch = i32(globalId.z);
if (row < uniforms.dimAOuter && col < uniforms.dimInner) {
let outRow = row / uniforms.outShape[2];
let outCol = row % uniforms.outShape[2];
let WRow = col / (uniforms.filterDims[1] * uniforms.outBackprop[3]);
let WCol = col / uniforms.outBackprop[3] % uniforms.filterDims[1];
let xR = f32(outRow - uniforms.pads[0] + WRow) / f32(uniforms.stride[0]);
let xC = f32(outCol - uniforms.pads[1] + WCol) / f32(uniforms.stride[1]);
if (xR < 0.0 || xR >= f32(uniforms.outBackprop[1]) || fract(xR) > 0.0) {
return 0.0;
}
if (xC < 0.0 || xC >= f32(uniforms.outBackprop[2]) || fract(xC) > 0.0) {
return 0.0;
}
let coord = vec4<i32>(
batch,
i32(xR),
i32(xC),
col % uniforms.outBackprop[3]);
2022-04-01 15:12:04 +02:00
return x[getIndexFromCoords4D(coord, uniforms.xShape)];
2022-02-10 18:27:21 +01:00
}
return 0.0;
}
fn mm_readB(row : i32, col : i32, globalId : vec3<u32>) -> f32 {
let coordX = uniforms.filterDims.x - 1 -
row / (uniforms.filterDims[1] * uniforms.outBackprop[3]);
let coordY = uniforms.filterDims.y - 1 -
(row / uniforms.outBackprop[3]) % uniforms.filterDims[1];
if (row < uniforms.dimInner && col < uniforms.dimBOuter &&
coordX >= 0 && coordY >= 0) {
let coord = vec4<i32>(coordX, coordY, col,
row % uniforms.outBackprop[3]);
2022-04-01 15:12:04 +02:00
return W[getIndexFromCoords4D(coord, uniforms.wShape)];
2022-02-10 18:27:21 +01:00
}
return 0.0;
}
fn mm_write(row : i32, col : i32, valueInput : f32, globalId : vec3<u32>) {
var batch = i32(globalId.z);
var value = valueInput;
let outCoord = vec4<i32>(
batch,
row / uniforms.outShape[2],
row % uniforms.outShape[2],
col);
2022-04-01 15:12:04 +02:00
result[getIndexFromCoords4D(outCoord, uniforms.outShape)] = value;
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
${vb(this.elementsPerThread,this.workGroupSize)}
`}},Rhe=class{constructor(e){this.variableNames=["dy","W"],this.uniforms="filterDims : vec2<i32>, pads : vec2<i32>, stride : vec2<i32>, outBackprop : vec4<i32>,",this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=e.inShape,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.isChannelsLast=e.dataFormat==="channelsLast",this.shaderKey=`conv2DDerInput_${this.isChannelsLast}`}getUserCode(){let e=this.isChannelsLast?1:2,t=this.isChannelsLast?2:3,r=this.isChannelsLast?3:1;return`
2022-04-01 15:13:32 +02:00
${tt()} {
2022-02-10 18:27:21 +01:00
if(index < uniforms.size) {
let coords = getCoordsFromIndex(index);
let batch = coords[0];
2022-04-01 15:13:32 +02:00
let d1 = coords[${r}];
2022-02-10 18:27:21 +01:00
let dyCorner = vec2<i32>(coords[${e}]), coords[${t}]) - uniforms.pads;
let dyRCorner = dyCorner.x;
let dyCCorner = dyCorner.y;
// Convolve dy(?, ?, d2) with w(:, :, d1, d2) to compute dx(xR, xC, d1).
// ? = to be determined. : = across all values in that axis.
var dotProd = 0.0;
for (var wR = 0; wR < uniforms.filterDims.x; wR = wR + 1) {
let dyR = (f32(dyRCorner) + f32(wR)) / f32(uniforms.stride.x);
let wRPerm = uniforms.filterDims.x - 1 - wR;
if (dyR < 0.0 || dyR >= f32(uniforms.outBackprop[1]) || fract(dyR) > 0.0 ||
wRPerm < 0) {
continue;
}
let idyR = dyR;
for (var wC = 0; wC < uniforms.filterDims.y; wC = wC + 1) {
let dyC = (f32(dyCCorner) + f32(wC)) / f32(uniforms.stride.y);
let wCPerm = uniforms.filterDims.y - 1 - wC;
if (dyC < 0.0 || dyC >= f32(uniforms.outBackprop[2]) ||
fract(dyC) > 0.0 || wCPerm < 0) {
continue;
}
let idyC = dyC;
for (var d2 = 0; d2 < uniforms.outBackprop[3]; d2 = d2 + 1) {
if (${this.isChannelsLast}) {
let xValue = getDy(batch, idyR, idyC, d2);
let wValue = getW(wRPerm, wCPerm, d1, d2);
dotProd = dotProd + xValue * wValue;
} else {
let xValue = getDy(batch, d2, idyR, idyC);
let wValue = getW(wRPerm, wCPerm, d1, d2);
dotProd = dotProd + xValue * wValue;
}
}
}
}
setOutputAtIndex(index, dotProd);
}
}
2022-04-14 17:47:08 +02:00
`}};function Mhe(e){let{inputs:t,backend:r,attrs:n}=e,{dy:a,filter:s}=t,{inputShape:i,strides:o,pad:l,dataFormat:u,dimRoundingMode:d}=n,h=N.convertConv2DDataFormat(u),p=N.computeConv2DInfo(i,s.shape,o,1,l,d,!1,h),c=[{type:"int32",data:[p.filterHeight,p.filterWidth]},{type:"int32",data:[p.filterHeight-1-p.padInfo.top,p.filterWidth-1-p.padInfo.left]},{type:"int32",data:[p.strideHeight,p.strideWidth]},{type:"int32",data:[p.batchSize,p.outHeight,p.outWidth,p.outChannels]}],f;if(Y().getBool("WEBGPU_USE_NAIVE_CONV2D_TRANSPOSE"))f=new Rhe(p);else{f=new Ehe(p);let m=p.inShape[1]*p.inShape[2],g=p.inShape[3],y=p.filterHeight*p.filterWidth*p.outChannels;c.push({type:"uint32",data:[m]},{type:"uint32",data:[g]},{type:"uint32",data:[y]})}return r.runWebGPUProgram(f,[a,s],"float32",c)}var Fhe={kernelName:ei,backendName:"webgpu",kernelFunc:Mhe},$he=kr({opType:2}),Phe={kernelName:ti,backendName:"webgpu",kernelFunc:$he},_he=kr({opType:3}),zhe={kernelName:ri,backendName:"webgpu",kernelFunc:_he},Ohe=class{constructor(e,t,r,n){this.variableNames=["Image","Boxes","BoxInd"],this.uniforms="extrapolationValue : f32,",this.workGroupSize=[64,1,1],this.size=!0;let[a]=t;this.outputShape=[a,r[0],r[1],e],this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.methodId=n==="bilinear"?1:0,this.cropHeightBiggerThan1=this.outputShape[1]>1,this.cropWidthBiggerThan1=this.outputShape[2]>1,this.shaderKey=`cropAndResize_${this.methodId}_${this.cropHeightBiggerThan1}_${this.cropWidthBiggerThan1}`}getUserCode(){let[e,t]=["f32(uniforms.imageShape[1] - 1)","f32(uniforms.imageShape[2] - 1)"],[r,n,a]=this.cropHeightBiggerThan1?[`(${e} / f32(uniforms.outShape[1] - 1))`,"(y2-y1) * height_ratio",`y1*${e} + f32(y)*(height_scale)`]:["0.0","0.0",`0.5 * (y1+y2) * ${e}`],[s,i,o]=this.cropWidthBiggerThan1?[`(${t} / f32(uniforms.outShape[2] - 1))`,"(x2-x1) * width_ratio",`x1*${t} + f32(x)*(width_scale)`]:["0.0","0.0",`0.5 * (x1+x2) * ${t}`];return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let coords = getCoordsFromIndex(index);
2022-04-01 15:13:32 +02:00
let height_ratio = f32(${r});
let width_ratio = f32(${s});
2022-02-10 18:27:21 +01:00
let b = coords[0];
let y = coords[1];
let x = coords[2];
let d = coords[3];
// get box vals
let y1 = getBoxes(b, 0);
let x1 = getBoxes(b, 1);
let y2 = getBoxes(b, 2);
let x2 = getBoxes(b, 3);
// get image in batch index
let bInd = i32(round(getBoxInd(b)));
if(bInd < 0 || bInd >= uniforms.outShape[0]) {
return;
}
2022-04-01 15:13:32 +02:00
let height_scale = ${n};
let width_scale = ${i};
let in_y = ${a};
2022-02-10 18:27:21 +01:00
if( in_y < 0.0 || in_y > ${e} ) {
setOutputAtIndex(index, uniforms.extrapolationValue);
return;
}
2022-04-01 15:13:32 +02:00
let in_x = ${o};
2022-02-10 18:27:21 +01:00
if( in_x < 0.0 || in_x > ${t} ) {
setOutputAtIndex(index, uniforms.extrapolationValue);
return;
}
let sourceFracIndexCR = vec2<f32>(in_x,in_y);
if(${this.methodId} == 1) {
// Compute the four integer indices.
let sourceFloorCR = vec2<i32>(sourceFracIndexCR);
let sourceCeilCR = vec2<i32>(ceil(sourceFracIndexCR));
let topLeft = getImage(bInd, sourceFloorCR.y, sourceFloorCR.x, d);
let bottomLeft = getImage(bInd, sourceCeilCR.y, sourceFloorCR.x, d);
let topRight = getImage(bInd, sourceFloorCR.y, sourceCeilCR.x, d);
let bottomRight = getImage(bInd, sourceCeilCR.y, sourceCeilCR.x, d);
let fracCR = sourceFracIndexCR - vec2<f32>(sourceFloorCR);
let top = topLeft + (topRight - topLeft) * fracCR.x;
let bottom = bottomLeft + (bottomRight - bottomLeft) * fracCR.x;
let newValue = top + (bottom - top) * fracCR.y;
setOutputAtIndex(index, newValue);
} else {
// Compute the coordinators of nearest neighbor point.
let sourceNearestCR = vec2<i32>(floor(
sourceFracIndexCR + vec2<f32>(0.5,0.5)));
let newValue = getImage(
bInd, sourceNearestCR.y, sourceNearestCR.x, d);
setOutputAtIndex(index, newValue);
}
}
}
2022-04-14 17:47:08 +02:00
`}},Dhe=e=>{let{inputs:t,backend:r,attrs:n}=e,{image:a,boxes:s,boxInd:i}=t,{cropSize:o,method:l,extrapolationValue:u}=n,d=new Ohe(a.shape[3],s.shape,o,l),h=[{type:"float32",data:[u]}];return r.runWebGPUProgram(d,[a,s,i],"float32",h)},Lhe={kernelName:Uo,backendName:"webgpu",kernelFunc:Dhe},Bhe=class{constructor(e,t){this.variableNames=["x"],this.workGroupSize=[64,1,1],this.size=!0,this.uniforms="blockSize : i32,",this.outputShape=e,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.shaderKey=`depthToSpace_${t}`,this.dataFormat=t}getUserCode(){return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let coords = getCoordsFromIndex(index);
let b = coords[0];
let h = ${this.getHeightCoordString()};
let w = ${this.getWidthCoordString()};
let d = ${this.getDepthCoordString()};
let in_h = h / uniforms.blockSize;
let offset_h = h % uniforms.blockSize;
let in_w = w / uniforms.blockSize;
let offset_w = w % uniforms.blockSize;
let offset_d = (offset_h * uniforms.blockSize + offset_w) *
${this.getOutputDepthSize()};
let in_d = d + offset_d;
let rlt = ${this.getInputSamplingString()};
setOutputAtIndex(index, rlt);
}
2022-04-14 17:47:08 +02:00
}`}getHeightCoordString(){return this.dataFormat==="NHWC"?"coords[1]":"coords[2]"}getWidthCoordString(){return this.dataFormat==="NHWC"?"coords[2]":"coords[3]"}getDepthCoordString(){return this.dataFormat==="NHWC"?"coords[3]":"coords[1]"}getOutputDepthSize(){return this.dataFormat==="NHWC"?"uniforms.outShape[3]":"uniforms.outShape[1]"}getInputSamplingString(){return this.dataFormat==="NHWC"?"getX(b, in_h, in_w, in_d)":"getX(b, in_d, in_h, in_w)"}};function Whe(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{blockSize:s,dataFormat:i}=n,o=a.shape[0],l=i==="NHWC"?a.shape[1]:a.shape[2],u=i==="NHWC"?a.shape[2]:a.shape[3],d=i==="NHWC"?a.shape[3]:a.shape[1],h=l*s,p=u*s,c=d/(s*s),f=i==="NHWC"?[o,h,p,c]:[o,c,h,p],m=[{type:"int32",data:[s]}],g=new Bhe(f,i);return r.runWebGPUProgram(g,[a],a.dtype,m)}var Vhe={kernelName:Go,backendName:"webgpu",kernelFunc:Whe},D8=class{constructor(e,t=!1,r=null,n=!1){this.variableNames=["x","W"],this.uniforms="pad : vec2<i32>, stride : vec2<i32>, dilation : vec2<i32>, inDims : vec2<i32>,",this.workGroupSize=[4,4,4],this.isVec4=!0,this.outputShape=e.outShape,this.dispatchLayout={x:[0,1],y:[2],z:[3]},this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,[1,4,4]),w.assert(e.dataFormat==="channelsLast",()=>"TODO: NCHW is unimplemented"),t&&this.variableNames.push("bias"),n&&this.variableNames.push("preluActivationWeights"),this.convInfo=e,this.addBias=t,this.activation=r,this.hasPreluActivation=n,this.shaderKey=`depthwise3x3_${r}`}getUserCode(){let e="",t="";if(this.activation){let n=ss(this.activation,this.isVec4);this.hasPreluActivation?e=`fn activation(a : vec4<f32>, outCoord : vec4<i32>) -> vec4<f32> {
2022-02-10 18:27:21 +01:00
let b = getPreluActivationWeightsByOutputCoords(outCoord);
2022-04-01 15:13:32 +02:00
${n}
2022-02-10 18:27:21 +01:00
}`:e=`
fn activation(a : vec4<f32>, outCoord : vec4<i32>) -> vec4<f32> {
2022-04-01 15:13:32 +02:00
${n}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`,t="dotProd[i] = activation(dotProd[i], coords);"}let r=this.addBias?"dotProd[i] = dotProd[i] + getBiasByOutputCoords(coords);":"";return`
2022-02-10 18:27:21 +01:00
${e}
2022-04-14 17:47:08 +02:00
${yb()}
2022-02-10 18:27:21 +01:00
fn main(@builtin(global_invocation_id) globalId: vec3<u32>) {
let batch = 0;
let r = i32(globalId.x);
let c = i32(globalId.y) * 4;
let d2 = i32(globalId.z) * 4;
let xRCCorner = vec2<i32>(r, c) * uniforms.stride - uniforms.pad;
let d1 = d2;
let q = 0;
let xRCorner = xRCCorner.x;
let xCCorner = xRCCorner.y;
var wVals : array<vec4<f32>, 9>;
wVals[0] = getW(0, 0, d1, q);
wVals[1] = getW(0, 1, d1, q);
wVals[2] = getW(0, 2, d1, q);
wVals[3] = getW(1, 0, d1, q);
wVals[4] = getW(1, 1, d1, q);
wVals[5] = getW(1, 2, d1, q);
wVals[6] = getW(2, 0, d1, q);
wVals[7] = getW(2, 1, d1, q);
wVals[8] = getW(2, 2, d1, q);
var xVals : array<array<vec4<f32>, 6>, 3>;
for (var wR = 0; wR < 3; wR = wR + 1) {
let xR = xRCorner + wR * uniforms.dilation[0];
for (var wC = 0; wC < 6; wC = wC + 1) {
let xC = xCCorner + wC * uniforms.dilation[1];
if (xR < 0 || xR >= uniforms.inDims[0] || xC < 0 || xC >= uniforms.inDims[1]) {
xVals[wR][wC] = vec4<f32>(0.0);
} else {
xVals[wR][wC] = getX(batch, xR, xC, d1);
}
}
}
var dotProd : array<vec4<f32>, 4>;
dotProd[0] = vec4<f32>(0.0);
dotProd[1] = vec4<f32>(0.0);
dotProd[2] = vec4<f32>(0.0);
dotProd[3] = vec4<f32>(0.0);
for (var wR = 0; wR < 3; wR = wR + 1) {
for (var wC = 0; wC < 3; wC = wC + 1) {
let indexW = wR * 3 + wC;
dotProd[0] = dotProd[0] + xVals[wR][0 + wC] * wVals[indexW];
dotProd[1] = dotProd[1] + xVals[wR][1 + wC] * wVals[indexW];
dotProd[2] = dotProd[2] + xVals[wR][2 + wC] * wVals[indexW];
dotProd[3] = dotProd[3] + xVals[wR][3 + wC] * wVals[indexW];
}
}
for (var i = 0; i < 4; i = i + 1) {
let coords = vec4<i32>(batch, r, c + i, d2);
if (coordsInBounds4D(coords, uniforms.outShape)) {
2022-04-01 15:13:32 +02:00
${r}
2022-02-10 18:27:21 +01:00
${t}
setOutputAtCoords(coords[0], coords[1], coords[2], coords[3], dotProd[i]);
}
}
}
2022-04-14 17:47:08 +02:00
`}},L8=class{constructor(e,t=!1,r=null,n=!1){this.variableNames=["x","W"],this.uniforms=`pad : vec2<i32>, stride : vec2<i32>, dilation : vec2<i32>,
2022-04-01 15:12:04 +02:00
inDims : vec2<i32>, filterHeight : i32, filterWidth : i32,
2022-04-11 17:45:24 +02:00
channelMul : i32,`,this.workGroupSize=[256,1,1],this.outputShape=e.outShape,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),w.assert(e.dataFormat==="channelsLast",()=>"TODO: NCHW is unimplemented"),t&&this.variableNames.push("bias"),n&&this.variableNames.push("preluActivationWeights"),this.convInfo=e,this.addBias=t,this.activation=r,this.hasPreluActivation=n,this.shaderKey=`depthwise_${this.activation}`}getUserCode(){let e="",t="";if(this.activation){let n=ss(this.activation,!1);this.hasPreluActivation?e=`fn activation(a : f32, outCoord : vec4<i32>) -> f32 {
2022-02-10 18:27:21 +01:00
let b = getPreluActivationWeightsByOutputCoords(outCoord);
2022-04-01 15:13:32 +02:00
${n}
2022-02-10 18:27:21 +01:00
}`:e=`
fn activation(a : f32, outCoord : vec4<i32>) -> f32 {
2022-04-01 15:13:32 +02:00
${n}
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
`,t="dotProd = activation(dotProd, coords);"}let r=this.addBias?"dotProd = dotProd + getBiasByOutputCoords(coords);":"";return`
2022-02-10 18:27:21 +01:00
${e}
fn writeResult(batch : i32, row : i32, col : i32, chan : i32,
value : f32) {
let coord = vec4<i32>(batch, row, col, chan);
if (coordsInBounds4D(coord, uniforms.outShape)) {
setOutputAtCoords(batch, row, col, chan, value);
}
}
2022-04-11 17:45:24 +02:00
${Ui()}
2022-02-10 18:27:21 +01:00
let coords = getOutputCoords();
let batch = coords[0];
let xRCCorner = vec2<i32>(coords.yz) * uniforms.stride - uniforms.pad;
let d2 = coords[3];
let d1 = d2 / uniforms.channelMul;
let q = d2 - d1 * uniforms.channelMul;
let inputRowStart = xRCCorner.x;
let inputColStart = xRCCorner.y;
let inputRowEnd = inputRowStart + uniforms.filterHeight *
uniforms.dilation[0];
let inputColEnd = inputColStart + uniforms.filterWidth *
uniforms.dilation[1];
// Convolve x(?, ?, d1) with w(:, :, d1, q) to get y(yR, yC, d2).
// ? = to be determined. : = across all values in that axis.
var dotProd = 0.0;
// Extract if checking out of for loop for performance.
if (inputRowStart >= 0 && inputColStart >= 0 &&
inputRowEnd < uniforms.inDims[0] &&
inputColEnd < uniforms.inDims[1]) {
// Here using a constant value |this.convInfo.filterHeight| instead
// of uniform value is in order to loop unrolling.
for (var wR = 0; wR < uniforms.filterHeight; wR = wR + 1) {
let xR = inputRowStart + wR * uniforms.dilation[0];
for (var wC = 0; wC < uniforms.filterWidth; wC = wC + 1) {
let xC = inputColStart + wC * uniforms.dilation[1];
let xVal = getX(batch, xR, xC, d1);
let wVal = getW(wR, wC, d1, q);
dotProd = dotProd + xVal * wVal;
}
}
} else {
for (var wR = 0; wR < uniforms.filterHeight; wR = wR + 1) {
let xR = inputRowStart + wR * uniforms.dilation[0];
if (xR < 0 || xR >= uniforms.inDims[0]) {
continue;
}
for (var wC = 0; wC < uniforms.filterWidth; wC = wC + 1) {
let xC = inputColStart + wC * uniforms.dilation[1];
if (xC < 0 || xC >= uniforms.inDims[1]) {
continue;
}
let xVal = getX(batch, xR, xC, d1);
let wVal = getW(wR, wC, d1, q);
dotProd = dotProd + xVal * wVal;
}
}
}
2022-04-01 15:13:32 +02:00
${r}
2022-02-10 18:27:21 +01:00
${t}
writeResult(batch, coords[1], coords[2], d2, dotProd);
}
2022-04-14 17:47:08 +02:00
`}};function Uhe(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,filter:s}=t,{strides:i,pad:o,dilations:l,dimRoundingMode:u}=n,d=l;d==null&&(d=[1,1]);let h=N.computeConv2DInfo(a.shape,s.shape,i,d,o,u,!0),p=[{type:"int32",data:[h.padInfo.top,h.padInfo.left]},{type:"int32",data:[h.strideHeight,h.strideWidth]},{type:"int32",data:[h.dilationHeight,h.dilationWidth]},{type:"int32",data:[h.inHeight,h.inWidth]}],c;return h.batchSize===1&&h.inHeight===h.outHeight&&h.inWidth===h.outWidth&&h.strideHeight===1&&h.strideWidth===1&&h.filterHeight===h.filterWidth&&h.inChannels===h.outChannels&&h.dilationHeight===1&&h.dilationWidth===1&&h.filterHeight===3&&h.inChannels%4===0?c=new D8(h):(c=new L8(h),p.push({type:"int32",data:[h.filterHeight]},{type:"int32",data:[h.filterWidth]},{type:"int32",data:[h.outChannels/h.inChannels]})),r.runWebGPUProgram(c,[a,s],a.dtype,p)}var Ghe={kernelName:ni,backendName:"webgpu",kernelFunc:Uhe},B8=jr({opSnippet:0,cpuKernelImpl:kpe,supportsComplex:!0}),jhe={kernelName:vi,backendName:"webgpu",kernelFunc:B8},Hhe=class{constructor(e,t){this.workGroupSize=[64,1,1],this.variableNames=["x"],this.uniforms="reduceSize : i32,",this.size=!0,this.inputShape=[e.batchSize,e.inSize];let[r]=N.computeOutAndReduceShapes(this.inputShape,[1]);this.outputShape=r.length===0?[1]:r,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,[1,1,1]),this.reduceType=t,this.shaderKey=`reduce_${t}`}getUserCode(){let e="",t="0.0";this.reduceType==="min"||this.reduceType==="max"?(e=`
2022-03-07 19:24:06 +01:00
if (isnan(candidate)) {
2022-02-10 18:27:21 +01:00
bestValue = uniforms.NAN;
2022-03-07 19:24:06 +01:00
} else if (!isnan(bestValue) && candidate ${this.reduceType==="min"?"<":">"} bestValue)
2022-04-01 15:13:32 +02:00
{ bestValue = candidate; }`,t="f32(x[offset])"):this.reduceType==="sum"||this.reduceType==="mean"?e=" bestValue = bestValue + candidate; ":this.reduceType==="prod"&&(e=" bestValue = bestValue * candidate; ",t="1.0");let r=this.reduceType==="mean"?"setOutputAtIndex(outputIndex, bestValue / f32(uniforms.reduceSize));":"setOutputAtIndex(outputIndex, bestValue);";return`
2022-02-10 18:27:21 +01:00
fn DIV_CEIL(a : u32, b : u32) -> u32 {
return ((a - 1u) / b + 1u);
}
${`
var<workgroup> xBestValues : array<f32, ${this.workGroupSize[0]}>;
`}
fn getOffset(outputIndex : i32) -> i32 {
let outputCoords = getCoordsFromIndex(outputIndex);
let offset = ${this.outputShape.length===1?"outputCoords":"outputCoords[0]"} * uniforms.reduceSize;
return offset;
}
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
let outputIndex = index / i32(workGroupSizeX);
let offset = getOffset(outputIndex);
var bestValue = ${t};
let Length = uniforms.reduceSize;
let WorkPerThread = DIV_CEIL(u32(Length), workGroupSizeX);
for (var k = i32(localId.x); k < Length && outputIndex < uniforms.size;
k = k + i32(workGroupSizeX)) {
2022-04-01 15:12:04 +02:00
let candidate = f32(x[offset + k]);
2022-02-10 18:27:21 +01:00
${e}
}
xBestValues[localId.x] = bestValue;
workgroupBarrier();
var reduceSize = min(u32(Length), workGroupSizeX);
for (var currentSize = reduceSize / 2u; reduceSize > 1u;
currentSize = reduceSize / 2u) {
let interval = DIV_CEIL(reduceSize, 2u);
if (localId.x < currentSize) {
let candidate = xBestValues[localId.x + interval];
${e}
xBestValues[localId.x] = bestValue;
}
reduceSize = interval;
workgroupBarrier();
}
if (localId.x == 0u && outputIndex < uniforms.size) {
2022-04-01 15:13:32 +02:00
${r}
2022-02-10 18:27:21 +01:00
}
}
2022-04-14 17:47:08 +02:00
`}};function Gh(e,t,r,n,a){let s=e.shape.length,i=[],o=w.parseAxisParam(t,e.shape),l=o,u=N.getAxesPermutation(l,s),d=e;u!=null&&(d=zl({inputs:{x:e},attrs:{perm:u},backend:a}),l=N.getInnerMostAxes(l.length,s),i.push(d)),N.assertAxesAreInnerMostDims(n,l,s);let[h,p]=N.computeOutAndReduceShapes(d.shape,l),c=h;r&&(c=N.expandShapeToKeepDim(h,o));let f;if((n==="max"||n==="prod")&&a.shouldExecuteOnCPU([d])){let m=a.tensorMap.get(d.dataId).values;switch(n){case"max":let g=bpe(m,w.sizeFromShape(p),c,e.dtype);f=a.makeTensorInfo(c,e.dtype,g);break;case"prod":let{outVals:y,outShape:A,outDtype:x}=Tpe(d.shape,d.dtype,m,l);f=a.makeTensorInfo(A,x,y);break;default:throw new Error(`${n} CPU implementation is not yet supported.`)}}else{let m=w.sizeFromShape(p),g=w.sizeFromShape(d.shape)/m,y={windowSize:m,inSize:m,batchSize:g,outSize:1},A=n==="mean"?"float32":ch(e.dtype),x=[{type:"int32",data:[m]}],b=new Hhe(y,n),v=a.runWebGPUProgram(b,[d],A,x);i.push(v),f=qe({inputs:{x:v},attrs:{shape:c},backend:a})}return i.forEach(m=>a.disposeData(m.dataId)),f}function kb(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{axis:s,keepDims:i}=n;return Gh(a,s,i,"sum",r)}var qhe={kernelName:Fi,backendName:"webgpu",kernelFunc:kb};function Khe(e){let{inputs:t,backend:r,attrs:n}=e,{equation:a}=n,s=t,{allDims:i,summedDims:o,idDims:l}=N.decodeEinsumEquation(a,s.length);N.checkEinsumDimSizes(i.length,l,s);let{path:u,steps:d}=N.getEinsumComputePath(o,l),h=d.length,p=null,c=i.length,f=[];for(let m=0;m<h;++m){for(let g of d[m]){let{permutationIndices:y,expandDims:A}=N.getEinsumPermutation(c,l[g]),x;N.isIdentityPermutation(y)?x=s[g]:(x=zl({inputs:{x:s[g]},backend:r,attrs:{perm:y}}),f.push(x));let b=x.shape.slice();for(let v=0;v<A.length;++v)b.splice(A[v],0,1);w.arraysEqual(x.shape,b)||(x=qe({inputs:{x},backend:r,attrs:{shape:b}}),f.push(x)),p===null?p=x:(p=B8({inputs:{a:x,b:p},backend:r}),f.push(p))}m<h-1&&(u[m]>=0&&(p=kb({inputs:{x:p},backend:r,attrs:{axis:u[m]-(i.length-c),keepDims:!1}}),f.push(p)),c--)}for(let m of f)m!==p&&r.disposeData(m.dataId);return p}var Xhe={kernelName:Qp,backendName:"webgpu",kernelFunc:Khe},Zhe=kr({opType:4}),Yhe={kernelName:si,backendName:"webgpu",kernelFunc:Zhe},Jhe=jr({opSnippet:4,dtype:"bool",cpuKernelImpl:upe}),Qhe={kernelName:jo,backendName:"webgpu",kernelFunc:Jhe},W8=kr({opType:5,cpuKernelImpl:dpe,dtype:"float32"}),ece={kernelName:ii,backendName:"webgpu",kernelFunc:W8};function n2(e){let{inputs:t,attrs:r,backend:n}=e,{dim:a}=r,{input:s}=t,i=s.shape.length,o=s.shape.slice(),l=a;return a<0&&(w.assert(-(i+1)<=a,()=>`Axis must be in the interval [${-(i+1)}, ${i}]`),l=i+a+1),o.splice(l,0,1),qe({inputs:{x:s},backend:n,attrs:{shape:o}})}var tce={kernelName:Ho,backendName:"webgpu",kernelFunc:n2},rce=kr({opType:6,cpuKernelImpl:ppe}),nce={kernelName:qo,backendName:"webgpu",kernelFunc:rce},ace=class{constructor(e){this.variableNames=[],this.outputShape=[],this.uniforms="value : f32,",this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=e,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.shaderKey="fill"}getUserCode(){return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
setOutputAtIndex(index, uniforms.value);
}
}
2022-04-14 17:47:08 +02:00
`}};function Rd(e){let{backend:t,attrs:r}=e,{shape:n,value:a}=r,{dtype:s}=r;if(s=s||w.inferDtype(a),s==="string"){let i=w.getArrayFromDType(s,w.sizeFromShape(n));return i.fill(a),t.makeTensorInfo(n,s,i)}else{let i=new ace(n),o=[{type:"float32",data:[a]}];return t.runWebGPUProgram(i,[],s,o)}}var sce={kernelName:Hu,backendName:"webgpu",kernelFunc:Rd},ice=class{constructor(e){this.outputShape=[],this.variableNames=["x"],this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=e,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.shaderKey="flipLeftRight"}getUserCode(){return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let coords = getCoordsFromIndex(index);
let coordX = uniforms.xShape[2] - coords[2] - 1;
let outputValue = getX(coords[0], coords[1], coordX, coords[3]);
setOutputAtIndex(index, outputValue);
}
}
2022-04-14 17:47:08 +02:00
`}},oce={kernelName:Ko,backendName:"webgpu",kernelFunc:({inputs:e,backend:t})=>{let{image:r}=e,n=t,a=new ice(r.shape);return n.runWebGPUProgram(a,[r],r.dtype)}},lce=kr({opType:7,cpuKernelImpl:hpe}),uce={kernelName:oi,backendName:"webgpu",kernelFunc:lce},dce=jr({opSnippet:12,dtype:"int32"}),pce={kernelName:li,backendName:"webgpu",kernelFunc:dce},hce=(e,t,r,n,a)=>{let s=[n,...r];return a&&s.push(a),e.createBindGroup({layout:t,entries:s.map((i,o)=>({binding:o,resource:i}))})},V8=(e,t,r,n,a,s=!1)=>{let i={dtype:a.dtype,shape:a.shape},o=Bde(n,i,t,s),l=e.createShaderModule({code:o,label:t.constructor.name});return e.createComputePipeline({layout:r,compute:{module:l,entryPoint:"main"},label:t.constructor.name})};function U8(e,t,r,n="",a=""){return e.shaderKey+"_"+(e.workGroupSize?e.workGroupSize.join(","):"")+t.map(s=>s.length).join(",")+r.join(",")+e.variableNames.join(",")+n+a}function ow(e){let{externalImage:t,backend:r,attrs:n,outShape:a,useImport:s}=e,{numChannels:i}=n,o=w.sizeFromShape(a),l=w.computeStrides(a),u=r.makeTensorInfo(a,"int32"),d=r.getFromPixelsProgram(s?"import":"copyExternal");d.updateOutputShape(a);let h=[u.shape],p=[u.dtype,s?"import":"copyExternal"],c=U8(d,h,p),f=d.getLayout(r.device),m=r.getAndSavePipeline(c,()=>V8(r.device,d,f.pipelineLayout,[],u,!0));d.setPipeline(m),s||r.queue.copyExternalImageToTexture({source:t,origin:{x:0,y:0}},{texture:d.makeInputTexture(r.device,a[1],a[0])},[a[1],a[0]]);let g=r.tensorMap.get(u.dataId);g.bufferInfo.buffer=r.acquireBuffer(g.bufferInfo.byteSize);let y=[o,i,...l,...d.dispatch];d.setUniform(r.device,y);let A;if(s){let x={source:t};A=r.device.importExternalTexture(x)}else A=d.inputTexture.createView();return r.runFromPixelsProgram(d,g.bufferInfo.buffer,f,A,u.dataId),u}var cce={kernelName:Pp,backendName:"webgpu",kernelFunc:fce},lu;function fce(e){let{inputs:t,backend:r,attrs:n}=e,{pixels:a}=t,{numChannels:s}=n;if(a==null)throw new Error("pixels passed to tf.browser.fromPixels() can not be null");let i=typeof HTMLVideoElement!="undefined"&&a instanceof HTMLVideoElement,o=typeof HTMLImageElement!="undefined"&&a instanceof HTMLImageElement,l=typeof HTMLCanvasElement!="undefined"&&a instanceof HTMLCanvasElement||typeof OffscreenCanvas!="undefined"&&a instanceof OffscreenCanvas,u=typeof ImageBitmap!="undefined"&&a instanceof ImageBitmap,[d,h]=i?[a.videoWidth,a.videoHeight]:[a.width,a.height],p=[h,d,s];if(Y().getBool("WEBGPU_USE_IMPORT")&&i)return ow({externalImage:a,backend:r,attrs:n,outShape:p,useImport:!0});if((i||o)&&(lu==null&&(lu=document.createElement("canvas").getContext("2d")),lu.canvas.width=d,lu.canvas.height=h,lu.drawImage(a,0,0,d,h),a=lu.canvas),u||l||i||o)return ow({externalImage:a,backend:r,attrs:n,outShape:p,useImport:!1});let c=a.data,f=c;if(s!=null&&s!==4){f=new Uint8Array(a.width*a.height*s);let y=c.length,A=0;for(let x=0;x<y;x++)x%4<s&&(f[A++]=c[x])}let m=r.makeTensorInfo(p,"int32"),g=r.tensorMap.get(m.dataId);return g.values=new Int32Array(f),r.maybeReleaseBuffer(m.dataId),r.uploadToGPU(m.dataId),m}var mce=class{constructor(e,t,r,n,a){this.uniforms="varianceEpsilon : f32,",this.workGroupSize=[128,1,1],this.size=!0,this.variableNames=["x","mean","variance"],N.assertAndGetBroadcastShape(e,t),N.assertAndGetBroadcastShape(e,r),this.outputShape=e,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),n!=null&&(N.assertAndGetBroadcastShape(e,n),this.variableNames.push("offset")),a!=null&&(N.assertAndGetBroadcastShape(e,a),this.variableNames.push("scale")),this.offsetShape=n,this.scaleShape=a,this.shaderKey="batchNorm"}getUserCode(){let e="0.0";this.offsetShape!=null&&(e="getOffsetByOutputIndex(index)");let t="1.0";return this.scaleShape!=null&&(t="getScaleByOutputIndex(index)"),`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size)
{
let xValue = getXByOutputIndex(index);
let meanValue = getMeanByOutputIndex(index);
let varianValue = getVarianceByOutputIndex(index);
let offsetValue = ${e};
let scaleValue = ${t};
let inv = scaleValue * inverseSqrt(varianValue + f32(uniforms.varianceEpsilon));
setOutputAtIndex(index,dot(vec3<f32>(xValue, -meanValue, offsetValue), vec3<f32>(inv, inv, 1.0)));
}
}
2022-04-14 17:47:08 +02:00
`}},gce={kernelName:ui,backendName:"webgpu",kernelFunc:({inputs:e,attrs:t,backend:r})=>{let{x:n,scale:a,offset:s,mean:i,variance:o}=e,{varianceEpsilon:l}=t,u=r,d=[n,i,o],h=null;s!=null&&(h=s.shape,d.push(s));let p=null;a!=null&&(p=a.shape,d.push(a));let c=new mce(n.shape,i.shape,o.shape,h,p),f=[{type:"float32",data:[l]}];return u.runWebGPUProgram(c,d,n.dtype,f)}};function yce(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,filter:s,bias:i,preluActivationWeights:o}=t,{strides:l,pad:u,dataFormat:d,dilations:h,dimRoundingMode:p,activation:c,leakyreluAlpha:f}=n,m=N.convertConv2DDataFormat(d),g=N.computeConv2DInfo(a.shape,s.shape,l,h,u,p,!1,m);return O8({x:a,filter:s,convInfo:g,backend:r,bias:i,preluActivationWeights:o,leakyreluAlpha:f,activation:c})}var Ace={kernelName:Fs,backendName:"webgpu",kernelFunc:yce};function xce(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,filter:s,bias:i,preluActivationWeights:o}=t,{strides:l,pad:u,dilations:d,dimRoundingMode:h,activation:p,leakyreluAlpha:c}=n,f=d;f==null&&(f=[1,1]),w.assert(N.eitherStridesOrDilationsAreOne(l,f),()=>`Error in depthwiseConv2d: Either strides or dilations must be 1. Got strides ${l} and dilations '${f}'`);let m=N.computeConv2DInfo(a.shape,s.shape,l,f,u,h,!0),g=[a,s],y=i!=null,A=o!=null;y&&g.push(i),A&&g.push(o);let x=[{type:"int32",data:[m.padInfo.top,m.padInfo.left]},{type:"int32",data:[m.strideHeight,m.strideWidth]},{type:"int32",data:[m.dilationHeight,m.dilationWidth]},{type:"int32",data:[m.inHeight,m.inWidth]}],b;return m.batchSize===1&&m.inHeight===m.outHeight&&m.inWidth===m.outWidth&&m.strideHeight===1&&m.strideWidth===1&&m.filterHeight===m.filterWidth&&m.inChannels===m.outChannels&&m.dilationHeight===1&&m.dilationWidth===1&&m.filterHeight===3&&m.inChannels%4===0?b=new D8(m,y,p,A):(b=new L8(m,y,p,A),x.push({type:"int32",data:[m.filterHeight]},{type:"int32",data:[m.filterWidth]},{type:"int32",data:[m.outChannels/m.inChannels]})),p==="leakyrelu"&&(x.push({type:"float32",data:[c]}),b.uniforms+=" alpha : f32,"),r.runWebGPUProgram(b,g,"float32",x)}var bce={kernelName:$s,backendName:"webgpu",kernelFunc:xce},vce=class{constructor(e,t){this.variableNames=["A","indices"],this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=t,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.shaderKey=`gathernd_${e}`,this.sliceDim=e,this.uniforms=`sliceDim : i32, strides : ${gr(e)},`}getUserCode(){let e;return this.sliceDim>1?e="uniforms.strides[j]":e="uniforms.strides",`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let coords = getCoordsFromIndex(index);
var flattenIndex = 0;
for (var j = 0; j < uniforms.sliceDim; j = j + 1) {
let indexTemp = i32(round(getIndices(coords[0], j)));
let strideNum = ${e};
flattenIndex = flattenIndex + indexTemp * strideNum;
}
setOutputAtIndex(index, getA(flattenIndex, coords[1]));
}
}
2022-04-14 17:47:08 +02:00
`}};function wce(e){let{inputs:t,backend:r}=e,{params:n,indices:a}=t,s=a.shape,i=s[s.length-1],o=w.sizeFromShape(n.shape),[l,u,d,h]=N.prepareAndValidate(n,a),p=qe({inputs:{x:a},backend:r,attrs:{shape:[u,i]}}),c=qe({inputs:{x:n},backend:r,attrs:{shape:[w.sizeFromShape(n.shape)/d,d]}});if(r.shouldExecuteOnCPU([n,a])||n.dtype==="string"){let A=r.readSync(a.dataId),x=r.bufferSync(n),b=cpe(A,x,n.dtype,u,i,d,h,n.shape,o);return r.makeTensorInfo(l,n.dtype,b.values)}let f=new vce(i,[u,d]),m=[{type:"int32",data:[i]},{type:"int32",data:h}],g=r.runWebGPUProgram(f,[c,p],c.dtype,m),y=qe({inputs:{x:g},backend:r,attrs:{shape:l}});return r.disposeData(p.dataId),r.disposeData(c.dataId),r.disposeData(g.dataId),y}var kce={kernelName:Zo,backendName:"webgpu",kernelFunc:wce},Ice=class{constructor(e,t){this.variableNames=["A","indices"],this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=e.slice(),this.aShape=e,this.outputShape=t,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.shaderKey="gather"}getUserCode(){let e=Sce(this.aShape);return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let resRC = getCoordsFromIndex(index);
2022-04-01 15:12:04 +02:00
let indexZ = i32(getIndices(resRC.x, resRC.z));
let inBounds = select(0.0, 1.0, indexZ >= 0 && indexZ < uniforms.aShape[2]);
setOutputAtIndex(index, inBounds * getA(${e}));
2022-02-10 18:27:21 +01:00
}
}
2022-04-14 17:47:08 +02:00
`}};function Sce(e){let t=["resRC.x","resRC.y","resRC.z","resRC.w"],r=[];for(let n=0;n<e.length;n++)n===2?r.push("indexZ"):r.push(`${t[n]}`);return r.join()}function G8(e){let{inputs:t,backend:r,attrs:n}=e,{x:a,indices:s}=t,{axis:i,batchDims:o}=n,l=w.parseAxisParam(i,a.shape)[0],u=N.segment_util.collectGatherOpShapeInfo(a,s,l,o),d=w.sizeFromShape(s.shape),h=[],p=qe({inputs:{x:a},backend:r,attrs:{shape:[u.batchSize,u.outerSize,u.dimSize,u.sliceSize]}}),c=qe({inputs:{x:s},backend:r,attrs:{shape:[u.batchSize,d/u.batchSize]}});h.push(p),h.push(c);let f=[u.batchSize,u.outerSize,d/u.batchSize,u.sliceSize];if(r.shouldExecuteOnCPU([a,s])){let A=r.tensorMap.get(c.dataId).values,x=We(c.shape,c.dtype,A),b=r.tensorMap.get(p.dataId).values,v=We(p.shape,p.dtype,b),S=fpe(v,x,f);return h.forEach(T=>r.disposeData(T.dataId)),r.makeTensorInfo(u.outputShape,S.dtype,S.values)}let m=new Ice(p.shape,f),g=r.runWebGPUProgram(m,[p,c],p.dtype);h.push(g);let y=qe({inputs:{x:g},backend:r,attrs:{shape:u.outputShape}});return h.forEach(A=>r.disposeData(A.dataId)),y}var Tce={kernelName:Xo,backendName:"webgpu",kernelFunc:G8},Nce=jr({opSnippet:5,cpuKernelImpl:gpe,dtype:"bool"}),Cce={kernelName:Yo,backendName:"webgpu",kernelFunc:Nce},Ece=jr({opSnippet:6,dtype:"bool",cpuKernelImpl:mpe}),Rce={kernelName:di,backendName:"webgpu",kernelFunc:Ece};function Mce(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{alpha:s}=n,i=[{type:"float32",data:[s]}],o=new Vh(a.shape,14);return o.uniforms="alpha : f32,",r.runWebGPUProgram(o,[a],"float32",i)}var Fce={kernelName:hi,backendName:"webgpu",kernelFunc:Mce},$ce=jr({opSnippet:7,dtype:"bool",cpuKernelImpl:Ape}),Pce={kernelName:Jo,backendName:"webgpu",kernelFunc:$ce},_ce=jr({opSnippet:8,dtype:"bool",cpuKernelImpl:ype}),zce={kernelName:Qo,backendName:"webgpu",kernelFunc:_ce},Oce=kr({opType:9,cpuKernelImpl:xpe}),Dce={kernelName:ci,backendName:"webgpu",kernelFunc:Oce},Lce=jr({opSnippet:9,dtype:"bool"}),Bce={kernelName:el,backendName:"webgpu",kernelFunc:Lce},Wce=kr({opType:10}),Vce={kernelName:Yu,backendName:"webgpu",kernelFunc:Wce};function j8(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{reductionIndices:s,keepDims:i}=n;return Gh(a,s,i,"max",r)}var Uce={kernelName:fi,backendName:"webgpu",kernelFunc:j8},Gce=jr({opSnippet:15,cpuKernelImpl:vpe}),jce={kernelName:mi,backendName:"webgpu",kernelFunc:Gce};function Hce(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{filterSize:s,strides:i,pad:o,dimRoundingMode:l}=n,u=1,d=N.computePool2DInfo(a.shape,s,i,u,o,l),h,p=[];if(d.filterHeight===1&&d.filterWidth===1){if(w.arraysEqual(d.inShape,d.outShape))return Vn({inputs:{x:a},backend:r});h=new P8(d),p.push({type:"int32",data:[d.strideHeight,d.strideWidth]})}else h=new $8(d,"max"),p.push({type:"int32",data:[d.strideHeight,d.strideWidth]},{type:"int32",data:[d.padInfo.top,d.padInfo.left]},{type:"int32",data:[d.dilationHeight,d.dilationWidth]},{type:"int32",data:[d.inHeight,d.inWidth]},{type:"int32",data:[d.effectiveFilterHeight,d.effectiveFilterWidth]});return r.runWebGPUProgram(h,[a],a.dtype,p)}var qce={kernelName:gi,backendName:"webgpu",kernelFunc:Hce};function Kce(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{keepDims:s,axis:i}=n;return Gh(a,i,s,"mean",r)}var Xce={kernelName:yi,backendName:"webgpu",kernelFunc:Kce};function Zce(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{axis:s,keepDims:i}=n;return Gh(a,s,i,"min",r)}var Yce={kernelName:Ai,backendName:"webgpu",kernelFunc:Zce},Jce=jr({opSnippet:16,cpuKernelImpl:wpe}),Qce={kernelName:xi,backendName:"webgpu",kernelFunc:Jce},efe=class{constructor(e,t,r){this.uniforms="",this.variableNames=["x"],this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=t.map((n,a)=>n[0]+e[a]+n[1]),this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.xShape=e,t.map((n,a)=>{this.uniforms+=` pad${a} : vec2<i32>,`}),this.offset=r==="reflect"?0:1,this.shaderKey=`mirrorPad_${r}`}getUserCode(){let e=this.xShape.length,t=this.xShape.map((l,u)=>`uniforms.pad${u}[0]`).join(","),r=this.xShape.map((l,u)=>`uniforms.pad${u}[0] + uniforms.xShape${e>1?`[${u}]`:""
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
2022-04-01 15:13:32 +02:00
let start = ${i}(${t});
let end = ${i}(${r});
2022-02-10 18:27:21 +01:00
var outC = getCoordsFromIndex(index);
for (var i = 0; i < ${e}; i = i + 1) {
2022-04-01 15:13:32 +02:00
if (${s} < ${n}) {
${s} = ${n} * 2 - ${s} - ${this.offset};
} else if(${s} >= ${a}) {
${s} = (${a} - 1) * 2 - ${s} + ${this.offset};
2022-02-10 18:27:21 +01:00
}
}
let coords = outC - start;
2022-04-01 15:13:32 +02:00
setOutputAtIndex(index, getX(${o}));
2022-02-10 18:27:21 +01:00
}
}
2022-04-14 17:47:08 +02:00
`}},tfe={kernelName:bi,backendName:"webgpu",kernelFunc:({inputs:e,attrs:t,backend:r})=>{let{x:n}=e,{paddings:a,mode:s}=t,i=r,o=a.map(u=>({type:"int32",data:[u[0],u[1]]})),l=new efe(n.shape,a,s);return i.runWebGPUProgram(l,[n],n.dtype,o)}};function rfe(e){let{inputs:t,backend:r}=e,{x:n}=t;if(r.shouldExecuteOnCPU([n])){let s=r.tensorMap.get(n.dataId),[i,o]=Ipe(s.values,n.shape,n.dtype);return r.makeTensorInfo(o,n.dtype,i)}let a=new Vh(n.shape,11);return r.runWebGPUProgram(a,[n],n.dtype)}var nfe={kernelName:tl,backendName:"webgpu",kernelFunc:rfe};function afe(e){console.warn("tf.nonMaxSuppression() in webgpu locks the UI thread. Call tf.nonMaxSuppressionAsync() instead");let{inputs:t,backend:r,attrs:n}=e,{boxes:a,scores:s}=t,{maxOutputSize:i,iouThreshold:o,scoreThreshold:l}=n,u=r.readSync(a.dataId),d=r.readSync(s.dataId),{selectedIndices:h}=qn.nonMaxSuppressionV3Impl(u,d,i,o,l);return r.makeTensorInfo([h.length],"int32",new Int32Array(h))}var sfe={kernelName:nl,backendName:"webgpu",kernelFunc:afe};function ife(e){console.warn("tf.nonMaxSuppression() in webgpu locks the UI thread. Call tf.nonMaxSuppressionAsync() instead");let{inputs:t,backend:r,attrs:n}=e,{boxes:a,scores:s}=t,{maxOutputSize:i,iouThreshold:o,scoreThreshold:l,softNmsSigma:u}=n,d=r.readSync(a.dataId),h=r.readSync(s.dataId),p=i,c=o,f=l,m=u,{selectedIndices:g,selectedScores:y}=qn.nonMaxSuppressionV5Impl(d,h,p,c,f,m);return[r.makeTensorInfo([g.length],"int32",new Int32Array(g)),r.makeTensorInfo([y.length],"float32",new Float32Array(y))]}var ofe={kernelName:al,backendName:"webgpu",kernelFunc:ife};function Lf(e){let{inputs:t,backend:r}=e,{x:n}=t;if(n.dtype==="complex64"){let a=Uh({inputs:{input:n},backend:r}),s=Lf({inputs:{x:a},backend:r}),i=w0({inputs:{input:n},backend:r}),o=Lf({inputs:{x:i},backend:r}),l=Cd({inputs:{real:s,imag:o},backend:r});return r.disposeData(a.dataId),r.disposeData(s.dataId),r.disposeData(i.dataId),r.disposeData(o.dataId),l}else return Rd({attrs:{shape:n.shape,dtype:n.dtype,value:n.dtype==="string"?"":0},backend:r})}var lfe={kernelName:kl,backendName:"webgpu",kernelFunc:Lf};function H8(e){let{inputs:t,backend:r}=e,{x:n}=t;if(n.dtype==="string")throw new Error("onesLike is not supported under string dtype");if(n.dtype==="complex64"){let a=Uh({inputs:{input:n},backend:r}),s=H8({inputs:{x:a},backend:r}),i=w0({inputs:{input:n},backend:r}),o=Lf({inputs:{x:i},backend:r}),l=Cd({inputs:{real:s,imag:o},backend:r});return r.disposeData(a.dataId),r.disposeData(s.dataId),r.disposeData(i.dataId),r.disposeData(o.dataId),l}else return Rd({attrs:{shape:n.shape,dtype:n.dtype,value:1},backend:r})}var ufe={kernelName:sl,backendName:"webgpu",kernelFunc:H8};function dfe(e){let{inputs:t,backend:r,attrs:n}=e,{axis:a}=n;if(t.length===1)return n2({inputs:{input:t[0]},backend:r,attrs:{dim:a}});let s=t[0].shape,i=t[0].dtype;t.forEach(d=>{w.assertShapesMatch(s,d.shape,"All tensors passed to stack must have matching shapes"),w.assert(i===d.dtype,()=>"All tensors passed to stack must have matching dtypes")});let o=[],l=t.map(d=>{let h=n2({inputs:{input:d},backend:r,attrs:{dim:a}});return o.push(h),h}),u=z8({inputs:l,backend:r,attrs:{axis:a}});return o.forEach(d=>r.disposeData(d.dataId)),u}var pfe={kernelName:ol,backendName:"webgpu",kernelFunc:dfe},hfe=class{constructor(e,t){this.variableNames=["x"],this.uniforms="constantValue : f32,",this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=t.map((r,n)=>r[0]+e[n]+r[1]),this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),t.map((r,n)=>{this.uniforms+=` pad${n} : vec2<i32>,`}),this.xShape=e,this.shaderKey="pad"}getUserCode(){let e=this.xShape.length,t=gr(e),r=this.xShape.map((u,d)=>`uniforms.pad${d}[0]`).join(","),n=this.xShape.map((u,d)=>`uniforms.pad${d}[0] + uniforms.xShape${e>1?`[${d}]`:""}`).join(","),a=e>1?`${t}(${r})`:`${r}`,s=e>1?`${t}(${n})`:`${n}`,i=e>1?"any(outC < start)":"outC < start",o=e>1?"any(outC >= end)":"outC >= end",l=e>1?["coords[0]","coords[1]","coords[2]","coords[3]"].slice(0,e):"coords";return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
2022-04-01 15:13:32 +02:00
let start = ${a};
let end = ${s};
2022-02-10 18:27:21 +01:00
let outC = getCoordsFromIndex(index);
2022-04-01 15:13:32 +02:00
if (${i} || ${o}) {
2022-02-10 18:27:21 +01:00
setOutputAtIndex(index, uniforms.constantValue);
} else {
let coords = outC - start;
setOutputAtIndex(index, getX(${l}));
}
}
}
2022-04-14 17:47:08 +02:00
`}},q8=e=>{let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{paddings:s,constantValue:i}=n;if(s.every(u=>w.arraysEqual(u,[0,0])))return Vn({inputs:{x:a},backend:r});if(w.sizeFromShape(a.shape)===0){let u=s.map((d,h)=>d[0]+a.shape[h]+d[1]);return Rd({backend:r,attrs:{shape:u,value:i,dtype:a.dtype}})}let o=[{type:"float32",data:[i]}];s.map(u=>o.push({type:"int32",data:[u[0],u[1]]}));let l=new hfe(a.shape,s);return r.runWebGPUProgram(l,[a],a.dtype,o)},cfe={kernelName:wi,backendName:"webgpu",kernelFunc:q8},ffe=jr({opSnippet:13}),mfe={kernelName:ki,backendName:"webgpu",kernelFunc:ffe};function gfe(e){let{inputs:t,backend:r}=e,{x:n,alpha:a}=t,s=new M8(14,n.shape,a.shape);return r.runWebGPUProgram(s,[n,a],"float32")}var yfe={kernelName:Ii,backendName:"webgpu",kernelFunc:gfe};function Afe(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{axis:s,keepDims:i}=n;return Gh(a,s,i,"prod",r)}var xfe={kernelName:ll,backendName:"webgpu",kernelFunc:Afe},bfe=e=>{let{backend:t,attrs:r}=e,{start:n,stop:a,step:s,dtype:i}=r,o=Npe(n,a,s,i);return t.makeTensorInfo([o.length],i,o)},vfe={kernelName:ed,backendName:"webgpu",kernelFunc:bfe},K8=jr({opSnippet:3}),wfe={kernelName:ai,backendName:"webgpu",kernelFunc:K8},kfe=kr({opType:12}),Ife={kernelName:Si,backendName:"webgpu",kernelFunc:kfe},Sfe=kr({opType:13}),Tfe={kernelName:Ni,backendName:"webgpu",kernelFunc:Sfe},Nfe=class{constructor(e,t,r){this.variableNames=["x"],this.uniforms="adjustHeightWidth : vec2<f32>, halfPixelCenters : f32,",this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=[e[0],t,r,e[3]],this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.shaderKey="resizeBilinear"}getUserCode(){return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let coords = getCoordsFromIndex(index);
let b = coords[0];
let d = coords[3];
let rc = coords.yz;
let effectiveInSize = vec2<f32>(
f32(uniforms.xShape.y) - uniforms.adjustHeightWidth[0],
f32(uniforms.xShape.z) - uniforms.adjustHeightWidth[1]);
let effectiveOutSize = vec2<f32>(
f32(uniforms.outShape.y) - uniforms.adjustHeightWidth[0],
f32(uniforms.outShape.z) - uniforms.adjustHeightWidth[1]);
let effectiveInputOverOutputRatioRC =
effectiveInSize / effectiveOutSize;
// Fractional source index
let sourceFracIndexRC =
(vec2<f32>(rc) + vec2<f32>(uniforms.halfPixelCenters)) *
effectiveInputOverOutputRatioRC - vec2<f32>(uniforms.halfPixelCenters);
// Compute the four integer indices.
let sourceFloorRC = vec2<i32>(sourceFracIndexRC);
let sourceCeilRC = vec2<i32>(
min(vec2<f32>(uniforms.xShape.yz) - vec2<f32>(1.0), ceil(sourceFracIndexRC)));
let topLeft = getX(b, sourceFloorRC.x, sourceFloorRC.y, d);
let bottomLeft = getX(b, sourceCeilRC.x, sourceFloorRC.y, d);
let topRight = getX(b, sourceFloorRC.x, sourceCeilRC.y, d);
let bottomRight = getX(b, sourceCeilRC.x, sourceCeilRC.y, d);
let fracRC = sourceFracIndexRC - vec2<f32>(sourceFloorRC);
let top = topLeft + (topRight - topLeft) * fracRC.y;
let bottom = bottomLeft + (bottomRight - bottomLeft) * fracRC.y;
let newValue = top + (bottom - top) * fracRC.x;
setOutputAtIndex(index, newValue);
}
}
2022-04-14 17:47:08 +02:00
`}};function Cfe(e){let{inputs:t,backend:r,attrs:n}=e,{images:a}=t,{alignCorners:s,size:i,halfPixelCenters:o}=n,[l,u]=i,d=s&&l>1?1:0,h=s&&u>1?1:0,p=[{type:"float32",data:[d,h]},{type:"float32",data:[o?.5:0]}],c=new Nfe(a.shape,l,u);return r.runWebGPUProgram(c,[a],"float32",p)}var Efe={kernelName:Ti,backendName:"webgpu",kernelFunc:Cfe},Rfe=class{constructor(e,t,r,n){this.variableNames=["x"],this.uniforms="adjustHeightWidth : vec2<f32>, roundBase : f32,",this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=[e[0],t,r,e[3]],this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.halfPixelCenters=n,this.shaderKey=`resizeNearest_${n}`}getUserCode(){let e;return this.halfPixelCenters?e="max((vec2<f32>(rc) + vec2<f32>(0.5)) * effectiveInputOverOutputRatioRC, vec2<f32>(0.0))":e="vec2<f32>(rc) * effectiveInputOverOutputRatioRC",`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let coords = getCoordsFromIndex(index);
let b = coords[0];
let d = coords[3];
let rc = coords.yz;
let effectiveInSize = vec2<f32>(
f32(uniforms.xShape.y) - uniforms.adjustHeightWidth[0],
f32(uniforms.xShape.z) - uniforms.adjustHeightWidth[1]);
let effectiveOutSize = vec2<f32>(
f32(uniforms.outShape.y) - uniforms.adjustHeightWidth[0],
f32(uniforms.outShape.z) - uniforms.adjustHeightWidth[1]);
let effectiveInputOverOutputRatioRC =
effectiveInSize / effectiveOutSize;
// Fractional source index
let sourceFracIndexRC = ${e};
// Compute the coordinators of nearest neighbor point.
let inputShapeRC = vec2<f32>(f32(uniforms.xShape.y), f32(uniforms.xShape.z));
let sourceNearestRC = vec2<i32>(
min(inputShapeRC - 1.0, floor(sourceFracIndexRC + uniforms.roundBase)));
let newValue = getX(b, sourceNearestRC.x, sourceNearestRC.y, d);
setOutputAtIndex(index, newValue);
}
}
2022-04-14 17:47:08 +02:00
`}};function Mfe(e){let{inputs:t,backend:r,attrs:n}=e,{images:a}=t,{alignCorners:s,halfPixelCenters:i,size:o}=n,[l,u]=o,d=s&&l>1?1:0,h=s&&u>1?1:0,p=[{type:"float32",data:[d,h]},{type:"float32",data:[s?.5:0]}],c=new Rfe(a.shape,l,u,i);return r.runWebGPUProgram(c,[a],a.dtype,p)}var Ffe={kernelName:rd,backendName:"webgpu",kernelFunc:Mfe},$fe=class{constructor(e,t){this.outputShape=[],this.variableNames=["x"],this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=e,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.uniforms=`centerX : f32, centerY : f32, sinRadians : f32,
2022-04-01 15:12:04 +02:00
cosRadians : f32,`,this.shaderKey="rotate",this.outputShape=e,typeof t=="number"?(this.uniforms+=" fillValue : f32,",this.fillSnippet="var outputValue = uniforms.fillValue;",this.shaderKey+="_float"):(this.uniforms+=" fillValue : vec3<f32>,",this.fillSnippet="var outputValue = uniforms.fillValue[coords[3]];",this.shaderKey+="_vec3")}getUserCode(){return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let coords = getCoordsFromIndex(index);
let coordXFloat = (f32(coords[2]) - uniforms.centerX) *
uniforms.cosRadians - (f32(coords[1]) - uniforms.centerY) *
uniforms.sinRadians;
let coordYFloat = (f32(coords[2]) - uniforms.centerX) *
uniforms.sinRadians + (f32(coords[1]) - uniforms.centerY) *
uniforms.cosRadians;
let coordX = i32(round(coordXFloat + uniforms.centerX));
let coordY = i32(round(coordYFloat + uniforms.centerY));
${this.fillSnippet}
if(coordX >= 0 && coordX < uniforms.xShape[2] && coordY >= 0 &&
coordY < uniforms.xShape[1]) {
outputValue = getX(coords[0], coordY, coordX, coords[3]);
}
setOutputAtIndex(index, outputValue);
}
}
2022-04-14 17:47:08 +02:00
`}},Pfe={kernelName:Il,backendName:"webgpu",kernelFunc:({inputs:e,attrs:t,backend:r})=>{let{image:n}=e,{radians:a,fillValue:s,center:i}=t,o=r,l=new $fe(n.shape,s),[u,d]=N.getImageCenter(i,n.shape[1],n.shape[2]),h=[{type:"float32",data:[u]},{type:"float32",data:[d]},{type:"float32",data:[Math.sin(a)]},{type:"float32",data:[Math.cos(a)]}];return typeof s=="number"?h.push({type:"float32",data:[Number.parseFloat(s.toFixed(2))]}):h.push({type:"float32",data:s}),o.runWebGPUProgram(l,[n],n.dtype,h)}},_fe=kr({opType:15,cpuKernelImpl:Cpe}),zfe={kernelName:Ci,backendName:"webgpu",kernelFunc:_fe},Ofe=class{constructor(e,t,r,n,a,s,i){this.variableNames=["updates","indices"],this.workGroupSize=[64,1,1],this.atomic=!0,this.outputShape=s,this.type=i,this.dispatchLayout=Xe(e),this.dispatch=Oe(this.dispatchLayout,e,this.workGroupSize),this.sliceDimGreaterThanOne=t>1,this.shaderKey=`scatter_${r}_${n}_${this.sliceDimGreaterThanOne}_${i}`;let o=gr(a.length);this.uniforms=`sliceDim : i32, strides: ${o}, size: i32,`,this.updatesRank=n,this.indicesRank=r}getUserCode(){let e="";this.indicesRank===1?e="coords[0]":this.indicesRank===2&&(e="coords[0], j");let t=`getIndices(${e})`,r=this.sliceDimGreaterThanOne?"uniforms.strides[j]":"uniforms.strides",n="",a="",s="";this.updatesRank===1?(n="coords[0]",a="flattenedIndex",s=`
2022-02-10 18:27:21 +01:00
fn getUpdatesCoordsFromFlatIndex(index : i32) -> i32 {
return index;
}
2022-04-01 15:13:32 +02:00
`):this.updatesRank===2&&(n="coords[0], coords[1]",a="vec2<i32>(flattenedIndex, coords[1])",s=`
2022-02-10 18:27:21 +01:00
fn getUpdatesCoordsFromFlatIndex(index : i32) -> vec2<i32> {
let d0 = index / uniforms.updatesShape[1];
let d1 = index - d0 * uniforms.updatesShape[1];
return vec2<i32>(d0, d1);
}
2022-04-01 15:13:32 +02:00
`);let i=`getUpdates(${n})`,o=this.type==="int32"?"atomicAdd(&(result[flatIndex]), i32(updateValue));":`
2022-04-01 15:12:04 +02:00
var assumed = atomicLoad(&(result[flatIndex]));
2022-02-10 18:27:21 +01:00
var success = 0;
for (; success == 0;) {
let new = bitcast<f32>(assumed) + updateValue;
let newI32 = bitcast<i32>(new);
2022-04-01 15:12:04 +02:00
let resValue = atomicCompareExchangeWeak(&(result[flatIndex]), assumed, newI32);
2022-02-10 18:27:21 +01:00
assumed = resValue[0];
success = resValue[1];
}
`;return`
2022-04-01 15:13:32 +02:00
${s}
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let coords = getUpdatesCoordsFromFlatIndex(index);
var flattenedIndex = 0;
for (var j = 0; j < uniforms.sliceDim; j = j + 1) {
let indexInside = i32(round(${t}));
2022-04-01 15:13:32 +02:00
flattenedIndex = flattenedIndex + indexInside * ${r};
2022-02-10 18:27:21 +01:00
}
2022-04-01 15:13:32 +02:00
let updateValue = ${i};
let flatIndex = getOutputIndexFromCoords(${a});
2022-02-10 18:27:21 +01:00
2022-04-01 15:13:32 +02:00
${o}
2022-02-10 18:27:21 +01:00
}
2022-04-14 17:47:08 +02:00
}`}};function Dfe(e){let{inputs:t,backend:r,attrs:n}=e,{indices:a,updates:s}=t,{shape:i}=n,{sliceRank:o,numUpdates:l,sliceSize:u,strides:d,outputSize:h}=N.calculateShapes(s,a,i),p=[h/u,u];if(h===0)return r.makeTensorInfo(i,a.dtype);let c=qe({inputs:{x:a},backend:r,attrs:{shape:[l,o]}}),f=qe({inputs:{x:s},backend:r,attrs:{shape:[l,u]}}),m=f.dtype,g=Rd({backend:r,attrs:{shape:p,value:0,dtype:m}}),y=w.sizeFromShape(f.shape),A=[{type:"int32",data:[o]},{type:"int32",data:d},{type:"int32",data:[y]}],x=new Ofe(f.shape,o,c.shape.length,f.shape.length,d,p,m),b=r.runWebGPUProgram(x,[f,c],m,A,g),v=qe({inputs:{x:b},backend:r,attrs:{shape:i}});return r.disposeData(c.dataId),r.disposeData(f.dataId),r.disposeData(b.dataId),v}var Lfe={kernelName:hl,backendName:"webgpu",kernelFunc:Dfe},Bfe=class{constructor(e,t,r){this.variableNames=["c","a","b"],this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=t,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.cRank=e,this.rank=r,this.shaderKey="select"}getUserCode(){let e,t;if(this.rank>4)throw Error(`Where for rank ${this.rank} is not yet supported`);if(this.rank===1)t="resRC",e="resRC";else{let r=["resRC.x","resRC.y","resRC.z","resRC.w"],n=[],a=[];for(let s=0;s<this.outputShape.length;s++)a.push(`${r[s]}`),s<this.cRank&&n.push(`${r[s]}`);e=n.join(),t=a.join()}return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let resRC = getCoordsFromIndex(index);
let cVal = getC(${e});
if (cVal >= 1.0) {
setOutputAtIndex(index, getA(${t}));
} else {
setOutputAtIndex(index, getB(${t}));
}
}
}
2022-04-14 17:47:08 +02:00
`}};function Wfe(e){let{inputs:t,backend:r}=e,{condition:n,t:a,e:s}=t,i=new Bfe(n.shape.length,a.shape,a.shape.length);return r.runWebGPUProgram(i,[n,a,s],Cr(a.dtype,s.dtype))}var Vfe={kernelName:cl,backendName:"webgpu",kernelFunc:Wfe},Ufe=kr({opType:18}),Gfe={kernelName:Ri,backendName:"webgpu",kernelFunc:Ufe},jfe=kr({opType:16}),Hfe={kernelName:Ei,backendName:"webgpu",kernelFunc:jfe},qfe=kr({opType:17}),Kfe={kernelName:ml,backendName:"webgpu",kernelFunc:qfe},X8=jr({opSnippet:2,cpuKernelImpl:$pe,supportsComplex:!0}),Xfe={kernelName:_i,backendName:"webgpu",kernelFunc:X8};function Zfe(e){let{inputs:t,backend:r,attrs:n}=e,{logits:a}=t,{dim:s}=n,i=w.parseAxisParam([s],a.shape),o=j8({inputs:{x:a},backend:r,attrs:{reductionIndices:i,keepDims:!1}}),l=N.expandShapeToKeepDim(o.shape,i),u=qe({inputs:{x:o},backend:r,attrs:{shape:l}}),d=X8({inputs:{a,b:u},backend:r}),h=W8({inputs:{x:d},backend:r}),p=kb({inputs:{x:h},backend:r,attrs:{axis:i,keepDims:!1}}),c=qe({inputs:{x:p},backend:r,attrs:{shape:l}}),f=K8({inputs:{a:h,b:c},backend:r});return r.disposeData(o.dataId),r.disposeData(u.dataId),r.disposeData(d.dataId),r.disposeData(h.dataId),r.disposeData(p.dataId),r.disposeData(c.dataId),f}var Yfe={kernelName:$i,backendName:"webgpu",kernelFunc:Zfe},Jfe=e=>{let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{blockShape:s,paddings:i}=n;w.assert(a.shape.length<=4,()=>"spaceToBatchND for rank > 4 with a WebGPU backend not implemented yet");let o=s.reduce((y,A)=>y*A),l=[[0,0]];l.push(...i);for(let y=1+s.length;y<a.shape.length;++y)l.push([0,0]);let u=[],d=q8({inputs:{x:a},backend:r,attrs:{paddings:l,constantValue:0}}),h=N.getReshaped(d.shape,s,o,!1),p=N.getPermuted(h.length,s.length,!1),c=N.getReshapedPermuted(d.shape,s,o,!1),f=qe({inputs:{x:d},backend:r,attrs:{shape:h}}),m=zl({inputs:{x:f},backend:r,attrs:{perm:p}}),g=qe({inputs:{x:m},backend:r,attrs:{shape:c}});return u.push(d),u.push(f),u.push(m),u.forEach(y=>r.disposeData(y.dataId)),g},Qfe={kernelName:gl,backendName:"webgpu",kernelFunc:Jfe},eme=class{constructor(e,t,r,n,a,s,i=!0){this.variableNames=["updates","indices","defaultValue"],this.workGroupSize=[64,1,1],this.workPerThread=4,this.size=!0,this.outputShape=s,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,[this.workPerThread,1,1]);let o=t>1;this.shaderKey=`scatter_${r}_${n}_${o}`;let l=gr(a.length);this.uniforms=`updateSize : i32, sliceDim : i32, strides: ${l},`;let u="";r===1?u="i":r===2&&(u="i, j"),this.indicesSnippet=`getIndices(${u})`;let d="";n===1?d="i":n===2&&(d="i, coords[1]"),this.updatesSnippet=`getUpdates(${d})`,this.strideString=o?"uniforms.strides[j]":"uniforms.strides"}getUserCode(){return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
let globalIndex = index * ${this.workPerThread};
if (globalIndex < uniforms.size) {
var sum = vec4<f32>(0.0);
var found = vec4<bool>(false);
for (var i = 0; i < uniforms.updateSize; i = i + 1) {
var flattenedIndex = 0;
for (var j = 0; j < uniforms.sliceDim; j = j + 1) {
let indexInside = i32(round(${this.indicesSnippet}));
flattenedIndex = flattenedIndex + indexInside * ${this.strideString};
}
for (var innerIndex = 0; innerIndex < ${this.workPerThread}; innerIndex = innerIndex + 1) {
let curIndex = globalIndex + innerIndex;
let coords = getCoordsFromIndex(curIndex);
if (flattenedIndex == coords[0]) {
sum[innerIndex] = sum[innerIndex] + ${this.updatesSnippet};
found[innerIndex] = true;
}
}
}
for (var innerIndex = 0; innerIndex < ${this.workPerThread}; innerIndex = innerIndex + 1) {
let curIndex = globalIndex + innerIndex;
if (curIndex < uniforms.size)
{
setOutputAtIndex(curIndex, mix(getDefaultValue(), sum[innerIndex], f32(found[innerIndex])));
}
}
}
2022-04-14 17:47:08 +02:00
}`}};function tme(e){let{inputs:t,backend:r,attrs:n}=e,{sparseIndices:a,sparseValues:s,defaultValue:i}=t,{outputShape:o}=n,{sliceRank:l,numUpdates:u,strides:d,outputSize:h}=N.calculateShapes(s,a,o),p=!1,c=[{type:"int32",data:[u]},{type:"int32",data:[l]},{type:"int32",data:d}],f=new eme(u,l,a.shape.length,s.shape.length,d,[h,1],p),m=r.runWebGPUProgram(f,[s,a,i],s.dtype,c),g=qe({inputs:{x:m},backend:r,attrs:{shape:o}});return r.disposeData(m.dataId),g}var rme={kernelName:lh,backendName:"webgpu",kernelFunc:tme};function nme(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{numOrSizeSplits:s,axis:i}=n,o=w.parseAxisParam(i,a.shape)[0],l=N.prepareSplitSize(a,s,o),u=a.shape.length,d=new Array(u).fill(0),h=a.shape.slice();return l.map(p=>{let c=[...h];c[o]=p;let f=Ed({inputs:{x:a},backend:r,attrs:{begin:d,size:c}});return d[o]+=p,f})}var ame={kernelName:yl,backendName:"webgpu",kernelFunc:nme},sme=kr({opType:19}),ime={kernelName:Mi,backendName:"webgpu",kernelFunc:sme},ome={kernelName:od,backendName:"webgpu",kernelFunc:({inputs:e,backend:t})=>{let{x:r}=e,n=t,a=new Vh(r.shape,20);return n.runWebGPUProgram(a,[r],r.dtype)}},lme=jr({opSnippet:11}),ume={kernelName:Pi,backendName:"webgpu",kernelFunc:lme},dme=class{constructor(e){this.variableNames=["x"],this.workPerThread=1,this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=e,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,[this.workPerThread,1,1]);let t=gr(this.outputShape.length);this.uniforms=`begin : ${t}, strides : ${t}, `,this.shaderKey="stridedSlice"}getUserCode(){let e=this.outputShape.length,t="";if(e===1)t="coords * uniforms.strides + uniforms.begin";else{let r=0;t=this.outputShape.map((n,a)=>(r++,this.outputShape.length===1?`coords * uniforms.strides[${a}] + uniforms.begin[${a}]`:`coords[${r-1}] * uniforms.strides[${a}] + uniforms.begin[${a}]`)).join(",")}return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let coords = getCoordsFromIndex(index);
setOutputAtIndex(index, getX(${t}));
}
}
2022-04-14 17:47:08 +02:00
`}};function pme(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{begin:s,end:i,strides:o,beginMask:l,endMask:u,ellipsisMask:d,newAxisMask:h,shrinkAxisMask:p}=n,{finalShapeSparse:c,finalShape:f,isIdentity:m,sliceDim0:g,isSimpleSlice:y,begin:A,end:x,strides:b}=_t.sliceInfo(a.shape,s,i,o,l,u,d,h,p),v;if(m)v=qe({inputs:{x:a},backend:r,attrs:{shape:f}});else if(g||y){w.assert(a.shape.length>=1,()=>`Input must have rank at least 1, got: ${a.shape.length}`);let S=_t.computeOutShape(A,x,b),T=Ed({inputs:{x:a},backend:r,attrs:{begin:A,size:S}});v=qe({inputs:{x:T},backend:r,attrs:{shape:f}}),r.disposeData(T.dataId)}else if(r.shouldExecuteOnCPU([a])){let S=r.readSync(a.dataId),T=We(a.shape,a.dtype,S),E=Mpe(c,T,b,A);v=r.makeTensorInfo(f,a.dtype,E.values)}else{let S=new dme(c),T=[{type:"int32",data:A},{type:"int32",data:b}],E=r.runWebGPUProgram(S,[a],a.dtype,T);v=qe({inputs:{x:E},backend:r,attrs:{shape:f}}),r.disposeData(E.dataId)}return v}var hme={kernelName:Al,backendName:"webgpu",kernelFunc:pme};function cme(e){let{inputs:t,backend:r,attrs:n}=e,{separator:a,nGramWidths:s,leftPad:i,rightPad:o,padWidth:l,preserveShortSequences:u}=n,{data:d,dataSplits:h}=t,p=r.readSync(d.dataId),c=r.readSync(h.dataId),[f,m]=Fpe(p,c,a,s,i,o,l,u);return[r.makeTensorInfo([f.length],"string",f),r.makeTensorInfo(h.shape,"int32",m)]}var fme={kernelName:uh,backendName:"webgpu",kernelFunc:cme},mme=kr({opType:21}),gme={kernelName:zi,backendName:"webgpu",kernelFunc:mme},yme=class{constructor(e,t){this.variableNames=["A"],this.workGroupSize=[64,1,1],this.size=!0;let r=new Array(e.length);for(let n=0;n<r.length;n++)r[n]=e[n]*t[n];this.outputShape=r,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.rank=this.outputShape.length,this.shaderKey="tile"}getUserCode(){let e=Ame(this.rank,"uniforms.");return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let resRC = getCoordsFromIndex(index);
setOutputAtIndex(index, getA(${e}));
}
}
2022-04-14 17:47:08 +02:00
`}};function Ame(e,t=""){if(e>=5)throw Error(`Tile for rank ${e} is not yet supported`);if(e===1)return`(resRC % ${t}aShape)`;let r=["resRC.x","resRC.y","resRC.z","resRC.w"],n=[];for(let a=0;a<e;a++)n.push(`(${r[a]} % ${t}aShape[${a}])`);return n.join()}function xme(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{reps:s}=n;if(r.shouldExecuteOnCPU([a])||a.dtype==="string"||a.shape.length>=5){let o=r.readSync(a.dataId),l=a.dtype==="string"?o.map(h=>w.decodeString(h)):o,u=We(a.shape,a.dtype,l),d=Ppe(u,s);return r.makeTensorInfo(d.shape,d.dtype,d.values)}let i=new yme(a.shape,s);return r.runWebGPUProgram(i,[a],a.dtype)}var bme={kernelName:Qa,backendName:"webgpu",kernelFunc:xme},vme=class{constructor(e){this.variableNames=["x","indices"],this.workGroupSize=[256,1,1],this.size=!0,this.outputShape=e,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.uniforms=`inputSize : i32, firstPass : i32, negativeInf : f32,
2022-04-01 15:12:04 +02:00
dir : i32, inc : i32,`,this.shaderKey="swap"}getUserCode(){return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let outC = getCoordsFromIndex(index);
let batch = outC[0];
let elemIdx = outC[1];
// We compare elements pair-wise within a group of size 2 * inc.
// The comparing rule for each group alternates between ascending
// and descending. Within each group, we compare each pair at
// positions i and i+inc. To decide whether an element at position i
// is x0 or x1, we mod it by 2 * inc, if the result is smaller than
// inc, it is in the first half of the group, we denote it as x0,
// otherwise we denote it as x1.
// For example, as shown in the Bitonic top K paper referenced
// above, Figure5(a) shows that element[1] is in the second half of
// the group when group size is 2, but it is in the first half of
// the group when group size is 4.
let isFirstInPair = elemIdx % (2 * uniforms.inc) < uniforms.inc;
var i = 0;
if (isFirstInPair) {
i = elemIdx;
} else {
i = elemIdx - uniforms.inc;
}
var i0 = 0;
if (uniforms.firstPass == 1) {
i0 = i;
} else {
i0 = i32(getIndices(batch, i));
}
var i1 = 0;
if (uniforms.firstPass == 1) {
i1 = i + uniforms.inc;
} else {
i1 = i32(getIndices(batch, i + uniforms.inc));
}
var x0 = f32(0.0);
var x1 = f32(0.0);
if (i0 < uniforms.inputSize) {
x0 = getX(batch, i0);
} else {
x0 = uniforms.negativeInf;
}
if (i1 < uniforms.inputSize) {
x1 = getX(batch, i1);
} else {
x1 = uniforms.negativeInf;
}
let reverse = elemIdx % (2 * uniforms.dir) >= uniforms.dir;
let isGreater = x0 > x1 || (x0 == x1 && i1 > i0);
if (reverse == isGreater) {
// Elements in opposite order of direction
let iTemp = i0;
i0 = i1;
i1 = iTemp;
}
if (isFirstInPair) {
setOutputAtIndex(index, f32(i0));
} else {
setOutputAtIndex(index, f32(i1));
}
}
}
2022-04-14 17:47:08 +02:00
`}},wme=class{constructor(e){this.variableNames=["x","indices"],this.workGroupSize=[256,1,1],this.size=!0,this.outputShape=e,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.uniforms="inputSize : i32, firstPass : i32, k : i32,",this.shaderKey="merge"}getUserCode(){return`
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let outC = getCoordsFromIndex(index);
let batch = outC[0];
let elemIdx = outC[1];
// The output size is half of the previous size.
// If the previous sequence is | | | | _ _ _ _ | | | | _ _ _ _
// (k=4), we only need to output the indices at positions |, the
// indices at positions _ can be thrown away, see Figure5(b) After
// Phase 2 (Merge phase) in the Bitonic Top K paper referenced
// above.
// For example, the paper shows we only need to output the orange
// bars. The output sequence should look like this | | | | | | | |.
// Because the sequence is halved, to map the output index back to
// the previous sequence to find the corresponding value, we need
// to double the index. When we double the index, we basically
// interpolate a position, so 2i looks like
// | _ | _ | _ | _ | _ | _ | _. We move the | to the first k
// position of each 2k positions by - elemIdx % k. E.g. for output
// at index 4,5,6,7, we want to get the corresponding element at
// original index 8,9,10,11, for output at index 8,9,10,11,
// we want to get the corresponding element at original index
// 16,17,18,19, so on and so forth.
var i = 0;
if (elemIdx < uniforms.k) {
i = elemIdx;
} else {
i = elemIdx * 2 - elemIdx % uniforms.k;
}
var i0 = 0;
if (uniforms.firstPass == 1) {
i0 = i;
} else {
i0 = i32(getIndices(batch, i));
}
var i1 = 0;
if (uniforms.firstPass == 1) {
i1 = i + uniforms.k;
} else {
i1 = i32(getIndices(batch, i + uniforms.k));
}
let x0 = getX(batch, i0);
var x1 = f32(0.0);
if (i1 < uniforms.inputSize) {
x1 = getX(batch, i1);
} else {
x1 = x0;
}
if (x0 >= x1) {
setOutputAtIndex(index, f32(i0));
} else {
setOutputAtIndex(index, f32(i1));
}
}
}
2022-04-14 17:47:08 +02:00
`}};function uu(e,t){t!==null&&e.disposeData(t.dataId)}function lw(e){let t=1;for(;t<e;)t*=2;return t}function kme(e){let{inputs:t,backend:r,attrs:n}=e,{x:a}=t,{k:s,sorted:i}=n,o=a.shape,l=o[o.length-1];if(r.shouldExecuteOnCPU([a])){let b=r.readSync(a.dataId),[v,S]=_pe(b,o,a.dtype,s,i);return[r.makeTensorInfo(v.shape,v.dtype,v.values),r.makeTensorInfo(S.shape,S.dtype,S.values)]}if(s===0)return o[o.length-1]=0,[r.makeTensorInfo(o,a.dtype,[]),r.makeTensorInfo(o,"int32",[])];if(l===1)return[a,Rd({attrs:{shape:o,dtype:"int32",value:0},backend:r})];let u=w.sizeFromShape(o)/l,d=qe({inputs:{x:a},attrs:{shape:[u,l]},backend:r}),h=lw(s),p=lw(l),c=null,f=()=>c===null?[d,d]:[d,c],m=(b,v,S)=>{let T=f(),E=new vme(S),R=[{type:"int32",data:[l]},{type:"int32",data:[c===null?1:0]},{type:"float32",data:[Number.NEGATIVE_INFINITY]},{type:"int32",data:[b]},{type:"int32",data:[v]}],_=c;c=r.runWebGPUProgram(E,T,"int32",R),uu(r,_)};for(let b=1;b<h;b*=2){let v=b*2;for(let S=b;S>=1;S/=2)m(v,S,[u,p])}for(let b=p;b>h;b/=2){let v=f(),S=new wme([u,b/2]),T=[{type:"int32",data:[l]},{type:"int32",data:[c===null?1:0]},{type:"int32",data:[h]}],E=c;c=r.runWebGPUProgram(S,v,"int32",T),uu(r,E);let R=h/2,_=R*2;for(let M=R;M>=1;M/=2)m(_,M,c.shape)}let g=c;c=Ed({inputs:{x:c},backend:r,attrs:{begin:0,size:[u,s]}}),uu(r,g);let y=G8({inputs:{x:d,indices:c},backend:r,attrs:{axis:1,batchDims:1}});uu(r,d);let A=o.slice(0,-1);A.push(s),g=c,c=qe({inputs:{x:c},attrs:{shape:A},backend:r}),uu(r,g);let x=y;return y=qe({inputs:{x:y},attrs:{shape:A},backend:r}),uu(r,x),[y,c]}var Ime={kernelName:bl,backendName:"webgpu",kernelFunc:kme},Sme=class{constructor(e){this.variableNames=["Image","Transforms"],this.uniforms="interpolationModeId : i32, fillModeId : i32, fillValue : f32,",this.workGroupSize=[64,1,1],this.size=!0,this.outputShape=e,this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize),this.shaderKey="transform"}getUserCode(){return`
2022-02-10 18:27:21 +01:00
fn mapCoord(outCoord : f32, len : f32) -> f32{
var inCoord = outCoord;
if(uniforms.fillModeId == 2) {
if (inCoord < 0.0) {
if (len <= 1.0) {
inCoord = 0.0;
} else {
let sz2 = 2.0 * len;
if (inCoord < sz2) {
inCoord = sz2 * f32(i32(f32(-inCoord / sz2))) +
inCoord;
}
if (inCoord < -len) {
inCoord = inCoord + sz2;
} else {
inCoord = -inCoord - 1.0;
}
}
} else if (inCoord > len - 1.0) {
if (len <= 1.0) {
inCoord = 0.0;
} else {
let sz2 = 2.0 * len;
inCoord = inCoord - sz2 * f32(i32(f32(inCoord / sz2)));
if (inCoord >= len) {
inCoord = sz2 - inCoord - 1.0;
}
}
}
return clamp(inCoord, 0.0, len - 1.0);
} else if (uniforms.fillModeId == 3) {
if (inCoord < 0.0) {
if (len <= 1.0) {
inCoord = 0.0;
} else {
let sz = len - 1.0;
inCoord = inCoord + len * (f32(i32(f32(-inCoord / sz))) + 1.0);
}
} else if (inCoord > len - 1.0) {
if (len <= 1.0) {
inCoord = 0.0;
} else {
let sz = len - 1.0;
inCoord = inCoord - len * f32(i32(f32(inCoord / sz)));
}
}
return clamp(inCoord, 0.0, len - 1.0);
} else if (uniforms.fillModeId == 4) {
return clamp(outCoord, 0.0, len - 1.0);
}
return outCoord;
}
fn readWithFillValue(batch : i32, coordY : i32, coordX : i32,
channel : i32) -> f32 {
var outputValue : f32;
if (0 <= coordY && coordY < uniforms.imageShape[1] && 0 <= coordX && coordX < uniforms.imageShape[2]) {
outputValue = getImage(batch, coordY, coordX, channel);
} else {
outputValue = uniforms.fillValue;
}
return outputValue;
}
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
if (index < uniforms.size) {
let coords = getCoordsFromIndex(index);
var outputValue : f32;
let batch = coords[0];
let x = coords[2];
let y = coords[1];
let channel = coords[3];
let xf = f32(x);
let yf = f32(y);
let a1 = getTransforms(batch, 0);
let a2 = getTransforms(batch, 1);
let a3 = getTransforms(batch, 2);
let b1 = getTransforms(batch, 3);
let b2 = getTransforms(batch, 4);
let b3 = getTransforms(batch, 5);
let c1 = getTransforms(batch, 6);
let c2 = getTransforms(batch, 7);
let projection = c1 * xf + c2 * yf + 1.0;
if (projection == 0.0) {
outputValue = uniforms.fillValue;
} else {
let inX = (a1 * xf + a2 * yf + a3) / projection;
let inY = (b1 * xf + b2 * yf + b3) / projection;
let mapX = mapCoord(inX, f32(uniforms.imageShape[2]));
let mapY = mapCoord(inY, f32(uniforms.imageShape[1]));
if (uniforms.interpolationModeId == 1) {
let coordY = i32(round(mapY));
let coordX = i32(round(mapX));
outputValue = readWithFillValue(batch, coordY, coordX,
channel);
} else {
let yFloor = floor(mapY);
let xFloor = floor(mapX);
let yCeil = yFloor + 1.0;
let xCeil = xFloor + 1.0;
let valueYFloor = (xCeil - mapX) *
readWithFillValue(batch, i32(yFloor), i32(xFloor), channel) +
(mapX - xFloor) *
readWithFillValue(batch, i32(yFloor), i32(xCeil), channel);
let valueYCeil = (xCeil - mapX) *
readWithFillValue(batch, i32(yCeil), i32(xFloor), channel) +
(mapX - xFloor) *
readWithFillValue(batch, i32(yCeil), i32(xCeil), channel);
outputValue = (yCeil - mapY) * valueYFloor +
(mapY - yFloor) * valueYCeil;
}
}
setOutputAtIndex(index, outputValue);
}
}
2022-04-14 17:47:08 +02:00
`}};function Tme(e){let{inputs:t,backend:r,attrs:n}=e,{image:a,transforms:s}=t,{interpolation:i,fillMode:o,fillValue:l,outputShape:u}=n,[d,h,p,c]=a.shape,[f,m]=u!=null?u:[h,p],g=[d,f,m,c],y=new Sme(g),A=i==="nearest"?1:2,x;switch(o){case"constant":x=1;break;case"reflect":x=2;break;case"wrap":x=3;break;case"nearest":x=4;break;default:x=1;break}let b=[{type:"int32",data:[A]},{type:"int32",data:[x]},{type:"float32",data:[l]}];return r.runWebGPUProgram(y,[a,s],"float32",b)}var Nme={kernelName:vl,backendName:"webgpu",kernelFunc:Tme};function Cme(e){let{inputs:t,backend:r,attrs:n}=e,{value:a}=t,{axis:s}=n;s<0&&(s+=a.shape.length);let i=a,o=i.shape.length,l=a.shape[s],u=new Array(o-1),d=0;for(let m=0;m<o;m++)m!==s&&(u[d++]=i.shape[m]);let h=[],p=new Array(o).fill(0),c=i.shape.slice();c[s]=1;let f=new Array(l);for(let m=0;m<f.length;m++){p[s]=m;let g=Ed({inputs:{x:i},backend:r,attrs:{begin:p,size:c}}),y=qe({inputs:{x:g},backend:r,attrs:{shape:u}});f[m]=y,h.push(g)}return h.forEach(m=>r.disposeData(m.dataId)),f}var Eme={kernelName:wl,backendName:"webgpu",kernelFunc:Cme},Rme=[tpe,Dpe,Bpe,Upe,Xpe,Ype,Qpe,the,ihe,dhe,hhe,ghe,spe,bhe,Che,Fhe,Phe,zhe,Lhe,Vhe,Ghe,Xhe,Yhe,Qhe,ece,tce,nce,sce,oce,cce,uce,pce,gce,Ace,bce,kce,Tce,Cce,Rce,ape,Ahe,Fce,Pce,zce,Dce,Bce,Vce,Uce,jce,qce,Xce,Yce,Qce,tfe,jhe,nfe,sfe,ofe,ohe,ufe,pfe,cfe,mfe,yfe,xfe,vfe,lhe,wfe,Ife,Tfe,Qde,Efe,Ffe,Pfe,zfe,Lfe,Vfe,Gfe,Hfe,Kfe,ahe,hme,fme,Yfe,Qfe,rme,ame,ime,ome,ume,Xfe,qhe,gme,bme,Ime,Nme,qpe,Eme,lfe];for(let e of Rme)Gn(e);var Mme=class{constructor(e){this.device=e,this.numUsedBuffers=0,this.numFreeBuffers=0,this.freeBuffers=new Map,this.usedBuffers=new Map,this.numBytesUsed=0,this.numBytesAllocated=0}acquireUploadBuffer(e,t){return this.acquireBuffer(e,t,!0)}acquireBuffer(e,t,r=!1){let n=uw(e,t);if(this.freeBuffers.has(n)||this.freeBuffers.set(n,[]),this.usedBuffers.has(n)||this.usedBuffers.set(n,[]),this.numBytesUsed+=e,this.numUsedBuffers++,this.freeBuffers.get(n).length>0){this.numFreeBuffers--;let s=this.freeBuffers.get(n).shift();return this.usedBuffers.get(n).push(s),s}this.numBytesAllocated+=e;let a=this.device.createBuffer({mappedAtCreation:r,size:e,usage:t});return this.usedBuffers.get(n).push(a),a}releaseBuffer(e,t,r){if(this.freeBuffers.size===0)return;let n=uw(t,r);this.freeBuffers.has(n)||this.freeBuffers.set(n,[]),this.freeBuffers.get(n).push(e),this.numFreeBuffers++,this.numUsedBuffers--;let a=this.usedBuffers.get(n),s=a.indexOf(e);if(s<0)throw new Error("Cannot release a buffer that was never provided by this buffer manager");a.splice(s,1),this.numBytesUsed-=t}releaseUploadBuffer(e,t,r){e.mapAsync(GPUMapMode.WRITE).then(()=>{this.releaseBuffer(e,t,r)},n=>{})}getNumUsedBuffers(){return this.numUsedBuffers}getNumFreeBuffers(){return this.numFreeBuffers}dispose(){this.freeBuffers.forEach((e,t)=>{e.forEach(r=>{r.destroy()})}),this.usedBuffers.forEach((e,t)=>{e.forEach(r=>{r.destroy()})}),this.freeBuffers=new Map,this.usedBuffers=new Map,this.numUsedBuffers=0,this.numFreeBuffers=0,this.numBytesUsed=0,this.numBytesAllocated=0}};function uw(e,t){return`${e}_${t}`}var Z8=class{constructor(){this.outputShape=[0],this.variableNames=[],this.workGroupSize=[256,1,1],this.lastUniformData=[],this.inputTexture=null,this.layout=null,this.lastPixelSize={width:0,height:0},this.disposed=!1,this.shaderKey="fromPixels",this.useImport=!1}updateOutputShape(e){w.arraysEqual(this.outputShape,e)||(this.outputShape=e,this.workPerThread=e[2],this.dispatchLayout=Xe(this.outputShape),this.dispatch=Oe(this.dispatchLayout,this.outputShape,this.workGroupSize,[this.workPerThread,1,1]))}makeFromPixelsSource(){let e=this.useImport?"textureLoad(src, vec2<i32>(coords.yx));":"textureLoad(src, vec2<i32>(coords.yx), 0)";return`
2022-02-10 18:27:21 +01:00
@binding(1) @group(0) var src: ${this.useImport?"texture_external":"texture_2d<f32>"};
2022-04-01 15:13:32 +02:00
${tt()}
2022-02-10 18:27:21 +01:00
let flatIndexBase = index * uniforms.numChannels;
for (var i = 0; i < uniforms.numChannels; i = i + 1) {
let flatIndex = flatIndexBase + i;
if (flatIndex < uniforms.size) {
let coords = getCoordsFromIndex(flatIndexBase);
let values = ${e};
2022-04-01 15:12:04 +02:00
result[flatIndex] = i32(floor(255.0 * values[i]));
2022-02-10 18:27:21 +01:00
}
}
}
2022-04-14 17:47:08 +02:00
`}getUserCode(){return this.makeFromPixelsSource()}setPipeline(e){this.pipeline=e}setUniform(e,t){if(!this.uniform){let r=e.createBuffer({size:t.length*4,usage:GPUBufferUsage.UNIFORM|GPUBufferUsage.COPY_DST});this.uniform=r}!t||t.length===this.lastUniformData.length&&t.every((r,n)=>r===this.lastUniformData[n])||(e.queue.writeBuffer(this.uniform,0,new Uint32Array(t)),this.lastUniformData=t)}makeInputTexture(e,t,r){return(!this.inputTexture||this.lastPixelSize.width!==t||this.lastPixelSize.height!==r)&&(this.inputTexture&&this.inputTexture.destroy(),this.inputTexture=e.createTexture({size:[t,r],format:"rgba8unorm",usage:GPUTextureUsage.COPY_DST|GPUTextureUsage.RENDER_ATTACHMENT|GPUTextureUsage.TEXTURE_BINDING}),this.lastPixelSize.width=t,this.lastPixelSize.height=r),this.inputTexture}dispose(){this.disposed||(this.uniform&&this.uniform.destroy(),this.inputTexture&&this.inputTexture.destroy(),this.disposed=!0)}getLayout(e){return this.layout===null&&(this.layout=this.createTextureLayout(e)),this.layout}createTextureLayout(e){let t=[];t.push({binding:0,visibility:GPUShaderStage.COMPUTE,buffer:{type:"storage"}}),t.push({binding:1,visibility:GPUShaderStage.COMPUTE,texture:{}}),t.push({binding:2,visibility:GPUShaderStage.COMPUTE,buffer:{}});let r=e.createBindGroupLayout({entries:t}),n=e.createPipelineLayout({bindGroupLayouts:[r]});return{bindGroupLayout:r,pipelineLayout:n}}},Fme=class extends Z8{constructor(){super(...arguments),this.layout=null,this.useImport=!0}getUserCode(){return this.makeFromPixelsSource()}getLayout(e){return this.layout===null&&(this.layout=this.createTextureImportLayout(e)),this.layout}createTextureImportLayout(e){let t=[];t.push({binding:0,visibility:GPUShaderStage.COMPUTE,buffer:{type:"storage"}}),t.push({binding:1,visibility:GPUShaderStage.COMPUTE,externalTexture:{}}),t.push({binding:2,visibility:GPUShaderStage.COMPUTE,buffer:{}});let r=e.createBindGroupLayout({entries:t}),n=e.createPipelineLayout({bindGroupLayouts:[r]});return{bindGroupLayout:r,pipelineLayout:n}}},$me=Y().getNumber("WEBGPU_CPU_HANDOFF_SIZE_THRESHOLD"),dw=(e,t)=>{let r=e.limits.maxComputeWorkgroupsPerDimension,n=t.dispatchLayout,a=t.dispatch;if(a.every(i=>i<=r))return a;w.assert(a[0]>r&&n.y===void 0&&n.z===void 0,()=>"Dispatch size exceeds WebGPU limits in Y or Z dimension.");let s=Math.ceil(Math.sqrt(a[0]));return s>r?(s=Math.ceil(Math.cbrt(a[0])),w.assert(s<=r,()=>"Total dispatch size exceeds WebGPU maximum."),[s,s,s]):[s,s,1]},Y8=class extends Fu{constructor(e,t=!1){if(super(),this.commandQueueOwnedIds=new WeakSet,this.tensorDisposalQueue=[],this.uniformDisposalQueue=[],this.stagingDisposalQueue=[],this.disposed=!1,this.uploadWaitMs=0,this.downloadWaitMs=0,this.dispatchNumberInEncoder=0,!bb())throw new Error("WebGPU is not supported on this device");this.layoutCache={},this.pipelineCache={},this.device=e,this.queue=e.queue,this.currentCommandEncoder=null,this.currentComputePass=null,this.supportTimeQuery=t,this.bufferManager=new Mme(this.device),this.tensorMap=new qp(this,br()),this.supportTimeQuery&&(this.querySet=this.device.createQuerySet({type:"timestamp",count:2})),Y().getBool("WEBGPU_USE_PROFILE_TOOL")&&(this.dummyCanvas=document.createElement("canvas"),this.dummyCanvas.width=1,this.dummyCanvas.height=1,this.dummyContext=this.dummyCanvas.getContext("webgpu"),this.dummyContext.configure({device:e,format:"bgra8unorm"}),document.body.appendChild(this.dummyCanvas))}nextDataId(){return Y8.nextDataId++}floatPrecision(){return 32}defaultGpuBufferUsage(){return GPUBufferUsage.STORAGE|GPUBufferUsage.COPY_SRC|GPUBufferUsage.COPY_DST}flushDisposalQueue(){this.tensorDisposalQueue.forEach(e=>{this.maybeReleaseBuffer(e),this.tensorMap.delete(e)}),this.uniformDisposalQueue.forEach(e=>this.bufferManager.releaseBuffer(e.buffer,e.byteSize,e.usage)),this.stagingDisposalQueue.forEach(e=>this.bufferManager.releaseUploadBuffer(e.buffer,e.byteSize,e.usage)),this.tensorDisposalQueue=[],this.uniformDisposalQueue=[],this.stagingDisposalQueue=[]}disposeData(e,t=!1){if(this.tensorMap.has(e)){let r=this.tensorMap.get(e);if(r.refCount--,!t&&r.refCount>
2022-04-01 15:13:32 +02:00
${n.shape}`);if(a.shape.length!==1)throw new Error(`Input shape should be a vector but received shape
2022-04-14 17:47:08 +02:00
${a.shape}`);if(s.shape.length!==1)throw new Error(`Target shape should be a vector but received shape ${s.shape}`);let i=t.dataIdMap.get(n.dataId).id,o=t.dataIdMap.get(a.dataId).id,l=t.dataIdMap.get(s.dataId).id,u=n.shape[0],d=w.sizeFromShape(s.shape),h=t.makeOutput([u,d],n.dtype),p=t.dataIdMap.get(h.dataId).id,c=t.makeOutput([d],s.dtype),f=t.dataIdMap.get(c.dataId).id,m=t.makeOutput([3],"int32"),g=t.dataIdMap.get(m.dataId).id;qT(i,o,l,u,p,f,g);let y=t.readSync(m.dataId),A;switch(y[0]){case 0:{A=N.getSparseReshapeMultipleNegativeOneOutputDimErrorMessage(y[1],y[2]);break}case 1:{A=N.getSparseReshapeNegativeOutputDimErrorMessage(y[1],y[2]);break}case 2:A=N.getSparseReshapeEmptyTensorZeroOutputDimErrorMessage();break;case 3:{let x=Array.from(t.readSync(a.dataId)),b=Array.from(t.readSync(c.dataId));A=N.getSparseReshapeInputOutputMultipleErrorMessage(x,b);break}case 4:{let x=Array.from(t.readSync(a.dataId)),b=Array.from(t.readSync(c.dataId));A=N.getSparseReshapeInputOutputMismatchErrorMessage(x,b);break}default:A=""}if(t.disposeData(m.dataId),A)throw t.disposeData(h.dataId),t.disposeData(c.dataId),new Error(A);return[h,c]}var pye={kernelName:id,backendName:"wasm",setupFunc:uye,kernelFunc:dye},KT;function XT(e){KT=e.wasm.cwrap("SparseSegmentReduction",null,["number","number","number","number","number","number","number","number","number"])}function ZT(e,t){let{backend:r,inputs:n}=e,{data:a,indices:s,segmentIds:i}=n,o=s.shape[0],l=r.readSync(i.dataId,o-1,o)[0],u=o>0?l+1:0;if(u<0)throw new Error(N.getSparseSegmentReductionNegativeSegmentIdsErrorMessage());let d=a.shape.slice();d[0]=u;let h=r.dataIdMap.get(a.dataId).id,p=r.dataIdMap.get(s.dataId).id,c=r.dataIdMap.get(i.dataId).id,f=r.makeOutput(d,a.dtype),m=r.dataIdMap.get(f.dataId).id,g=r.makeOutput([4],"int32"),y=r.dataIdMap.get(g.dataId).id;KT(h,Vt[a.dtype],a.shape[0],p,c,m,y,t,0);let A=r.readSync(g.dataId),x;switch(A[0]){case 0:{x=N.getSparseSegmentReductionNegativeSegmentIdsErrorMessage();break}case 1:{x=N.getSparseSegmentReductionNonIncreasingSegmentIdsErrorMessage();break}case 2:x=N.getSparseSegmentReductionSegmentIdOutOfRangeErrorMessage(A[1],A[2]);break;case 3:x=N.getSparseSegmentReductionIndicesOutOfRangeErrorMessage(A[1],A[2],A[3]);break;default:x=""}if(r.disposeData(g.dataId),x)throw r.disposeData(f.dataId),new Error(x);return f}function hye(e){return ZT(e,!0)}var cye={kernelName:ih,backendName:"wasm",setupFunc:XT,kernelFunc:hye};function fye(e){return ZT(e,!1)}var mye={kernelName:oh,backendName:"wasm",setupFunc:XT,kernelFunc:fye};function gye(e){let{inputs:t,attrs:r,backend:n}=e,{x:a}=t,{numOrSizeSplits:s,axis:i}=r,o=w.parseAxisParam(i,a.shape)[0],l=N.prepareSplitSize(a,s,o),u=new Array(a.shape.length).fill(0),d=a.shape.slice();return l.map(h=>{let p=[...d];p[o]=h;let c=zo({inputs:{x:a},attrs:{begin:u,size:p},backend:n});return u[o]+=h,c})}var yye={kernelName:yl,backendName:"wasm",kernelFunc:gye},Aye=Ir(Mi),xye=Ir(od),bye=!0,vye=Hr(Pi,bye),YT;function wye(e){YT=e.wasm.cwrap(Di,null,["number","number","number","number"])}function kye(e){let{backend:t,inputs:r,attrs:n}=e,{alpha:a}=n,{x:s}=r,i=t.dataIdMap.get(s.dataId).id,o=t.makeOutput(s.shape,s.dtype),l=t.dataIdMap.get(o.dataId).id;return YT(i,a,Vt[s.dtype],l),o}var Iye={kernelName:Di,backendName:"wasm",setupFunc:wye,kernelFunc:kye},JT;function Sye(e){JT=e.wasm.cwrap(Al,null,["number","array","number","array","array","array","array","array","number","number"])}function Tye(e){let{backend:t,inputs:r,attrs:n}=e,{x:a}=r,{begin:s,end:i,strides:o,beginMask:l,endMask:u,ellipsisMask:d,newAxisMask:h,shrinkAxisMask:p}=n,{finalShapeSparse:c,finalShape:f,isIdentity:m,sliceDim0:g,isSimpleSlice:y,begin:A,end:x,strides:b}=_t.sliceInfo(a.shape,s,i,o,l,u,d,h,p),v;if(m)v=en({inputs:{x:a},backend:t,attrs:{shape:f}});else if(g||y){w.assert(a.shape.length>=1,()=>`Input must have rank at least 1, got: ${a.shape.length}`);let S=_t.computeOutShape(A,x,b),T=zo({inputs:{x:a},backend:t,attrs:{begin:A,size:S}});v=en({inputs:{x:T},backend:t,attrs:{shape:f}}),t.disposeData(T.dataId)}else{let S=t.makeOutput(c,"float32"),T=t.dataIdMap.get(
");return}console.error(text)}function threadAlert(){var text=Array.prototype.slice.call(arguments).join(" ");postMessage({cmd:"alert",text:text,threadId:Module["_pthread_self"]()})}var err=threadPrintErr;self.alert=threadAlert;Module["instantiateWasm"]=((info,receiveInstance)=>{var instance=new WebAssembly.Instance(Module["wasmModule"],info);receiveInstance(instance);Module["wasmModule"]=null;return instance.exports});self.onmessage=(e=>{try{if(e.data.cmd==="load"){Module["wasmModule"]=e.data.wasmModule;Module["wasmMemory"]=e.data.wasmMemory;Module["buffer"]=Module["wasmMemory"].buffer;Module["ENVIRONMENT_IS_PTHREAD"]=true;if(typeof e.data.urlOrBlob==="string"){importScripts(e.data.urlOrBlob)}else{var objectUrl=URL.createObjectURL(e.data.urlOrBlob);importScripts(objectUrl);URL.revokeObjectURL(objectUrl)}WasmBackendModuleThreadedSimd(Module).then(function(instance){Module=instance})}else if(e.data.cmd==="run"){Module["__performance_now_clock_drift"]=performance.now()-e.data.time;Module["__emscripten_thread_init"](e.data.threadInfoStruct,0,0,1);Module["establishStackSpace"]();Module["PThread"].receiveObjectTransfer(e.data);Module["PThread"].threadInit();try{var result=Module["invokeEntryPoint"](e.data.start_routine,e.data.arg);if(Module["keepRuntimeAlive"]()){Module["PThread"].setExitStatus(result)}else{Module["__emscripten_thread_exit"](result)}}catch(ex){if(ex!="unwind"){if(ex instanceof Module["ExitStatus"]){if(Module["keepRuntimeAlive"]()){}else{Module["__emscripten_thread_exit"](ex.status)}}else{throw ex}}}}else if(e.data.cmd==="cancel"){if(Module["_pthread_self"]()){Module["__emscripten_thread_exit"](-1)}}else if(e.data.target==="setimmediate"){}else if(e.data.cmd==="processThreadQueue"){if(Module["_pthread_self"]()){Module["_emscripten_current_thread_process_queued_calls"]()}}else if(e.data.cmd==="processProxyingQueue"){if(Module["_pthread_self"]()){Module["_emscripten_proxy_execute_queue"](e.data.queue)}}else{err("worker.js received unknown command "+e.data.cmd);err(e.data)}}catch(ex){err("worker.js onmessage() captured an uncaught exception: "+ex);if(ex&&ex.stack)err(ex.stack);if(Module["__emscripten_thread_crashed"]){Module["__emscripten_thread_crashed"]()}throw ex}});`,Zye=Oo(iR()),nN=class extends Fu{constructor(e){super(),this.wasm=e,this.dataIdNextNumber=1,this.wasm.tfjs.initWithThreadsCount(aN),i2=this.wasm.tfjs.getThreadsCount(),this.dataIdMap=new qp(this,br())}write(e,t,r){let n={id:this.dataIdNextNumber++};return this.move(n,e,t,r,1),n}numDataIds(){return this.dataIdMap.numDataIds()}async time(e){let t=w.now();return e(),{kernelMs:w.now()-t}}move(e,t,r,n,a){let s=this.dataIdNextNumber++;if(n==="string"){let u=t;this.dataIdMap.set(e,{id:s,stringBytes:u,shape:r,dtype:n,memoryOffset:null,refCount:a});return}let i=w.sizeFromShape(r),o=i*w.bytesPerElement(n),l=this.wasm._malloc(o);this.dataIdMap.set(e,{id:s,memoryOffset:l,shape:r,dtype:n,refCount:a}),this.wasm.tfjs.registerTensor(s,i,l),t!=null&&this.wasm.HEAPU8.set(new Uint8Array(t.buffer,t.byteOffset,o),l)}async read(e){return this.readSync(e)}readSync(e,t,r){let{memoryOffset:n,dtype:a,shape:s,stringBytes:i}=this.dataIdMap.get(e);if(a==="string")return(t==null||t===0)&&(r==null||r>=i.length)?i:i.slice(t,r);t=t||0,r=r||w.sizeFromShape(s);let o=w.bytesPerElement(a),l=this.wasm.HEAPU8.slice(n+t*o,n+r*o);return Qye(l.buffer,a)}disposeData(e,t=!1){if(this.dataIdMap.has(e)){let r=this.dataIdMap.get(e);if(r.refCount--,!t&&r.refCount>0)return!1;this.wasm._free(r.memoryOffset),this.wasm.tfjs.disposeData(r.id),this.dataIdMap.delete(e)}return!0}refCount(e){return this.dataIdMap.has(e)?this.dataIdMap.get(e).refCount:0}incRef(e){let t=this.dataIdMap.get(e);t!=null&&t.refCount++}floatPrecision(){return 32}getMemoryOffset(e){return this.dataIdMap.get(e).memoryOffset}dispose(){this.wasm.tfjs.dispose(),"PThread"in this.wasm&&this.wasm.PThread.terminateAllThreads(),this.wasm=null}memory(){return{unreliable:!1}}makeOutput(e,t,r){let n;if(r==null)n=this.write(null,e,t);else{let a=this.dataIdNextNumber++;n={id:a},this.dataIdMap.set(n,{id:a,memoryOffset:r,shape:e,dtype:t,refCou
2022-02-10 18:27:21 +01:00
precision highp float;
attribute vec2 pos;
attribute vec2 uv;
varying vec2 vUv;
uniform float flipY;
void main(void) {
vUv = uv;
gl_Position = vec4(pos.x, pos.y*flipY, 0.0, 1.);
}
2022-04-14 17:47:08 +02:00
`;var iN=`
2022-02-10 18:27:21 +01:00
precision highp float;
varying vec2 vUv;
uniform sampler2D texture;
uniform float m[20];
void main(void) {
vec4 c = texture2D(texture, vUv);
gl_FragColor.r = m[0] * c.r + m[1] * c.g + m[2] * c.b + m[3] * c.a + m[4];
gl_FragColor.g = m[5] * c.r + m[6] * c.g + m[7] * c.b + m[8] * c.a + m[9];
gl_FragColor.b = m[10] * c.r + m[11] * c.g + m[12] * c.b + m[13] * c.a + m[14];
gl_FragColor.a = m[15] * c.r + m[16] * c.g + m[17] * c.b + m[18] * c.a + m[19];
}
2022-04-14 17:47:08 +02:00
`,oN=`
2022-02-10 18:27:21 +01:00
precision highp float;
varying vec2 vUv;
uniform sampler2D texture;
uniform float m[20];
void main(void) {
vec4 c = texture2D(texture, vUv);
gl_FragColor.r = m[0] * c.r + m[1] * c.g + m[2] * c.b + m[4];
gl_FragColor.g = m[5] * c.r + m[6] * c.g + m[7] * c.b + m[9];
gl_FragColor.b = m[10] * c.r + m[11] * c.g + m[12] * c.b + m[14];
gl_FragColor.a = c.a;
}
2022-04-14 17:47:08 +02:00
`,lN=`
2022-02-10 18:27:21 +01:00
precision highp float;
varying vec2 vUv;
uniform vec2 size;
uniform sampler2D texture;
vec2 pixelate(vec2 coord, vec2 size) {
return floor( coord / size ) * size;
}
void main(void) {
gl_FragColor = vec4(0.0);
vec2 coord = pixelate(vUv, size);
gl_FragColor += texture2D(texture, coord);
}
2022-04-14 17:47:08 +02:00
`,uN=`
2022-02-10 18:27:21 +01:00
precision highp float;
varying vec2 vUv;
uniform sampler2D texture;
uniform vec2 px;
void main(void) {
gl_FragColor = vec4(0.0);
gl_FragColor += texture2D(texture, vUv + vec2(-7.0*px.x, -7.0*px.y))*0.0044299121055113265;
gl_FragColor += texture2D(texture, vUv + vec2(-6.0*px.x, -6.0*px.y))*0.00895781211794;
gl_FragColor += texture2D(texture, vUv + vec2(-5.0*px.x, -5.0*px.y))*0.0215963866053;
gl_FragColor += texture2D(texture, vUv + vec2(-4.0*px.x, -4.0*px.y))*0.0443683338718;
gl_FragColor += texture2D(texture, vUv + vec2(-3.0*px.x, -3.0*px.y))*0.0776744219933;
gl_FragColor += texture2D(texture, vUv + vec2(-2.0*px.x, -2.0*px.y))*0.115876621105;
gl_FragColor += texture2D(texture, vUv + vec2(-1.0*px.x, -1.0*px.y))*0.147308056121;
gl_FragColor += texture2D(texture, vUv )*0.159576912161;
gl_FragColor += texture2D(texture, vUv + vec2( 1.0*px.x, 1.0*px.y))*0.147308056121;
gl_FragColor += texture2D(texture, vUv + vec2( 2.0*px.x, 2.0*px.y))*0.115876621105;
gl_FragColor += texture2D(texture, vUv + vec2( 3.0*px.x, 3.0*px.y))*0.0776744219933;
gl_FragColor += texture2D(texture, vUv + vec2( 4.0*px.x, 4.0*px.y))*0.0443683338718;
gl_FragColor += texture2D(texture, vUv + vec2( 5.0*px.x, 5.0*px.y))*0.0215963866053;
gl_FragColor += texture2D(texture, vUv + vec2( 6.0*px.x, 6.0*px.y))*0.00895781211794;
gl_FragColor += texture2D(texture, vUv + vec2( 7.0*px.x, 7.0*px.y))*0.0044299121055113265;
}
2022-04-14 17:47:08 +02:00
`,dN=`
2022-02-10 18:27:21 +01:00
precision highp float;
varying vec2 vUv;
uniform sampler2D texture;
uniform vec2 px;
uniform float m[9];
void main(void) {
vec4 c11 = texture2D(texture, vUv - px); // top left
vec4 c12 = texture2D(texture, vec2(vUv.x, vUv.y - px.y)); // top center
vec4 c13 = texture2D(texture, vec2(vUv.x + px.x, vUv.y - px.y)); // top right
vec4 c21 = texture2D(texture, vec2(vUv.x - px.x, vUv.y) ); // mid left
vec4 c22 = texture2D(texture, vUv); // mid center
vec4 c23 = texture2D(texture, vec2(vUv.x + px.x, vUv.y) ); // mid right
vec4 c31 = texture2D(texture, vec2(vUv.x - px.x, vUv.y + px.y) ); // bottom left
vec4 c32 = texture2D(texture, vec2(vUv.x, vUv.y + px.y) ); // bottom center
vec4 c33 = texture2D(texture, vUv + px ); // bottom right
gl_FragColor =
c11 * m[0] + c12 * m[1] + c22 * m[2] +
c21 * m[3] + c22 * m[4] + c23 * m[5] +
c31 * m[6] + c32 * m[7] + c33 * m[8];
gl_FragColor.a = c22.a;
}
2022-04-14 17:47:08 +02:00
`;var Cb=(e,t,r)=>{let n=new RegExp("\\b"+t+" \\w+ (\\w+)","ig");e.replace(n,(a,s)=>(r[s]=0,a))},Eb=class{constructor(t,r,n){fe(this,"uniform",{});fe(this,"attribute",{});fe(this,"gl");fe(this,"id");fe(this,"compile",(t,r)=>{let n=this.gl.createShader(r);return n?(this.gl.shaderSource(n,t),this.gl.compileShader(n),this.gl.getShaderParameter(n,this.gl.COMPILE_STATUS)?n:(ie(`filter: gl compile failed: ${this.gl.getShaderInfoLog(n)}`),null)):(ie("filter: could not create shader"),null)});this.gl=t;let a=this.compile(r,this.gl.VERTEX_SHADER),s=this.compile(n,this.gl.FRAGMENT_SHADER);if(this.id=this.gl.createProgram(),!(!a||!s)){if(!this.id){ie("filter: could not create webgl program");return}if(this.gl.attachShader(this.id,a),this.gl.attachShader(this.id,s),this.gl.linkProgram(this.id),!this.gl.getProgramParameter(this.id,this.gl.LINK_STATUS)){ie(`filter: gl link failed: ${this.gl.getProgramInfoLog(this.id)}`);return}this.gl.useProgram(this.id),Cb(r,"attribute",this.attribute);for(let i in this.attribute)this.attribute[i]=this.gl.getAttribLocation(this.id,i);Cb(r,"uniform",this.uniform),Cb(n,"uniform",this.uniform);for(let i in this.uniform)this.uniform[i]=this.gl.getUniformLocation(this.id,i)}}};function pN(){let e=0,t=null,r=!1,n=-1,a=[null,null],s=[],i=null,o=null,l=qr(100,100),u={},d={INTERMEDIATE:1},h=l.getContext("webgl");if(!h){ie("filter: cannot get webgl context");return}this.gl=h;function p(A,x){if(!(A===l.width&&x===l.height)){if(l.width=A,l.height=x,!i){let b=new Float32Array([-1,-1,0,1,1,-1,1,1,-1,1,0,0,-1,1,0,0,1,-1,1,1,1,1,1,0]);i=h.createBuffer(),h.bindBuffer(h.ARRAY_BUFFER,i),h.bufferData(h.ARRAY_BUFFER,b,h.STATIC_DRAW),h.pixelStorei(h.UNPACK_PREMULTIPLY_ALPHA_WEBGL,!0)}h.viewport(0,0,l.width,l.height),a=[null,null]}}function c(A,x){let b=h.createFramebuffer();h.bindFramebuffer(h.FRAMEBUFFER,b);let v=h.createRenderbuffer();h.bindRenderbuffer(h.RENDERBUFFER,v);let S=h.createTexture();return h.bindTexture(h.TEXTURE_2D,S),h.texImage2D(h.TEXTURE_2D,0,h.RGBA,A,x,0,h.RGBA,h.UNSIGNED_BYTE,null),h.texParameteri(h.TEXTURE_2D,h.TEXTURE_MAG_FILTER,h.LINEAR),h.texParameteri(h.TEXTURE_2D,h.TEXTURE_MIN_FILTER,h.LINEAR),h.texParameteri(h.TEXTURE_2D,h.TEXTURE_WRAP_S,h.CLAMP_TO_EDGE),h.texParameteri(h.TEXTURE_2D,h.TEXTURE_WRAP_T,h.CLAMP_TO_EDGE),h.framebufferTexture2D(h.FRAMEBUFFER,h.COLOR_ATTACHMENT0,h.TEXTURE_2D,S,0),h.bindTexture(h.TEXTURE_2D,null),h.bindFramebuffer(h.FRAMEBUFFER,null),{fbo:b,texture:S}}function f(A){return a[A]=a[A]||c(l.width,l.height),a[A]}function m(A=0){if(!o)return;let x=null,b=null,v=!1;e===0?x=t:x=f(n).texture||null,e++,r&&!(A&d.INTERMEDIATE)?(b=null,v=e%2===0):(n=(n+1)%2,b=f(n).fbo||null),h.bindTexture(h.TEXTURE_2D,x),h.bindFramebuffer(h.FRAMEBUFFER,b),h.uniform1f(o.uniform.flipY,v?-1:1),h.drawArrays(h.TRIANGLES,0,6)}function g(A){if(u[A])return o=u[A],h.useProgram((o?o.id:null)||null),o;if(o=new Eb(h,sN,A),!o)return ie("filter: could not get webgl program"),null;let x=Float32Array.BYTES_PER_ELEMENT,b=4*x;return h.enableVertexAttribArray(o.attribute.pos),h.vertexAttribPointer(o.attribute.pos,2,h.FLOAT,!1,b,0*x),h.enableVertexAttribArray(o.attribute.uv),h.vertexAttribPointer(o.attribute.uv,2,h.FLOAT,!1,b,2*x),u[A]=o,o}let y={colorMatrix:A=>{let x=new Float32Array(A);x[4]/=255,x[9]/=255,x[14]/=255,x[19]/=255;let b=x[18]===1&&x[3]===0&&x[8]===0&&x[13]===0&&x[15]===0&&x[16]===0&&x[17]===0&&x[19]===0?oN:iN,v=g(b);!v||(h.uniform1fv(v.uniform.m,x),m())},brightness:A=>{let x=(A||0)+1;y.colorMatrix([x,0,0,0,0,0,x,0,0,0,0,0,x,0,0,0,0,0,1,0])},saturation:A=>{let x=(A||0)*2/3+1,b=(x-1)*-.5;y.colorMatrix([x,b,b,0,0,b,x,b,0,0,b,b,x,0,0,0,0,0,1,0])},desaturate:()=>{y.saturation(-1)},contrast:A=>{let x=(A||0)+1,b=-128*(x-1);y.colorMatrix([x,0,0,0,b,0,x,0,0,b,0,0,x,0,b,0,0,0,1,0])},negative:()=>{y.contrast(-2)},hue:A=>{A=(A||0)/180*Math.PI;let x=Math.cos(A),b=Math.sin(A),v=.213,S=.715,T=.072;y.colorMatrix([v+x*(1-v)+b*-v,S+x*-S+b*-S,T+x*-T+b*(1-T),0,0,v+x*-v+b*.143,S+x*(1-S)+b*.14,T+x*-T+b*-.283,0,0,v+x*-v+b*-(1-v),S+x*-S+b*S,T+x*(1-T)+b*T,0,0,0,0,0,1,0])},desaturateLuminance:()=>{y.colorMatrix([.2764723,.929708
2022-04-01 15:13:32 +02:00
M ${d.box[0]+d.box[2]/2} ${d.box[1]}
2022-02-10 18:27:21 +01:00
C
2022-04-01 15:13:32 +02:00
${h} ${d.box[1]},
${h} ${d.box[1]+d.box[3]},
${d.box[0]+d.box[2]/2} ${d.box[1]+d.box[3]}
2022-02-10 18:27:21 +01:00
`),f=new Path2D(`
2022-04-01 15:13:32 +02:00
M ${d.box[0]} ${d.box[1]+d.box[3]/2}
2022-02-10 18:27:21 +01:00
C
2022-04-01 15:13:32 +02:00
${d.box[0]} ${p},
${d.box[0]+d.box[2]} ${p},
${d.box[0]+d.box[2]} ${d.box[1]+d.box[3]/2}
2022-04-14 17:47:08 +02:00
`);a.stroke(f),a.stroke(c)}if(n.drawGaze&&((o=(i=d.rotation)==null?void 0:i.gaze)==null?void 0:o.strength)&&((u=(l=d.rotation)==null?void 0:l.gaze)==null?void 0:u.bearing)&&d.annotations.leftEyeIris&&d.annotations.rightEyeIris&&d.annotations.leftEyeIris[0]&&d.annotations.rightEyeIris[0]){a.strokeStyle="pink",a.fillStyle="pink";let h=[d.annotations.leftEyeIris[0][0]+Math.sin(d.rotation.gaze.bearing)*d.rotation.gaze.strength*d.box[3],d.annotations.leftEyeIris[0][1]+Math.cos(d.rotation.gaze.bearing)*d.rotation.gaze.strength*d.box[2]];q5(a,[d.annotations.leftEyeIris[0][0],d.annotations.leftEyeIris[0][1]],[h[0],h[1]],4);let p=[d.annotations.rightEyeIris[0][0]+Math.sin(d.rotation.gaze.bearing)*d.rotation.gaze.strength*d.box[3],d.annotations.rightEyeIris[0][1]+Math.cos(d.rotation.gaze.bearing)*d.rotation.gaze.strength*d.box[2]];q5(a,[d.annotations.rightEyeIris[0][0],d.annotations.rightEyeIris[0][1]],[p[0],p[1]],4)}}}}}async function qd(e,t,r){var s;let n=Ut(xr,r);if(!t||!e)return;let a=On(e);if(!!a){a.lineJoin="round";for(let i=0;i<t.length;i++){if(a.strokeStyle=n.color,a.fillStyle=n.color,a.lineWidth=n.lineWidth,a.font=n.font,n.drawBoxes&&t[i].box&&((s=t[i].box)==null?void 0:s.length)===4&&(Va(a,t[i].box[0],t[i].box[1],t[i].box[2],t[i].box[3],n),n.drawLabels&&(n.shadowColor&&n.shadowColor!==""&&(a.fillStyle=n.shadowColor,a.fillText(`body ${100*t[i].score}%`,t[i].box[0]+3,1+t[i].box[1]+n.lineHeight,t[i].box[2])),a.fillStyle=n.labelColor,a.fillText(`body ${100*t[i].score}%`,t[i].box[0]+2,0+t[i].box[1]+n.lineHeight,t[i].box[2]))),n.drawPoints&&t[i].keypoints)for(let o=0;o<t[i].keypoints.length;o++)!t[i].keypoints[o].score||t[i].keypoints[o].score===0||(a.fillStyle=n.useDepth&&t[i].keypoints[o].position[2]?Wa(t[i].keypoints[o].position[2]||0):n.color,jl(a,t[i].keypoints[o].position[0],t[i].keypoints[o].position[1],0,n));if(n.drawLabels&&t[i].keypoints){a.font=n.font;for(let o of t[i].keypoints)!o.score||o.score===0||(a.fillStyle=n.useDepth&&o.position[2]?Wa(o.position[2]):n.color,a.fillText(`${o.part} ${Math.trunc(100*o.score)}%`,o.position[0]+4,o.position[1]+4))}if(n.drawPolygons&&t[i].keypoints&&t[i].annotations)for(let o of Object.values(t[i].annotations))for(let l of o)E9(a,l,n)}}}async function Kd(e,t,r){let n=Ut(xr,r);if(!t||!e)return;let a=On(e);if(!!a){a.lineJoin="round",a.font=n.font;for(let s of t){if(n.drawBoxes&&(a.strokeStyle=n.color,a.fillStyle=n.color,Va(a,s.box[0],s.box[1],s.box[2],s.box[3],n),n.drawLabels&&(n.shadowColor&&n.shadowColor!==""&&(a.fillStyle=n.shadowColor,a.fillText(`hand:${Math.trunc(100*s.score)}%`,s.box[0]+3,1+s.box[1]+n.lineHeight,s.box[2])),a.fillStyle=n.labelColor,a.fillText(`hand:${Math.trunc(100*s.score)}%`,s.box[0]+2,0+s.box[1]+n.lineHeight,s.box[2])),a.stroke()),n.drawPoints&&s.keypoints&&s.keypoints.length>0)for(let i of s.keypoints)a.fillStyle=n.useDepth?Wa(i[2]||0):n.color,jl(a,i[0],i[1],0,n);if(n.drawLabels&&s.annotations){let i=(o,l)=>{if(!o||o.length===0||!o[0])return;let u=o[o.length-1][2]||0;a.fillStyle=n.useDepth?Wa(u):n.color,a.fillText(l,o[o.length-1][0]+4,o[o.length-1][1]+4)};a.font=n.font,i(s.annotations.index,"index"),i(s.annotations.middle,"middle"),i(s.annotations.ring,"ring"),i(s.annotations.pinky,"pinky"),i(s.annotations.thumb,"thumb"),i(s.annotations.palm,"palm")}if(n.drawPolygons&&s.annotations){let i=o=>{if(!(!o||o.length===0||!o[0]))for(let l=0;l<o.length;l++){a.beginPath();let u=o[l][2]||0;a.strokeStyle=n.useDepth?Wa(l*u):n.color,a.moveTo(o[l>0?l-1:0][0],o[l>0?l-1:0][1]),a.lineTo(o[l][0],o[l][1]),a.stroke()}};a.lineWidth=n.lineWidth,i(s.annotations.index),i(s.annotations.middle),i(s.annotations.ring),i(s.annotations.pinky),i(s.annotations.thumb)}}}}async function Xd(e,t,r){let n=Ut(xr,r);if(!t||!e)return;let a=On(e);if(!!a){a.lineJoin="round",a.font=n.font;for(let s of t)if(n.drawBoxes){if(a.strokeStyle=n.color,a.fillStyle=n.color,Va(a,s.box[0],s.box[1],s.box[2],s.box[3],n),n.drawLabels){let i=`${s.label} ${Math.round(100*s.score)}%`;n.shadowColor&&n.shadowColor!==""&&(a.fillStyle=n.shadowColor,a.fillText(i,s.box[0]+3,1+s.box[1]+n.lineHeight,s.box[2])),a.fil
2022-02-10 18:27:21 +01:00
/9j/4AAQSkZJRgABAQEAYABgAAD/4QBoRXhpZgAATU0AKgAAAAgABAEaAAUAAAABAAAAPgEbAAUA
AAABAAAARgEoAAMAAAABAAIAAAExAAIAAAARAAAATgAAAAAAAABgAAAAAQAAAGAAAAABcGFpbnQu
bmV0IDQuMi4xMwAA/9sAQwAGBAUGBQQGBgUGBwcGCAoQCgoJCQoUDg8MEBcUGBgXFBYWGh0lHxob
IxwWFiAsICMmJykqKRkfLTAtKDAlKCko/9sAQwEHBwcKCAoTCgoTKBoWGigoKCgoKCgoKCgoKCgo
KCgoKCgoKCgoKCgoKCgoKCgoKCgoKCgoKCgoKCgoKCgoKCgo/8AAEQgBAAEAAwEhAAIRAQMRAf/E
AB8AAAEFAQEBAQEBAAAAAAAAAAABAgMEBQYHCAkKC//EALUQAAIBAwMCBAMFBQQEAAABfQECAwAE
EQUSITFBBhNRYQcicRQygZGhCCNCscEVUtHwJDNicoIJChYXGBkaJSYnKCkqNDU2Nzg5OkNERUZH
SElKU1RVVldYWVpjZGVmZ2hpanN0dXZ3eHl6g4SFhoeIiYqSk5SVlpeYmZqio6Slpqeoqaqys7S1
tre4ubrCw8TFxsfIycrS09TV1tfY2drh4uPk5ebn6Onq8fLz9PX29/j5+v/EAB8BAAMBAQEBAQEB
AQEAAAAAAAABAgMEBQYHCAkKC//EALURAAIBAgQEAwQHBQQEAAECdwABAgMRBAUhMQYSQVEHYXET
IjKBCBRCkaGxwQkjM1LwFWJy0QoWJDThJfEXGBkaJicoKSo1Njc4OTpDREVGR0hJSlNUVVZXWFla
Y2RlZmdoaWpzdHV2d3h5eoKDhIWGh4iJipKTlJWWl5iZmqKjpKWmp6ipqrKztLW2t7i5usLDxMXG
x8jJytLT1NXW19jZ2uLj5OXm5+jp6vLz9PX29/j5+v/aAAwDAQACEQMRAD8A+qaKACigApGOKAML
Xp8xlF5A7V4X8RtYs7PzfNImnx8sa8Kp9z3q2tEgp6angWs62ZZ5CTGoJ6DArGNz5p+UrID6EUrF
PUlW1EuN0XNW7PQ2L5j3JnoKXN0KijqNP0eYoqXBdgPuuo+ZPeupisWn2Jd4+0r924XgsQOCff3/
AJ1FzRKxDqGii6m3siiQ8F1XGfXI6YNWLfRbiRQMkcZI9fpTDluT2/h6Qy8gDPbtmtG38JeY480Z
5zSLUTZg8M28YwYxjAArXtdPt402qgHbpSaLWhma3o0Uqk7Nx9DWLaaVblgPs6qRyds2M/gRSQp9
zZOni2iWS2hlQ+kjYz9OMGrdjq89vIPPVhj+8M/lQyDq9P1WOYBlMZz1AOD+VdDaTiReOKulK0jO
tHmi0WDTlr0TyxRVhT8tJjIX+9SUxHXUV553BRQAVBcPhSBTSuxPY86+IGti0s5I7dsORy9fM3i6
8e8mfDO5P90ZrWWiJicNPpZZtxV/xrW0jQt4DOv6Vk2dEEdTY6BHuB25rpbPSo0QARjP0qTRI17W
wA/hFaMWmoQMgflQXYsDS142rU9tpqqenfNA7GgtihxkdKuRW6qMY/GkDZY8sY4Ap4hXbyB+VArk
EtuH4wPyrk/EGkOm+a3jw3suRQLc5i38SX9hJ9nnY+XnBUdPyNdFY6pa3KkkAE9l6f8AfJ/pSJT6
GhDmI+Zb4ZRycdv6ium0nUhKFydrelTsNnS2829RnrVgV6NKXNG55lWPLIM81Op+WrZkRMfmNNzT
A7GivPO4KKAEY4XNYWt3vkwPg4OK0giJdjw/xrqhm87Zs8tc7pX5A+leSajf6aHYJ50kn4AZpTep
rBWRm2Vobm4BXfyehPFdnpmnBFUY5rI2SN63tlToK0YI+KZpFF+3QdavwoKTLtoW0Toaswpk5pCb
LCxipAhoIuP2dKevHXoaYDylRyxhlwRQI4nxVoCXWZI1GfpXGtbSWjYPGP73+NIGupt6TqMsLruZ
ih4xnP5V09mQ+JLd8gn0xSYJnVaVdkook69K34zuUGunDS3Rx4qOzHVIp4rrOMY3NJQI7GivPO8K
KAILt9kZrz3xlebYiu8KCCWb0XvW0NFch6ysfO3jLVjfXLIn+pQkKorl7WxNxIPl71g2dUUdpo+l
pBGvHPet23iC8ihFosrxirkHQUFo0IF4FXI1O726CpKLacCrMJoJLYHAPpTwucHpSRJJ5e4AZI9x
UqpxzVpCuOC8cUpQUMRnXttuB4rjNdsYyeVwfXpmpGmcvcQyafMCFJjPY10eg34BUg4DcZP8jUO4
HaRq3lLNF+IHet7R7jz7c56rwa2wz9+xhiVeFy/T1PFegeaNPWigDsc0ZrzzvDNIaAM7VpNqdegr
xL4l6kywyRhseZ19lrdfAZL4jxYg3Fw20d63tJsdrDI5rm3Z3R0R0Mce1eKnQYAplIkWrMJ45oZS
NO3PHbNXIyfpSGWowSOasxLUiZdjFSqtNEMkUemKlAGKsRJjAppFAiORMjmsTVrNZEO4cfSoZSOD
1eJ7WXBUzQZ+7nkfSo7e2Ei+ZaMzxntjBX2NSU1Y6/wxqojiEFzkA8KTXYaUoWRyv3W5rSjpNHPX
+BmpSg8V6J5gUUAdhRXnneFFAGHrTfu5PpXzj8S70/aZtxzztXFbv4DKHxHI+H4GZiz9zxXXW8G3
GBXMjvLRXAx0oPGPSmMVeOnWrMTYpFI0bcg1fh54xmgovRcD3qxETSIZcRvzp+/BpEkqsBUqsM9K
q4Em4Gkxk0yRGXrVW6i8yFhkg+tJjRxGsWrxllkUMh9eK5uMz6bcebbnfG33kPcVkay2OntPKuo0
nhXI67c8qa7Lw3c+adjcEDGK1paSRhVV4s6A0or0jyRRQ1AHX0V553hRQBz+vNtt5z3xXzX8Qbdm
uic5YnOMdK3l8JnTXvlbwpYl+WySOgrp5YfLOOB9O1c62O7qQkc+9RsKChFPWp4DluOlSykaNruH
ArUgHShFNF2NT1qxGO3NBmyxGcE1N2560CFzjrUysO9JAPDDjFOVuKoQuSRTWouBkazbCa3cd8cV
wF7IISQccHBzUSWpV9C3o1x5b5GAjdQD1rs9DjC3kckbEhqKfxIzn8LOupRXqnkPccBSkUAzraK8
87wooA5rxMSI3HqK8B8bQl9Q8sffY5b/AAraXwkUviNrw9pH2W1ViMMRTdRjw4HpWNtDti9TPc4P
FQs2M5qdyyMHLcfjV63HTAoBGtap0wK0YxigpsuRDtVhVYd6GQydVwwIqdRnqKCR23I5pCMUW6gD
YNKuetAEise9KTxQBWuFyhrznxNZkXjFeN3I+tTIZg2OqmzmxNF0PO3vXp/g2+hukVl4zyPanTXv
JmVR+60dpThXpnlPceopWFAbnV0V553hSGgRynjC5FujOey14Ssp1HxNmTnc+a3kvcIpv37HoEYQ
QmMdVHSsnVbYJF5jVk0dsNzlruVIsl2wKxbjWrVHILjg1CRbZJb+ILHPzyhfStODWLQgFJFYd+el
UJM27HUIXxhga1Y5lLVLKLkMnoauxnPPrSEx7ShF+Y/n2qrc6xBbhizDAqkK1zJuvG9nbg8ZA681
ly/Ei052RO3uKAsZlx8QGd8xxvt9Aa1NH8dK7AXMcip64zigdkdrZX8F7EJLdwwNXMkrz1qRMRly
CK4TxmpidWI49felPYSOMmi80NIoOV6qRzXYeA5SskYPfirpfEjGr8LPWVHyD6U4CvQPL3ZItOYc
UDOoNFeed4Uhpks4H4iE/Z5MeleMeGULeLgjds10S+BGdL+Jc9OSBU2Huc5Nc74yvUtrcDBrJnZF
63PJdXvLy/lKWw46bvQVz82jXhkLO5Y+9ZlsYthcRnbIjY9R3q3awTRkEM3WmJI6C0ea3dGRsr1x
XY6TqW9FLHnjrUs0izpLK5DDjofSta3ckH09KRUkZuuTvFGdvPauE1Y3U6Mqbssf/rUxHPTaJPK2
ZmJPbBqzY6DCZh5xJC9s9aBJHU6dpemJjfEmfetJtI0+VPkUr/unFOxdiextHs33W07YHQHk11mk
Xb3KbZ1xIvcd6LEyWho4Nct41sTPYb16ipexCPPZN+wYGCvH1rrPAEJmvkPoc1VL4kZVvgZ6yFwK
cBXoHkkqinFaVyzo80GuE7WJRQSziPiGdthK5HQV4x4J/wBI8WPIewNdEvgRNL42emO/yj1UHNef
eNpRczbC+I17DvWT2OqJxc0sMK4TCisy41q0hfEkqj8aixdwTXNOlwvmqD9anS9tXH7uVG+hosO4
/wC0oOhrR0+6G4YNIEzsNEuCxAPNdjZruA4xxUmjINSjURksOlcbqFykbnjFA1sYGoassaknCqO5
rl7rxhGm7yBnBxuJq0rkSlYpw+NLlsfd5P8AerVsvHEqSBHwPVgcgVpyMyVXU3rXxcHYETAk+hru
/DWti6ZSTyOKzZqndHaxvvUGq2rQ+dYyqR24qWI8dvbr7LqDxyDAzXpvw6FvIxePGSM06Xxoyr/A
zviKFHNegeX1J41zUhXioGbuaSuM6wpCaBHG/EcA6HN/exxXjXw2jL67cv8A3Qa6H8CFR+NnoWpO
I4XI44rxLxrqjQzSEsQM1gdSPM9U1uR1YbmWIdXHf2rmpIb67YS28UrRlsLI3c/jW0VZGUpO5pW1
jfLNOjahawzwReYI5cjzMkDavHJ5/SrVv9uhtPtVxCPLBwzxnlT9KGghLU3tKvvPjHzbl7EGuisJ
GRxWLOg7nRXJEbDjmvSNK+aFSfSoZr0KutRkphc4NcRrdkVjL9aVio7Hk3iqS8ubhrWzUlsZY9kG
cZNc5D4aee5MclzJIFTzHAO0MfatqSOWu7bFS1srDUZEis0vIZoUxPvfcC+4/dx2xjr712XiTwXb
WmlQ6hol3cRhoFd4rlg3zY5wR0GelavQwjq7GD4etdVvSnk2wAB+9v8A8mvcfA2kXiRo0/UdcDis
ZnTTulqeoWqbUAJqWUb42X1FZlnjfjSwlGrr5S/eNdD4RkvLAAQ4yRyaUZcruVKl7TQ9I0G+mnzH
ckFwM8VuIK7ac3KF2eXiKapz5UWYxipNtMyNejNch0jSar3cjR27uoyQCRVRWom9DxTx54gu5fMi
lbKdMVjfCZPNlv5v9rFbVHpYqjGzbOn8SzFI9o715L4u0r7arYzk+lYdTqSujy7U/C0u4vHk+WwO
xuh9q3J9dgvbdVukMV1EwbDDgn04rZMwlHoZ+orZ6hfQ3RWVnQYCgZAq+8U0ln5NtBsV2yxYcfgK
JtW0CnB31LlroVwJ1nQLGDjeP7w+lb0dsFxjrWB0tHS6NuWPJ6A16ToUm63T3Gallr4S7cxiTjrX
PaxaF7dlVeSMUhxZ5jd+H7qCa4eF3DSE5x3zXN3Wk6jbyeaiFWUY6ZyPStYS5SalPmVipFbX0E4c
W0alvmPHJrag0rVvEE6LdljGpG2NRtQD+tW5XMI0uU9M8NeFo9PiQhecDIIrtrOMIoG3H4VlJm9t
C6CB06VPGM1IHLeItGS6uw+ORT7e3jsbQvj7gzUNam0JaWE+HN7NqOqX80n3FO1RXo8YzXdS+BHk
4z+KyzGPapcU2YIv7qQtiuaxvcaWqG4O6FwfSrS1JbPnrxoxkv7qIfejcitj4V2f2exumI+8+aKn
xHTT+G5d8Txlm4rjLxMsQwzWT3OiK0Mm6sEkVsAcjFc1d+FEmlGwEDPQVopaEuOpr6f4ZWNAu3tW
vHpAj5ZQcUFIWaDjGMVUMQ3cVDBmvbhY7QAV2nh+T/R1yeKhlrY31+b61FcQK6nIoJMi401WblRi
qr6PCw5UYq9y+YgOgWzNkRrx3xWjp+nx2v3FQcelAbmko9anQ4GBUNisPHWr1qMrQhS2K11HvmYV
hamcxSRZ5xRIqluS/DKAQQXZxyXrvo2FdlL4EeZjH+/ZbjNSZpswLNBrE1Gt7VE4ODVIlnh/j61F
j4lmeTGyUbq6LwdEqWbeX0YbhSqfEddP4Bddj4JIrhL5d8h7VjI6oLQqKNzelWre3yc4/ClFjaL6
wqBxxUUxwCKu5BmXRA6c+9ZjP83FSBoQuPs4BrsNBlUW659KmRrDY6G1lyQtW3Hy0lqQ1qVJnAbm
oy3b9KYJCqRj3o4zRctIlhjLHmpSuOBRbQOpLGpPFaES7UqkZzKN1KsEc87/AHUUmvPLTVGv72aQ
k7WJwKmRrQ3ud74Ltilgz4++2a6iNDXdS0gjyMU71my7GpqTbxSbMki3SViajTTHqkSeR/GeyZmg
nQHkEE1S+F+oPPavBL96I4/Cia1udVF+4dVrkW+Fq8+v4tjMDWUkdVJ6WM0cNV+F+MVmjUcZgqnP
1qpNNnkcVRLiZtxIS1UzzIF7mghlxUZpVQdq6nTVdAoAOKzkbQWhvwM6gMM1twOJYx3NOJE11Kt1
H1/pVVlwBkk+9NocXoOQ45FPj+fkUJFF2NSB700v/hTEty5ZpkjvVyUgcCq6GM9zC14/8Se6GcZQ
1574Xs5WkI2HBPHFQ1dm1KSSZ7Rotn9l0+KPHIHNacae1dy0Vjxaj5ptlhVp+2s2CJ9ppCKzuWNx
zSFc1SYrHNeNdIGpaYw25ZeRXmvheyk0jVpEdcLJ0q3ZxNKTa0O3vQHg/DNcHrsJDmsmjspnNzNt
fFIJ24GazOhC+azDmgZIOOKBsp3J2qSaZodubq58yQ4QAnmhGT3NO18pb7BORmu205LfYpyKVkWp
Oxr5gKYWoIZWgfGfloFq1qTPLubnGO1RPtxg4P0oBAkY/hBz6VNDDkZ6AU0W2WSdqkdKr9ZOaGSj
VtcLHmnOcgmmYvcz7mBLy3MbdD1q9ouiRK6bUAVeelOC1InPlidSsWMDFOCEdq3uefykqrinYqGy
rFvApMVka2DAowKAsMkRXQqwyDXn/iWyitNQ3qPl6itIvRoF8RXinW4tQ6HI6GuW8SIVBPalc6qe
5x9x97r3qruwTjrWZ0ksZ9TUmcDNAmZ9/wAoao63rR0+w22MLPtAzt6mghmfofiB76LdJBJBIp5D
d/oa7bSdWLIPnpDi9TM8TeKdas51XTbIyxd3J/pXS+E/EFxqNoFu7do5OmD60maHWrnZyDRkn/69
MlEyOR0xntVoNx+FUgYjPxg4FLCuWDZyKQr2RoRnP0qO+nEFpJITgAUzLqZnhu6+0rknOTXpOmwJ
Fbrt5yMmnHYyr6Oxb2ijaKLnPYMClwKQWK3n0hn+lachHOJ9pNNN0apQFzsY10a4v4hXQh0xpieQ
MA1XLZNjhK80cT8OdV+3Wl3A7ZZJCw+hrR1qLcjZ/CsbnfHRnFXseHJArOYYbrUs1uPhYbuatqFP
ByfSkMq3UIINYkto+87Tx6GkSxfsDbflGD7CtTw/pk4nzITtPIFMFudsukh4Rxz71paTpKwP5jcn
0qTRy0NORMDgVCqewoJTJgAoxjntTiTu7fWmFxAcnn1q3EPl+X8KZMi4gKqB1Peob/Tv7Us5bfeU
yOoq4R5nYxqT5I8xieH9J1DTbvyJELRg8ODwa9Ms5mSFV9BWiptbnNVrKdmif7Q1KLg96XIZc5Is
pNL5pqeUrmMtZs0jzV08phchaY00zH1p2ZNxjS1g+LdJOt6U9ssmxjyGp2urDjLlaZzng/wUPDqz
TSTmWeTrjpVjVk3Rvjr2rnqQ5dDvo1XUd2cTqSNk9OKxXGCeKxZ1DAxHTr2q5C/y8GokUhsz54qu
uCxzSQjQ0+FZblR2ro4bZYiMVQ0dBb7Qi5x0qzuG5QOh71LYErDufpSeWrHnimIXbjkUjLkH1Hem
gGxryc+tXI19KYmWegq9YLiLJ7mtqS945cS7QsWehqxA9dEjz4krPSxyZqbFFhGxUm6smjRM55Lk
HvSvNxXTY57kLT+9MNwKdhXGm5FIbkU7Bca1wMEVhaiuQcVhXWiZ14R6tHGanGBI2OtYkqEHjgVy
s9ErEeo6UBsHipKEZs5qpPdRxcbhx70NCSuybTNWihc5brW9Fq6vjMnFSdEIdDRi8RRKygZbHFbu
m6nb3RA3gMegNJhOm0jbXGOoxTuCc1Rz3FyoGKawz9KaAVcZqeMgCmIkB4FaUTbYwB6V00Fuzixb
0SFMuDU8Mlbs4UPeXHeiOXkUrDuXYnyKk3cVk0ap6HMxxketSMhrcwRC0dMMZFMQ3yzSeVQAeUaz
9Vj8uPd271nVV4m+GdpnHX67pCeKyLtBtNcR6xlk9RVeWTb3qRnO6trgttyIfm71z7ai8j7/AJmN
DNqUVa5Yi1AnjynHuBV+11YJhWWXcP8AZNSzqgmaEerSsf3NtIQP4mGKtRavdRgMIpVI9KjU0a7n
R6T43uYQI7qN2Tpkqciu503VVuQGAYZHQjFVc4alPlZrpKGAznpTwxOc9+lWjIlUACnM4XApiLNk
nmvnsK0NvpXZRVonmYqV52GsmanhXitTmFkSiJTSAvwrxUxXIrJ7miOfjf1pzNWxkRlqYWpgJupu
6gQbuahvIxPA6eo4pNXVioS5WmefakGhndH4INZs5DJXA10PaTurmLO21uKpSZqGMoXGnRzBiyjd
9Kx5rcQS428fSkjanLoaOliHGZFB56VswW+mtPufcBsGOAfmxz+tFkd8HpoaUx09FAtFY8DO71qb
Sms/Nb7RbecG6AEjFLS5c78t+p0djpVs9wsyQiJAdyr1rW+zqjErzSe559Sbk9S3C+MA1bjbgE1S
MSXzMVG0vNUI2tPKrAuCMnrVzNd0PhR49W/O2xrHmp4TxVMzQshpIzzQBehqesnuaI5VGzT2bitz
FEbNTC1ADS1JupgG6l3UAc14s04yR/aYRll+8BXCtLncDXFWjys9TCz5oW7GddH5qqNzWDOgQnC8
VSuo1kHzAGkPYopEY2+RWxV23Vzj5G/Kg3jWaNazhZuqNXS6TaKhB2c0jR1nJWOlhOxRxU4YkCgx
Y0OQatQyDbyaaFYe8uF4NY3iC9ltbVGj43NTIL3h7WzMihjzXVQXYYDdW9Cf2WcOJpfaRZ3g9KsQ
mupnCLIabGeaAL0LcVY3cVmzRHIxtUhetzEjZqjLUAIWpN1ArhupwagAfDKQ3Q1594v0c2bm6tx+
5Y8j+6ayrR5onThp8s7dzkZjuqAAmuBnqC7c0iwgtzSA0rWzjfGRW3ZadDu4AoNYo2rfS4v7orSh
05UA2r0pDbsTm29KRottBNyJ0wpJ9KhD7f6U0ikNWffIFBz60zVUW52ow4UcUN6EPcx44WsbgOmd
ua7TT5Bd24KHnFKnLlZFSN4koluLdueRWvp14swweG9DXoxldHlTjYtzGoo25qzEvwtUxas2jRPQ
5CNqkLVsYoYzUzdQA3dSFqBBmnqaBhuqhriCXTpVIzxUz+Fl03aSPI9QTypW2/dz0qKNw3SvOPZR
Mqin8VLKRcs3O4Cuk0w/MDjt1NBtHY6O2IIHY1pxgFaETIRwMkjtVSUEk4570MlFW5bap6dKzWm8
1tqH8aY+hp2FvGoGayNevVt7/ap4xzUvYjqTLtvLPcvJxSaVcyWsxTnFZlnT2t15xHmCtOBYwQy4
B9q7cPO+jPPxFO2qLEj5HWo42+aus4HpoX4W4FTF+KlotbHII9SFuK0MUNZqiLUDE3UbqBBupwag
Bc1DefPbyD/ZND2KjujyPWlKzuPesRZjHJXms9lMuw3StjnmphKDSLTJ7OfE3JrpbO4GQc9qlnRA
3LO82k5NbFvdADkjBoCSHyXIIIzgVQvdRigT7wzjgUzO1jHknlvG7qnp61etYFQDIpCZoqVijzXn
3iC8EmsOuaCGb/heR/s0ijkVv6fbxy3QMg5xmsnuX0Ldzut3+UYTPWk+2GJSe+M1pFtamcldalmx
1eO4XaThhWnC+TXqR2PHqL3maUJ4qRjxSEjj42qXdxVmaGs1MJoATfSbqBAG5p6mgAzTJTmNvpQU
tzzHXY83D/U1zF5FhjgV5r3Pa6FMsV5HWnLe7RhqBRdmTwagN2d2K2rPU1C5LAnPrUs6Iysbdrq6
f3gK0BrUKj/WClY05iM6xLOcQAj3NT29uznfKSzHuadzNu7NSBFjHNSm5VO9IRnajqoWMhTzXFtA
bvUfMduSeg702Qz0rS7FbTToQFwzjJqaGTFyfK5PQViyzUuFmuIdgGABya5u/vTaN5cnUHFUmLoZ
zyskwlgJweSK6zQdUEwVJeGr0aUrxPLxEfe0OrhPAqVjxWhznGRtUwatDK4jNxURbmkAm6jNABup
6tQAFqhupNtu59qUnZFwV5JHnWsHdIx96w5lz15rzT2uhRmt85xWbcxMnUGmZlB0bdxmrNvFIcfM
350mWjbs7YkDJY/jW5ZWW4jikWkdNp9mqYJFaJdEHHakUULu/VB1rLn1Ld/FgetMGYd/qWSQmSa0
/AemS32pfa7piLeLkg9z6UmQtz0W7uQ2cZx0A9BVzR7cAea6j2rPqX0L99KRat5A6Dk1wOoKZ52a
YfMORTYRLujiGWEq6/NWza2yKQVHNdOHerRy4laJo6TTnbbtb8KuM3Fdh5z3OJjbmpt3FaMxAtUZ
agBN1GaQBzTwaAAms3VbjERUGsa07RsdeFpuUuY4jUjljWTKK4j02RE4IpJYFk6imQkVl0xWarsO
mAEcUi0bNnZBR0rWtoguMCkUi21wI161mXuocEKaYXMS4u+pY/hVCSWSY4HT0pEmlouiSahdpEBl
mOceleiwWcNjClvHgJH97Hc1EmVFFi3Czy7mwIl/WtJbjP7uLgd/apQ2VNVvtsBhiPzdK5S4nAuR
nqOCaTGi9pcytPlU+XpmumtWII44rah8ZjiNIXRuWeNvvViQ/LXpJWPJbu7nCRvVkNxVsxBmqJmo
EPiXca0YLMuOlJsuKuPlsSi5IrNuG8s4HWs5VEkbwoOTKsk+FJY4rC1K53k1xTk5O7PSpwVNWRzt
4cms+WpKICtSLTETQj5q0YeBSGiys23pUguGxQMq3E59ayrm4x3yaAKiRtO2WPHcmhruKFxFajzZ
ScA44qRHoXhuMaLpxaUg6hcDLMf4F9KlhuDeXGASIl+8azZslYma68y48m1+7nFW5rtbRNhb5z1p
iMKbUg0zuW4A4rPgb7VdKXOMmpA7HRbMS7nUYiUda0lkQOBngVrS+JGdbWLRt2bAx5BqeQ/LXpnj
PQ4GJ+ashuK0MhWaoWcA0AaOmASMK7jRNPWYBmHyiuepO2x10qfcv6vYxCzYqoGK4HVYVTJrmb5l
c6oaM5TUJ8EgGsG4kLNUHT0M64OaqMMikSRsuKbnFMRLG3zVehOaGNE445NNlnVFpDMu6uie9Vo1
8z5mOAOST2pDK91cNN+5tsrH3PrW54a06KxT7fdrlh/q1Pc+tJ6IUdZGvHPLezMcnBOWbsPap5r3
ylFtbdT1xUWNWzU0/Zbwlgfmx8zGsHWtRHmMqE59aAMyNifvHPc1f0gtPdqkY5JosJHeNci2tktY
2022-04-14 17:47:08 +02:00
euPnNY+oXWZEVJNrZ9aun8SIq/CzodHuriIokhDIR1ronbKZr0o6o8ipoz//2Q==`,pg=`
2022-02-10 18:27:21 +01:00
/9j/4AAQSkZJRgABAQAAAQABAAD/2wBDAAsICAoIBwsKCQoNDAsNERwSEQ8PESIZGhQcKSQrKigk
JyctMkA3LTA9MCcnOEw5PUNFSElIKzZPVU5GVEBHSEX/2wBDAQwNDREPESESEiFFLicuRUVFRUVF
RUVFRUVFRUVFRUVFRUVFRUVFRUVFRUVFRUVFRUVFRUVFRUVFRUVFRUVFRUX/wAARCASwBLADASIA
AhEBAxEB/8QAGwABAAIDAQEAAAAAAAAAAAAAAAEDAgQFBgf/xABDEAEAAgECBAMECQIDBgUFAQAA
AQIDBBEFEiExE0FRBiJhcRQjMkJSgZGhsWLBJDNyFSVTY3OSNEPR4fAHFjWCokT/xAAYAQEAAwEA
AAAAAAAAAAAAAAAAAQIDBP/EACARAQEBAQADAQEBAQEBAAAAAAABAhEDITFBEjJRIhP/2gAMAwEA
AhEDEQA/APqYAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAKNTq8OkxzfNkisQC8eb1XtRNbzXT4q7eU2nu0MntRq/D8StMccvW29ZmdvgjsTyvZjxOLj
+s8WLxn8TFPXs6Oj9oct7c14rkxz22nrB2I49KOdTjelmszfmpMeUxv/AA28OqwZ4icWWtt/SUi4
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAmdo3nsPNe0Pt
Fh09Z0+DNWL7+9O/7A3eJcZppsV5raI27esvH6jX5ddM25p79Ilo59VbUZOe2Tm/PeGvfPfT2iKR
PLv1+DO678XmW/a97U6TtOyzTbTF538/T9WjTNecm9a7126tqk3rSYxY5ta1plRZqZNXGjyZcPXl
mZmsx+qjBrsuO16xM7eXRt04JrdTltk5OWJnfaWf0a2lty5MdZnfzSn+WOHiOutFpjHa9e8bQ2fp
+alYy462pk7zXbuxjPesbRS0f6ZZV1ET1tErzXFLHo+A+1ddZf6NrI8PJHa1vN6iJi0bxMTHwfOa
zhzd61v1846utwniM6DUdb3nBaNrVmd9vjC/ZVePYirBqMWppz4rxaPgtEAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAItaK1m09ojcHnvarjM8P0vh49+a/eY8ng9D
h1fGM1rxjtGPfvbzdbjuTJxHX48cTPNltM/KsS9Dw7S49Jp6UpHaGe2vjz1y9J7LYK13vHWe7bj2
ex1tvM80ekuxW3RnW3Vm6P5jRx8H0+OYmMcb+bapo8GKPdpC6bQwtdHU8JpWkdJ/JweL6e23iU67
d4dubSqyVi9Zi0bwIs68XGp36TtEq7ZJmZmevzdbifCKWtbJinkt6eTgZPFw32t+sRurbWVzxs1y
Rv6T8V1NZNPtfq0seTm+Kevr+SZuxXjvaPiV8N4viycto9HseG6+uu08W6Rkj7UPmFck1tE1nlmP
Ld3eA8V8HVVi1pjq6Ma/pnqce/ERMTETHaUrKgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAADW19+TQ5p/p2bLS4v04Zmt5VjeQeJ4bjnLqsupv+Ka1+ERLv4reTmcNxcuC
vy3l0qdI2hlr66sT02ot0ZV7qqrInruzrVZLGSZ37JjqgYTG0K5lbaFVhDT1Ub456RPweY4hixWi
eSdpjvD1eWejz3FNHWYtkpvFo9EIseb3tS3SerOms22rfpPqZKzvvHSYUz70TExG6Gdbs2rljeJ/
Mx5L0vEzPaelnOi98c9J2bFNTFpit47+a+PVUvx9T9nOIfT+GV5p3yY/ds67wvsXqpxau+G09Lx+
r3TqrEAQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAADV4ljnLw3U0jvO
O0fs2lWqyUw6XLkyfYrWZkHldBEV09eveG3Fq1mI3jd4vPrOIaid8G9MP3Y38k6fNrt/rMk9Ou8s
tfXXn49rGWInuy8SO/k5Gl1E3rG/fzbOe94wTy99mbRvTrMOOvNfJWsesywniukrG/jU6fF43WYN
TmtEeJtEQ06aSmK2+bNtEd+qfSO17unF9Hmvy1y13XWyVmN4tExLxVK8PmNq5NrT58zawam+m/yc
0Xj8NpRYSvQZ7xEOdqI3rPozxayNRXe0ct/ON03jmrKB5nV4q1yTO20Obmv4c+cx8HoeI6WZpNoj
q83niYmYscU0r8aJ6T1n49zeJ+Meqm1drb9J+Kd5p136StGVem9l9TbHxLDFp7W7+sS+q1nesT6w
+PcAzVjiGHftzQ+v4f8AJpv6On8jH9ZgIAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAABp8VrW/C9TW0ztOO3b5Nxp8VmI4bn37TWYB8f1HFtTfUfR9FWJmsdZ9I7MtJxDX5s
d8ta1y0xzteaR2277rcuhycP12SceLxMeWNpjttHwlu8I0mfQ1y+D7k5YmJmY36T36Ka43z/AF1t
cI1ds+qxVj7/AEej19PCw9HJ4NoK4OIU5Y35YmZdzVTGebVZabx5jJS+Tmns81rNLm1Wrzc9rVw4
Yibbem72mXTTS0w0M3BvEta1bWrM95ie5EanY87wXgNOL6XPfxraXLhra/W28bR/dzYzarBqJxRe
bzE7Rt5vWU9n8mPHOGmS0Ypnea1naJb+k9ncNLR7u2y/WcxXO4TOoyUrN6zD0FaW5Y3hu49FiwUi
KxCvLMR0hlW0jn6ukWw3iXjOJzbDlneOj3GaN6zDzfFOH+LE7SRGo83XNSZ2lbG2/WfdlvaT2cy6
rNFInlrv1mfJ37cK4PwTTxOoidRm2+/2/KFuyMp47XB4LivXiunrH2b2iH2qn2K/J8x4fGDNxTSZ
9Nh8OviRvTyfT6xtWI+DeXs9MNZubypASqAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAOZx6/LoOWPvWiHTcf2hiZ0e8fc2mf1E5+vP/AEeuSd7RC2uKtI6QjHfeINTfwtPf
Jvty9WPfbt/lucP03gxfJf7d/wBoReYpm97zaNeLb4Ims9Nt94auDjem1Wo5PFi1onylS+1o7l8V
bxvtupjDMdNkYtXS1+Stt+m63xImEJ4xjHER2ZxMUjeUTO3VRmydBbjLJqPi08mbeVOXJPq1sl5Q
Vbkz9+rRy35rxHqzmZlVEe/Ez5LRlW5iyfR6zffaIjq1OSNZps2a21rZInafSPJhxGMl9LStLRWM
lorM/A4dkrWbYfLZC2W/7K6eubX6b4RzT+W76K8b7G6X62cu3Sten59nsm3j+OXz3/0ANGIAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA0OIYfpOHPijvNNo+fdvtXJO18k/
/OwPFYbz2ls3jx8VqW6xMdWPEdP9D4lkx/dt79flLLHbkxTPwY6nt2512ORTRzE2x4/dpE7cvkme
E4IrW3hRMxO8THRtU1FKWtvtvK2upx22rzRCtXkqzh2jtF7ZbT122b01ndnpuWuP3Z3+Ky20qDVv
fauzVy3mejZzNK8dVjqi87KLRLYtXruqvXzkQp7Qoid88R6rcl+WGlW0/Sa22mfhCZOq2x082ix6
jkm822pO8VrPdr4dNObVeDo8XW3uzMbzK+mvxT7szE27cvnu9j7PcNjSaXx8mOIzZevbrEeic5tN
+SZnpt8J4fHD9HXHO3PPW0x/DeBtJxx29vaAJQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAKNRim9Z5e89Nl4DzXtVh5babURHrSf7f3ec1+qnDorWrvvt5Pccb0n0zhmWk
Rvevv1+cPE2rGTFNZU26PFfxwa5dVkjelI2772nZnX6bbrEUq3o0d678u8wmuDL2ittvVjXdneeK
cGv4jpJ6U56+kS7+j118+GLXpakzHaWlp9NNY3tv+bbiYiNoQy1y30uyZJlrWmZnuym6q1iIJnop
yW2Te8bdWnnypQqzZOadokiIpSZntWN5lrxki19vNRxrUeBwnNNd+fJEY6/OejXLn3Xe/wDp9wyn
E8uo4lqqxblv7lJ26T6vpD5X7G8QycKzeBMbzMRM1/FH/wA/h9QwZ6ajDXLitvWzRgsAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAeL45w+dDrZvWv1OWd4+E+j2jX
12jx67TWw5Y6T2nzifU+rZ1y9eHwzDYxxEy18+DJodXfT5o96vafWPVbjyxDn1OOzHudbM0rt2UW
iI69mVtRXZq5tREb9VUoy2iIlRbJ0UX1VZ6btTLrI7V6yk62M2oisT1c7JmtkttVMUyZp6x0beDS
RWOvdKijDimvWd3G9pNRMfRcNfvZOb9Hpb0itJeP47k/3hgjaZnbaP1XxWW3T0movbNS0W645nbf
0nrMPpXs3xamoxdJiLbe/X1n8Uf3fKsOTw4jbaXo+EarJhtGTHMxeJ6xH7Sti9Zaj6x3HM4NxXFx
DS1mtoi8dJrv2l011QAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AGjxLhODieOIye7kr9m8d4eM4to9RwjPXFa0ZIvG9bR0fQXmPbDFvTTZPOJmEWS/V8bs9R43NxLL
G8eFbePg1bajU5/s0l1ceKLx1hbjwRE9mOpx0y2uRTSZsm3PMw2aaKtIjo6kYo9EXpET0hVLXxYK
xC6MZvyx1lFs0RHfaPiCnU12pLyHGNDbUajBekWma2npWN3p8+opa20e9LSyZLxExTlpM+vdOdcZ
a9tPS8MyUvFrzWlI6727u1pYxYrbVmb7x+TQx6au3Nqcl7/0rcmW9axGnwZJj1novmxnZXV0fFp4
ZxLBPgTGK8xzXr5fOH0bFlpmxVyY7Rato3iYfNuG2x56Wrqa8s2jz+7Lu8O12bS6jkwzN6THNNI6
tvrN68Y4rxlx1vHa0bskAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAA4XtTTm0OKfTJ/aXdcL2pyRGjwU362yb7fkJz9eTxxyZJjyltRXzUZK7TFtl9Lbwy06YzrHwa+
fJFd/wCVt8m0bQ0eS2qzcm+1K/an+zNZFL5M1pjFXeI72ky48eGnPkvNp27+TPU6nHpMfLXaIjpE
erk5dRMxOfN1mPeisfshW1ne1a1577Y6x5R3U0zze31FOWI6ze0byU098kRlzbxM9qrMlPDpyRMR
Md5Vt/Ihp5898mWZm1pjftE91uCt7fCI7dWeHDEW3t723l6rslqxWZnasR+SYhFbzhnfxJ2jyeq9
lcGXWZcmW0zWKxHLaI7794eJx5fpfEKabT8t8l5isddo3l9S4VjrwrRUwzSJt3tav3pdOL6Y6dXD
j8HFWm+/KsU4NRXPvtWazHquWVAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAa+fXYNP9u8b+kdZBsDkZOO135cWOZn4y5Wu4xqctbe9y19Kp4njt6vi+PDm8DFMWybbzPlV
5PiGtz67UxbNbeKTtWIjaIXYpnwuaftT5tXJT3vmi1pMsrU5qIrG1V1a+5DCa7b9GFbRr5J6Wnbt
Cu+Wmk0m8956z8ZWZNorbfzcbX5rZslazPux3hUt41NTntktObJ13+zX1bek01r4/HzVm0bxPXy/
+bNfDgjVa2uOY92kdfg6ufJOKvLXtttVVSqbcta2vM7zXtHpLQy5ZtMd+vWd+7Zy3mdJHXra3f0c
vUarw7zFY5rT2hH1Lavnrgx81p3U49Pk4nE5L35MO/StfNRXR5tXnrS8W67WvfyiPSPi7uLHFK1p
jrtSsbR5Lc4RzsXBaYreP4l45esRD2HD9fnw6evvWvO3Tfr0aGk0U55ra0TFInv6uzgrXFXlx0i0
77RPlC83Yj+JW7oddqr6vHzTTw9/f6dod+L1t9m0T8pcbFSmPHER3892W0zPuz+jSbVvidkcqmfP
Sel7bekrI4n4dZnPWIrHeYnZee2Wpy8dEaml4npNZblw5qzb8M9JbYgAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAABEzFYmZnaI7yCXL1XGa0jJXT0571nbee27DiXEprp8nhbxG20W8
5cbD0ikfnKO+urTPvjoZdXqctdsmTaPSvRpWmsdZ6yztfaGplvv3lWW1tyRlz1x0vkn7Vo5atTNe
Y0+1o79V2KsZsvX7Ne5mwxnyTNvsx2iGneM/rCdRSuOsTasTt5kRFtpjqmOH4t4nk7estiMNa97R
Hwhna0iuKTEdmGWa4672nZtRele1N59Zlq6vLOSsYorEc07qcW65euzRvtXvPZy52naZ7ujr6fXV
rWdukREK8+njHgmZmPc67bq6ivVWhxxgxZLztNrT1mZ/SP4VZs0zaOvfp84WUtNsXLvtv3699+rU
z7+Jtt5qURqMnPpctaR1rMSw4ZoK57eNk6xHaJRh97Ltt7lo5Z+L1HAPZvVauZ2nFTSzMTzeJEz8
to6xPfvsZntPZ9rXxabmxzefdrv0j1dXh/BcmstW1qxTHHasR3+b0GPhGl+kWmd64dNEVjf73T7X
y8vy+Ddx6O3iRakxTH5RXrMw1/lX+3Itw2MFIraN48qRHdZi0cUjmmPen9noox1iO0fNzdXEYrTt
stcmd9aX0bJ+HePmiKTitO8TMLZ1cVjrMfqpz6ys4pjfrPRWZ9rXXptUit6zO+23VyaRHEc05L1/
w9J9ys/en1ljqdVbwYw452tlnl3jyjzbmmiMeKtYjpEbLeTXPUU8ee/+qjJpsV5rbkrFqzE1tEbT
DpYNbW21Mnu29fKWna0KbqTdjXXjld0cvQ63ltGHNPSfs2n+HUbS9c2s2UASqAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAOVxPWe99HpP8ArmP4b+r1EabT3yT3iOkesvMVtN7za07zad5l
XV5GmM9vVfEstvDx0jtaVVMlq+UJ18b5cMRvPeSuK87bUt+i2Z3PtG7zXpjkzXt6R+TXyTMzvM7t
ydHqZ+zhv1+Cv/ZuqvPTHMfOYaTMil1a1K2vHSLTELq2v+KWzThGo84rH5rq8JzedqR+ZeI7WnOS
34pYTafWXR/2Pln/AMyrKOCWnvmiPyR6O1y9585lhWJvl557Q6eo4T4dYiMvW3b3UanhldHpJtGX
e09unmjsT7eb1l4trI2t0hsZfrdNO0bzy+nzU20/+NmkzO9esz+TZxWis9dttvPv+Tn21jjaW8zn
26bTG3mp1M/Wzv3t0jyWXiKZJmsTERaZhXXDbNl8WaztWenxZLstPp5pau8frDtVrNMM5cfTfpMf
3aunxxbes9d/R09Dp8ebJi09ptFr3jtt2WyrW9wy1Jx132mK+Xq9PotT0iIU19ntLtExa3T47T+q
6nBaYvsZstZ+cT/LeMnUi0TXffo1s2m8Ws2/OIMWk5Jib5L328rS2t94Sh5TV4ppklpW6PT6rh+P
NbebTHyas8E081mZy5P2W6OFhjxNTE/hr/LoRO0Kvo9dPqctKzMxEx1la5t3tdnjnMs4noievcrO
yZjeFF1OSnNV0OG62cn1GWffj7Mz5w05joovzY7xes7TE7w0xrjPeex6Ua+j1UarBFu1o6Wj0lsN
3JfQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACrU5o0+nvlt92P3BxuM6nxNRGCs+7Tv8
2hToxm1r3m9utrTvMsonqyt7XTmcja0u3O6FMfi5t/u0/lzdJM81p9O3zdvHTwsUR5+bfPqOfX1h
dqV+3O7bs1+T31oqmI3TEM4rvCdkDGIIhlFd2daboS0NXG2bD6bufxXU1vlmu/u4us/N0+L1tTSx
kr9qk7w89j1FNZMV3jxLzvaJ8mer+LSOZqK2xZotbvljfr/89U453rXt9lse081xZtNjx7TGKu0t
DHlrevSevaN5Y6+tJ8c7VRNMt63n3ub+6/R54rERMztDYy4a5omclYmfxKcenrjtHLvtPrCnVmdb
eFe3JXmjy6eS/DrMuLVYsta9Mdt++6qLxO+0dEc8UmInr18iUfReHcXrqccb9Z27Q61Lb13eJ9nc
1Z35rTvE9avY4bTkpG8xEfB05vYxqybc07R281naGMREdoT5JQqy9mply7Q3bV3iXG1eXw7TWSka
c258t7+tpT5/BjT7MfHqndz12Z+M4lMMKyziUJJiN1WSu9fku23RaOgKNJqbaTU1t9yelo+D0cTE
xEx1iXmM1Nt3W4PqvFweDaffx9vjDbGvxz+TP66QDRiAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAOJxzU73rp6z296zsZMkYsdr2naKxvLyObNOfNfJbvad1dXkaeOdpvsc2yuZVzfbfqybutwu
s5s8R92J3dvJb3tnO4HSMegtmt3nfZvYp8SZl0z45NfSK7onH1bNcfRFqnUKJr0Y7dVtq7prjEsK
0XVpEM6028mW20IHK41aPo3J6zs4ODhdcvPnvExFevNXpMOrxi/PlrTee7PLX6Pwa09uaNlKtHg9
dM3z5d7ReOu02nu0JzZMfblrv5R5uvrcdImZ26T1mYhxs1Os7RH93PZ7axuafNfLitvbaYU3yZYt
PXs9NwHhui1HBa5LVicsb81onrEuVqNNSuS8Y67dZ6xPZa59Il9uX41vEitImZme3q2Kxbxora0T
Md/ROSa4Ztkj7c9OafL5LuGYubmyX3iu/TfbdSfVnpvZLT/XZK233+Mbbva1xRXyiPk8pwbH4N6T
adq5a71n0tD1WDL4tPe6Xr0tDpz8YVnJHWEXYxbqlBedoef4tW0XraO09HdyztSZcbUz43C+ee9b
SVMaeOfqq7+jGckQ1Yz7+7v2RN/WXPXZPjci2+2yyJaVMuy+uSJlA2d+pNoVRbeDcSxyTE+TDDlt
pdRXLTynrHrDOyiyZeVFnY9TjvXJjres71tG8MnJ4Nqt4tp7T1jrV1nRL1x2cvABKAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAHJ49qfD09cNZ97JPX5PPw2uI6j6Vrsl/ux7tfk1mWr7dOM8iLdm
vfebREefRsWldw7SxqNbWbR7lPesrn3Vteo7dYjDpMGCvfbeXQ0uLlxRLRxROfUc34p6fCHYrXlr
EejqrjY8uzCYW7MZjdVKqK9VlaxCYrsnYExBMRMJRPZA8/xPHtmpP9W2xx76vhWOInvt/C7ike7N
vwzE9kcapGfhlevTaFbFo8RqJ5vy8/RoW09ek0msxHfp3dzNoLzp4zUmZpMbT8HJyYJi20X2n0lh
ZY1li/RaidBF4w2mK3jrHaFGp1lN+tptPp5IjBkid5mIp16TKu0abBPv33vPlM7z+iPdFNcWXU5I
tkrNce/b1W5db1nTaf3ax9q0fxDW1ebNk2phty1mOu09VOm8W19orEz23j1TwfSeERFuEYMddptW
d43dvBn21eKJ75KbW+cf/JcTgMxXTb3nbljz+TpcPmc2uyZO1KRtVtGVdi0bx07qJnllsRO6rNTe
N4XVamsy8mnvPwc3R2jPwe8TPbdlxXNOPSZfhWWpwO85OFzv57qrODkzeHntSe8Sn6Rv0a3EZ218
8nXekfr1a0ZLVnqx19dWb6demXybOO7lYMvNMdW9S/VVLo0us7tPHdtUtEwJiZU3jq2Jhham8CVG
PNODNTJXvWd3qcWSubFXJWd4tG8PK3pPd1OB6veLaa89Y61/u2xfxh5c/rsgNHOAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAANLimq+i6O0xPv392rdeZ4rq/pOqnlnelOkIt5F8Z7Wj27I2I6sb25YY
V1ImY3dbQ08LRc23vZp2j5OJG+XJWle9p2h6HHtbJXFT7OOIpX+7TxT31j5rycdTh+Dpz+XaG/sw
w18PHWseULN2trBE9UcrJKBhFU7JAQi0dEomegNDUYovM7x3jb5tO1ZvpbaTLtzRExWfWPJ08kbT
Ex5NXWYYyV5omYtHWJieyeDzuizfRs19Jn6TM7Ru1uMcJxZqTkw+5f4ebqa7SV1MR4tdrx2vEfy1
axqsNOTLjnLXytVXi3Xj8+nmsxTLM16d5npPyUzpekTtSK+U7vS6vQ/SYmK1vWPS1HOn2dvvvvE/
tDO5XlcO+LbfHSd/W3o6/BdDOXPTnj3Kz38rS6Wm4FNrRyRzTH3p6RH/AKvR8L4dXSzE3jmtHn5I
mbfqLV+m4dbLSsZInHjr3iI6zLpYaxS01rHuxHRHiT9mv6s67Vj1aqL6326MrWiYa+/Q54BxPaGe
XRZpj8MquB4+Xg8zPnB7SX30to379GxpK1xcHiKz5IS8xr8PLPixH2bftLTy05o6dHYyVjLhy0t1
izjZa3pMVv3iO/qz1G2L+NbSajbNyW7xLsY8kTDz+fJXFqKZN4iZnafi6WHL0iYlStI7OO+7axW2
crFl7dW9jvE9ULN+J3ZbdFGOy+AYWpEqN7afNXLj+1Wd23KrJVMvCzseh0+auow1yU7WhY4fCdV4
OadPefcvPuz6S7jol649Tl4AJVAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAV581NPhtkvO0R+4NPi2
r8DB4dJ9+/7Q83Po2NTqLanNbLfvPaPSFDHV66sZ5ET0hRknyW2lTtMyouz0c8usx2n7s7vScKwx
zc1vu/y85p+maJh6Th+SOWeveXR4/wDLm8v+nX5mUWa9bbrInolmu5jdTNkxYFk2Isr3TuCzeGMz
+THdEyDDJO9Ja823rt2XWnya946pGvktDXta0ztWu/ybvLE9dkcoOf4GbJPWK1j49VmLh9JtE33v
Mevb9G7WsW8l1ccREISophiJ2jpDYpijbaOjOuOJ8ujOdqxsgVcsUjaETYvbaFFrgu5lVsm0yUtu
ryg43H5m+GIj1XcJzePoL4pnrWGtxmfchr8JvfHS1622if3QljzTTLes+qrNjrkiYtCzPMxnm095
YZJ6boS5teB49Tqscza97VtvWvlv8V/FOF34RrIxTM2xXjelp/eHoeA6XnzReY3ivX/0dfivDcfE
9HbDbaLx1pb0lOs+jO7K8Lis3cN+0NKcd9PmthzV5clJ2mF9J9GHHVL108dm1SznYr/Ft0tuhLb8
mNohFbMhLWy0mJ3rPXvDvcO1karBG8/WV6Wj+7kWrvDDBlvpdRGSnbzj1hpjX4z8mOx6UYYstc2O
uSk71tG7Ns5AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACZ2jeXneJ62dVl5KT9VTt8Z9W9xbWclPo+O
fft9qfSHEU1pv48ftYST23ZTDC/p0YtlVuvVjMbM5+LCZjYGWGdrTPxiHY4ffaf3cjTxz1v6xMS6
Olty2iXVj/Dk8n+ndrkhnGRo1v8AFdW3RCrZ5uiYsqrboncSu508yjmZRYQt50TfowYTbYGVrKrT
uTZjvukQnYhMIGVY2ZxPVWyrHVCWzXpVXkt3TE7Va+W4K7X3jv1auTNy3jdba0RZpamfroQN7Hk3
6wr1GTaN2OOJiu6Mu98NvgDi8Wy74d/yZ8PiPAiO2zU4nb6qIn1bugjfFE/ASp1ke9u15mbbRDZ1
Mb823kx0Ontn1OOkedoJCvT8I03gaKsz9q/WW+isRWsVjtHRKyrhe0XCfpWL6Vgr9fjjrEfeh5fF
feH0V5Dj3DPoOo+k4a/U5J6xH3ZZ7z3228evytOk7NvFbo0cdols47bSybt7HbddHVqUs2aW3Qnq
xVeu8LILR3SlZw3V/R8nhXn6u0/pLuPMXjeHT4Zruf6jLPvR9mZ8/g1xrvpz+TH7HUAaMAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAABRq9VXSYJyW79qx6yvmdo3l5viGs+maqYrO+OnSvx+KLeLZz2te1rZL2v
ed7WneZYWnZl5K72YV1xEyxmeqJljzIEWlVkszvbZp5soN3h2SJz3pP3odCnuWmPRxuERfJrZmtZ
mtY96fR28kbX3dXj/wAuTyf6bmK+9YX1s0cNtm3Sd4LFY2K23W1s16StiUJW7bp22RW3RluBuruz
mWEgrmCGWyNkoExKE1QlPmsqRDKeyBjaejWy2W3ttDUyz1QKslvehVqKTNosyyTvELabXptIJpaP
B39Ia2mz+JGpr51jdZefDx2hzuHZObNq58poJaGtjxJ2+LoaKP8ADRPo5+T3skx5OhpOmC0fBNQ0
5yTbn+bt8A0u9raiY6RHLVwY62mI6zMvaaHBGn0mPHt1iN5+aYVsACBXqMFNTgviyxvW0bSsAeE1
mkvw7V2w5Ote9besJx2er4rw2nEdNNekZa9aW9JeQjnxZLYskTW9Z2mJY7zz26fHrrdpbZsY7NGt
mxjvso1b9NmUwpx33XRO4K7VUTE1nmrvEx1bVo2VWiJE/XY4frY1WPlt0y17x6/FuPM0m+HJGTHO
1qu9pNVXVYt46Xj7VfRtnXXL5MfzexsALsgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAHM4jxOMFJphmJv529Dq
ZLfjDjPEIx450+K3v2+1MeUOHSOWFc3nJkmZnf4yujpVlqunOeFpV2nctLCZUXRM7MJtsWlRkv3Q
ky5NmpWt9RnrixVm17TtEQnJabXisRMzPSIew9n+CRoccajURvqLx5/chfOest642OGcIpoOG2w7
ROW9d72+LQvXevyejcPUU5M+SvpLeOataraw2a0dLbLqTtK1G3Es4lVWWUSoldFtmcXUbpidgXzK
GEW3TuCUSncnsDFMMLSms9EC6J6FpVzbZE5ALy0809ZbFr9GtfrEoFMzuuwz0Ueey3HbaBLDXe7i
tMOfwWnP9I+NZbuttvhs1uBRtXPb4SDm3iIvf57N7Dbl0VrS5+XrltEd+Z1Jx7cNms9N4TURRw3T
+PrcO3WszEvZOD7P6aYiMlvu16S7y1QAIAABxOPcLnUY/pWCv1tI96I+9DtgmXl68Biy7/NtUu3+
O8HnFa2s0tfd75KR5fFyMWTdhrPHVnX9R0cd21S3Rzsdm1iuqs256wrmGcT0RYSx5d047X02SMmO
esd49YRE9WcdSXhZ2O1p89NRji9J+cei1xMc3wXi+KZj1j1dTTaqmor06WjvWW+ddcu8XK8BZmAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAMMmWmKu952UZ9XFZmuP3revlDTtzWnmvO8q3XGmfHb9ZanV3yxtWeWn7y4es
vPNtDqZJ6Ts5mppvdl/XXRMyfGvSNlu/RVvtOzLfoipLT1VTKbSpvfogRkvtDVyZOhkyvQcA4Dzz
XV6yvTvTHMfvK+c9U3rkW+zvA/D21urr789cdZ8vi9KDb45rejl8Rry6iJ/FV1HP4vXbBTJEfYt1
+UpiHM295bXsqrO9l8QkZ0lZEqqLeyBZHZLGvZkhIndADKJ3TMoqWQMZ6pjsxll2jsCLSrmU2lFY
36gieyu0LJk3jbsga0wdqzK20QpyztQGprL/AFMrOE05NLkt6qdVWZxNrSe5o9vWBLiUjnzXn0vL
q555dHt8HOwV928/1z/LpzXxbYccRvzTB+jucOwxh0dI22mY3ltIrHLWIjyjZKyoAAAAACJiJjaY
3iXleM8InR5J1GniZw2n3oj7s/8Ao9Wi9a3rNbRE1mNpifNFnVs65XhcWTdt47bnFuF24dm8TFEz
p7T0/pn0a+HJux1OOrOux08d1ndqY7tillVkzExLOk7yd4YxGwluViJhE45raL0na0dtlWO0+bZr
1TKi+2zptZGTamT3b/tLacvJjiY3XaTWdYxZZ6/dtPm1zrv1z78fPcbwC7EAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAABhkyV
xUm152iAZWtFazNp2iGhm1Vss8uP3aevnKrNntqLdelI7VRHRnrX/HRjx/tZREVjZXeybW6KbWZt
pCZ6S08tN7Nmbb7zCrJtyoS5145bSx5mWafelr3tsKmS/o08uXyhlly7RPV2+AcBnPNdZrK+53pS
fP4ytnPVda4y4BwHxOXV6uvu96Unz+MvVxG0bQRG0bR2G0nHLb2gCUDX12LxtFmpHeazt82wT1gH
mMN4tWs+rcr2aEV8DU5sM/cvO3yb+O0csLUTSdrLphRE8tlkZI7Atr2ZMazDJVKTYSCawi7Ksq7z
1QERvLK3ZGPrKbyCrbdnMcsbeaa18/RhvvM7oGEwTG0JmYYTIML22a2e28xELM19oURPNO4lOem+
n3ZY5+prVnMc2GYU4/L4A0a15cNf6rz/AC6fC6+NxCPOuOu/5tHJTbHj+F5/l1+BYumXJMd9o3/d
MRXYASgAAAAAAABhlxUz4rY8lYtS0bTEvH8R4ffhmo6bzhtPu29Pg9mq1Gnx6rDbFmrzVsizq2df
zXkMWTeIbNL7tbXaHLwzUctvexWn3bmPL8WFnHVL326VZ91MfFVjvvVlz79kLrcf2m7j7bNHH3bl
J2SirLQoy4t1++7G0dBC/RanxI8PJPv18/WG241+alovSdrV6w6mDNGfFF4/OPSW2b1zeTPL1aAs
zAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAVZ9RXBTe3WZ7R6iZOpzZq4ac1p+UermZMl89+a/byj0Ra9815ted59PQ32hlrXXRjH
DpCLX6ML5NlNsm/ZRqstfdXzbsZt06sLZNvNB1Za8RDWyZdo7q8udq5Mu/mIMt4md2lmy7JzZuWJ
dHgfBL8RvGo1MTXTxPSPx/8AstJ1XWpIs4BwSdbeNVqq/URPu0n73/s9hEREbRG0QUpWlYrWIisR
tER5JbSccur2gCUAAAAPM8Sry8Uyz67fwuxbzVPGsE49XGbvF42V4M0TEL33ERnktsxpk3sumK2j
admFdPFZ33VS2Mdui2J3UU6LYlFSsN2O5NkCyJ6K7T1TEsbAsxdpReerKkTFGMxvYEz0rsqtbbpC
b2VT1QEzuwtbaGUxspuJU3neWdKoiu8rq12gCI92YatLcublnzbEz1aOptyZqTuDHLfxN6R0+t5X
qdJhjBp6UiPLeXl9NSMnEKxHa1+bb8nrlvxUAAAAAAAAAAABTqtNj1eC2LLXeto/R43VabJw/VTh
ydY+7b1h7ho8V4dXiGlmvbJXrS3xRZ1fGv5rzeHN02bEW3cys3xZJx5ImtqztMS3MeTeGFjqlb2O
8btql3NpbZtYsnSBLeiWfdTjtutid+ghherHS5p0+f3vsX6T8Fkw181d4lMvEWdnHaGnw/UeNh5L
T7+PpPxbjdyWcvAAQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAo1Oprgr63ntAmTqdRqK4K9etp7Q5d7Wy2m953lNrWyWm953mVd77R0
Za1104xxlN9lV8qnJl2a9s3xUXX2ybsJyRDWtl3YWydEC+2VRkzeW6q+T4tbJm+KRdfK1cmWZnlr
vNp7RC/R6HU8SycmCk7ed57Q9ZwvgOn4fEXtHi5/O9o7fJaZ6z1uRyOEezVstq6jiEbV71xevzer
rWtKxWsRFY6REeSRrJxz22gCUAAAAAANbX6aNVpL0npMRvWfSXlKamsRMVvXm+EvZXjmpaPWHzfL
oNRjzXicfWJ8phfPxFejx72x7xMzK+sXiNoiXlq+Pi6fWV/VfTNqfLJl/WTg9Pji8R70LqvMV1Gq
j/zcv6yz+lanzzZP1lWpelTET6S81Gp1P/Gyf90s412rjtnyfqql6asREdWM9+jz9eJ6yP8Az7uh
odZqMt458tpB1JvEViI3/RhzRt13/R1MNaziiZiJn5K9ZNceKZiIiQcu/WekT+iYrWI3lzdTrs+8
8uW0fJzcur1Np/zsn6g79phVaIeetqNR/wAXJ/3SwnUaj/i5P+6UD0ldonum161h5mNRqP8Ai5P1
lNtRqJjacuT9Qd22WN5aGeZyZd/KHJy59RHbLf8AVq31Gp/4uT9ZEvS8Lr/vSs2npzRtL1z53wK+
oza/HW2XJNd99pmX0Rb8VAAAAAAAAAAAAAAcHj/C5yV+l4I9+v24jzj1cLFk8nu5jeNpeW41wmdL
knU6ev1Vp96sfdn/ANFdTrXG+eq1q5F2LLtbZoY8m8d11bbSydErsYsm+zZrO/zcnBm226uhiyRK
EtrvCrJDOJTeu8A1MWX6Lqq5N/dnpb5O5ExMbx2cPNTeJb/DM/iYPDtPvY+nzhri/jDy5/W6AuwA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAa2p1UYo5adbz+xbxMlvqJ1OqjDHLXree0ejmzNrWm953tPmTPWbWneZ7yoy5YhjrXXTjH8s75N
mtkyxt0VZM2/m175N1V03yTKubMLXVXybeYLLX2VXy7eam+b0bOg4VquJW+rry4/O9uyZOq3UjVm
9r25axMzPaIdvhns1kzbZddM0p5Y47z8/R2+HcF03Doi1a8+Xzvbv+TotJnjDXkt+K8ODHp8cY8N
IpSO0RCwF2YAAAAAAAAACvUZYw6fJkntWN3k8dfHz2vLucdz8mkjFE9bz1+UOZosX1UzPm0nqI/W
MYo9FlcPNklfFGeH/NshLGun+Cz6PtHZtVZWlRLS+jxPkRpIn7rdoupHTdA5s6SI+7H6Mfo+32Y2
+To3neSIiZ7A0IjPXpXLePlMotGW3272t85datKzHZjbTVnsDj+FG/2Y/RlGP4R+jo20u7H6N1Ql
o+H8I/REY957R+jpfReiK6eOYHLtj2tttH6KrY/6Y/R2c+kjeJiFVtLG24hxpw7/AHY/RRkw9O37
O99Hrt1YX0tfOBLjcGp4XF8c+u8fs9c4dcVcGemSI61nd3IneN1orQAAAAAAAAAAAAABFqxes1tE
TE9JiUgPKcX4RbRXnNgiZwWnrH4XPi28PdXpW9JraImsxtMS8pxXhF9DecuGJtgmf+1TWW2N/la1
L7N7T5e3Vy6W3hsYcvLbqzbO9jvvCzvDR0+XeO7crO6FmGSvRThy/RtVXJ92elvk2rRvDUzU7pl4
izsd2J3jeBpcNz+Lg5LT7+Pp+Xk3W7js5eAAgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAADs0NTrN96Yp6edkW8Wzm6+LNTq4pvTHO9vOfRoWtt
1mes95YWvs1s2fZldddOczLPLn2ju0MmebT3YZc2/mpm3qqllN1drsbZIhr3yzvtHf4AsvlYYseb
V5Yx4KTe0+UQ6nDvZ3UazbJqd8OKeu33peq0eh0+hxcmnxxWPOfOfm0mP+steT/ji8N9mKY9suum
L37+HHaPm9DSlaVitKxWsdohI0Y22gAgAAAAAAAAAABXnyRhw3yT92Nwef4xm8bVzET0rPJH5d12
CvLhho3rN9RWs9Z23n5y6O21YhrVYbdGOCfrrLPJRpv863zVS6FS09SvZj3lVZZRdPSqmnSWdrIE
ebOkK4ldTsgW1WKqd1oMZhEVZyRAImOjGI6rJ7IiATNd46qL02bHkiaxaoNGY2n4ImPgtyV2n0Vo
Gvlx7x2beiyTk08RPevSVUxux00+Fn2n7N+n5rRFb4AAAAAAAAAAAAAAACLVres1tETWekxKQHlu
L8InR2nPp43wz3j8P/s5dLveWrFqzW0bxPeJeV4xwmdFec+CJnDM9Y/CrY1xv8qvTZ+WYdbDk5oh
5zHk283U0eo3jaZZ2N5XYjrCnLSJhOK+8d1kxvCqzSwZvousrb7k9LfJ3nB1OLeJdLhufx9LEWn3
6e7LXN9Ofy5/W4AuxAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAETaKxMzO0Qi9646Ta07RDmZ9VbPbaOlI7Qi3i+c3TPUaqcu9adKfy0722ZXvFa9
XO1OrjrESxt66ZJmcjPUanlidmhkzTZVfLN5VWvsC2b7R3U3yqrZZtO1esz2h2+F+zWTUcuXXTNM
feKR3n5+iZLVbqRzNJo9TxHLyaekz62ntD1fDOA6fQbZL7Zc/wCKY6R8odLBgxabFGPDSKUjyiFj
SZkYa3aALKAAAAAAAAAAAAAADQ4pl2pTFH3p3n5Q33E12Tn1eSfKscsLZ+orS00eJqbW+Lfnu1tF
XaJnZsz3WpCfsyp00fWSvmPdVYOmSUDd8kR3InoQosy7JmUX7MdwZ17ro7KKT1XRPRAsrO0rYndr
79V1ZBaQiJ6JgCSIJASwrO07MpV2nqBlrv1a1o2bf2qtfLXaQUTO0sb05o3jv3ZXhjS20xEphW5h
yeJjjf7UdJWNKLziyRePsz0lux1SgAQAAAAAAAAAAAAAADG9K5KTS8Rato2mJZAPIcU4ZbQZuekT
OC3afT4NXFkmlntc2GmoxWx5K71tG0vHa/RX0GpmlutJ61t6wrY2xr8dXS5uesN+tt4ef0eaa223
2dnHk3juyreM81OaFGiy/RtZET9jJ7s/2bdutd2jqKeic3iNTsd8a2h1H0jTVtP2o6W+bZbOO+gA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAABje9cdJt
adohGTLXFTmvO0fy52bJfU23t0pHaqLeL5xdK9Rnvqb+cUjtCi94xxvK3JetKuHrdZvaa1ljb10y
cnIs1Wt3naJc++TmVWvMz1YWybfMGdsm3eWek0mo4jm8PT0mfW3lDf4V7P5tdMZdRviwfvZ6/TaX
DpMMYsFIpWPTzXmf+steT8jn8L4Dp+HxF77Zc/4pjpHydYGjC3oAAAAAAAAAAAAAAAAADG9opS1p
7RG7zszN6WtPe0zLua+3Joss/wBOzhzG2OsL5+IrY09dsSyYRijbHEMvOChb7KjF0yS2LQ169Mso
S24noyrPVXWejNVKbTuw3T3REdQWU6LYlVvsyiUDPfqupPRr79VuOQX1lZEqoZxIMksd0gT2VT0l
bPZVbuCaW8i8bwr32WxbcGnkjaZa9p2ndv5qbw5+aNugLItF6TEtvTX5sMb969HMpfazc0d9stqe
vVZDdAQAAAAAAAAAAAAAAAADV1+iprtPOO/2u9bektoB4TJTJpNRbHkja1Z6uto8viVht+0HDvpG
H6Tjj6zHHvbecONw7Ltfkmeqmo6Ma69DXbbZTkr1mGWO3RneOaGbZRoM30fVzSelMnT83aef1FZ7
x3h1tBqfpGnjmn369LNc3sc3kzy9bQCzIAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAa+q1dNNXr7157VhGp1Xh70x+9f9ocy283m1p5rz3mVbrjXHjt91lz
5c9+fJ1nyjyhdM8lZlOOIiqrUXikd+kMreunnI5XEdX4dZiZcG+XmtNl/F83PeeWWHDOGanieSKY
q+5H2rz2hMzWd1Iqx1yajJXHhrNrW6REeb1nCPZumn2z62Ivl7xTyr/6uhwzhGn4Zj2xxzZJ+1kn
vLoNJnjHW7TbbsAszAAAAAAAAAAAAAAAAAAAAaPFrbaSK/itEOXt0rDf4xb/ACa/GZacRvaF58Q2
IjasQnzPIhCU92tMbZGzHmotG10C6nZkwpPRmipIllEbMIZIE7solgmJBnCyk9VMM6z1BtVllEqK
z0WRILYlluriWcSDJVbusV27gwInaSWM9ECyZ3hqamnSWxFmOSOaqRx725bNnSZNs9J+OynVY+WZ
YYr7TE+nVaIr0Ais81Yn1hKAAAAAAAAAAAAAAAAAABExvG09peU4nov9n66L0j6q/WPg9Y1OJaON
ZpL0+9HWs/EWzeVz9PbmrEtnyc3h9reHy26TWdnSr2YX6657ijLXpLX0+onSamL/AHJ6W+Tbv2aW
ekTv16JzeI1Ox6KJiYiY7Slz+E6jxdN4dp3vj6fl5Og2clnKACAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACZ2jeQRMxEbzO0Q08uqtkma4ulfO3r8lefUePMxWf
cjy9WvlzVxV6T1Z61/x0Y8f7Wc7Ur1lqVy+LqOWJ2hp6rXddon5rOF1tfmz5OkT0qzb8dWbxjp1c
biuuilJ5Z6r+IcQrixzEy8zl1E6rNt1tMztFY81sztU1eRucN4ffi2p5esRM72n0h7rS6XFo8FcO
CkVpX082nwXh3+z9FWLxHi36328vg6TZyW9ABAAAAAAAAAAAAAAAAAAAAAADj8Unm1tK/hqppHvw
y1k8/EMk+m0GOPeafiFpCZYwolnXspvHvLa9mF46gmnZmwozRUiUCBKYYsoBLOFbKAX0llEqqyzi
QXRLOJVRLOOwLIljZMEgrlhKyYYTAK5nZPN0RZjugUanHzVlz6xtLq361c+9eXItPpXX0dubTU+E
bL2lw2++O1fSW6m/VYAISAAAAAAAAAAAAAAAAAp1GbwcfTreelYEydcuMcRrM/L9nnlsV6wqpi2r
tv133mfWVkRyRtEdGFva7MzkYZNoamWN4bV4mYa9qztKIujhVppxGI8r1mJegeZpknBqKZY+7L0t
LRekWrO8TG8Ns/HJ5ZypAWZAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAADS12fp4VJ6z9qVuq1HgUiI+3bpDl589cOKZmevqprXPTbx477rDJlrhr1nq4+s182tMRP
RqaziXiZJrWekNG17ZbxWJ336M5LXRbI3dLTJrs07RMY6fan1dHLrowY+X7MVjt6N3R6Kul0EbWm
s7bz8Z+LnabQX43r7Y53php/mXj+Dnv0f1JO1x/8ZxbUzj02O15mfLtD13AvZqnDds+pmMmo26el
XX0Wh0/D8EYtNjilY7+s/NstpOOTW7QBKgAAAAAAAAAAAAAAAAAAAAAADG88tLW9I3BwJtz6nNf1
vK/DHVqYJ3pzT5y3MPZeojOWMQylEKpTVjZnDCwkqzYQyRRICATCITAJZQxhMAshnEq4ZQC2srKq
qrIBZCWNZZgwswmFloVyCu0dFcx1WyrtCBhv5NTPHXds2U5o3hIz4ffbPt+KHUcTSW5c9Jme0u2v
VYAKpAAAAAAAAAAAAAAAAYZctcVOa35R6tLrltN795/YvknNqrfhpPLH92V5isd9mWq6fHjk6rn0
ZxG8KK5Jm/wbVZiYZtqrmkqL023bkxvCiY3lJHNyRG81mHS4Rn5sNsNp64+3yaWaNrzOzHBl+i6q
mT7s9J+S+ay8mex6EIneN47SNXKAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAImYiJme0JafEs3h6fkidrZOn5eaLeJk7eOdm1Hi2vmtPTry/CHmOJcUvmvOPF1n09Pm
6HF9ZGm01qxO3R5vSY7XwzmzTy47zzTEd7en5Mfvt2/PURWdo3tvPrPlKymbktFqTtMTvHzbOLDG
f63JXbFX7FdnoODcDprZpq9TjiMMTvSn4vj8l5fxnrk91saPSa7i2hpOfbTVt5x1m0fLydzR6PDo
dPGHBXasd585n1lsRERG0dIF5OOe6tAEqgAAAAAAAAAAAAAAAAAAAAAAADX11+TRZrf0y2Gjxe22
gtH4piP3TPpXKwxtjhuYo9xq442iIblI2pC1RET2ILd9kxCqRjZmwlCSEohIJAQAAJZISDKGUd2M
MoBnVbVVCyAWVWeSuqyOwIlXZZKue4MJV2WWYT2QKbKL9YlfdRdIo35b7/Hd3KTzUrPrDh27uxpb
c2mpPwX/ABX9XAKpAAAAAAAAAAAAAACekTIp1eTwtJmv+GkyJn1oafeazbfpMzLR4jq/o8b823zX
6XNF8ERCvTcNpxLV5LauvPhx9Irv3lhztdtv8TtaWLicXrt03jzjzb2k1nid56ty3s/w+a7Uwzjn
1raejlarhmbhl/FpbxMO/fzj5p/ixSeXOvTtRfeI280ZI26tfDm3pWe63LaZx7qtGvniJ6tPLvOK
fOa9WzbJvTbza02jl3n5SSljscK1MajSxWZ96nSW88xw/VfQ9XMT9nfa3yemid43jtLeXsce88qQ
EqAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAADia3UTm1l4j7OP3Y/u
7Vp2rM+kPJW1PhYcmS0+9MzKm/jbwz31weMzbV8UppazPL9q0/BF4rk1GLDSNqxPWPhCnHmnNrtT
qPKteWPm6U6OdHaZvO+SaRNvhv12Ub/q3FhtrNVj0uKOt56z6R5y9zix1w4qY6RtWsREOJ7L6OKa
S2rvX6zNM7T6Vh3mmZyOfya7eACzIAAAAAAAAAAAAAAAAAAAAAAAAAAczjVvqMVfW/8AZ03I41bf
Lp6/OVs/UVrY47NyOzUxd4bUJpEbb3Z7IiOrKIVSjZhMLJYyhKIgmGUQSDESIEbJEgQmCITEAmGU
IiGUAyhZVhDOoM4Wx2VQtqBKuyyWEgqlhKyyuyBVaGtkbNmvk7A15l1eH2300R6TMORPSXT4ZO+O
8fFefEX63gEAAAAAAAAAAAAAAAq1WPxdLlp+Kkx+y1Fvsz8gjhaDauGK8sx07y3OE3m1tT6RaP4c
vU6yMNKUx73zT0ilY3l2eF6a+m0kRl/zbzz3+Ez5M8z26fJruW6wzYq5sV8d43raNpZjRzPPaTmx
5b6bJ9rHO3zb2WJ8GWPEscY9bgzxH2t62n19GWW0eHOzHU5XbjXZ1x8WTnz2iZ7S2M1IjH2+LX0V
KTqs8zO9ot0j8nUthi1J3UaOFMTfLFo6xMbS9BwHWTqdHOO8+/hnln5eTjYMFo1WTH5VnePzXcIm
2k4zlpPSmXy/hfF5eMfJns69OA2cgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAADG/2LfJ874rW845mubliY7bPoto5qzHrDz0+yePNF41OotaJ7RWNtpV1OtfHqZ715fhu
j8adNpcVfeyzE2/vLuanhOu1nEctIxTTFa/+ZPbZ3eHcF0vDbTfFE2yzG03t32+DokynXl9+leDB
TTYKYccbUpWIhYCzEAAAAAAAAAAAAAAAAAAAAAAAAAAAAcXjE/4zDH9M/wAu04XF5/3jj/0f3Wz9
RUYmzDWxS2I7FSyjuzY1ZKpRKEygEwiWUIkGIk2QJNhKQhMIhkCYZQxhlAMoZwwZwgWQshVCyATL
CWc9ldpBhZXLOVdpQK7NfJPRdaWvknoDVvPvOnwuel4+TlXn3nS4VPvXj4QtEV0wAAAAAAAAAAAA
AAAAAVV02CmTxK4qRf8AFFeq0AAAanEsfPpZmO9Ji0NDLfkwdOsulrumiyzHlVzJrz4Ovoy26vB8
cTBa9NffLtMY77Rv8Yegx5ImkKdJoY1HC81Y+3OSbVn0mGGkmbY45u6tnrrTOu2xGO0RxCd+nNVj
qKxTV1vH2pjaGtnyzXXYdo96ZmGXEMk15b7/AGZiVerWPTYckZcNbx5wzc7hGbnxXxzPWk7x8pdF
0S9jh1OXgAlUAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAcPjEf4/FP9H93ccXjMf4vDP9Mx+62fqKrx+S+GvibEFSsqyYwlVK
ZYsmIMoRKYJQIPIEiQ2ATCUQygCGUIhMAyhnDCGUIFkLIV1ZxIMpVWWSrsCuyqyyyq09ECq8tfJK
66jJ2Bp5J6upwn7dv9Lk5J951uE/av8AJaIrqAAAAAAAAAAAAAAAAAAAAAAq1Mc2myxPnWf4cmtu
XT9fR0tffk0WSe28bfq5Wbamm3326MtunwfK6PCv/AxPraZ/dz9PO97/AOqf5dHhdZrw7Dv3mOb9
XOxRFM+avpe38mvkPHf/AFWlrKba7Tzt99ZxKkfR7euyNXMTrtPHfa0z+zPiM/UR8Zj+Wbdu8HpN
M2bfzrV13M4dO2pyR61dNvj44/J/oAWZgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAADj8bj63BPzdhyeNx0wz8ZWz9RWri7Nmv
VrYu0NmqaRZHZlDGGSiwxZSgCEkCBCQSCQBMJRCYgEsoYx3Z17AlMIhlCBnDOGEM4AlhZZKq4KrK
7LLKrIFN2vdfZReAaObu6/CO9vk5OePR1uEd7fJeIrqAIAAAAAAAAAAAAAAAAAAAAGtxCk5NFliI
3mI32+XVyNTyZOHTee946PQKPoeDffw4777eW/yVs60xv+ZxOnr4Okx1t05KRv8Ao41Z5q3yed5m
XY1szXRZ5jvFJ/hxItP0aOSN9q7yrtr4f2tHFM5+KT16Yq/vK/iGSbXw4vO14UcPx5MGfNbPG18m
1oj4THRsTw7VanPXVYpi3gzMcnrvCnG11JOupwuN8+a3pEQ6jT4divjxWnJExa09pbjbM5HHu90A
JUAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAHM41H1GOf6nTc/jEf4Ws+lls/UX45uGekNujTwdm5RNIthKIZKLDFlsiQIShIC
EgCUJ7AmGTGO7IDzZQhMSDJMMYZQgZwzhhDOATuqssmVdgVWVWWyqtCBTeVF19lF+wNLNG7q8I+9
8nLyupwnt+S8RXUAQAAAAAAAAAAAAAAAAAAAAAAItWL1mto3iY2lyrcLyUxzix2ia2nvPeK+jrCL
OrTVnxpanhuPPemSs8l6RtE7dJj0ldpNP9GwRSZ3neZmV4cR/Vs4AJQAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAANHi1d9H
M+kt5ra+vPoskfDdOfqK4mn7Q3aNHBPZu0W0RdDOGFWcKLCJZeTGQQlCQSgASBsCYZQxhlAJTAmA
TsmAgGcM4YQyjsgRLC3VnaVcgwsrt3Z2V2QK7tbJ1bN5a9waeWO7p8Knt8nNyebpcK8vkvlFdQBA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAK9RXmwZI+ErEWjesx6wQeZwejeo0cccuW8
elpblJaaRGxVnCuss4ZrMvJEgCAASISCQIBlCYYpieoM0wx8k7gzIRueYM4Z79FcSy3QEsLJmWFp
BjaVVpZWlXMoGNmvkXXlr3kGtknu6XCf7OXkl1OEdl8orqgIAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAHmskcmtzV/rls0U62OXiWX4zErcc9GmkRfWVkSqqziWayxCPIANwBIhIJSxS
CRG6dwZwlhEs4BluMdzfqgZxLLdXuy3AmVdpZTKuZBjaVVpWWV2QlhZRdfZRcGpl7urwfrzfJy8r
rcH61vPyWitdMAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAHA4nHLxKZ9awnH2ZcY
jbW459aq8fZpfiI2IZwrqzhmsz3Ebm4JN0AMhCQSIASndiAziWUSriWcAyRujc80DM3RCfIETLCW
UsZEsJYSslXZAwlTddPZTkBp5e7r8Gj6rJPxhx8k9Xa4PG2C8/FaK10QAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAcfjcbZMFvnDWx9m5x2PqcNvS+zSxT7sNPxH62YZQwqzhRZO6UCB
KUAJTux3SDIRuAncQAmJZRLBMSgZ7iIAZRKd2DICUSlAljLCYWMLIFVukNfI2bNbIDTyT7zu8Ijb
Sz/qcG/2nf4T/wCE/wD2WnxWt4AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAHL9oL
+Hw2cm28VvEuPptfgyVj6yIn0no7/FtJfW8NzYMe3PaPd39d3iMug1WktNc2C9dvPbeP1aZ9xF+v
T471tHu2iflK2HkqWmvaZj5Surqc9Ps5bx+alTHqYHm68S1Vf/NmfnC2vGNTXvyT84Ql6A3cSvHM
sfaxVn5Ssrxyv3sM/lKB1xza8bwT3pePyWV4tpZ+/MfOEjfGrXiGlt2zV/PotrqcN/s5aT/+wLRj
FontMSlAlKEgndO6IAZQljDIEgeQljLCzOVdkCu/SGrkbF56NPNeKxMzMRHxENe0+89DwuNtHHzl
5PJr8NcnLW3Pbf7r1nCZm2gpae8zMrz4i/W6AgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAETETG0xukB4HVaeMHEtRi26RedvkyjBSfX9W77QYvC4xz7dMlYlrU7M929dWJLFc6aPK0q
7YLxPS0S22FlP6q38Zac0yR92s/KVc3tHfFf8tpbcsLRvB/dR/8ALLVnU0r9uL1+dZI1mnmdvGpv
6TOy6ym+Oto2tWJ+cJ/tW+KLK5KW+zes/KU7tG+h01p64qx8Y6NXNo6Y+uPJlp8rLf0rfG7MXtHa
0x8pZxqs9e2a8f8A7Oj7HaTHn0+f6RWM23LETfr6vRW4PoL99NT8ui7F4+vEdXXtnt+fVbXjGsr/
AOZE/OsPS29nuH27YrV+VpeV9pdPXhOtw49NG9Mld55+vXcTPd42I47qo7xSfyWV9oM8d8VJ/VxM
d8l46xWF9cV7en6o/qLfxp2I9ob+eCv/AHMo9op89P8A/wBORGmyT5R+qfo2X8P7n9Q/jTsx7RR5
6ef+4/8AuHftg/8A6cWcOSO9J/WEbWr3pY7Efzp2Lcfv5YK/9zWy8d1E/ZpSv5Oba1/+Hb9lc+LP
bFt87I7E/wAabWbiurvEx4nL/pjZzc2bJkn372t85ZXx55/BX85lucC0vPxnTxlnnjm32mOiZqUu
LJ2p4TwnVavNWaYbRTfre0bQ99pcH0bT0xb78vmtiIiNojaErMwAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAHnfarF7umzRHaZrLjYrdIen9ocPi8JyTt1xzF4eUw23rCm3R4r6bMy
wt6kdTaWLdjswmNoZontsCm0K5XWjopnuDC0dGpqG5bs08/daKV672MjbSaif6oh6Z5f2LtvptRX
0tEvUN3Jfo8f7cYve0eX4zV7B5z20xc/C8eSPuZIRficfXlcPaG7ino08HWIbePpLF2NuiyOyrHK
3fZFSwuovHVfaVF4QK5YWTM9UT0EKry6Ps1Tn4zjn8NZn9nOtLseydObiWW34cf918fWfk+PYANn
KAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAq1WKM+ly4p+/WYeBxTNd6zG0xO0
vobw3FcP0bi2em20Tbmj5Srr418V9sa2Z7qKyzi07MXUylhaU7yjqhLCeiq3ddaFNxFYW7NLNG8t
zya+WO6Va9J7FW66mvwidnrXiPY3Ny8RyUn71Jj9Ht3RPjk19HK9pMHj8D1ER3rHN+jqqtTjjNps
uOe16zAifXzfTz7kNyndpYazS9qT0mszDdoxrsi6m8LazMq6zDOsq1ZEyrt1WWlXaUCqyq0rbKbi
Fdp6PReyFd8uqv8ACsfy83aXrPZHHto89/xX2/SP/dpj6y8vx6EBq5gAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAB5n2q03LfDqqx39y39npmlxbS/TOG5se29tuavzgWzeV4mtui2
O3RRSY2hdVhqO2MvI36iu9lUsrSrvDHn6spnmSiq5jooyV6tq1VV69RC32byTh43h8otMx+r6I+Z
aK/g8TwX7bXh9Mid4iW+fjl8n1ICWb57xLBOm4zqse20Tbmj8+qKdnS9q8PhcTw5tumSm0/OHMxz
0Za+uzx3sX1t0Zxurr1ZxvspWiZYWZbsbT0QK7KLrZVZJFaqt5vbezNOTg9J/FaZeJns93wCvLwb
T/GJn92uGHldIBowAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAADuAPA67F9H4l
qMW20VvO3yRWW97T4fC4rXJHSMtI/WGhVlue3b473K2KzMML4+62tujG9pnozXaOSOVFMnVbmq1t
trJRW5E7wwvUxTvCyY6CHOt7moxz6Wh9PxTzYaT61h8x1MbZK/OH0zTf+Fxf6I/htj45vL9WgLMn
mvbPFvocGWO9L7fq85p5maw9d7VYvE4JkmPu2if3eW0+PasdFNOnxfF1Y2hlykRsmY+LJ0MZjZXa
eq2eyi8oQTO0KLdZWzPRjWu6VaqtHR73g0bcI0sf0Q8Nkq93wqNuFaWP+XDTDDytwBowAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAef9q8HNpcGaI60vtPyl56k9Iew49j8ThGe
PwxFv0l4zH2U26fDfTYiyJljvsjf4sm6vJ1hrXjq2MkqLdZEVbgbMx0auGdmzNt6iHN1Ub5af6of
TdPG2nxx6Vj+HzaaTm1+nx/iyVj930ysbViPRrj45vL9SAuyc7j1efguqj+jd4/T33rD3HEcPj8O
1GP8WOY/Z4TTT7sKadHhbcsZnaCJ3TPZk6VdrKbTutmP0U2nqgrGOsr8deiuI2X09EqKM1dt3uuG
f/jdN/06/wAPE546S9rwud+Gaaf+XH8NMMPK2wGjAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAABrcRp4nDtRWPPHP8PCYusPoWSvNjtX1iYfPuWaXtX8MzCuvjfw32siu8ptXoxi
0wy5t4YulReqmazu2skbquURWFInddM7VYRGyL291KFnCcfj8e0le/Lbmn8n0N4b2Ur4nHLWmPsY
5e5a5+OXyXugBZmiY3iY9Xz7NjnTa3Ph/BeYj5PoTxftFg8Hjk2iOmWkW/Psrr418V5WrWd2faFc
V2jdnEMXWxntupmN7NiYU27iWML6dVMVnddjgVqMsdHr+CW5uE6f4Rt+7yuSsTDv+zWXn0WTHP3L
/tK+GHl+O0A1c4AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA8Dn93W56/wDM
t/L3z59qp24jn+OS38lnpr4r7ZxHQ2TEstt3PXUrt27K57rr1VT0BjKnJPRbMqMs7QlV2fYvHvrd
VknyrEfu9m8f7FZI8fVU85iJewbT45NfQBKo817W4eulzxHaZrL0rje09ItwqbfhtBVs3leai8RD
KLw1sduesL606dWFdsZT1jdhNeq6K9DlhCVUU6s4jZnt1YzAhnM71dH2bycmszY/K1d/0c6OzY4R
fwuK4p8rTstn6z8k7HrwGzkAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAHz3
Vxvr80/8y38voTwGpj/F5/8AqT/JfjTx/WVeyY6FPspc9dZPVXaOq2WEwIUTVRmjo2rNfLHRI3vZ
DJycXtX8dZh7t879nsnhcbwz23tt+r6I2nxyb+gCVBzuPY/E4PqI9K7ui19fTxNBnp60n+Aj5/pJ
3jZu1aOnnltMNussdfXbm+l3ZM9URHREdZVXTuT1Nk7boQiOkJw28PU47/htEp5eivJPLMTCZ9Vv
x7mJ3iJ9UqNHk8XR4b+tIXuhxAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAD
weqjbWZ4/wCZP8vePCaz/wDIaiP+Zb+UX408f0r9lOxWOifJhXWjfyYWllPRXYQxnrCrJHRd3YZI
6A1NJecHEsN/S0T+76bE7xE+r5dk93LW3pL6ZpMni6PDf8VIn9m2fjm8s9rgFmQxvHNS0esbMiew
PnHLyai9fS0w2aNfUTtrs3+uf5bGPqy068fF227KtSsdFlKqNGMV6myyY6sbdIQI8tlOWOi6Jhhk
j3RD0vA8nicMx9etZmHRcT2Zyb6XNT8N9/2dt0T449T2AJVAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAHhdfG3E9TH9cvdPEcXjk4zqI/q3L8aeP6xr2TsxpLOekMK6mFo6qpXSrm
OqBixvHSVmzC4OfqK7S9/wAByeLwbTW9K7fo8Fqo6Paeyl+fglI/Da0NcMPK7QC7AAB8313TiOf/
AKk/y2MHWrX4jG3E9R/1Lfyv0/aFNOrHxuU7LI7MMayGTVlHWUXhNe6Z6wIUsb9d1m20q7dkDpez
N9tRqKT5xEvRvKez9+Xis1/FSYerb5+OTyf6AFlAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAB43j9eXjN/jWJ/Z7J5L2mry8Upb8VIF8f6aGOey2eynHvOy7bowrrYSxZSwQJ2YXZ
92N4BoanrEvVexmTm4blr+HJ/aHltRHSXofYm/1Wrp5RaJaYY+X49WA0c4AD51xONuKan/qW/lbp
+0MOLRtxbU/9SU4J7KadWPjep2WQrr2WRPRk1TvsndXMpiRCb9FNu0rbTuqvKBscCjfi9PhWZeue
V9n434rafTHL1TfPxy+T/QAszAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAHmv
avHtfTZfnV6VxPajHzcNrf8ABeJFs/XnMcr4no18c+6vr2YadkY2YM57sEDLyY37Mo7MMnYGlqO0
vQ+xNfqNVb1tEfs87qZ2rL0/sVX/AHdnt65P7Q0wx8vx6UBo5wAHz/jUbcX1PT78qtO2vaCnJxjP
8Zif2amnnspp04+OjWejKJ6MKdmcMmyJn4m5ZHzEVPMwtJv0VZLbQDqezcb8RzT6Y/7vUPM+ytZt
n1OTyiIh6Ztn45N/6AFlAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAABocbxeLw
nUR5xXm/Rvq8+OMuDJjntaswEeBxT0bNZ6NatZpNqz3rO0rqsdO3PxlaWEMpY+aqWXkryT0ZT2V3
7A0dVPuy9f7G124NM/iyT/Z4zWT7sw957MYfB4Fp4/FE2/WWmGHldcBowAAeM9qKcvFeb8VIly9P
0nq7ntbTbVYL+tJj93CwT76unR4/jo0nozhhTsy3Y1sWljM9Ce7HyQIm3RRlttVbaWrnt0Sh6n2U
x8vD8mSfv3/h3XN4Bi8Lg2nj8Uc36y6TeOPXugCUAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAPD8RxeBxXUU26Tbmj8+quro+02Lw+I4ssdslNvzhzazvDPbq8d7GW7Dfqz2VzG
0s2qd+iu/Zn5Ksk9BVztX1mI8930zh2LwOHabH+HHWP2fNYp4+vwYvxXiP3fUqxtWIjyjZtj45/L
faQFmQADzftfj3w6fJ6WmHmsP23rvaqnNwqLfhvEvIYZ+sV038bo0noy36MK9oZQxrdMyrlnMbMZ
QKrS1M07zEestq/RRjr4utwY/wAV4j91p9V18fQdJj8LR4ccfdpEfsuREbREJbuMAAAAAAAAAAAA
BAJAAAAEAJEAJQAJQAJEAJQAJQAJEACUJAQlAJEAJQAJQJAAAEAJEAJBAAAJAABAJEJAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAABwvanDzaPFmjvjv8A
tLztJ3h7HjGHx+FainnFeaPnHV4vFbeIU038VbHeGF+kso7Mb9mTdhKnLK3dRm7SIrHhGPxeP6Sv
9cT/AHfSnz72Zx+J7Q45/BWZ/Z9BbZ+OXyfQBZQABzeP4/E4NqI9Ii36S8Ng/wAx9C4jTxOH6ivr
jn+Hz3B/mQi/GvjdCnWNlsdI2V07LIlg6USrt2ZzZXMoFV+zPhGLxeOaavpbm/RVltEN72Yx+Jxm
b7dKUmf7L5+s9/HtRA2cqRACRACRACRACUAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAACQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAQCQQCRACRACRCQBCQBCQB
ACRACRACRACRACL1i9LVntMbPATTwdRkxT3pea/u+gPE8Xx+DxrPHlaYt+qNfGvjvtXXsi0dOrKk
dEXjZg6VMtbP2bMtXUdpEV0/Y2nNxbNf8OP+727xvsXH+N1U/wBEfy9k3nxyb+gCVQAGOWvNivX1
rMPnGGOXNNfOJ2fSZ6w+dZKeHxDPX8N7R+6L8a+L63KdoZ7q6zvEMpnowdKJ6ywmWUyqvIKM0vQ+
x+D6rU55+9aKx+TzWa36vbezmDwODYenW+95/Nphj5L6dQBo5wAAAAAAAAAAAAAAAAAAAAAAAAAA
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAEgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACAEiAAAEoA
AAAAAAAAAAAAAEAkEAkRuAkQbgkQAkQAkQAkQAl5T2nx8nEMOT8dNv0l6pwfarHvpcGWPu32/WCr
YvK4mOem6b9mGKd4Z3idmFdka0y1c892zfpMtLPaNpEV6D2Kj/Eauf6YeweQ9ieuTVz8K/3evbT4
5NfQBKoAA8FxCvJxrUx/XMvevD8Zry8fz/Haf2RfjTx/6RSOnRMyypHu9kXjowrqVSrvPRnZVl6V
kK0775MsUjvadn0nT4ow6bFijtSsVfPuFYvpPGtNTy54mfy6vorXDm8l9pEC7JIgBIgBIgBIgBIg
BIgBIhIAgBIhIAgBIgBIIBIAAhIAhIAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAJAAAAAAAAAAAAAAA
AAAAAAAAABAJQkAEAAAAAAAAAAjc3BIjdG4Mkbo5kcwMjdhzHMDPc3V8xzAs3N1fMjmBZubq+Y5g
Wbm6vmOYFm5ur5jmBZubq+Y5gWbm6vmOYFm5ur5jmBZubq+Y5gWbm6vmTzAz3N2HMnmBlu5ftFTx
OEZJ/DMW/d0t2rxKni8N1FPWkiZ9eS08e7Cy8dGGn6UhZaJljXZGnmc3UT3dPP2cnUT78xCIV6j2
H/8A9c/6f7vXPI+w8bU1U+vL/d63du5NfUiDcVSIAS8b7RV5eOb/AIqRL2TyXtNX/e2KfXH/AHlF
+NPH/pr4+2xcxx0hFpY11K7R16KM32ZWz3UaidqSgrc9kcPicWyZJjfw6T+727y3sXh2xarN+K0V
h6lvPjj3e0ASqAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAJQAAAAAkQAkQAkAAAAAAAAAAAAAAA
EgAAAAAAAAAAAAAAAAAAAAAgAAABKDcAN0bgkY8xzAyRux5kcwM9zdXNkTcFm6OZXzMeYFvMibKu
ZHMC2bo51U2RuC2bom6rc3BZzom6sBZzI52ADPnOdggFnMc6skFnMc6rc3BbznOp3RzAv50c6nml
HMC/nOf4qOY5wX85zqOc5wbHOc7X5znBsc6edr85zg2ec52vzpi4NjmY5bROG+/bllVzsNTk5dLl
n0pP8BHmMHWNmzt0aum8obm08vVjfrtnxztR0mXHzTvaZdjVRMTLkZo6yiFen9iZ2pqY/wBP93rN
3kPY+/LfPX1rE/u9XzN3HfqzdO6vmTuIZ7m7Hc3Bnu8t7TR/vHBP9E/y9Pu837SV31umn+if5Rfi
/j/01MMb1hjkrtKzBG0bMsmOZY11tOYamr6Und0LUc7XT7u3rJPqL8er9lcPhcFpbzyWm39v7O00
+FYvA4Zpsc94xxu227jv1IAgAAAAAAAAABKAAAASgASgBIgBIgBIgBIhIAAAAAAAAAAAAAAAAAAC
UACUJAAAAAAAAAAAABIAAAAAAAAAAAAAAAAAAAAg3AEbomQZbo3YzLGbAz3RNlc3YzcFs2YzdVN2
M2Bdzom6nmNwW86JurTAMuY3REJ2BB1ZRVMVBhsbSsiqeUFXLucq3lTygp5TlXcpygp5TlXcpygp
5TlXcqOUFXKjlXcrGYBXysdlswiYBVMdUTCyY6sZBWxlnMMZgGLGZZSwkDdHMiWO4MuY5mEyjcFn
N1OdVzHMC3nTzqeY5gX85zqOZPMC+Lqdbk20eb/RKOZr8QybaK/XvtH7iZ9aGlp2luzT3fg19NHS
OjbmPcYX67XH1XSZ9XIzRvMuzrK7zLkZYmYnciunb9lZ5dTk+OP+71cXeP8AZnJ/ip2nf3J/l6iL
/Fu5L9bMWZczXi6YuIbEWTzKIuyiwLt3nuO25uI4a/hx7/rLuczg8TicvFLbfdpEK6+NPH/phhjo
stLGkctUWnoxrrU3j1cnWTzZq1jzl1clo5Zcu8c+txR63iP3Tn6pv4+g4o5cVI9IiGe7CJ2iE7t3
GyN2O6dwSINwSISAlAAlACRAAlAAlACRACRCQAAAAAAAAAASgASISAAAAAAAAAAAAACQAAAAAAAA
AAAAAASAAAAAAAAAAAAAAAAIAAAQCAJljuljsCJlhMs9mOwMJYys5TkBVsjZdyHICrZPKt5E8oK4
qmKrOVOwMIqyirPY2Bjyp2ZbAI2NmSARsbMgEbI2ZAMdjZICNkbMkSCNmOzJEgx2YyzljMAwlhKy
WEwCuWErJhhMArlhLOWEgxljMpljIImWMyTKJA3N0IBO5vux3NwZbnMx3NwZczT4jf3MdPW27a3a
fJOq1XNP2KdIRfi+J2trSYfcjeF+Wm1OicVeWIiN9kai8xjY12ORqultnI1Ecsujq79XP1FovWYI
rTgeq+j8QrWZ+3Mx+r2UXeC0WG2Ti2kiN5mL807eUREvbzbaejefHJv62Iv8WUXa0WTFhVtRdlF2
rz9WUXBtc7jR9dqc2T1ttHyhvZMvJitb0jdq6XHNcNenWVN3028U99WRj6Kb02be3Tq18/SN2Lpc
3UdN9nOmZrqKX/DaJ/d0svvTLRzV3jomK6+Pd1vvWJj0ZczT0mXxNJht60hfFnQ4qu3N1cWTEgs3
Tur5k7gz3N2O5uDM3Y7m4MtxBuCQASIASIASAAAAAAACRCQAAAAAAAAEoSAAAAAAAAAAAlAAlCQA
AAAAAAAAAAASAAAAAAAAAAAAIASgAAAEJAQJQCNkbMgGOyOVnsAw5TlZ7GwMOVPKy2NgY7GzIBGx
skA2AAAAAAAAAAQkBAEghEskAxYzDPZGwK5hjMLJhjMAqmGEwumrCagomFcw2JqqtUFEsLLrV82F
o7gqljKyYYTGwMZRKUSCAQAboJnaN5Bjkneu0d5W4ccViIiOzHFWbTzNumP1Zarr8eeRMbxDW1Mx
NO67NbkhzNVnmInqzaOZrL93JyZeV0M1++7S02jvxDWxhxx033tPpC8Z6rrezWjmZyazJG2/u03h
2vFibTHoqvamiwVwY+nLGzV0+SZ1Mx8G0/45tOhzJ5lXMc3UVXRdlF1HP+iYsDPLPPy49/tz1+Te
pSIr0ho6ak5Ms5J8o2q6NImOrHV7XX488ypzTtHXo0s9t6zG7c1G1qz6ubeZiZ3UatXJG3yauSO7
cvMTEx5tPLb3prPRMVr0HB8vicNxf0+7+kt+LOJwTJyY/Bnz3tH93X36N58cWvq6LSyiyndMSlC7
mZcymLJiwLosmJVRLKLAtiU7q4lMSCzc3YxJuDMRuAlKAEgAAAlAkAAAAAABKAEgAAAAAJAAAAAA
AAAAAAAEgAAAAAAAAAAAAAkAAAAAAAAEAAAAAAAAAAAAAAAAAAAAAhIAAACAAAASgAAAAAAEAAAA
hGzJAImGMwzQDDZjNVuyNgUTVhNGxysZqDVmiu1G5NN2M4waM0+DCaN2cbGcQNGaMZq3JxMJxA1J
qx2bU4kU09slorWNwa20z02RXHbJbl26QvtFovbHWkxEdJt5y2MOHlr2U1W3jx+1hiw8vSO63lmI
XRTaEWmtY6snRHO1VpmJ+DjavpSZl2s8b7y4HFcnh0n0gha5ebJN55KRM2mdoiPN6fh+kpwXh0Wy
RHj5Otp/s5Ps1p62y31+em9aTMYt/OfVfxTiPjZ52naI7fBrI5t66xz5+a1rW7yx0eSL6iZjtEOX
qNbSletom3lENjh2fbHzbbWt3iVozruc+5ztWubf4M4ybpQ2Oboyrva0Vjza8WdDR4OkXt3n9ldX
kaePP9VtYqctYhdvt5oivTeCZ2YOxXk6ubqMfV0b9mrljfqlFcq88k7z2U5axeItDa1OPessuC8P
ya7XRWYnwqdbT/ZMilvIu4dpslNdixXja8Y5tt85djZdbDWnGOesRtXFtuw6T27No5Kx2OrKYQlC
ExKJgBnEpiyvdlEgsizKLKollFgWxLKJVRLKJBbEp3VxLKJBnuMWQJEbpBIAAAJAAAABIAAAAAAA
lAJAAAAAAAAAAAAAASAAAAAAAAAAAAAJAAAABAJABAlAAAAAAAAAAAAAAAAAAAAAAAAIAAAAAAAA
AAABAJQAAAAgAABAAI2EoBGyJhkgGPKxmqxAKpownHC+YRMdN5BrTj67R3bOn01o7p01Iv71u89o
b9a7LfBTfS1vWI2jf12VfQPSW8KX2mas+NC2iv6xMNfJpMnLtEbuuxtMRCtzF55NR5rPps1N/ctP
y6uHreE6nXZ4pak48X3rT06fB7fNeI33cbX6mI32R/MWu7XF116aDSRhxbRERs8f499bkyZeeKae
kzE2mdon81/tfxDLGOunwbzlzbx08oaHBvZHJlx48mrvaa94pu04y617576rNGLRRM0397JEd/lu
9Dw/S3x4qxffo6mm4NjwUiKY4iI9Ib1dHFY6QIaNabbrYrLfrpJtaK1rMzPZb/s+05IpP59OyLeJ
k7eNfRaOc1ue32I7fGXYpi5Y77M8OGMeOKxHSFsU3Y29deZMzirl6dlVvhLatCjJHeYQv1rXnps1
8k9/VsW6qLVmZIi1rzitlvFKRvaZ2h6TSaenC9FFY+3brM+sqeG8Prp4+kZ+lvuxPkr1mqm95nfp
DXM459676a2q1dsV7XietvNno78+CJn1cjX6mOeIm0bR33dfRU5NJjidt9t5afjG/V6JZ7I2QMNh
nyo2BhsMuVG3wAhMSbbQRAMolnE+iuGUSCyJZRKuGUSCyJZK4llEgyZMYTuCUsYSCQASISAAAlCQ
AAAAAAEoASCASAAAAAAAAAAAAlACRACQAAAAAAAAAEgCEoASCAAAAAAAAAAAAAAAAAAAAAAABAAA
AAAAAAAISAIAAAAAAQAAACASgAAAQJAQAAhIDHZhln3do7z0WS18mWsajHjmes7pg3dNi5aRMNqO
yvDHTpPRaigHZhN4hHRlaVN59JY3zRENLUavaO+yq0iNVlitJ6vNcR1MVi0zO0era1/Ea0rPvbz5
PM5MWp45qvo2GZrhmfrsnpHpHzTCseEcM/2vrr8Q1Eb4qzy44nziPN63HpYiIiI7LNHoqabBTFii
IpSNohuVxrKtWMEejPwY9G1FFmHB4mWJn7MdfnIM9JpIx15to5pbUaas/a6rqViI7MxPxqX0UT1r
O3wVzpbR2hviP5i03Y5s6a879FNtHljydhExCv8AMTPJXBnRZbz0iG5ptFjwe/l96zctMVamTJtE
yTMibu1VrdTzRMR0j0ed4lr64MVpm0RERvMz5NvX62uOJ69XhOKX1HH9bHDtFvNYnfJeOy0Z2ojX
6jjnEq6fRUmccTvN/J9H0eKcOnx45neaxEbubwHgOHg+milI3vP2resu3Wu0JQmITsmISDHZHKz2
JgFc1RMLJhGwK9iIZ7MZgEdgmAEwyiWCdwWRLKJVxKYsC2JTuriWUSDNlEsIlMAySx3SCRCQSIAS
AAACRACQAAAAAAASIASAAAAAAAAAAAAAAACRACRACQASIAAAAAAAAAAAAAAAAAAAAAAAAQCUAAAA
AAAAAAIAAAAAAAAQAAAAAACBICBICAAEJAQJQCJcLjuS2ny6fPG/LWdpd1o8T0X07SXx/e7wCdJx
Wa0jmneHQpxPDMdZmJfNtZm49weZrh0/j4o7VtSZ2+Uw0/8A7o49k92vBLc/ntFohFW9PqGXimOI
6Tu1L8T3eCx6r2t1O3JwvHjifO99v7t/Bwf2l1PXU6rS6eJ8qUm8x+so5TsekzcSjbvs4mt4rzW5
K2mbT0itesy2cHsvbvqtbmyz5xERWP2jd1tJwrTaONsOKtZ8585+cnDrzmn4Rq+IZObUROHD32n7
Vv8A0ej0uhxaXFGPFSK1j0bkY4jyZRVZVXFGUVWbGwKsk8mObekNrSW3pWf1a2aYjHbm7bNnQ1id
PW0TvuDdhJEbQABMsLW2R0ZTMQrvfbz2YWzVhpanUxEd0dWkW5c8R5uXxDX1w4pnfr5Q19XxKuOJ
2neXltVqtVxbV/RdJ715+1bypANfiOu1HENV9C0MTfNeesx2rD1PAeBYuE6aKx72W3W9/WVnBuB4
eF4dqRzZbdb5J72l160WVK02ZxCYhOwI23TsnY2BGxsnYBjsiYZsZBjMMZZSgGEolMsQDdG6NwZ7
piVe6YkFsSziVMWZRILolMSriWUSCyJTuwhMSDMRCQSI3SAlACRCQAAEoAEoASAAAAAAAAACUACR
ACQAAAAAAAAAAAAASAAAAAAAAAAAAAAAAAAACAAAAAAAAAAAAAABAAAAAAAAAAAAACBKAAAAAAAQ
JQAAAhICEbJAYTWJ7wx8KvpC0BV4ceieWGewDHlNmWwCNjZICNhIDmcZredBecdpiY69FXCOLW+i
UiZidukulmxxlx2paN4mNng+K4+I8Hy2yaTfl37TXetoCPfRxfp1qi3F48ofKMvtvxak8s6LDv61
rZji9rPaLUf5PC+bfttS0q8q3p9W/wBrRMdpUZuKdN99nzvFqPbTVz7nD8OKs+do2/mW3h4D7Xaq
ZnPrtNpqz35aRaYOHY9Zk4pNt9rR+rl6zi+OnS+WN57Rv1lXp/YrNaYtruL6zNPnGO3hxP6O5w/2
f0HDuun09Yv55Le9afznqcOvO4tBreMTHu30unnva0bWt8on+70nDuE4OHYYx4Kbesz3tPrMuhGO
IjpDOKrK9YVpsyiGUQnYGOyUgI2SlAIEmwMWMs9kTAMJYzDOYRMArmGErZhhMArlHmzmGMwDE3Ts
bAbs4swj5pgFkSziVcM4BZEsolXDKAZwyhjCYBkACQhIAAAAAAAJAAAAAAAAAAAAAAAAAAAShIAA
AAAAAAJAAAAAAAAAAAAAABAJEAAAAAAAAAAAAAAAIEoBKAAAAAAAAAAAAAAABAlAAAAAAAIAAAAA
BAkBAkBAkBAlACEgMZjdjbFW8bWrEx8YWANb6Fp+bfwab+vLDKMFK9qxH5L0bAr8OPRPKz2AY7J2
SbAjYZAI2E7AIEgIEgIEgMdkSy2NgY7MdlmyNoBXsxmFuyNgVTVjNV3KjlBRNTlXTVHKCrlIqt5T
lBhEMohlFerLlBjEMohMVTEARDKCITsAk2AEgAAAkAAAAAAAAAAAAAAAAAAAAAAAASAAAAAAAAD/
2022-04-14 17:47:08 +02:00
2Q==`;async function MAe(e){let t=(a,s="application/octet-stream")=>fetch(`data:${s};base64,${a}`).then(i=>i.blob()),r,n;switch(e.config.warmup){case"face":r=await t(dg);break;case"body":case"full":r=await t(pg);break;default:r=null}if(r){let a=await createImageBitmap(r);n=await e.detect(a,e.config),a.close()}return n}async function FAe(e){return new Promise(t=>{let r;switch(e.config.warmup){case"face":r="data:image/jpeg;base64,"+dg;break;case"full":case"body":r="data:image/jpeg;base64,"+pg;break;default:r=null}let n;if(typeof Image!="undefined")n=new Image;else if(he.Image)n=new he.Image;else return;n.onload=async()=>{let a=qr(n.naturalWidth,n.naturalHeight);if(!a)ie("Warmup: Canvas not found"),t(void 0);else{let s=a.getContext("2d");s&&s.drawImage(n,0,0);let i=await e.image(a),o=await e.detect(i.tensor,e.config);t(o)}},r?n.src=r:t(void 0)})}async function $Ae(e){let t=a=>Buffer.from(a,"base64"),r;e.config.warmup==="face"?r=t(dg):r=t(pg);let n;if("node"in Ue){let a=(void 0).decodeJpeg(r),s=a.expandDims(0);e.tf.dispose(a),n=await e.detect(s,e.config),e.tf.dispose(s)}else e.config.debug&&ie("Warmup tfjs-node not loaded");return n}async function PAe(e){let t;return typeof createImageBitmap=="function"?t=await MAe(e):typeof Image!="undefined"||he.Canvas!==void 0?t=await FAe(e):t=await $Ae(e),t}async function L9(e,t){let r=oe();return e.state="warmup",t&&(e.config=Ut(e.config,t)),!e.config.warmup||e.config.warmup.length===0||e.config.warmup==="none"?{face:[],body:[],hand:[],gesture:[],object:[],performance:e.performance,timestamp:oe(),persons:[],error:null}:new Promise(async n=>{let a=await PAe(e),s=oe();e.config.debug&&ie("warmup",e.config.warmup,Math.round(s-r),"ms"),e.emit("warmup"),n(a)})}var Jd,ac,sc,hg,s3=class{constructor(t){fe(this,"version");fe(this,"config");fe(this,"result");fe(this,"state");fe(this,"process");fe(this,"tf");fe(this,"env");fe(this,"draw");fe(this,"models");fe(this,"events");fe(this,"faceTriangulation");fe(this,"faceUVMap");fe(this,"performance");hp(this,Jd,void 0);hp(this,ac,void 0);hp(this,sc,void 0);fe(this,"gl");fe(this,"analyze",(...t)=>{if(!pp(this,ac))return;let r=this.tf.engine().state.numTensors,n=pp(this,Jd);cp(this,Jd,r);let a=r-n;a!==0&&ie(...t,a)});hp(this,hg,t=>{if(!pp(this,sc))return null;if(!t)return"input is not defined";if(this.env.node&&!(t instanceof rt))return"input must be a tensor";try{this.tf.getBackend()}catch(r){return"backend not loaded"}return null});fe(this,"similarity",r3);fe(this,"distance",nc);fe(this,"match",n3);fe(this,"emit",t=>{var r;this.events&&this.events.dispatchEvent&&((r=this.events)==null||r.dispatchEvent(new Event(t)))});this.env=he,bs.wasmPath=Hh["tfjs-core"].includes("-")?"https://vladmandic.github.io/tfjs/dist/":`https://cdn.jsdelivr.net/npm/@tensorflow/tfjs-backend-wasm@${T2}/dist/`,bs.modelBasePath=he.browser?"../models/":"file://models/",bs.backend=he.browser?"humangl":"tensorflow",this.version=Mb,Object.defineProperty(this,"version",{value:Mb}),this.config=JSON.parse(JSON.stringify(bs)),Object.seal(this.config),this.config.cacheModels=typeof indexedDB!="undefined",t&&(this.config=Ut(this.config,t)),fN(this.config),this.tf=Ue,this.state="idle",cp(this,Jd,0),cp(this,ac,!1),cp(this,sc,!1),this.performance={},this.events=typeof EventTarget!="undefined"?new EventTarget:void 0,this.models=new rc,this.draw={options:xr,canvas:(r,n)=>Z5(r,n),face:(r,n,a)=>Hd(r,n,a),body:(r,n,a)=>qd(r,n,a),hand:(r,n,a)=>Kd(r,n,a),gesture:(r,n,a)=>Zd(r,n,a),object:(r,n,a)=>Xd(r,n,a),person:(r,n,a)=>X5(r,n,a),all:(r,n,a)=>Y5(r,n,a)},this.result={face:[],body:[],hand:[],gesture:[],object:[],performance:{},timestamp:0,persons:[],error:null},this.process={tensor:null,canvas:null},this.faceTriangulation=SC,this.faceUVMap=TC,this.gl=Ct,this.emit("create")}reset(){let t=this.config.backend;this.config=JSON.parse(JSON.stringify(bs)),this.config.backend=t}validate(t){return G1(bs,t||this.config)}now(){return oe()}image(t,r=!0){return Fd(t,this.config,r)}async segmentation(t,r){return S9(t,r,this.config)}enhance(t){return m5(t)}compare(t,r){return cN(this.config,t,r)}async init(){await
2022-02-10 18:27:21 +01:00
/**
* @license
* Copyright 2017 Google LLC. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* =============================================================================
*/
/**
* @license
* Copyright 2018 Google LLC
*
* Use of this source code is governed by an MIT-style
* license that can be found in the LICENSE file or at
* https://opensource.org/licenses/MIT.
* =============================================================================
*/
/**
* @license
* Copyright 2018 Google LLC. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
* =============================================================================
*/
/**
* @license
* Copyright 2018 Google LLC. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* =============================================================================
*/
/**
* @license
* Copyright 2019 Google LLC
*
* Use of this source code is governed by an MIT-style
* license that can be found in the LICENSE file or at
* https://opensource.org/licenses/MIT.
* =============================================================================
*/
/**
* @license
* Copyright 2019 Google LLC. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
* =============================================================================
*/
/**
* @license
* Copyright 2019 Google LLC. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* =============================================================================
*/
/**
* @license
* Copyright 2020 Google Inc. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* =============================================================================
*/
/**
* @license
* Copyright 2020 Google LLC
*
* Use of this source code is governed by an MIT-style
* license that can be found in the LICENSE file or at
* https://opensource.org/licenses/MIT.
* =============================================================================
*/
/**
* @license
* Copyright 2020 Google LLC. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use backend file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* =============================================================================
*/
/**
* @license
* Copyright 2020 Google LLC. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* =============================================================================
*/
/**
* @license
* Copyright 2020 Google LLC. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the License);
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an AS IS BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* =============================================================================
*/
/**
* @license
* Copyright 2021 Google LLC. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* =============================================================================
*/
/**
* @license
* Copyright 2021 Google LLC. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* https://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* =============================================================================
*/
/**
* @license
* Copyright 2021 Google LLC. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the License);
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an AS IS BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
2022-03-16 16:19:56 +01:00
* =============================================================================
*/
/**
* @license
* Copyright 2022 Google LLC. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* =============================================================================
*/
/**
* @license
* Copyright 2022 Google LLC. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the 'License');
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an 'AS IS' BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
2022-02-10 18:27:21 +01:00
* =============================================================================
*/
/**
* Human main module
* @default Human Library
* @summary <https://github.com/vladmandic/human>
* @author <https://github.com/vladmandic>
* @copyright <https://github.com/vladmandic>
* @license MIT
*/
/**
* @license
* Copyright 2018 Google LLC. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* =============================================================================
*/
/** @license See the LICENSE file. */