diff --git a/assets/index-BbCFr5ZN.js b/assets/index-BbCFr5ZN.js new file mode 100644 index 0000000000000000000000000000000000000000..7db25fb6398f881f9eaab0873dfc911380a57a3c --- /dev/null +++ b/assets/index-BbCFr5ZN.js @@ -0,0 +1,2787 @@ +(function(){const A=document.createElement("link").relList;if(A&&A.supports&&A.supports("modulepreload"))return;for(const $ of document.querySelectorAll('link[rel="modulepreload"]'))g($);new MutationObserver($=>{for(const N of $)if(N.type==="childList")for(const Z of N.addedNodes)Z.tagName==="LINK"&&Z.rel==="modulepreload"&&g(Z)}).observe(document,{childList:!0,subtree:!0});function r($){const N={};return $.integrity&&(N.integrity=$.integrity),$.referrerPolicy&&(N.referrerPolicy=$.referrerPolicy),$.crossOrigin==="use-credentials"?N.credentials="include":$.crossOrigin==="anonymous"?N.credentials="omit":N.credentials="same-origin",N}function g($){if($.ep)return;$.ep=!0;const N=r($);fetch($.href,N)}})();var bh={},pf={"./node_modules/onnxruntime-web/dist/ort-wasm-simd-threaded.jsep.wasm":(ke,A,r)=>{ke.exports=r.p+"ort-wasm-simd-threaded.jsep.wasm"},"./node_modules/onnxruntime-web/dist/ort.bundle.min.mjs?46eb":(ke,A,r)=>{ke.exports=r.p+"ort.bundle.min.mjs"},"?2ce3":()=>{},"?7a2c":()=>{},"?a42a":()=>{},"?2b25":()=>{},"?569f":()=>{},"?3f59":()=>{},"?154a":()=>{},"./node_modules/@huggingface/jinja/dist/index.js":(ke,A,r)=>{r.r(A),r.d(A,{Environment:()=>Ze,Interpreter:()=>at,Template:()=>ct,parse:()=>_e,tokenize:()=>x});var g=Object.freeze({Text:"Text",NumericLiteral:"NumericLiteral",BooleanLiteral:"BooleanLiteral",NullLiteral:"NullLiteral",StringLiteral:"StringLiteral",Identifier:"Identifier",Equals:"Equals",OpenParen:"OpenParen",CloseParen:"CloseParen",OpenStatement:"OpenStatement",CloseStatement:"CloseStatement",OpenExpression:"OpenExpression",CloseExpression:"CloseExpression",OpenSquareBracket:"OpenSquareBracket",CloseSquareBracket:"CloseSquareBracket",OpenCurlyBracket:"OpenCurlyBracket",CloseCurlyBracket:"CloseCurlyBracket",Comma:"Comma",Dot:"Dot",Colon:"Colon",Pipe:"Pipe",CallOperator:"CallOperator",AdditiveBinaryOperator:"AdditiveBinaryOperator",MultiplicativeBinaryOperator:"MultiplicativeBinaryOperator",ComparisonBinaryOperator:"ComparisonBinaryOperator",UnaryOperator:"UnaryOperator",Set:"Set",If:"If",For:"For",In:"In",Is:"Is",NotIn:"NotIn",Else:"Else",EndIf:"EndIf",ElseIf:"ElseIf",EndFor:"EndFor",And:"And",Or:"Or",Not:"UnaryOperator",Macro:"Macro",EndMacro:"EndMacro"}),$=Object.freeze({set:g.Set,for:g.For,in:g.In,is:g.Is,if:g.If,else:g.Else,endif:g.EndIf,elif:g.ElseIf,endfor:g.EndFor,and:g.And,or:g.Or,not:g.Not,"not in":g.NotIn,macro:g.Macro,endmacro:g.EndMacro,true:g.BooleanLiteral,false:g.BooleanLiteral,none:g.NullLiteral,True:g.BooleanLiteral,False:g.BooleanLiteral,None:g.NullLiteral}),N=class{constructor(O,le){this.value=O,this.type=le}};function Z(O){return/\w/.test(O)}function j(O){return/[0-9]/.test(O)}var y=[["{%",g.OpenStatement],["%}",g.CloseStatement],["{{",g.OpenExpression],["}}",g.CloseExpression],["(",g.OpenParen],[")",g.CloseParen],["{",g.OpenCurlyBracket],["}",g.CloseCurlyBracket],["[",g.OpenSquareBracket],["]",g.CloseSquareBracket],[",",g.Comma],[".",g.Dot],[":",g.Colon],["|",g.Pipe],["<=",g.ComparisonBinaryOperator],[">=",g.ComparisonBinaryOperator],["==",g.ComparisonBinaryOperator],["!=",g.ComparisonBinaryOperator],["<",g.ComparisonBinaryOperator],[">",g.ComparisonBinaryOperator],["+",g.AdditiveBinaryOperator],["-",g.AdditiveBinaryOperator],["*",g.MultiplicativeBinaryOperator],["/",g.MultiplicativeBinaryOperator],["%",g.MultiplicativeBinaryOperator],["=",g.Equals]],T=new Map([["n",` +`],["t"," "],["r","\r"],["b","\b"],["f","\f"],["v","\v"],["'","'"],['"','"'],["\\","\\"]]);function b(O,le={}){return O.endsWith(` +`)&&(O=O.slice(0,-1)),O=O.replace(/{#.*?#}/gs,"{##}"),le.lstrip_blocks&&(O=O.replace(/^[ \t]*({[#%])/gm,"$1")),le.trim_blocks&&(O=O.replace(/([#%]})\n/g,"$1")),O.replace(/{##}/g,"").replace(/-%}\s*/g,"%}").replace(/\s*{%-/g,"{%").replace(/-}}\s*/g,"}}").replace(/\s*{{-/g,"{{")}function x(O,le={}){const Q=[],we=b(O,le);let Se=0;const We=qe=>{let tt="";for(;qe(we[Se]);){if(we[Se]==="\\"){if(++Se,Se>=we.length)throw new SyntaxError("Unexpected end of input");const st=we[Se++],ft=T.get(st);if(ft===void 0)throw new SyntaxError(`Unexpected escaped character: ${st}`);tt+=ft;continue}if(tt+=we[Se++],Se>=we.length)throw new SyntaxError("Unexpected end of input")}return tt};e:for(;Se0){Q.push(new N(st,g.Text));continue}}We(st=>/\s/.test(st));const tt=we[Se];if(tt==="-"||tt==="+"){const st=Q.at(-1)?.type;if(st===g.Text||st===void 0)throw new SyntaxError(`Unexpected character: ${tt}`);switch(st){case g.Identifier:case g.NumericLiteral:case g.BooleanLiteral:case g.NullLiteral:case g.StringLiteral:case g.CloseParen:case g.CloseSquareBracket:break;default:{++Se;const ft=We(j);Q.push(new N(`${tt}${ft}`,ft.length>0?g.NumericLiteral:g.UnaryOperator));continue}}}for(const[st,ft]of y)if(we.slice(Se,Se+st.length)===st){Q.push(new N(st,ft)),Se+=st.length;continue e}if(tt==="'"||tt==='"'){++Se;const st=We(ft=>ft!==tt);Q.push(new N(st,g.StringLiteral)),++Se;continue}if(j(tt)){const st=We(j);Q.push(new N(st,g.NumericLiteral));continue}if(Z(tt)){const st=We(Z),ft=Object.hasOwn($,st)?$[st]:g.Identifier;ft===g.In&&Q.at(-1)?.type===g.Not?(Q.pop(),Q.push(new N("not in",g.NotIn))):Q.push(new N(st,ft));continue}throw new SyntaxError(`Unexpected character: ${tt}`)}return Q}var v=class{type="Statement"},L=class extends v{constructor(O){super(),this.body=O}type="Program"},K=class extends v{constructor(O,le,Q){super(),this.test=O,this.body=le,this.alternate=Q}type="If"},se=class extends v{constructor(O,le,Q,we){super(),this.loopvar=O,this.iterable=le,this.body=Q,this.defaultBlock=we}type="For"},oe=class extends v{constructor(O,le){super(),this.assignee=O,this.value=le}type="Set"},V=class extends v{constructor(O,le,Q){super(),this.name=O,this.args=le,this.body=Q}type="Macro"},U=class extends v{type="Expression"},H=class extends U{constructor(O,le,Q){super(),this.object=O,this.property=le,this.computed=Q}type="MemberExpression"},I=class extends U{constructor(O,le){super(),this.callee=O,this.args=le}type="CallExpression"},S=class extends U{constructor(O){super(),this.value=O}type="Identifier"},w=class extends U{constructor(O){super(),this.value=O}type="Literal"},P=class extends w{type="NumericLiteral"},F=class extends w{type="StringLiteral"},ae=class extends w{type="BooleanLiteral"},ie=class extends w{type="NullLiteral"},ye=class extends w{type="ArrayLiteral"},ge=class extends w{type="TupleLiteral"},re=class extends w{type="ObjectLiteral"},Me=class extends U{constructor(O,le,Q){super(),this.operator=O,this.left=le,this.right=Q}type="BinaryExpression"},pe=class extends U{constructor(O,le){super(),this.operand=O,this.filter=le}type="FilterExpression"},Ce=class extends U{constructor(O,le){super(),this.iterable=O,this.test=le}type="SelectExpression"},Ae=class extends U{constructor(O,le,Q){super(),this.operand=O,this.negate=le,this.test=Q}type="TestExpression"},Pe=class extends U{constructor(O,le){super(),this.operator=O,this.argument=le}type="UnaryExpression"},Je=class extends U{constructor(O=void 0,le=void 0,Q=void 0){super(),this.start=O,this.stop=le,this.step=Q}type="SliceExpression"},je=class extends U{constructor(O,le){super(),this.key=O,this.value=le}type="KeywordArgumentExpression"};function _e(O){const le=new L([]);let Q=0;function we(it,vt){const Ft=O[Q++];if(!Ft||Ft.type!==it)throw new Error(`Parser Error: ${vt}. ${Ft.type} !== ${it}.`);return Ft}function Se(){switch(O[Q].type){case g.Text:return tt();case g.OpenStatement:return st();case g.OpenExpression:return ft();default:throw new SyntaxError(`Unexpected token type: ${O[Q].type}`)}}function We(...it){return Q+it.length<=O.length&&it.some((vt,Ft)=>vt!==O[Q+Ft].type)}function qe(...it){return Q+it.length<=O.length&&it.every((vt,Ft)=>vt===O[Q+Ft].type)}function tt(){return new F(we(g.Text,"Expected text token").value)}function st(){we(g.OpenStatement,"Expected opening statement token");let it;switch(O[Q].type){case g.Set:++Q,it=Nt(),we(g.CloseStatement,"Expected closing statement token");break;case g.If:++Q,it=ss(),we(g.OpenStatement,"Expected {% token"),we(g.EndIf,"Expected endif token"),we(g.CloseStatement,"Expected %} token");break;case g.Macro:++Q,it=Ts(),we(g.OpenStatement,"Expected {% token"),we(g.EndMacro,"Expected endmacro token"),we(g.CloseStatement,"Expected %} token");break;case g.For:++Q,it=Ps(),we(g.OpenStatement,"Expected {% token"),we(g.EndFor,"Expected endfor token"),we(g.CloseStatement,"Expected %} token");break;default:throw new SyntaxError(`Unknown statement type: ${O[Q].type}`)}return it}function ft(){we(g.OpenExpression,"Expected opening expression token");const it=As();return we(g.CloseExpression,"Expected closing expression token"),it}function Nt(){const it=As();if(qe(g.Equals)){++Q;const vt=Nt();return new oe(it,vt)}return it}function ss(){const it=As();we(g.CloseStatement,"Expected closing statement token");const vt=[],Ft=[];for(;!(O[Q]?.type===g.OpenStatement&&(O[Q+1]?.type===g.ElseIf||O[Q+1]?.type===g.Else||O[Q+1]?.type===g.EndIf));)vt.push(Se());if(O[Q]?.type===g.OpenStatement&&O[Q+1]?.type!==g.EndIf)if(++Q,qe(g.ElseIf))we(g.ElseIf,"Expected elseif token"),Ft.push(ss());else for(we(g.Else,"Expected else token"),we(g.CloseStatement,"Expected closing statement token");!(O[Q]?.type===g.OpenStatement&&O[Q+1]?.type===g.EndIf);)Ft.push(Se());return new K(it,vt,Ft)}function Ts(){const it=or();if(it.type!=="Identifier")throw new SyntaxError("Expected identifier following macro statement");const vt=Er();we(g.CloseStatement,"Expected closing statement token");const Ft=[];for(;We(g.OpenStatement,g.EndMacro);)Ft.push(Se());return new V(it,vt,Ft)}function ms(it=!1){const vt=it?or:As,Ft=[vt()],Ys=qe(g.Comma);for(;Ys&&(++Q,Ft.push(vt()),!!qe(g.Comma)););return Ys?new ge(Ft):Ft[0]}function Ps(){const it=ms(!0);if(!(it instanceof S||it instanceof ge))throw new SyntaxError(`Expected identifier/tuple for the loop variable, got ${it.type} instead`);we(g.In,"Expected `in` keyword following loop variable");const vt=As();we(g.CloseStatement,"Expected closing statement token");const Ft=[];for(;We(g.OpenStatement,g.EndFor)&&We(g.OpenStatement,g.Else);)Ft.push(Se());const Ys=[];if(qe(g.OpenStatement,g.Else))for(++Q,++Q,we(g.CloseStatement,"Expected closing statement token");We(g.OpenStatement,g.EndFor);)Ys.push(Se());return new se(it,vt,Ft,Ys)}function As(){return tr()}function tr(){const it=Tr();if(qe(g.If)){++Q;const vt=Tr();if(qe(g.Else)){++Q;const Ft=Tr();return new K(vt,[it],[Ft])}else return new Ce(it,vt)}return it}function Tr(){let it=Gr();for(;qe(g.Or);){const vt=O[Q];++Q;const Ft=Gr();it=new Me(vt,it,Ft)}return it}function Gr(){let it=Ns();for(;qe(g.And);){const vt=O[Q];++Q;const Ft=Ns();it=new Me(vt,it,Ft)}return it}function Ns(){let it;for(;qe(g.Not);){const vt=O[Q];++Q;const Ft=Ns();it=new Pe(vt,Ft)}return it??Mr()}function Mr(){let it=Lt();for(;qe(g.ComparisonBinaryOperator)||qe(g.In)||qe(g.NotIn);){const vt=O[Q];++Q;const Ft=Lt();it=new Me(vt,it,Ft)}return it}function Lt(){let it=Cr();for(;qe(g.AdditiveBinaryOperator);){const vt=O[Q];++Q;const Ft=Cr();it=new Me(vt,it,Ft)}return it}function Kr(){const it=qr();return qe(g.OpenParen)?Pr(it):it}function Pr(it){let vt=new I(it,Er());return qe(g.OpenParen)&&(vt=Pr(vt)),vt}function Er(){we(g.OpenParen,"Expected opening parenthesis for arguments list");const it=Hr();return we(g.CloseParen,"Expected closing parenthesis for arguments list"),it}function Hr(){const it=[];for(;!qe(g.CloseParen);){let vt=As();if(qe(g.Equals)){if(++Q,!(vt instanceof S))throw new SyntaxError("Expected identifier for keyword argument");const Ft=As();vt=new je(vt,Ft)}it.push(vt),qe(g.Comma)&&++Q}return it}function dr(){const it=[];let vt=!1;for(;!qe(g.CloseSquareBracket);)qe(g.Colon)?(it.push(void 0),++Q,vt=!0):(it.push(As()),qe(g.Colon)&&(++Q,vt=!0));if(it.length===0)throw new SyntaxError("Expected at least one argument for member/slice expression");if(vt){if(it.length>3)throw new SyntaxError("Expected 0-3 arguments for slice expression");return new Je(...it)}return it[0]}function qr(){let it=or();for(;qe(g.Dot)||qe(g.OpenSquareBracket);){const vt=O[Q];++Q;let Ft;const Ys=vt.type!==g.Dot;if(Ys)Ft=dr(),we(g.CloseSquareBracket,"Expected closing square bracket");else if(Ft=or(),Ft.type!=="Identifier")throw new SyntaxError("Expected identifier following dot operator");it=new H(it,Ft,Ys)}return it}function Cr(){let it=Dr();for(;qe(g.MultiplicativeBinaryOperator);){const vt=O[Q];++Q;const Ft=Dr();it=new Me(vt,it,Ft)}return it}function Dr(){let it=Lr();for(;qe(g.Is);){++Q;const vt=qe(g.Not);vt&&++Q;let Ft=or();if(Ft instanceof ae?Ft=new S(Ft.value.toString()):Ft instanceof ie&&(Ft=new S("none")),!(Ft instanceof S))throw new SyntaxError("Expected identifier for the test");it=new Ae(it,vt,Ft)}return it}function Lr(){let it=Kr();for(;qe(g.Pipe);){++Q;let vt=or();if(!(vt instanceof S))throw new SyntaxError("Expected identifier for the filter");qe(g.OpenParen)&&(vt=Pr(vt)),it=new pe(it,vt)}return it}function or(){const it=O[Q];switch(it.type){case g.NumericLiteral:return++Q,new P(Number(it.value));case g.StringLiteral:return++Q,new F(it.value);case g.BooleanLiteral:return++Q,new ae(it.value.toLowerCase()==="true");case g.NullLiteral:return++Q,new ie(null);case g.Identifier:return++Q,new S(it.value);case g.OpenParen:{++Q;const vt=ms();if(O[Q].type!==g.CloseParen)throw new SyntaxError(`Expected closing parenthesis, got ${O[Q].type} instead`);return++Q,vt}case g.OpenSquareBracket:{++Q;const vt=[];for(;!qe(g.CloseSquareBracket);)vt.push(As()),qe(g.Comma)&&++Q;return++Q,new ye(vt)}case g.OpenCurlyBracket:{++Q;const vt=new Map;for(;!qe(g.CloseCurlyBracket);){const Ft=As();we(g.Colon,"Expected colon between key and value in object literal");const Ys=As();vt.set(Ft,Ys),qe(g.Comma)&&++Q}return++Q,new re(vt)}default:throw new SyntaxError(`Unexpected token: ${it.type}`)}}for(;Q=0?(le=(le??=0)<0?Math.max(O.length+le,0):Math.min(le,O.length),Q=(Q??=O.length)<0?Math.max(O.length+Q,0):Math.min(Q,O.length)):(le=(le??=O.length-1)<0?Math.max(O.length+le,-1):Math.min(le,O.length-1),Q=(Q??=-1)<-1?Math.max(O.length+Q,-1):Math.min(Q,O.length-1));const We=[];for(let qe=le;Se*qele.toUpperCase())}var Oe=class{type="RuntimeValue";value;builtins=new Map;constructor(O=void 0){this.value=O}__bool__(){return new Ve(!!this.value)}},Xe=class extends Oe{type="NumericValue"},ee=class extends Oe{type="StringValue";builtins=new Map([["upper",new Ne(()=>new ee(this.value.toUpperCase()))],["lower",new Ne(()=>new ee(this.value.toLowerCase()))],["strip",new Ne(()=>new ee(this.value.trim()))],["title",new Ne(()=>new ee(Ee(this.value)))],["length",new Xe(this.value.length)],["rstrip",new Ne(()=>new ee(this.value.trimEnd()))],["lstrip",new Ne(()=>new ee(this.value.trimStart()))]])},Ve=class extends Oe{type="BooleanValue"},Re=class extends Oe{type="ObjectValue";__bool__(){return new Ve(this.value.size>0)}builtins=new Map([["get",new Ne(([O,le])=>{if(!(O instanceof ee))throw new Error(`Object key must be a string: got ${O.type}`);return this.value.get(O.value)??le??new Ue})],["items",new Ne(()=>new ve(Array.from(this.value.entries()).map(([O,le])=>new ve([new ee(O),le]))))]])},te=class extends Re{type="KeywordArgumentsValue"},ve=class extends Oe{type="ArrayValue";builtins=new Map([["length",new Xe(this.value.length)]]);__bool__(){return new Ve(this.value.length>0)}},Ke=class extends ve{type="TupleValue"},Ne=class extends Oe{type="FunctionValue"},Ue=class extends Oe{type="NullValue"},ze=class extends Oe{type="UndefinedValue"},Ze=class{constructor(O){this.parent=O}variables=new Map([["namespace",new Ne(O=>{if(O.length===0)return new Re(new Map);if(O.length!==1||!(O[0]instanceof Re))throw new Error("`namespace` expects either zero arguments or a single object argument");return O[0]})]]);tests=new Map([["boolean",O=>O.type==="BooleanValue"],["callable",O=>O instanceof Ne],["odd",O=>{if(O.type!=="NumericValue")throw new Error(`Cannot apply test "odd" to type: ${O.type}`);return O.value%2!==0}],["even",O=>{if(O.type!=="NumericValue")throw new Error(`Cannot apply test "even" to type: ${O.type}`);return O.value%2===0}],["false",O=>O.type==="BooleanValue"&&!O.value],["true",O=>O.type==="BooleanValue"&&O.value],["none",O=>O.type==="NullValue"],["string",O=>O.type==="StringValue"],["number",O=>O.type==="NumericValue"],["integer",O=>O.type==="NumericValue"&&Number.isInteger(O.value)],["iterable",O=>O.type==="ArrayValue"||O.type==="StringValue"],["mapping",O=>O.type==="ObjectValue"],["lower",O=>{const le=O.value;return O.type==="StringValue"&&le===le.toLowerCase()}],["upper",O=>{const le=O.value;return O.type==="StringValue"&&le===le.toUpperCase()}],["none",O=>O.type==="NullValue"],["defined",O=>O.type!=="UndefinedValue"],["undefined",O=>O.type==="UndefinedValue"],["equalto",(O,le)=>O.value===le.value],["eq",(O,le)=>O.value===le.value]]);set(O,le){return this.declareVariable(O,mt(le))}declareVariable(O,le){if(this.variables.has(O))throw new SyntaxError(`Variable already declared: ${O}`);return this.variables.set(O,le),le}setVariable(O,le){return this.variables.set(O,le),le}resolve(O){if(this.variables.has(O))return this;if(this.parent)return this.parent.resolve(O);throw new Error(`Unknown variable: ${O}`)}lookupVariable(O){try{return this.resolve(O).variables.get(O)??new ze}catch{return new ze}}},at=class{global;constructor(O){this.global=O??new Ze}run(O){return this.evaluate(O,this.global)}evaluateBinaryExpression(O,le){const Q=this.evaluate(O.left,le);switch(O.operator.value){case"and":return Q.__bool__().value?this.evaluate(O.right,le):Q;case"or":return Q.__bool__().value?Q:this.evaluate(O.right,le)}const we=this.evaluate(O.right,le);switch(O.operator.value){case"==":return new Ve(Q.value==we.value);case"!=":return new Ve(Q.value!=we.value)}if(Q instanceof ze||we instanceof ze)throw new Error("Cannot perform operation on undefined values");if(Q instanceof Ue||we instanceof Ue)throw new Error("Cannot perform operation on null values");if(Q instanceof Xe&&we instanceof Xe)switch(O.operator.value){case"+":return new Xe(Q.value+we.value);case"-":return new Xe(Q.value-we.value);case"*":return new Xe(Q.value*we.value);case"/":return new Xe(Q.value/we.value);case"%":return new Xe(Q.value%we.value);case"<":return new Ve(Q.value":return new Ve(Q.value>we.value);case">=":return new Ve(Q.value>=we.value);case"<=":return new Ve(Q.value<=we.value)}else if(Q instanceof ve&&we instanceof ve)switch(O.operator.value){case"+":return new ve(Q.value.concat(we.value))}else if(we instanceof ve){const Se=we.value.find(We=>We.value===Q.value)!==void 0;switch(O.operator.value){case"in":return new Ve(Se);case"not in":return new Ve(!Se)}}if(Q instanceof ee||we instanceof ee)switch(O.operator.value){case"+":return new ee(Q.value.toString()+we.value.toString())}if(Q instanceof ee&&we instanceof ee)switch(O.operator.value){case"in":return new Ve(we.value.includes(Q.value));case"not in":return new Ve(!we.value.includes(Q.value))}if(Q instanceof ee&&we instanceof Re)switch(O.operator.value){case"in":return new Ve(we.value.has(Q.value));case"not in":return new Ve(!we.value.has(Q.value))}throw new SyntaxError(`Unknown operator "${O.operator.value}" between ${Q.type} and ${we.type}`)}evaluateArguments(O,le){const Q=[],we=new Map;for(const Se of O)if(Se.type==="KeywordArgumentExpression"){const We=Se;we.set(We.key.value,this.evaluate(We.value,le))}else{if(we.size>0)throw new Error("Positional arguments must come before keyword arguments");Q.push(this.evaluate(Se,le))}return[Q,we]}evaluateFilterExpression(O,le){const Q=this.evaluate(O.operand,le);if(O.filter.type==="Identifier"){const we=O.filter;if(we.value==="tojson")return new ee(lt(Q));if(Q instanceof ve)switch(we.value){case"list":return Q;case"first":return Q.value[0];case"last":return Q.value[Q.value.length-1];case"length":return new Xe(Q.value.length);case"reverse":return new ve(Q.value.reverse());case"sort":return new ve(Q.value.sort((Se,We)=>{if(Se.type!==We.type)throw new Error(`Cannot compare different types: ${Se.type} and ${We.type}`);switch(Se.type){case"NumericValue":return Se.value-We.value;case"StringValue":return Se.value.localeCompare(We.value);default:throw new Error(`Cannot compare type: ${Se.type}`)}}));default:throw new Error(`Unknown ArrayValue filter: ${we.value}`)}else if(Q instanceof ee)switch(we.value){case"length":return new Xe(Q.value.length);case"upper":return new ee(Q.value.toUpperCase());case"lower":return new ee(Q.value.toLowerCase());case"title":return new ee(Ee(Q.value));case"capitalize":return new ee(Q.value.charAt(0).toUpperCase()+Q.value.slice(1));case"trim":return new ee(Q.value.trim());case"indent":return new ee(Q.value.split(` +`).map((Se,We)=>We===0||Se.length===0?Se:" "+Se).join(` +`));case"string":return Q;default:throw new Error(`Unknown StringValue filter: ${we.value}`)}else if(Q instanceof Xe)switch(we.value){case"abs":return new Xe(Math.abs(Q.value));default:throw new Error(`Unknown NumericValue filter: ${we.value}`)}else if(Q instanceof Re)switch(we.value){case"items":return new ve(Array.from(Q.value.entries()).map(([Se,We])=>new ve([new ee(Se),We])));case"length":return new Xe(Q.value.size);default:throw new Error(`Unknown ObjectValue filter: ${we.value}`)}throw new Error(`Cannot apply filter "${we.value}" to type: ${Q.type}`)}else if(O.filter.type==="CallExpression"){const we=O.filter;if(we.callee.type!=="Identifier")throw new Error(`Unknown filter: ${we.callee.type}`);const Se=we.callee.value;if(Se==="tojson"){const[,We]=this.evaluateArguments(we.args,le),qe=We.get("indent")??new Ue;if(!(qe instanceof Xe||qe instanceof Ue))throw new Error("If set, indent must be a number");return new ee(lt(Q,qe.value))}if(Q instanceof ve){switch(Se){case"selectattr":case"rejectattr":{const We=Se==="selectattr";if(Q.value.some(ss=>!(ss instanceof Re)))throw new Error(`\`${Se}\` can only be applied to array of objects`);if(we.args.some(ss=>ss.type!=="StringLiteral"))throw new Error(`arguments of \`${Se}\` must be strings`);const[qe,tt,st]=we.args.map(ss=>this.evaluate(ss,le));let ft;if(tt){const ss=le.tests.get(tt.value);if(!ss)throw new Error(`Unknown test: ${tt.value}`);ft=ss}else ft=(...ss)=>ss[0].__bool__().value;const Nt=Q.value.filter(ss=>{const Ts=ss.value.get(qe.value),ms=Ts?ft(Ts,st):!1;return We?ms:!ms});return new ve(Nt)}case"map":{const[,We]=this.evaluateArguments(we.args,le);if(We.has("attribute")){const qe=We.get("attribute");if(!(qe instanceof ee))throw new Error("attribute must be a string");const tt=We.get("default"),st=Q.value.map(ft=>{if(!(ft instanceof Re))throw new Error("items in map must be an object");return ft.value.get(qe.value)??tt??new ze});return new ve(st)}else throw new Error("`map` expressions without `attribute` set are not currently supported.")}}throw new Error(`Unknown ArrayValue filter: ${Se}`)}else if(Q instanceof ee){switch(Se){case"indent":{const[We,qe]=this.evaluateArguments(we.args,le),tt=We.at(0)??qe.get("width")??new Xe(4);if(!(tt instanceof Xe))throw new Error("width must be a number");const st=We.at(1)??qe.get("first")??new Ve(!1),ft=We.at(2)??qe.get("blank")??new Ve(!1),Nt=Q.value.split(` +`),ss=" ".repeat(tt.value),Ts=Nt.map((ms,Ps)=>!st.value&&Ps===0||!ft.value&&ms.length===0?ms:ss+ms);return new ee(Ts.join(` +`))}}throw new Error(`Unknown StringValue filter: ${Se}`)}else throw new Error(`Cannot apply filter "${Se}" to type: ${Q.type}`)}throw new Error(`Unknown filter: ${O.filter.type}`)}evaluateTestExpression(O,le){const Q=this.evaluate(O.operand,le),we=le.tests.get(O.test.value);if(!we)throw new Error(`Unknown test: ${O.test.value}`);const Se=we(Q);return new Ve(O.negate?!Se:Se)}evaluateUnaryExpression(O,le){const Q=this.evaluate(O.argument,le);switch(O.operator.value){case"not":return new Ve(!Q.value);default:throw new SyntaxError(`Unknown operator: ${O.operator.value}`)}}evalProgram(O,le){return this.evaluateBlock(O.body,le)}evaluateBlock(O,le){let Q="";for(const we of O){const Se=this.evaluate(we,le);Se.type!=="NullValue"&&Se.type!=="UndefinedValue"&&(Q+=Se.value)}return new ee(Q)}evaluateIdentifier(O,le){return le.lookupVariable(O.value)}evaluateCallExpression(O,le){const[Q,we]=this.evaluateArguments(O.args,le);we.size>0&&Q.push(new te(we));const Se=this.evaluate(O.callee,le);if(Se.type!=="FunctionValue")throw new Error(`Cannot call something that is not a function: got ${Se.type}`);return Se.value(Q,le)}evaluateSliceExpression(O,le,Q){if(!(O instanceof ve||O instanceof ee))throw new Error("Slice object must be an array or string");const we=this.evaluate(le.start,Q),Se=this.evaluate(le.stop,Q),We=this.evaluate(le.step,Q);if(!(we instanceof Xe||we instanceof ze))throw new Error("Slice start must be numeric or undefined");if(!(Se instanceof Xe||Se instanceof ze))throw new Error("Slice stop must be numeric or undefined");if(!(We instanceof Xe||We instanceof ze))throw new Error("Slice step must be numeric or undefined");return O instanceof ve?new ve(de(O.value,we.value,Se.value,We.value)):new ee(de(Array.from(O.value),we.value,Se.value,We.value).join(""))}evaluateMemberExpression(O,le){const Q=this.evaluate(O.object,le);let we;if(O.computed){if(O.property.type==="SliceExpression")return this.evaluateSliceExpression(Q,O.property,le);we=this.evaluate(O.property,le)}else we=new ee(O.property.value);let Se;if(Q instanceof Re){if(!(we instanceof ee))throw new Error(`Cannot access property with non-string: got ${we.type}`);Se=Q.value.get(we.value)??Q.builtins.get(we.value)}else if(Q instanceof ve||Q instanceof ee)if(we instanceof Xe)Se=Q.value.at(we.value),Q instanceof ee&&(Se=new ee(Q.value.at(we.value)));else if(we instanceof ee)Se=Q.builtins.get(we.value);else throw new Error(`Cannot access property with non-string/non-number: got ${we.type}`);else{if(!(we instanceof ee))throw new Error(`Cannot access property with non-string: got ${we.type}`);Se=Q.builtins.get(we.value)}return Se instanceof Oe?Se:new ze}evaluateSet(O,le){const Q=this.evaluate(O.value,le);if(O.assignee.type==="Identifier"){const we=O.assignee.value;le.setVariable(we,Q)}else if(O.assignee.type==="MemberExpression"){const we=O.assignee,Se=this.evaluate(we.object,le);if(!(Se instanceof Re))throw new Error("Cannot assign to member of non-object");if(we.property.type!=="Identifier")throw new Error("Cannot assign to member with non-identifier property");Se.value.set(we.property.value,Q)}else throw new Error(`Invalid LHS inside assignment expression: ${JSON.stringify(O.assignee)}`);return new Ue}evaluateIf(O,le){const Q=this.evaluate(O.test,le);return this.evaluateBlock(Q.__bool__().value?O.body:O.alternate,le)}evaluateFor(O,le){const Q=new Ze(le);let we,Se;if(O.iterable.type==="SelectExpression"){const ft=O.iterable;Se=this.evaluate(ft.iterable,Q),we=ft.test}else Se=this.evaluate(O.iterable,Q);if(!(Se instanceof ve))throw new Error(`Expected iterable type in for loop: got ${Se.type}`);const We=[],qe=[];for(let ft=0;ftms.setVariable(O.loopvar.value,ss);else if(O.loopvar.type==="TupleLiteral"){const ms=O.loopvar;if(ss.type!=="ArrayValue")throw new Error(`Cannot unpack non-iterable type: ${ss.type}`);const Ps=ss;if(ms.value.length!==Ps.value.length)throw new Error(`Too ${ms.value.length>Ps.value.length?"few":"many"} items to unpack`);Ts=As=>{for(let tr=0;tr0?We[ft-1]:new ze],["nextitem",ft{const Se=new Ze(we);Q=Q.slice();let We;Q.at(-1)?.type==="KeywordArgumentsValue"&&(We=Q.pop());for(let qe=0;qethis.evaluate(Q,le)));case"TupleLiteral":return new Ke(O.value.map(Q=>this.evaluate(Q,le)));case"ObjectLiteral":{const Q=new Map;for(const[we,Se]of O.value){const We=this.evaluate(we,le);if(!(We instanceof ee))throw new Error(`Object keys must be strings: got ${We.type}`);Q.set(We.value,this.evaluate(Se,le))}return new Re(Q)}case"Identifier":return this.evaluateIdentifier(O,le);case"CallExpression":return this.evaluateCallExpression(O,le);case"MemberExpression":return this.evaluateMemberExpression(O,le);case"UnaryExpression":return this.evaluateUnaryExpression(O,le);case"BinaryExpression":return this.evaluateBinaryExpression(O,le);case"FilterExpression":return this.evaluateFilterExpression(O,le);case"TestExpression":return this.evaluateTestExpression(O,le);default:throw new SyntaxError(`Unknown node type: ${O.type}`)}}};function mt(O){switch(typeof O){case"number":return new Xe(O);case"string":return new ee(O);case"boolean":return new Ve(O);case"undefined":return new ze;case"object":return O===null?new Ue:Array.isArray(O)?new ve(O.map(mt)):new Re(new Map(Object.entries(O).map(([le,Q])=>[le,mt(Q)])));case"function":return new Ne((le,Q)=>{const we=O(...le.map(Se=>Se.value))??null;return mt(we)});default:throw new Error(`Cannot convert to runtime value: ${O}`)}}function lt(O,le,Q){const we=Q??0;switch(O.type){case"NullValue":case"UndefinedValue":return"null";case"NumericValue":case"StringValue":case"BooleanValue":return JSON.stringify(O.value);case"ArrayValue":case"ObjectValue":{const Se=le?" ".repeat(le):"",We=` +`+Se.repeat(we),qe=We+Se;if(O.type==="ArrayValue"){const tt=O.value.map(st=>lt(st,le,we+1));return le?`[${qe}${tt.join(`,${qe}`)}${We}]`:`[${tt.join(", ")}]`}else{const tt=Array.from(O.value.entries()).map(([st,ft])=>{const Nt=`"${st}": ${lt(ft,le,we+1)}`;return le?`${qe}${Nt}`:Nt});return le?`{${tt.join(",")}${We}}`:`{${tt.join(", ")}}`}}default:throw new Error(`Cannot convert to JSON: ${O.type}`)}}var ct=class{parsed;constructor(O){const le=x(O,{lstrip_blocks:!0,trim_blocks:!0});this.parsed=_e(le)}render(O){const le=new Ze;le.set("false",!1),le.set("true",!0),le.set("raise_exception",Se=>{throw new Error(Se)}),le.set("range",X);for(const[Se,We]of Object.entries(O))le.set(Se,We);return new at(le).run(this.parsed).value}}},"./node_modules/onnxruntime-common/dist/esm/backend-impl.js":(ke,A,r)=>{r.r(A),r.d(A,{registerBackend:()=>N,resolveBackendAndExecutionProviders:()=>j});const g=new Map,$=[],N=(y,T,b)=>{if(T&&typeof T.init=="function"&&typeof T.createInferenceSessionHandler=="function"){const x=g.get(y);if(x===void 0)g.set(y,{backend:T,priority:b});else{if(x.priority>b)return;if(x.priority===b&&x.backend!==T)throw new Error(`cannot register backend "${y}" using priority ${b}`)}if(b>=0){const v=$.indexOf(y);v!==-1&&$.splice(v,1);for(let L=0;L<$.length;L++)if(g.get($[L]).priority<=b){$.splice(L,0,y);return}$.push(y)}return}throw new TypeError("not a valid backend")},Z=async y=>{const T=g.get(y);if(!T)return"backend not found.";if(T.initialized)return T.backend;if(T.aborted)return T.error;{const b=!!T.initPromise;try{return b||(T.initPromise=T.backend.init(y)),await T.initPromise,T.initialized=!0,T.backend}catch(x){return b||(T.error=`${x}`,T.aborted=!0),T.error}finally{delete T.initPromise}}},j=async y=>{const T=y.executionProviders||[],b=T.map(oe=>typeof oe=="string"?oe:oe.name),x=b.length===0?$:b;let v;const L=[],K=new Set;for(const oe of x){const V=await Z(oe);typeof V=="string"?L.push({name:oe,err:V}):(v||(v=V),v===V&&K.add(oe))}if(!v)throw new Error(`no available backend found. ERR: ${L.map(oe=>`[${oe.name}] ${oe.err}`).join(", ")}`);for(const{name:oe,err:V}of L)b.includes(oe)&&console.warn(`removing requested execution provider "${oe}" from session options because it is not available: ${V}`);const se=T.filter(oe=>K.has(typeof oe=="string"?oe:oe.name));return[v,new Proxy(y,{get:(oe,V)=>V==="executionProviders"?se:Reflect.get(oe,V)})]}},"./node_modules/onnxruntime-common/dist/esm/backend.js":(ke,A,r)=>{r.r(A),r.d(A,{registerBackend:()=>g.registerBackend});var g=r("./node_modules/onnxruntime-common/dist/esm/backend-impl.js")},"./node_modules/onnxruntime-common/dist/esm/env-impl.js":(ke,A,r)=>{r.r(A),r.d(A,{env:()=>N});var g=r("./node_modules/onnxruntime-common/dist/esm/version.js");let $="warning";const N={wasm:{},webgl:{},webgpu:{},versions:{common:g.version},set logLevel(Z){if(Z!==void 0){if(typeof Z!="string"||["verbose","info","warning","error","fatal"].indexOf(Z)===-1)throw new Error(`Unsupported logging level: ${Z}`);$=Z}},get logLevel(){return $}};Object.defineProperty(N,"logLevel",{enumerable:!0})},"./node_modules/onnxruntime-common/dist/esm/env.js":(ke,A,r)=>{r.r(A),r.d(A,{env:()=>$});var g=r("./node_modules/onnxruntime-common/dist/esm/env-impl.js");const $=g.env},"./node_modules/onnxruntime-common/dist/esm/index.js":(ke,A,r)=>{r.r(A),r.d(A,{InferenceSession:()=>N.InferenceSession,TRACE:()=>j.TRACE,TRACE_FUNC_BEGIN:()=>j.TRACE_FUNC_BEGIN,TRACE_FUNC_END:()=>j.TRACE_FUNC_END,Tensor:()=>Z.Tensor,TrainingSession:()=>y.TrainingSession,env:()=>$.env,registerBackend:()=>g.registerBackend});var g=r("./node_modules/onnxruntime-common/dist/esm/backend.js"),$=r("./node_modules/onnxruntime-common/dist/esm/env.js"),N=r("./node_modules/onnxruntime-common/dist/esm/inference-session.js"),Z=r("./node_modules/onnxruntime-common/dist/esm/tensor.js");r("./node_modules/onnxruntime-common/dist/esm/tensor-conversion.js"),r("./node_modules/onnxruntime-common/dist/esm/tensor-factory.js");var j=r("./node_modules/onnxruntime-common/dist/esm/trace.js");r("./node_modules/onnxruntime-common/dist/esm/onnx-model.js"),r("./node_modules/onnxruntime-common/dist/esm/onnx-value.js");var y=r("./node_modules/onnxruntime-common/dist/esm/training-session.js")},"./node_modules/onnxruntime-common/dist/esm/inference-session-impl.js":(ke,A,r)=>{r.r(A),r.d(A,{InferenceSession:()=>Z});var g=r("./node_modules/onnxruntime-common/dist/esm/backend-impl.js"),$=r("./node_modules/onnxruntime-common/dist/esm/tensor.js"),N=r("./node_modules/onnxruntime-common/dist/esm/trace.js");class Z{constructor(y){this.handler=y}async run(y,T,b){(0,N.TRACE_FUNC_BEGIN)();const x={};let v={};if(typeof y!="object"||y===null||y instanceof $.Tensor||Array.isArray(y))throw new TypeError("'feeds' must be an object that use input names as keys and OnnxValue as corresponding values.");let L=!0;if(typeof T=="object"){if(T===null)throw new TypeError("Unexpected argument[1]: cannot be null.");if(T instanceof $.Tensor)throw new TypeError("'fetches' cannot be a Tensor");if(Array.isArray(T)){if(T.length===0)throw new TypeError("'fetches' cannot be an empty array.");L=!1;for(const oe of T){if(typeof oe!="string")throw new TypeError("'fetches' must be a string array or an object.");if(this.outputNames.indexOf(oe)===-1)throw new RangeError(`'fetches' contains invalid output name: ${oe}.`);x[oe]=null}if(typeof b=="object"&&b!==null)v=b;else if(typeof b<"u")throw new TypeError("'options' must be an object.")}else{let oe=!1;const V=Object.getOwnPropertyNames(T);for(const U of this.outputNames)if(V.indexOf(U)!==-1){const H=T[U];(H===null||H instanceof $.Tensor)&&(oe=!0,L=!1,x[U]=H)}if(oe){if(typeof b=="object"&&b!==null)v=b;else if(typeof b<"u")throw new TypeError("'options' must be an object.")}else v=T}}else if(typeof T<"u")throw new TypeError("Unexpected argument[1]: must be 'fetches' or 'options'.");for(const oe of this.inputNames)if(typeof y[oe]>"u")throw new Error(`input '${oe}' is missing in 'feeds'.`);if(L)for(const oe of this.outputNames)x[oe]=null;const K=await this.handler.run(y,x,v),se={};for(const oe in K)if(Object.hasOwnProperty.call(K,oe)){const V=K[oe];V instanceof $.Tensor?se[oe]=V:se[oe]=new $.Tensor(V.type,V.data,V.dims)}return(0,N.TRACE_FUNC_END)(),se}async release(){return this.handler.dispose()}static async create(y,T,b,x){(0,N.TRACE_FUNC_BEGIN)();let v,L={};if(typeof y=="string"){if(v=y,typeof T=="object"&&T!==null)L=T;else if(typeof T<"u")throw new TypeError("'options' must be an object.")}else if(y instanceof Uint8Array){if(v=y,typeof T=="object"&&T!==null)L=T;else if(typeof T<"u")throw new TypeError("'options' must be an object.")}else if(y instanceof ArrayBuffer||typeof SharedArrayBuffer<"u"&&y instanceof SharedArrayBuffer){const V=y;let U=0,H=y.byteLength;if(typeof T=="object"&&T!==null)L=T;else if(typeof T=="number"){if(U=T,!Number.isSafeInteger(U))throw new RangeError("'byteOffset' must be an integer.");if(U<0||U>=V.byteLength)throw new RangeError(`'byteOffset' is out of range [0, ${V.byteLength}).`);if(H=y.byteLength-U,typeof b=="number"){if(H=b,!Number.isSafeInteger(H))throw new RangeError("'byteLength' must be an integer.");if(H<=0||U+H>V.byteLength)throw new RangeError(`'byteLength' is out of range (0, ${V.byteLength-U}].`);if(typeof x=="object"&&x!==null)L=x;else if(typeof x<"u")throw new TypeError("'options' must be an object.")}else if(typeof b<"u")throw new TypeError("'byteLength' must be a number.")}else if(typeof T<"u")throw new TypeError("'options' must be an object.");v=new Uint8Array(V,U,H)}else throw new TypeError("Unexpected argument[0]: must be 'path' or 'buffer'.");const[K,se]=await(0,g.resolveBackendAndExecutionProviders)(L),oe=await K.createInferenceSessionHandler(v,se);return(0,N.TRACE_FUNC_END)(),new Z(oe)}startProfiling(){this.handler.startProfiling()}endProfiling(){this.handler.endProfiling()}get inputNames(){return this.handler.inputNames}get outputNames(){return this.handler.outputNames}}},"./node_modules/onnxruntime-common/dist/esm/inference-session.js":(ke,A,r)=>{r.r(A),r.d(A,{InferenceSession:()=>$});var g=r("./node_modules/onnxruntime-common/dist/esm/inference-session-impl.js");const $=g.InferenceSession},"./node_modules/onnxruntime-common/dist/esm/onnx-model.js":(ke,A,r)=>{r.r(A)},"./node_modules/onnxruntime-common/dist/esm/onnx-value.js":(ke,A,r)=>{r.r(A)},"./node_modules/onnxruntime-common/dist/esm/tensor-conversion-impl.js":(ke,A,r)=>{r.r(A),r.d(A,{tensorToDataURL:()=>g,tensorToImageData:()=>$});const g=(N,Z)=>{const j=typeof document<"u"?document.createElement("canvas"):new OffscreenCanvas(1,1);j.width=N.dims[3],j.height=N.dims[2];const y=j.getContext("2d");if(y!=null){let T,b;Z?.tensorLayout!==void 0&&Z.tensorLayout==="NHWC"?(T=N.dims[2],b=N.dims[3]):(T=N.dims[3],b=N.dims[2]);const x=Z?.format!==void 0?Z.format:"RGB",v=Z?.norm;let L,K;v===void 0||v.mean===void 0?L=[255,255,255,255]:typeof v.mean=="number"?L=[v.mean,v.mean,v.mean,v.mean]:(L=[v.mean[0],v.mean[1],v.mean[2],0],v.mean[3]!==void 0&&(L[3]=v.mean[3])),v===void 0||v.bias===void 0?K=[0,0,0,0]:typeof v.bias=="number"?K=[v.bias,v.bias,v.bias,v.bias]:(K=[v.bias[0],v.bias[1],v.bias[2],0],v.bias[3]!==void 0&&(K[3]=v.bias[3]));const se=b*T;let oe=0,V=se,U=se*2,H=-1;x==="RGBA"?(oe=0,V=se,U=se*2,H=se*3):x==="RGB"?(oe=0,V=se,U=se*2):x==="RBG"&&(oe=0,U=se,V=se*2);for(let I=0;I{const j=typeof document<"u"?document.createElement("canvas").getContext("2d"):new OffscreenCanvas(1,1).getContext("2d");let y;if(j!=null){let T,b,x;Z?.tensorLayout!==void 0&&Z.tensorLayout==="NHWC"?(T=N.dims[2],b=N.dims[1],x=N.dims[3]):(T=N.dims[3],b=N.dims[2],x=N.dims[1]);const v=Z!==void 0&&Z.format!==void 0?Z.format:"RGB",L=Z?.norm;let K,se;L===void 0||L.mean===void 0?K=[255,255,255,255]:typeof L.mean=="number"?K=[L.mean,L.mean,L.mean,L.mean]:(K=[L.mean[0],L.mean[1],L.mean[2],255],L.mean[3]!==void 0&&(K[3]=L.mean[3])),L===void 0||L.bias===void 0?se=[0,0,0,0]:typeof L.bias=="number"?se=[L.bias,L.bias,L.bias,L.bias]:(se=[L.bias[0],L.bias[1],L.bias[2],0],L.bias[3]!==void 0&&(se[3]=L.bias[3]));const oe=b*T;if(Z!==void 0&&(Z.format!==void 0&&x===4&&Z.format!=="RGBA"||x===3&&Z.format!=="RGB"&&Z.format!=="BGR"))throw new Error("Tensor format doesn't match input tensor dims");const V=4;let U=0,H=1,I=2,S=3,w=0,P=oe,F=oe*2,ae=-1;v==="RGBA"?(w=0,P=oe,F=oe*2,ae=oe*3):v==="RGB"?(w=0,P=oe,F=oe*2):v==="RBG"&&(w=0,F=oe,P=oe*2),y=j.createImageData(T,b);for(let ie=0;ie{r.r(A)},"./node_modules/onnxruntime-common/dist/esm/tensor-factory-impl.js":(ke,A,r)=>{r.r(A),r.d(A,{bufferToTensor:()=>$,tensorFromGpuBuffer:()=>j,tensorFromImage:()=>N,tensorFromMLTensor:()=>y,tensorFromPinnedBuffer:()=>T,tensorFromTexture:()=>Z});var g=r("./node_modules/onnxruntime-common/dist/esm/tensor-impl.js");const $=(b,x)=>{if(b===void 0)throw new Error("Image buffer must be defined");if(x.height===void 0||x.width===void 0)throw new Error("Image height and width must be defined");if(x.tensorLayout==="NHWC")throw new Error("NHWC Tensor layout is not supported yet");const{height:v,width:L}=x,K=x.norm??{mean:255,bias:0};let se,oe;typeof K.mean=="number"?se=[K.mean,K.mean,K.mean,K.mean]:se=[K.mean[0],K.mean[1],K.mean[2],K.mean[3]??255],typeof K.bias=="number"?oe=[K.bias,K.bias,K.bias,K.bias]:oe=[K.bias[0],K.bias[1],K.bias[2],K.bias[3]??0];const V=x.format!==void 0?x.format:"RGBA",U=x.tensorFormat!==void 0&&x.tensorFormat!==void 0?x.tensorFormat:"RGB",H=v*L,I=U==="RGBA"?new Float32Array(H*4):new Float32Array(H*3);let S=4,w=0,P=1,F=2,ae=3,ie=0,ye=H,ge=H*2,re=-1;V==="RGB"&&(S=3,w=0,P=1,F=2,ae=-1),U==="RGBA"?re=H*3:U==="RBG"?(ie=0,ge=H,ye=H*2):U==="BGR"&&(ge=0,ye=H,ie=H*2);for(let pe=0;pe{const v=typeof HTMLImageElement<"u"&&b instanceof HTMLImageElement,L=typeof ImageData<"u"&&b instanceof ImageData,K=typeof ImageBitmap<"u"&&b instanceof ImageBitmap,se=typeof b=="string";let oe,V=x??{};const U=()=>{if(typeof document<"u")return document.createElement("canvas");if(typeof OffscreenCanvas<"u")return new OffscreenCanvas(1,1);throw new Error("Canvas is not supported")},H=I=>typeof HTMLCanvasElement<"u"&&I instanceof HTMLCanvasElement||I instanceof OffscreenCanvas?I.getContext("2d"):null;if(v){const I=U();I.width=b.width,I.height=b.height;const S=H(I);if(S!=null){let w=b.height,P=b.width;if(x!==void 0&&x.resizedHeight!==void 0&&x.resizedWidth!==void 0&&(w=x.resizedHeight,P=x.resizedWidth),x!==void 0){if(V=x,x.tensorFormat!==void 0)throw new Error("Image input config format must be RGBA for HTMLImageElement");V.tensorFormat="RGBA",V.height=w,V.width=P}else V.tensorFormat="RGBA",V.height=w,V.width=P;S.drawImage(b,0,0),oe=S.getImageData(0,0,P,w).data}else throw new Error("Can not access image data")}else if(L){let I,S;if(x!==void 0&&x.resizedWidth!==void 0&&x.resizedHeight!==void 0?(I=x.resizedHeight,S=x.resizedWidth):(I=b.height,S=b.width),x!==void 0&&(V=x),V.format="RGBA",V.height=I,V.width=S,x!==void 0){const w=U();w.width=S,w.height=I;const P=H(w);if(P!=null)P.putImageData(b,0,0),oe=P.getImageData(0,0,S,I).data;else throw new Error("Can not access image data")}else oe=b.data}else if(K){if(x===void 0)throw new Error("Please provide image config with format for Imagebitmap");const I=U();I.width=b.width,I.height=b.height;const S=H(I);if(S!=null){const w=b.height,P=b.width;return S.drawImage(b,0,0,P,w),oe=S.getImageData(0,0,P,w).data,V.height=w,V.width=P,$(oe,V)}else throw new Error("Can not access image data")}else{if(se)return new Promise((I,S)=>{const w=U(),P=H(w);if(!b||!P)return S();const F=new Image;F.crossOrigin="Anonymous",F.src=b,F.onload=()=>{w.width=F.width,w.height=F.height,P.drawImage(F,0,0,w.width,w.height);const ae=P.getImageData(0,0,w.width,w.height);V.height=w.height,V.width=w.width,I($(ae.data,V))}});throw new Error("Input data provided is not supported - aborted tensor creation")}if(oe!==void 0)return $(oe,V);throw new Error("Input data provided is not supported - aborted tensor creation")},Z=(b,x)=>{const{width:v,height:L,download:K,dispose:se}=x,oe=[1,L,v,4];return new g.Tensor({location:"texture",type:"float32",texture:b,dims:oe,download:K,dispose:se})},j=(b,x)=>{const{dataType:v,dims:L,download:K,dispose:se}=x;return new g.Tensor({location:"gpu-buffer",type:v??"float32",gpuBuffer:b,dims:L,download:K,dispose:se})},y=(b,x)=>{const{dataType:v,dims:L,download:K,dispose:se}=x;return new g.Tensor({location:"ml-tensor",type:v??"float32",mlTensor:b,dims:L,download:K,dispose:se})},T=(b,x,v)=>new g.Tensor({location:"cpu-pinned",type:b,data:x,dims:v??[x.length]})},"./node_modules/onnxruntime-common/dist/esm/tensor-factory.js":(ke,A,r)=>{r.r(A)},"./node_modules/onnxruntime-common/dist/esm/tensor-impl-type-mapping.js":(ke,A,r)=>{r.r(A),r.d(A,{NUMERIC_TENSOR_TYPEDARRAY_TO_TYPE_MAP:()=>$,NUMERIC_TENSOR_TYPE_TO_TYPEDARRAY_MAP:()=>g,checkTypedArray:()=>Z});const g=new Map([["float32",Float32Array],["uint8",Uint8Array],["int8",Int8Array],["uint16",Uint16Array],["int16",Int16Array],["int32",Int32Array],["bool",Uint8Array],["float64",Float64Array],["uint32",Uint32Array],["int4",Uint8Array],["uint4",Uint8Array]]),$=new Map([[Float32Array,"float32"],[Uint8Array,"uint8"],[Int8Array,"int8"],[Uint16Array,"uint16"],[Int16Array,"int16"],[Int32Array,"int32"],[Float64Array,"float64"],[Uint32Array,"uint32"]]);let N=!1;const Z=()=>{if(!N){N=!0;const j=typeof BigInt64Array<"u"&&BigInt64Array.from,y=typeof BigUint64Array<"u"&&BigUint64Array.from,T=typeof Float16Array<"u"&&Float16Array.from;j&&(g.set("int64",BigInt64Array),$.set(BigInt64Array,"int64")),y&&(g.set("uint64",BigUint64Array),$.set(BigUint64Array,"uint64")),T?(g.set("float16",Float16Array),$.set(Float16Array,"float16")):g.set("float16",Uint16Array)}}},"./node_modules/onnxruntime-common/dist/esm/tensor-impl.js":(ke,A,r)=>{r.r(A),r.d(A,{Tensor:()=>j});var g=r("./node_modules/onnxruntime-common/dist/esm/tensor-conversion-impl.js"),$=r("./node_modules/onnxruntime-common/dist/esm/tensor-factory-impl.js"),N=r("./node_modules/onnxruntime-common/dist/esm/tensor-impl-type-mapping.js"),Z=r("./node_modules/onnxruntime-common/dist/esm/tensor-utils-impl.js");class j{constructor(T,b,x){(0,N.checkTypedArray)();let v,L;if(typeof T=="object"&&"location"in T)switch(this.dataLocation=T.location,v=T.type,L=T.dims,T.location){case"cpu-pinned":{const se=N.NUMERIC_TENSOR_TYPE_TO_TYPEDARRAY_MAP.get(v);if(!se)throw new TypeError(`unsupported type "${v}" to create tensor from pinned buffer`);if(!(T.data instanceof se))throw new TypeError(`buffer should be of type ${se.name}`);this.cpuData=T.data;break}case"texture":{if(v!=="float32")throw new TypeError(`unsupported type "${v}" to create tensor from texture`);this.gpuTextureData=T.texture,this.downloader=T.download,this.disposer=T.dispose;break}case"gpu-buffer":{if(v!=="float32"&&v!=="float16"&&v!=="int32"&&v!=="int64"&&v!=="uint32"&&v!=="uint8"&&v!=="bool"&&v!=="uint4"&&v!=="int4")throw new TypeError(`unsupported type "${v}" to create tensor from gpu buffer`);this.gpuBufferData=T.gpuBuffer,this.downloader=T.download,this.disposer=T.dispose;break}case"ml-tensor":{if(v!=="float32"&&v!=="float16"&&v!=="int32"&&v!=="int64"&&v!=="uint32"&&v!=="uint64"&&v!=="int8"&&v!=="uint8"&&v!=="bool")throw new TypeError(`unsupported type "${v}" to create tensor from MLTensor`);this.mlTensorData=T.mlTensor,this.downloader=T.download,this.disposer=T.dispose;break}default:throw new Error(`Tensor constructor: unsupported location '${this.dataLocation}'`)}else{let se,oe;if(typeof T=="string")if(v=T,oe=x,T==="string"){if(!Array.isArray(b))throw new TypeError("A string tensor's data must be a string array.");se=b}else{const V=N.NUMERIC_TENSOR_TYPE_TO_TYPEDARRAY_MAP.get(T);if(V===void 0)throw new TypeError(`Unsupported tensor type: ${T}.`);if(Array.isArray(b)){if(T==="float16"&&V===Uint16Array||T==="uint4"||T==="int4")throw new TypeError(`Creating a ${T} tensor from number array is not supported. Please use ${V.name} as data.`);T==="uint64"||T==="int64"?se=V.from(b,BigInt):se=V.from(b)}else if(b instanceof V)se=b;else if(b instanceof Uint8ClampedArray)if(T==="uint8")se=Uint8Array.from(b);else throw new TypeError("A Uint8ClampedArray tensor's data must be type of uint8");else throw new TypeError(`A ${v} tensor's data must be type of ${V}`)}else if(oe=b,Array.isArray(T)){if(T.length===0)throw new TypeError("Tensor type cannot be inferred from an empty array.");const V=typeof T[0];if(V==="string")v="string",se=T;else if(V==="boolean")v="bool",se=Uint8Array.from(T);else throw new TypeError(`Invalid element type of data array: ${V}.`)}else if(T instanceof Uint8ClampedArray)v="uint8",se=Uint8Array.from(T);else{const V=N.NUMERIC_TENSOR_TYPEDARRAY_TO_TYPE_MAP.get(T.constructor);if(V===void 0)throw new TypeError(`Unsupported type for tensor data: ${T.constructor}.`);v=V,se=T}if(oe===void 0)oe=[se.length];else if(!Array.isArray(oe))throw new TypeError("A tensor's dims must be a number array");L=oe,this.cpuData=se,this.dataLocation="cpu"}const K=(0,Z.calculateSize)(L);if(this.cpuData&&K!==this.cpuData.length&&!((v==="uint4"||v==="int4")&&Math.ceil(K/2)===this.cpuData.length))throw new Error(`Tensor's size(${K}) does not match data length(${this.cpuData.length}).`);this.type=v,this.dims=L,this.size=K}static async fromImage(T,b){return(0,$.tensorFromImage)(T,b)}static fromTexture(T,b){return(0,$.tensorFromTexture)(T,b)}static fromGpuBuffer(T,b){return(0,$.tensorFromGpuBuffer)(T,b)}static fromMLTensor(T,b){return(0,$.tensorFromMLTensor)(T,b)}static fromPinnedBuffer(T,b,x){return(0,$.tensorFromPinnedBuffer)(T,b,x)}toDataURL(T){return(0,g.tensorToDataURL)(this,T)}toImageData(T){return(0,g.tensorToImageData)(this,T)}get data(){if(this.ensureValid(),!this.cpuData)throw new Error("The data is not on CPU. Use `getData()` to download GPU data to CPU, or use `texture` or `gpuBuffer` property to access the GPU data directly.");return this.cpuData}get location(){return this.dataLocation}get texture(){if(this.ensureValid(),!this.gpuTextureData)throw new Error("The data is not stored as a WebGL texture.");return this.gpuTextureData}get gpuBuffer(){if(this.ensureValid(),!this.gpuBufferData)throw new Error("The data is not stored as a WebGPU buffer.");return this.gpuBufferData}get mlTensor(){if(this.ensureValid(),!this.mlTensorData)throw new Error("The data is not stored as a WebNN MLTensor.");return this.mlTensorData}async getData(T){switch(this.ensureValid(),this.dataLocation){case"cpu":case"cpu-pinned":return this.data;case"texture":case"gpu-buffer":case"ml-tensor":{if(!this.downloader)throw new Error("The current tensor is not created with a specified data downloader.");if(this.isDownloading)throw new Error("The current tensor is being downloaded.");try{this.isDownloading=!0;const b=await this.downloader();return this.downloader=void 0,this.dataLocation="cpu",this.cpuData=b,T&&this.disposer&&(this.disposer(),this.disposer=void 0),b}finally{this.isDownloading=!1}}default:throw new Error(`cannot get data from location: ${this.dataLocation}`)}}dispose(){if(this.isDownloading)throw new Error("The current tensor is being downloaded.");this.disposer&&(this.disposer(),this.disposer=void 0),this.cpuData=void 0,this.gpuTextureData=void 0,this.gpuBufferData=void 0,this.mlTensorData=void 0,this.downloader=void 0,this.isDownloading=void 0,this.dataLocation="none"}ensureValid(){if(this.dataLocation==="none")throw new Error("The tensor is disposed.")}reshape(T){if(this.ensureValid(),this.downloader||this.disposer)throw new Error("Cannot reshape a tensor that owns GPU resource.");return(0,Z.tensorReshape)(this,T)}}},"./node_modules/onnxruntime-common/dist/esm/tensor-utils-impl.js":(ke,A,r)=>{r.r(A),r.d(A,{calculateSize:()=>$,tensorReshape:()=>N});var g=r("./node_modules/onnxruntime-common/dist/esm/tensor-impl.js");const $=Z=>{let j=1;for(let y=0;y{switch(Z.location){case"cpu":return new g.Tensor(Z.type,Z.data,j);case"cpu-pinned":return new g.Tensor({location:"cpu-pinned",data:Z.data,type:Z.type,dims:j});case"texture":return new g.Tensor({location:"texture",texture:Z.texture,type:Z.type,dims:j});case"gpu-buffer":return new g.Tensor({location:"gpu-buffer",gpuBuffer:Z.gpuBuffer,type:Z.type,dims:j});case"ml-tensor":return new g.Tensor({location:"ml-tensor",mlTensor:Z.mlTensor,type:Z.type,dims:j});default:throw new Error(`tensorReshape: tensor location ${Z.location} is not supported`)}}},"./node_modules/onnxruntime-common/dist/esm/tensor.js":(ke,A,r)=>{r.r(A),r.d(A,{Tensor:()=>$});var g=r("./node_modules/onnxruntime-common/dist/esm/tensor-impl.js");const $=g.Tensor},"./node_modules/onnxruntime-common/dist/esm/trace.js":(ke,A,r)=>{r.r(A),r.d(A,{TRACE:()=>$,TRACE_FUNC_BEGIN:()=>Z,TRACE_FUNC_END:()=>j});var g=r("./node_modules/onnxruntime-common/dist/esm/env-impl.js");const $=(y,T)=>{(typeof g.env.trace>"u"?!g.env.wasm.trace:!g.env.trace)||console.timeStamp(`${y}::ORT::${T}`)},N=(y,T)=>{const b=new Error().stack?.split(/\r\n|\r|\n/g)||[];let x=!1;for(let v=0;v{(typeof g.env.trace>"u"?!g.env.wasm.trace:!g.env.trace)||N("BEGIN",y)},j=y=>{(typeof g.env.trace>"u"?!g.env.wasm.trace:!g.env.trace)||N("END",y)}},"./node_modules/onnxruntime-common/dist/esm/training-session-impl.js":(ke,A,r)=>{r.r(A),r.d(A,{TrainingSession:()=>Z});var g=r("./node_modules/onnxruntime-common/dist/esm/backend-impl.js"),$=r("./node_modules/onnxruntime-common/dist/esm/tensor.js");const N="Training backend could not be resolved. Make sure you're using the correct configuration & WebAssembly files.";class Z{constructor(y,T,b){this.handler=y,this.hasOptimizerModel=T,this.hasEvalModel=b}get trainingInputNames(){return this.handler.inputNames}get trainingOutputNames(){return this.handler.outputNames}get evalInputNames(){if(this.hasEvalModel)return this.handler.evalInputNames;throw new Error("This training session has no evalModel loaded.")}get evalOutputNames(){if(this.hasEvalModel)return this.handler.evalOutputNames;throw new Error("This training session has no evalModel loaded.")}static async create(y,T){const b=y.evalModel||"",x=y.optimizerModel||"",v=T||{},[L,K]=await(0,g.resolveBackendAndExecutionProviders)(v);if(L.createTrainingSessionHandler){const se=await L.createTrainingSessionHandler(y.checkpointState,y.trainModel,b,x,K);return new Z(se,!!y.optimizerModel,!!y.evalModel)}else throw new Error(N)}typeNarrowingForRunStep(y,T,b,x,v){const L={};let K={};if(typeof b!="object"||b===null||b instanceof $.Tensor||Array.isArray(b))throw new TypeError("'feeds' must be an object that use input names as keys and OnnxValue as corresponding values.");let se=!0;if(typeof x=="object"){if(x===null)throw new TypeError("Unexpected argument[1]: cannot be null.");if(x instanceof $.Tensor)throw new TypeError("'fetches' cannot be a Tensor");if(Array.isArray(x)){if(x.length===0)throw new TypeError("'fetches' cannot be an empty array.");se=!1;for(const oe of x){if(typeof oe!="string")throw new TypeError("'fetches' must be a string array or an object.");if(T.indexOf(oe)===-1)throw new RangeError(`'fetches' contains invalid output name: ${oe}.`);L[oe]=null}if(typeof v=="object"&&v!==null)K=v;else if(typeof v<"u")throw new TypeError("'options' must be an object.")}else{let oe=!1;const V=Object.getOwnPropertyNames(x);for(const U of T)if(V.indexOf(U)!==-1){const H=x[U];(H===null||H instanceof $.Tensor)&&(oe=!0,se=!1,L[U]=H)}if(oe){if(typeof v=="object"&&v!==null)K=v;else if(typeof v<"u")throw new TypeError("'options' must be an object.")}else K=x}}else if(typeof x<"u")throw new TypeError("Unexpected argument[1]: must be 'fetches' or 'options'.");for(const oe of y)if(typeof b[oe]>"u")throw new Error(`input '${oe}' is missing in 'feeds'.`);if(se)for(const oe of T)L[oe]=null;return[L,K]}convertHandlerReturnTypeToMapOfTensors(y){const T={};for(const b in y)if(Object.hasOwnProperty.call(y,b)){const x=y[b];x instanceof $.Tensor?T[b]=x:T[b]=new $.Tensor(x.type,x.data,x.dims)}return T}async lazyResetGrad(){await this.handler.lazyResetGrad()}async runTrainStep(y,T,b){const[x,v]=this.typeNarrowingForRunStep(this.trainingInputNames,this.trainingOutputNames,y,T,b),L=await this.handler.runTrainStep(y,x,v);return this.convertHandlerReturnTypeToMapOfTensors(L)}async runOptimizerStep(y){if(this.hasOptimizerModel)await this.handler.runOptimizerStep(y||{});else throw new Error("This TrainingSession has no OptimizerModel loaded.")}async runEvalStep(y,T,b){if(this.hasEvalModel){const[x,v]=this.typeNarrowingForRunStep(this.evalInputNames,this.evalOutputNames,y,T,b),L=await this.handler.runEvalStep(y,x,v);return this.convertHandlerReturnTypeToMapOfTensors(L)}else throw new Error("This TrainingSession has no EvalModel loaded.")}async getParametersSize(y=!0){return this.handler.getParametersSize(y)}async loadParametersBuffer(y,T=!0){const b=await this.getParametersSize(T);if(y.length!==4*b)throw new Error("Size of the buffer passed into loadParametersBuffer must match the number of parameters in the model. Please use getParametersSize method to check.");return this.handler.loadParametersBuffer(y,T)}async getContiguousParameters(y=!0){return this.handler.getContiguousParameters(y)}async release(){return this.handler.dispose()}}},"./node_modules/onnxruntime-common/dist/esm/training-session.js":(ke,A,r)=>{r.r(A),r.d(A,{TrainingSession:()=>$});var g=r("./node_modules/onnxruntime-common/dist/esm/training-session-impl.js");const $=g.TrainingSession},"./node_modules/onnxruntime-common/dist/esm/version.js":(ke,A,r)=>{r.r(A),r.d(A,{version:()=>g});const g="1.20.1"},"./node_modules/onnxruntime-web/dist/ort.bundle.min.mjs?3a96":(ke,A,r)=>{r.r(A),r.d(A,{InferenceSession:()=>lt,TRACE:()=>Ke,TRACE_FUNC_BEGIN:()=>Ue,TRACE_FUNC_END:()=>ze,Tensor:()=>te,default:()=>xf,env:()=>F,registerBackend:()=>K});/*! + * ONNX Runtime Web v1.21.0-dev.20250114-228dd16893 + * Copyright (c) Microsoft Corporation. All rights reserved. + * Licensed under the MIT License. + */var g=Object.defineProperty,$=Object.getOwnPropertyDescriptor,N=Object.getOwnPropertyNames,Z=Object.prototype.hasOwnProperty,j=(e=>typeof require<"u"?require:typeof Proxy<"u"?new Proxy(e,{get:(t,s)=>(typeof require<"u"?require:t)[s]}):e)(function(e){if(typeof require<"u")return require.apply(this,arguments);throw Error('Dynamic require of "'+e+'" is not supported')}),y=(e,t)=>()=>(e&&(t=e(e=0)),t),T=(e,t)=>{for(var s in t)g(e,s,{get:t[s],enumerable:!0})},b=(e,t,s,n)=>{if(t&&typeof t=="object"||typeof t=="function")for(let i of N(t))!Z.call(e,i)&&i!==s&&g(e,i,{get:()=>t[i],enumerable:!(n=$(t,i))||n.enumerable});return e},x=e=>b(g({},"__esModule",{value:!0}),e),v,L,K,se,oe,V=y(()=>{v=new Map,L=[],K=(e,t,s)=>{if(t&&typeof t.init=="function"&&typeof t.createInferenceSessionHandler=="function"){let n=v.get(e);if(n===void 0)v.set(e,{backend:t,priority:s});else{if(n.priority>s)return;if(n.priority===s&&n.backend!==t)throw new Error(`cannot register backend "${e}" using priority ${s}`)}if(s>=0){let i=L.indexOf(e);i!==-1&&L.splice(i,1);for(let o=0;o{let t=v.get(e);if(!t)return"backend not found.";if(t.initialized)return t.backend;if(t.aborted)return t.error;{let s=!!t.initPromise;try{return s||(t.initPromise=t.backend.init(e)),await t.initPromise,t.initialized=!0,t.backend}catch(n){return s||(t.error=`${n}`,t.aborted=!0),t.error}finally{delete t.initPromise}}},oe=async e=>{let t=e.executionProviders||[],s=t.map(p=>typeof p=="string"?p:p.name),n=s.length===0?L:s,i,o=[],a=new Set;for(let p of n){let h=await se(p);typeof h=="string"?o.push({name:p,err:h}):(i||(i=h),i===h&&a.add(p))}if(!i)throw new Error(`no available backend found. ERR: ${o.map(p=>`[${p.name}] ${p.err}`).join(", ")}`);for(let{name:p,err:h}of o)s.includes(p)&&console.warn(`removing requested execution provider "${p}" from session options because it is not available: ${h}`);let c=t.filter(p=>a.has(typeof p=="string"?p:p.name));return[i,new Proxy(e,{get:(p,h)=>h==="executionProviders"?c:Reflect.get(p,h)})]}}),U=y(()=>{V()}),H,I=y(()=>{H="1.21.0-dev.20241212-1f88284f96"}),S,w,P=y(()=>{I(),S="warning",w={wasm:{},webgl:{},webgpu:{},versions:{common:H},set logLevel(e){if(e!==void 0){if(typeof e!="string"||["verbose","info","warning","error","fatal"].indexOf(e)===-1)throw new Error(`Unsupported logging level: ${e}`);S=e}},get logLevel(){return S}},Object.defineProperty(w,"logLevel",{enumerable:!0})}),F,ae=y(()=>{P(),F=w}),ie,ye,ge=y(()=>{ie=(e,t)=>{let s=typeof document<"u"?document.createElement("canvas"):new OffscreenCanvas(1,1);s.width=e.dims[3],s.height=e.dims[2];let n=s.getContext("2d");if(n!=null){let i,o;t?.tensorLayout!==void 0&&t.tensorLayout==="NHWC"?(i=e.dims[2],o=e.dims[3]):(i=e.dims[3],o=e.dims[2]);let a=t?.format!==void 0?t.format:"RGB",c=t?.norm,p,h;c===void 0||c.mean===void 0?p=[255,255,255,255]:typeof c.mean=="number"?p=[c.mean,c.mean,c.mean,c.mean]:(p=[c.mean[0],c.mean[1],c.mean[2],0],c.mean[3]!==void 0&&(p[3]=c.mean[3])),c===void 0||c.bias===void 0?h=[0,0,0,0]:typeof c.bias=="number"?h=[c.bias,c.bias,c.bias,c.bias]:(h=[c.bias[0],c.bias[1],c.bias[2],0],c.bias[3]!==void 0&&(h[3]=c.bias[3]));let C=o*i,u=0,k=C,B=C*2,R=-1;a==="RGBA"?(u=0,k=C,B=C*2,R=C*3):a==="RGB"?(u=0,k=C,B=C*2):a==="RBG"&&(u=0,B=C,k=C*2);for(let z=0;z{let s=typeof document<"u"?document.createElement("canvas").getContext("2d"):new OffscreenCanvas(1,1).getContext("2d"),n;if(s!=null){let i,o,a;t?.tensorLayout!==void 0&&t.tensorLayout==="NHWC"?(i=e.dims[2],o=e.dims[1],a=e.dims[3]):(i=e.dims[3],o=e.dims[2],a=e.dims[1]);let c=t!==void 0&&t.format!==void 0?t.format:"RGB",p=t?.norm,h,C;p===void 0||p.mean===void 0?h=[255,255,255,255]:typeof p.mean=="number"?h=[p.mean,p.mean,p.mean,p.mean]:(h=[p.mean[0],p.mean[1],p.mean[2],255],p.mean[3]!==void 0&&(h[3]=p.mean[3])),p===void 0||p.bias===void 0?C=[0,0,0,0]:typeof p.bias=="number"?C=[p.bias,p.bias,p.bias,p.bias]:(C=[p.bias[0],p.bias[1],p.bias[2],0],p.bias[3]!==void 0&&(C[3]=p.bias[3]));let u=o*i;if(t!==void 0&&(t.format!==void 0&&a===4&&t.format!=="RGBA"||a===3&&t.format!=="RGB"&&t.format!=="BGR"))throw new Error("Tensor format doesn't match input tensor dims");let k=4,B=0,R=1,z=2,ne=3,J=0,W=u,ue=u*2,he=-1;c==="RGBA"?(J=0,W=u,ue=u*2,he=u*3):c==="RGB"?(J=0,W=u,ue=u*2):c==="RBG"&&(J=0,ue=u,W=u*2),n=s.createImageData(i,o);for(let be=0;be{Re(),re=(e,t)=>{if(e===void 0)throw new Error("Image buffer must be defined");if(t.height===void 0||t.width===void 0)throw new Error("Image height and width must be defined");if(t.tensorLayout==="NHWC")throw new Error("NHWC Tensor layout is not supported yet");let{height:s,width:n}=t,i=t.norm??{mean:255,bias:0},o,a;typeof i.mean=="number"?o=[i.mean,i.mean,i.mean,i.mean]:o=[i.mean[0],i.mean[1],i.mean[2],i.mean[3]??255],typeof i.bias=="number"?a=[i.bias,i.bias,i.bias,i.bias]:a=[i.bias[0],i.bias[1],i.bias[2],i.bias[3]??0];let c=t.format!==void 0?t.format:"RGBA",p=t.tensorFormat!==void 0&&t.tensorFormat!==void 0?t.tensorFormat:"RGB",h=s*n,C=p==="RGBA"?new Float32Array(h*4):new Float32Array(h*3),u=4,k=0,B=1,R=2,z=3,ne=0,J=h,W=h*2,ue=-1;c==="RGB"&&(u=3,k=0,B=1,R=2,z=-1),p==="RGBA"?ue=h*3:p==="RBG"?(ne=0,W=h,J=h*2):p==="BGR"&&(W=0,J=h,ne=h*2);for(let he=0;he{let s=typeof HTMLImageElement<"u"&&e instanceof HTMLImageElement,n=typeof ImageData<"u"&&e instanceof ImageData,i=typeof ImageBitmap<"u"&&e instanceof ImageBitmap,o=typeof e=="string",a,c=t??{},p=()=>{if(typeof document<"u")return document.createElement("canvas");if(typeof OffscreenCanvas<"u")return new OffscreenCanvas(1,1);throw new Error("Canvas is not supported")},h=C=>typeof HTMLCanvasElement<"u"&&C instanceof HTMLCanvasElement||C instanceof OffscreenCanvas?C.getContext("2d"):null;if(s){let C=p();C.width=e.width,C.height=e.height;let u=h(C);if(u!=null){let k=e.height,B=e.width;if(t!==void 0&&t.resizedHeight!==void 0&&t.resizedWidth!==void 0&&(k=t.resizedHeight,B=t.resizedWidth),t!==void 0){if(c=t,t.tensorFormat!==void 0)throw new Error("Image input config format must be RGBA for HTMLImageElement");c.tensorFormat="RGBA",c.height=k,c.width=B}else c.tensorFormat="RGBA",c.height=k,c.width=B;u.drawImage(e,0,0),a=u.getImageData(0,0,B,k).data}else throw new Error("Can not access image data")}else if(n){let C,u;if(t!==void 0&&t.resizedWidth!==void 0&&t.resizedHeight!==void 0?(C=t.resizedHeight,u=t.resizedWidth):(C=e.height,u=e.width),t!==void 0&&(c=t),c.format="RGBA",c.height=C,c.width=u,t!==void 0){let k=p();k.width=u,k.height=C;let B=h(k);if(B!=null)B.putImageData(e,0,0),a=B.getImageData(0,0,u,C).data;else throw new Error("Can not access image data")}else a=e.data}else if(i){if(t===void 0)throw new Error("Please provide image config with format for Imagebitmap");let C=p();C.width=e.width,C.height=e.height;let u=h(C);if(u!=null){let k=e.height,B=e.width;return u.drawImage(e,0,0,B,k),a=u.getImageData(0,0,B,k).data,c.height=k,c.width=B,re(a,c)}else throw new Error("Can not access image data")}else{if(o)return new Promise((C,u)=>{let k=p(),B=h(k);if(!e||!B)return u();let R=new Image;R.crossOrigin="Anonymous",R.src=e,R.onload=()=>{k.width=R.width,k.height=R.height,B.drawImage(R,0,0,k.width,k.height);let z=B.getImageData(0,0,k.width,k.height);c.height=k.height,c.width=k.width,C(re(z.data,c))}});throw new Error("Input data provided is not supported - aborted tensor creation")}if(a!==void 0)return re(a,c);throw new Error("Input data provided is not supported - aborted tensor creation")},pe=(e,t)=>{let{width:s,height:n,download:i,dispose:o}=t,a=[1,n,s,4];return new Ve({location:"texture",type:"float32",texture:e,dims:a,download:i,dispose:o})},Ce=(e,t)=>{let{dataType:s,dims:n,download:i,dispose:o}=t;return new Ve({location:"gpu-buffer",type:s??"float32",gpuBuffer:e,dims:n,download:i,dispose:o})},Ae=(e,t)=>{let{dataType:s,dims:n,download:i,dispose:o}=t;return new Ve({location:"ml-tensor",type:s??"float32",mlTensor:e,dims:n,download:i,dispose:o})},Pe=(e,t,s)=>new Ve({location:"cpu-pinned",type:e,data:t,dims:s??[t.length]})}),je,_e,X,de,Ee=y(()=>{je=new Map([["float32",Float32Array],["uint8",Uint8Array],["int8",Int8Array],["uint16",Uint16Array],["int16",Int16Array],["int32",Int32Array],["bool",Uint8Array],["float64",Float64Array],["uint32",Uint32Array],["int4",Uint8Array],["uint4",Uint8Array]]),_e=new Map([[Float32Array,"float32"],[Uint8Array,"uint8"],[Int8Array,"int8"],[Uint16Array,"uint16"],[Int16Array,"int16"],[Int32Array,"int32"],[Float64Array,"float64"],[Uint32Array,"uint32"]]),X=!1,de=()=>{if(!X){X=!0;let e=typeof BigInt64Array<"u"&&BigInt64Array.from,t=typeof BigUint64Array<"u"&&BigUint64Array.from,s=typeof Float16Array<"u"&&Float16Array.from;e&&(je.set("int64",BigInt64Array),_e.set(BigInt64Array,"int64")),t&&(je.set("uint64",BigUint64Array),_e.set(BigUint64Array,"uint64")),s?(je.set("float16",Float16Array),_e.set(Float16Array,"float16")):je.set("float16",Uint16Array)}}}),Oe,Xe,ee=y(()=>{Re(),Oe=e=>{let t=1;for(let s=0;s{switch(e.location){case"cpu":return new Ve(e.type,e.data,t);case"cpu-pinned":return new Ve({location:"cpu-pinned",data:e.data,type:e.type,dims:t});case"texture":return new Ve({location:"texture",texture:e.texture,type:e.type,dims:t});case"gpu-buffer":return new Ve({location:"gpu-buffer",gpuBuffer:e.gpuBuffer,type:e.type,dims:t});case"ml-tensor":return new Ve({location:"ml-tensor",mlTensor:e.mlTensor,type:e.type,dims:t});default:throw new Error(`tensorReshape: tensor location ${e.location} is not supported`)}}}),Ve,Re=y(()=>{ge(),Je(),Ee(),ee(),Ve=class{constructor(e,t,s){de();let n,i;if(typeof e=="object"&&"location"in e)switch(this.dataLocation=e.location,n=e.type,i=e.dims,e.location){case"cpu-pinned":{let a=je.get(n);if(!a)throw new TypeError(`unsupported type "${n}" to create tensor from pinned buffer`);if(!(e.data instanceof a))throw new TypeError(`buffer should be of type ${a.name}`);this.cpuData=e.data;break}case"texture":{if(n!=="float32")throw new TypeError(`unsupported type "${n}" to create tensor from texture`);this.gpuTextureData=e.texture,this.downloader=e.download,this.disposer=e.dispose;break}case"gpu-buffer":{if(n!=="float32"&&n!=="float16"&&n!=="int32"&&n!=="int64"&&n!=="uint32"&&n!=="uint8"&&n!=="bool"&&n!=="uint4"&&n!=="int4")throw new TypeError(`unsupported type "${n}" to create tensor from gpu buffer`);this.gpuBufferData=e.gpuBuffer,this.downloader=e.download,this.disposer=e.dispose;break}case"ml-tensor":{if(n!=="float32"&&n!=="float16"&&n!=="int32"&&n!=="int64"&&n!=="uint32"&&n!=="uint64"&&n!=="int8"&&n!=="uint8"&&n!=="bool"&&n!=="uint4"&&n!=="int4")throw new TypeError(`unsupported type "${n}" to create tensor from MLTensor`);this.mlTensorData=e.mlTensor,this.downloader=e.download,this.disposer=e.dispose;break}default:throw new Error(`Tensor constructor: unsupported location '${this.dataLocation}'`)}else{let a,c;if(typeof e=="string")if(n=e,c=s,e==="string"){if(!Array.isArray(t))throw new TypeError("A string tensor's data must be a string array.");a=t}else{let p=je.get(e);if(p===void 0)throw new TypeError(`Unsupported tensor type: ${e}.`);if(Array.isArray(t)){if(e==="float16"&&p===Uint16Array||e==="uint4"||e==="int4")throw new TypeError(`Creating a ${e} tensor from number array is not supported. Please use ${p.name} as data.`);e==="uint64"||e==="int64"?a=p.from(t,BigInt):a=p.from(t)}else if(t instanceof p)a=t;else if(t instanceof Uint8ClampedArray)if(e==="uint8")a=Uint8Array.from(t);else throw new TypeError("A Uint8ClampedArray tensor's data must be type of uint8");else throw new TypeError(`A ${n} tensor's data must be type of ${p}`)}else if(c=t,Array.isArray(e)){if(e.length===0)throw new TypeError("Tensor type cannot be inferred from an empty array.");let p=typeof e[0];if(p==="string")n="string",a=e;else if(p==="boolean")n="bool",a=Uint8Array.from(e);else throw new TypeError(`Invalid element type of data array: ${p}.`)}else if(e instanceof Uint8ClampedArray)n="uint8",a=Uint8Array.from(e);else{let p=_e.get(e.constructor);if(p===void 0)throw new TypeError(`Unsupported type for tensor data: ${e.constructor}.`);n=p,a=e}if(c===void 0)c=[a.length];else if(!Array.isArray(c))throw new TypeError("A tensor's dims must be a number array");i=c,this.cpuData=a,this.dataLocation="cpu"}let o=Oe(i);if(this.cpuData&&o!==this.cpuData.length&&!((n==="uint4"||n==="int4")&&Math.ceil(o/2)===this.cpuData.length))throw new Error(`Tensor's size(${o}) does not match data length(${this.cpuData.length}).`);this.type=n,this.dims=i,this.size=o}static async fromImage(e,t){return Me(e,t)}static fromTexture(e,t){return pe(e,t)}static fromGpuBuffer(e,t){return Ce(e,t)}static fromMLTensor(e,t){return Ae(e,t)}static fromPinnedBuffer(e,t,s){return Pe(e,t,s)}toDataURL(e){return ie(this,e)}toImageData(e){return ye(this,e)}get data(){if(this.ensureValid(),!this.cpuData)throw new Error("The data is not on CPU. Use `getData()` to download GPU data to CPU, or use `texture` or `gpuBuffer` property to access the GPU data directly.");return this.cpuData}get location(){return this.dataLocation}get texture(){if(this.ensureValid(),!this.gpuTextureData)throw new Error("The data is not stored as a WebGL texture.");return this.gpuTextureData}get gpuBuffer(){if(this.ensureValid(),!this.gpuBufferData)throw new Error("The data is not stored as a WebGPU buffer.");return this.gpuBufferData}get mlTensor(){if(this.ensureValid(),!this.mlTensorData)throw new Error("The data is not stored as a WebNN MLTensor.");return this.mlTensorData}async getData(e){switch(this.ensureValid(),this.dataLocation){case"cpu":case"cpu-pinned":return this.data;case"texture":case"gpu-buffer":case"ml-tensor":{if(!this.downloader)throw new Error("The current tensor is not created with a specified data downloader.");if(this.isDownloading)throw new Error("The current tensor is being downloaded.");try{this.isDownloading=!0;let t=await this.downloader();return this.downloader=void 0,this.dataLocation="cpu",this.cpuData=t,e&&this.disposer&&(this.disposer(),this.disposer=void 0),t}finally{this.isDownloading=!1}}default:throw new Error(`cannot get data from location: ${this.dataLocation}`)}}dispose(){if(this.isDownloading)throw new Error("The current tensor is being downloaded.");this.disposer&&(this.disposer(),this.disposer=void 0),this.cpuData=void 0,this.gpuTextureData=void 0,this.gpuBufferData=void 0,this.mlTensorData=void 0,this.downloader=void 0,this.isDownloading=void 0,this.dataLocation="none"}ensureValid(){if(this.dataLocation==="none")throw new Error("The tensor is disposed.")}reshape(e){if(this.ensureValid(),this.downloader||this.disposer)throw new Error("Cannot reshape a tensor that owns GPU resource.");return Xe(this,e)}}}),te,ve=y(()=>{Re(),te=Ve}),Ke,Ne,Ue,ze,Ze=y(()=>{P(),Ke=(e,t)=>{(typeof w.trace>"u"?!w.wasm.trace:!w.trace)||console.timeStamp(`${e}::ORT::${t}`)},Ne=(e,t)=>{let s=new Error().stack?.split(/\r\n|\r|\n/g)||[],n=!1;for(let i=0;i{(typeof w.trace>"u"?!w.wasm.trace:!w.trace)||Ne("BEGIN",e)},ze=e=>{(typeof w.trace>"u"?!w.wasm.trace:!w.trace)||Ne("END",e)}}),at,mt=y(()=>{V(),ve(),Ze(),at=class hf{constructor(t){this.handler=t}async run(t,s,n){Ue();let i={},o={};if(typeof t!="object"||t===null||t instanceof te||Array.isArray(t))throw new TypeError("'feeds' must be an object that use input names as keys and OnnxValue as corresponding values.");let a=!0;if(typeof s=="object"){if(s===null)throw new TypeError("Unexpected argument[1]: cannot be null.");if(s instanceof te)throw new TypeError("'fetches' cannot be a Tensor");if(Array.isArray(s)){if(s.length===0)throw new TypeError("'fetches' cannot be an empty array.");a=!1;for(let h of s){if(typeof h!="string")throw new TypeError("'fetches' must be a string array or an object.");if(this.outputNames.indexOf(h)===-1)throw new RangeError(`'fetches' contains invalid output name: ${h}.`);i[h]=null}if(typeof n=="object"&&n!==null)o=n;else if(typeof n<"u")throw new TypeError("'options' must be an object.")}else{let h=!1,C=Object.getOwnPropertyNames(s);for(let u of this.outputNames)if(C.indexOf(u)!==-1){let k=s[u];(k===null||k instanceof te)&&(h=!0,a=!1,i[u]=k)}if(h){if(typeof n=="object"&&n!==null)o=n;else if(typeof n<"u")throw new TypeError("'options' must be an object.")}else o=s}}else if(typeof s<"u")throw new TypeError("Unexpected argument[1]: must be 'fetches' or 'options'.");for(let h of this.inputNames)if(typeof t[h]>"u")throw new Error(`input '${h}' is missing in 'feeds'.`);if(a)for(let h of this.outputNames)i[h]=null;let c=await this.handler.run(t,i,o),p={};for(let h in c)if(Object.hasOwnProperty.call(c,h)){let C=c[h];C instanceof te?p[h]=C:p[h]=new te(C.type,C.data,C.dims)}return ze(),p}async release(){return this.handler.dispose()}static async create(t,s,n,i){Ue();let o,a={};if(typeof t=="string"){if(o=t,typeof s=="object"&&s!==null)a=s;else if(typeof s<"u")throw new TypeError("'options' must be an object.")}else if(t instanceof Uint8Array){if(o=t,typeof s=="object"&&s!==null)a=s;else if(typeof s<"u")throw new TypeError("'options' must be an object.")}else if(t instanceof ArrayBuffer||typeof SharedArrayBuffer<"u"&&t instanceof SharedArrayBuffer){let C=t,u=0,k=t.byteLength;if(typeof s=="object"&&s!==null)a=s;else if(typeof s=="number"){if(u=s,!Number.isSafeInteger(u))throw new RangeError("'byteOffset' must be an integer.");if(u<0||u>=C.byteLength)throw new RangeError(`'byteOffset' is out of range [0, ${C.byteLength}).`);if(k=t.byteLength-u,typeof n=="number"){if(k=n,!Number.isSafeInteger(k))throw new RangeError("'byteLength' must be an integer.");if(k<=0||u+k>C.byteLength)throw new RangeError(`'byteLength' is out of range (0, ${C.byteLength-u}].`);if(typeof i=="object"&&i!==null)a=i;else if(typeof i<"u")throw new TypeError("'options' must be an object.")}else if(typeof n<"u")throw new TypeError("'byteLength' must be a number.")}else if(typeof s<"u")throw new TypeError("'options' must be an object.");o=new Uint8Array(C,u,k)}else throw new TypeError("Unexpected argument[0]: must be 'path' or 'buffer'.");let[c,p]=await oe(a),h=await c.createInferenceSessionHandler(o,p);return ze(),new hf(h)}startProfiling(){this.handler.startProfiling()}endProfiling(){this.handler.endProfiling()}get inputNames(){return this.handler.inputNames}get outputNames(){return this.handler.outputNames}}}),lt,ct=y(()=>{mt(),lt=at}),O=y(()=>{}),le=y(()=>{}),Q=y(()=>{}),we=y(()=>{}),Se={};T(Se,{InferenceSession:()=>lt,TRACE:()=>Ke,TRACE_FUNC_BEGIN:()=>Ue,TRACE_FUNC_END:()=>ze,Tensor:()=>te,env:()=>F,registerBackend:()=>K});var We=y(()=>{U(),ae(),ct(),ve(),O(),le(),Ze(),Q(),we()}),qe=y(()=>{}),tt={};T(tt,{default:()=>Nt});var st,ft,Nt,ss=y(()=>{Ch(),br(),Lr(),st="ort-wasm-proxy-worker",ft=globalThis.self?.name===st,ft&&(self.onmessage=e=>{let{type:t,in:s}=e.data;try{switch(t){case"init-wasm":dn(s.wasm).then(()=>{Zd(s).then(()=>{postMessage({type:t})},n=>{postMessage({type:t,err:n})})},n=>{postMessage({type:t,err:n})});break;case"init-ep":{let{epName:n,env:i}=s;ec(i,n).then(()=>{postMessage({type:t})},o=>{postMessage({type:t,err:o})});break}case"copy-from":{let{buffer:n}=s,i=ur(n);postMessage({type:t,out:i});break}case"create":{let{model:n,options:i}=s;Up(n,i).then(o=>{postMessage({type:t,out:o})},o=>{postMessage({type:t,err:o})});break}case"release":Wp(s),postMessage({type:t});break;case"run":{let{sessionId:n,inputIndices:i,inputs:o,outputIndices:a,options:c}=s;Kp(n,i,o,a,new Array(a.length).fill(null),c).then(p=>{p.some(h=>h[3]!=="cpu")?postMessage({type:t,err:"Proxy does not support non-cpu tensor location."}):postMessage({type:t,out:p},qp([...o,...p]))},p=>{postMessage({type:t,err:p})});break}case"end-profiling":Hp(s),postMessage({type:t});break;default:}}catch(n){postMessage({type:t,err:n})}}),Nt=ft?null:e=>new Worker(e??Ns,{type:"module",name:st})}),Ts={};T(Ts,{default:()=>As});var ms,Ps,As,tr=y(()=>{Ps=(ms=import.meta.url,async function(e={}){function t(){return Vt.buffer!=Xt.buffer&&ir(),Xt}function s(){return Vt.buffer!=Xt.buffer&&ir(),Ut}function n(){return Vt.buffer!=Xt.buffer&&ir(),$s}function i(){return Vt.buffer!=Xt.buffer&&ir(),ut}function o(){return Vt.buffer!=Xt.buffer&&ir(),xt}function a(){return Vt.buffer!=Xt.buffer&&ir(),hs}function c(){return Vt.buffer!=Xt.buffer&&ir(),vs}function p(){return Vt.buffer!=Xt.buffer&&ir(),er}var h,C,u=Object.assign({},e),k=new Promise((l,m)=>{h=l,C=m}),B=typeof window=="object",R=typeof importScripts=="function",z=R&&self.name=="em-pthread";u.mountExternalData=(l,m)=>{l.startsWith("./")&&(l=l.substring(2)),(u.Fb||(u.Fb=new Map)).set(l,m)},u.unmountExternalData=()=>{delete u.Fb};var ne=globalThis.SharedArrayBuffer??new WebAssembly.Memory({initial:0,maximum:0,shared:!0}).buffer.constructor;let J=()=>{let l=(E,D,G)=>(...fe)=>{let Qe=ln,et=D?.();fe=E(...fe);let bt=D?.();return et!==bt&&(E=bt,G(et),D=G=null),ln!=Qe?new Promise((Pt,Rt)=>{hh={resolve:Pt,reject:Rt}}):fe},m=E=>async(...D)=>{try{if(u.Gb)throw Error("Session already started");let G=u.Gb={hc:D[0],errors:[]},fe=await E(...D);if(u.Gb!==G)throw Error("Session mismatch");u.Hb?.flush();let Qe=G.errors;if(0bt),0u._OrtCreateSession,E=>u._OrtCreateSession=E),u._OrtRun=m(l(u._OrtRun,()=>u._OrtRun,E=>u._OrtRun=E)),u._OrtRunWithBinding=m(l(u._OrtRunWithBinding,()=>u._OrtRunWithBinding,E=>u._OrtRunWithBinding=E)),u._OrtBindInput=l(u._OrtBindInput,()=>u._OrtBindInput,E=>u._OrtBindInput=E),J=void 0};u.jsepInit=(l,m)=>{if(J?.(),l==="webgpu"){[u.Hb,u.Vb,u.Zb,u.Ob,u.Yb,u.kb,u.$b,u.cc,u.Wb,u.Xb,u.ac]=m;let E=u.Hb;u.jsepRegisterBuffer=(D,G,fe,Qe)=>E.registerBuffer(D,G,fe,Qe),u.jsepGetBuffer=D=>E.getBuffer(D),u.jsepCreateDownloader=(D,G,fe)=>E.createDownloader(D,G,fe),u.jsepOnCreateSession=D=>{E.onCreateSession(D)},u.jsepOnReleaseSession=D=>{E.onReleaseSession(D)},u.jsepOnRunStart=D=>E.onRunStart(D),u.dc=(D,G)=>{E.upload(D,G)}}else if(l==="webnn"){[u.Hb,u.bc,u.Pb,u.jsepEnsureTensor,u.ec,u.jsepDownloadTensor]=m,u.jsepReleaseTensorId=u.Pb;let E=u.Hb;u.jsepOnRunStart=D=>E.onRunStart(D),u.jsepRegisterMLContext=(D,G)=>{E.registerMLContext(D,G)},u.jsepOnReleaseSession=D=>{E.onReleaseSession(D)},u.jsepCreateMLTensorDownloader=(D,G)=>E.createMLTensorDownloader(D,G),u.jsepRegisterMLTensor=(D,G,fe)=>E.registerMLTensor(D,G,fe),u.jsepCreateMLContext=D=>E.createMLContext(D),u.jsepRegisterMLConstant=(D,G,fe,Qe,et)=>E.registerMLConstant(D,G,fe,Qe,et,u.Fb)}};var W,ue,he=Object.assign({},u),be="./this.program",Be=(l,m)=>{throw m},Ie="";(B||R)&&(R?Ie=self.location.href:typeof document<"u"&&document.currentScript&&(Ie=document.currentScript.src),ms&&(Ie=ms),Ie=Ie.startsWith("blob:")?"":Ie.substr(0,Ie.replace(/[?#].*/,"").lastIndexOf("/")+1),R&&(ue=l=>{var m=new XMLHttpRequest;return m.open("GET",l,!1),m.responseType="arraybuffer",m.send(null),new Uint8Array(m.response)}),W=(l,m,E)=>{var D=new XMLHttpRequest;D.open("GET",l,!0),D.responseType="arraybuffer",D.onload=()=>{D.status==200||D.status==0&&D.response?m(D.response):E()},D.onerror=E,D.send(null)});var nt,dt=console.log.bind(console),Et=console.error.bind(console),zt=dt,It=Et;if(Object.assign(u,he),he=null,z){let l=function(m){try{var E=m.data,D=E.cmd;if(D==="load"){let G=[];self.onmessage=fe=>G.push(fe),self.startWorker=()=>{postMessage({cmd:"loaded"});for(let fe of G)l(fe);self.onmessage=l};for(let fe of E.handlers)u[fe]&&!u[fe].proxy||(u[fe]=(...Qe)=>{postMessage({Nb:"callHandler",pc:fe,args:Qe})},fe=="print"&&(zt=u[fe]),fe=="printErr"&&(It=u[fe]));Vt=E.wasmMemory,ir(),ht(E.wasmModule)}else if(D==="run"){gh(E.pthread_ptr,0,0,1,0,0),ch(E.pthread_ptr),Cf(),Yh(),Jt||(qm(),Jt=!0);try{kf(E.start_routine,E.arg)}catch(G){if(G!="unwind")throw G}}else D==="cancel"?Pa()&&Ap(-1):E.target!=="setimmediate"&&(D==="checkMailbox"?Jt&&bp():D&&(It(`worker: received unknown command ${D}`),It(E)))}catch(G){throw Qm(),G}};var ht,Jt=!1;It=function(...m){m=m.join(" "),console.error(m)},self.alert=function(...m){postMessage({Nb:"alert",text:m.join(" "),rc:Pa()})},u.instantiateWasm=(m,E)=>new Promise(D=>{ht=G=>{G=new WebAssembly.Instance(G,Kh()),E(G),D()}}),self.onunhandledrejection=m=>{throw m.reason||m},self.onmessage=l}u.wasmBinary&&(nt=u.wasmBinary);var Vt,St,ts,Xt,Ut,$s,ut,xt,hs,vs,xs,xn,er,Ss=!1;function ir(){var l=Vt.buffer;u.HEAP8=Xt=new Int8Array(l),u.HEAP16=$s=new Int16Array(l),u.HEAPU8=Ut=new Uint8Array(l),u.HEAPU16=ut=new Uint16Array(l),u.HEAP32=xt=new Int32Array(l),u.HEAPU32=hs=new Uint32Array(l),u.HEAPF32=vs=new Float32Array(l),u.HEAPF64=er=new Float64Array(l),u.HEAP64=xs=new BigInt64Array(l),u.HEAPU64=xn=new BigUint64Array(l)}if(!z){if(!((Vt=new WebAssembly.Memory({initial:256,maximum:65536,shared:!0})).buffer instanceof ne))throw It("requested a shared WebAssembly.Memory but the returned buffer is not a SharedArrayBuffer, indicating that while the browser has SharedArrayBuffer it does not have WebAssembly threads support - you may need to set a flag"),Error("bad memory");ir()}var yp=[],rc=[],Tf=[],nc=0,ic=null;function jh(){if(--nc==0&&ic){var l=ic;ic=null,l()}}function Hn(l){throw It(l="Aborted("+l+")"),Ss=!0,ts=1,l=new WebAssembly.RuntimeError(l+". Build with -sASSERTIONS for more info."),C(l),l}var Zp,Vh=l=>l.startsWith("data:application/octet-stream;base64,"),Uh=l=>l.startsWith("file://");function Wh(l){if(l==Zp&&nt)return new Uint8Array(nt);if(ue)return ue(l);throw"both async and sync fetching of the wasm failed"}function Gh(l,m,E){return function(D){if(!nt&&(B||R)){if(typeof fetch=="function"&&!Uh(D))return fetch(D,{credentials:"same-origin"}).then(G=>{if(!G.ok)throw`failed to load wasm binary file at '${D}'`;return G.arrayBuffer()}).catch(()=>Wh(D));if(W)return new Promise((G,fe)=>{W(D,Qe=>G(new Uint8Array(Qe)),fe)})}return Promise.resolve().then(()=>Wh(D))}(l).then(D=>WebAssembly.instantiate(D,m)).then(E,D=>{It(`failed to asynchronously prepare wasm: ${D}`),Hn(D)})}function Kh(){return{a:{O:Ef,Aa:Pf,b:$f,aa:tm,B:nm,qa:im,Y:am,_:lm,ra:um,oa:dm,ha:cm,na:pm,L:hm,Z:mm,W:fm,pa:_m,X:gm,va:Af,F:If,Q:Ff,P:Df,E:zf,u:Bf,q:Rf,G:Nf,A:Hf,R:qf,ua:Qf,ka:Xf,U:Yf,ba:Jf,H:Zf,ja:ch,ta:e_,t:t_,Ba:s_,x:i_,n:o_,l:l_,c:uh,o:u_,j:p_,w:h_,p:m_,f:f_,s:__,m:g_,e:w_,k:y_,i:M_,h:b_,d:v_,ea:x_,fa:T_,ga:P_,ca:Am,da:Im,T:E_,g:C_,D:k_,I:S_,M:$_,y:A_,sa:I_,V:F_,v:Om,z:O_,N:D_,S:L_,za:z_,ya:B_,la:zm,ma:Bm,$:nh,C:Rm,K:Nm,ia:jm,J:Vm,a:Vt,xa:rh,wa:Gm,r:j_}}}var eh={913700:(l,m,E,D,G)=>{if(u===void 0||!u.Fb)return 1;if((l=Ws(Number(l>>>0))).startsWith("./")&&(l=l.substring(2)),!(l=u.Fb.get(l)))return 2;if(m=Number(m>>>0),E=Number(E>>>0),D=Number(D>>>0),m+E>l.byteLength)return 3;try{let fe=l.subarray(m,m+E);switch(G){case 0:s().set(fe,D>>>0);break;case 1:u.dc(D,fe);break;default:return 4}return 0}catch{return 4}},914415:(l,m,E)=>{u.ec(l,s().subarray(m>>>0,m+E>>>0))},914478:()=>u.bc(),914519:l=>{u.Pb(l)},914555:()=>{u.Wb()},914586:()=>{u.Xb()},914615:()=>{u.ac()},914640:l=>u.Vb(l),914673:l=>u.Zb(l),914705:(l,m,E)=>{u.Ob(Number(l),Number(m),Number(E),!0)},914768:(l,m,E)=>{u.Ob(Number(l),Number(m),Number(E))},914825:()=>typeof wasmOffsetConverter<"u",914882:l=>{u.kb("Abs",l,void 0)},914933:l=>{u.kb("Neg",l,void 0)},914984:l=>{u.kb("Floor",l,void 0)},915037:l=>{u.kb("Ceil",l,void 0)},915089:l=>{u.kb("Reciprocal",l,void 0)},915147:l=>{u.kb("Sqrt",l,void 0)},915199:l=>{u.kb("Exp",l,void 0)},915250:l=>{u.kb("Erf",l,void 0)},915301:l=>{u.kb("Sigmoid",l,void 0)},915356:(l,m,E)=>{u.kb("HardSigmoid",l,{alpha:m,beta:E})},915435:l=>{u.kb("Log",l,void 0)},915486:l=>{u.kb("Sin",l,void 0)},915537:l=>{u.kb("Cos",l,void 0)},915588:l=>{u.kb("Tan",l,void 0)},915639:l=>{u.kb("Asin",l,void 0)},915691:l=>{u.kb("Acos",l,void 0)},915743:l=>{u.kb("Atan",l,void 0)},915795:l=>{u.kb("Sinh",l,void 0)},915847:l=>{u.kb("Cosh",l,void 0)},915899:l=>{u.kb("Asinh",l,void 0)},915952:l=>{u.kb("Acosh",l,void 0)},916005:l=>{u.kb("Atanh",l,void 0)},916058:l=>{u.kb("Tanh",l,void 0)},916110:l=>{u.kb("Not",l,void 0)},916161:(l,m,E)=>{u.kb("Clip",l,{min:m,max:E})},916230:l=>{u.kb("Clip",l,void 0)},916282:(l,m)=>{u.kb("Elu",l,{alpha:m})},916340:l=>{u.kb("Gelu",l,void 0)},916392:l=>{u.kb("Relu",l,void 0)},916444:(l,m)=>{u.kb("LeakyRelu",l,{alpha:m})},916508:(l,m)=>{u.kb("ThresholdedRelu",l,{alpha:m})},916578:(l,m)=>{u.kb("Cast",l,{to:m})},916636:l=>{u.kb("Add",l,void 0)},916687:l=>{u.kb("Sub",l,void 0)},916738:l=>{u.kb("Mul",l,void 0)},916789:l=>{u.kb("Div",l,void 0)},916840:l=>{u.kb("Pow",l,void 0)},916891:l=>{u.kb("Equal",l,void 0)},916944:l=>{u.kb("Greater",l,void 0)},916999:l=>{u.kb("GreaterOrEqual",l,void 0)},917061:l=>{u.kb("Less",l,void 0)},917113:l=>{u.kb("LessOrEqual",l,void 0)},917172:(l,m,E,D,G)=>{u.kb("ReduceMean",l,{keepDims:!!m,noopWithEmptyAxes:!!E,axes:D?Array.from(o().subarray(Number(D)>>>0,Number(G)>>>0)):[]})},917347:(l,m,E,D,G)=>{u.kb("ReduceMax",l,{keepDims:!!m,noopWithEmptyAxes:!!E,axes:D?Array.from(o().subarray(Number(D)>>>0,Number(G)>>>0)):[]})},917521:(l,m,E,D,G)=>{u.kb("ReduceMin",l,{keepDims:!!m,noopWithEmptyAxes:!!E,axes:D?Array.from(o().subarray(Number(D)>>>0,Number(G)>>>0)):[]})},917695:(l,m,E,D,G)=>{u.kb("ReduceProd",l,{keepDims:!!m,noopWithEmptyAxes:!!E,axes:D?Array.from(o().subarray(Number(D)>>>0,Number(G)>>>0)):[]})},917870:(l,m,E,D,G)=>{u.kb("ReduceSum",l,{keepDims:!!m,noopWithEmptyAxes:!!E,axes:D?Array.from(o().subarray(Number(D)>>>0,Number(G)>>>0)):[]})},918044:(l,m,E,D,G)=>{u.kb("ReduceL1",l,{keepDims:!!m,noopWithEmptyAxes:!!E,axes:D?Array.from(o().subarray(Number(D)>>>0,Number(G)>>>0)):[]})},918217:(l,m,E,D,G)=>{u.kb("ReduceL2",l,{keepDims:!!m,noopWithEmptyAxes:!!E,axes:D?Array.from(o().subarray(Number(D)>>>0,Number(G)>>>0)):[]})},918390:(l,m,E,D,G)=>{u.kb("ReduceLogSum",l,{keepDims:!!m,noopWithEmptyAxes:!!E,axes:D?Array.from(o().subarray(Number(D)>>>0,Number(G)>>>0)):[]})},918567:(l,m,E,D,G)=>{u.kb("ReduceSumSquare",l,{keepDims:!!m,noopWithEmptyAxes:!!E,axes:D?Array.from(o().subarray(Number(D)>>>0,Number(G)>>>0)):[]})},918747:(l,m,E,D,G)=>{u.kb("ReduceLogSumExp",l,{keepDims:!!m,noopWithEmptyAxes:!!E,axes:D?Array.from(o().subarray(Number(D)>>>0,Number(G)>>>0)):[]})},918927:l=>{u.kb("Where",l,void 0)},918980:(l,m,E)=>{u.kb("Transpose",l,{perm:m?Array.from(o().subarray(Number(m)>>>0,Number(E)>>>0)):[]})},919104:(l,m,E,D)=>{u.kb("DepthToSpace",l,{blocksize:m,mode:Ws(E),format:D?"NHWC":"NCHW"})},919237:(l,m,E,D)=>{u.kb("DepthToSpace",l,{blocksize:m,mode:Ws(E),format:D?"NHWC":"NCHW"})},919370:(l,m,E,D,G,fe,Qe,et,bt,Pt,Rt,us,_s,Ge,os)=>{u.kb("ConvTranspose",l,{format:bt?"NHWC":"NCHW",autoPad:m,dilations:[E],group:D,kernelShape:[G],pads:[fe,Qe],strides:[et],wIsConst:()=>!!t()[Pt>>>0],outputPadding:Rt?Array.from(o().subarray(Number(Rt)>>>0,Number(us)>>>0)):[],outputShape:_s?Array.from(o().subarray(Number(_s)>>>0,Number(Ge)>>>0)):[],activation:Ws(os)})},919803:(l,m,E,D,G,fe,Qe,et,bt,Pt,Rt,us,_s,Ge)=>{u.kb("ConvTranspose",l,{format:et?"NHWC":"NCHW",autoPad:m,dilations:Array.from(o().subarray(Number(E)>>>0,2+(Number(E)>>>0)>>>0)),group:D,kernelShape:Array.from(o().subarray(Number(G)>>>0,2+(Number(G)>>>0)>>>0)),pads:Array.from(o().subarray(Number(fe)>>>0,4+(Number(fe)>>>0)>>>0)),strides:Array.from(o().subarray(Number(Qe)>>>0,2+(Number(Qe)>>>0)>>>0)),wIsConst:()=>!!t()[bt>>>0],outputPadding:Pt?Array.from(o().subarray(Number(Pt)>>>0,Number(Rt)>>>0)):[],outputShape:us?Array.from(o().subarray(Number(us)>>>0,Number(_s)>>>0)):[],activation:Ws(Ge)})},920464:(l,m,E,D,G,fe,Qe,et,bt,Pt,Rt,us,_s,Ge,os)=>{u.kb("ConvTranspose",l,{format:bt?"NHWC":"NCHW",autoPad:m,dilations:[E],group:D,kernelShape:[G],pads:[fe,Qe],strides:[et],wIsConst:()=>!!t()[Pt>>>0],outputPadding:Rt?Array.from(o().subarray(Number(Rt)>>>0,Number(us)>>>0)):[],outputShape:_s?Array.from(o().subarray(Number(_s)>>>0,Number(Ge)>>>0)):[],activation:Ws(os)})},920897:(l,m,E,D,G,fe,Qe,et,bt,Pt,Rt,us,_s,Ge)=>{u.kb("ConvTranspose",l,{format:et?"NHWC":"NCHW",autoPad:m,dilations:Array.from(o().subarray(Number(E)>>>0,2+(Number(E)>>>0)>>>0)),group:D,kernelShape:Array.from(o().subarray(Number(G)>>>0,2+(Number(G)>>>0)>>>0)),pads:Array.from(o().subarray(Number(fe)>>>0,4+(Number(fe)>>>0)>>>0)),strides:Array.from(o().subarray(Number(Qe)>>>0,2+(Number(Qe)>>>0)>>>0)),wIsConst:()=>!!t()[bt>>>0],outputPadding:Pt?Array.from(o().subarray(Number(Pt)>>>0,Number(Rt)>>>0)):[],outputShape:us?Array.from(o().subarray(Number(us)>>>0,Number(_s)>>>0)):[],activation:Ws(Ge)})},921558:(l,m)=>{u.kb("GlobalAveragePool",l,{format:m?"NHWC":"NCHW"})},921649:(l,m,E,D,G,fe,Qe,et,bt,Pt,Rt,us,_s,Ge)=>{u.kb("AveragePool",l,{format:Ge?"NHWC":"NCHW",auto_pad:m,ceil_mode:E,count_include_pad:D,storage_order:G,dilations:fe?Array.from(o().subarray(Number(fe)>>>0,Number(Qe)>>>0)):[],kernel_shape:et?Array.from(o().subarray(Number(et)>>>0,Number(bt)>>>0)):[],pads:Pt?Array.from(o().subarray(Number(Pt)>>>0,Number(Rt)>>>0)):[],strides:us?Array.from(o().subarray(Number(us)>>>0,Number(_s)>>>0)):[]})},922128:(l,m)=>{u.kb("GlobalAveragePool",l,{format:m?"NHWC":"NCHW"})},922219:(l,m,E,D,G,fe,Qe,et,bt,Pt,Rt,us,_s,Ge)=>{u.kb("AveragePool",l,{format:Ge?"NHWC":"NCHW",auto_pad:m,ceil_mode:E,count_include_pad:D,storage_order:G,dilations:fe?Array.from(o().subarray(Number(fe)>>>0,Number(Qe)>>>0)):[],kernel_shape:et?Array.from(o().subarray(Number(et)>>>0,Number(bt)>>>0)):[],pads:Pt?Array.from(o().subarray(Number(Pt)>>>0,Number(Rt)>>>0)):[],strides:us?Array.from(o().subarray(Number(us)>>>0,Number(_s)>>>0)):[]})},922698:(l,m)=>{u.kb("GlobalMaxPool",l,{format:m?"NHWC":"NCHW"})},922785:(l,m,E,D,G,fe,Qe,et,bt,Pt,Rt,us,_s,Ge)=>{u.kb("MaxPool",l,{format:Ge?"NHWC":"NCHW",auto_pad:m,ceil_mode:E,count_include_pad:D,storage_order:G,dilations:fe?Array.from(o().subarray(Number(fe)>>>0,Number(Qe)>>>0)):[],kernel_shape:et?Array.from(o().subarray(Number(et)>>>0,Number(bt)>>>0)):[],pads:Pt?Array.from(o().subarray(Number(Pt)>>>0,Number(Rt)>>>0)):[],strides:us?Array.from(o().subarray(Number(us)>>>0,Number(_s)>>>0)):[]})},923260:(l,m)=>{u.kb("GlobalMaxPool",l,{format:m?"NHWC":"NCHW"})},923347:(l,m,E,D,G,fe,Qe,et,bt,Pt,Rt,us,_s,Ge)=>{u.kb("MaxPool",l,{format:Ge?"NHWC":"NCHW",auto_pad:m,ceil_mode:E,count_include_pad:D,storage_order:G,dilations:fe?Array.from(o().subarray(Number(fe)>>>0,Number(Qe)>>>0)):[],kernel_shape:et?Array.from(o().subarray(Number(et)>>>0,Number(bt)>>>0)):[],pads:Pt?Array.from(o().subarray(Number(Pt)>>>0,Number(Rt)>>>0)):[],strides:us?Array.from(o().subarray(Number(us)>>>0,Number(_s)>>>0)):[]})},923822:(l,m,E,D,G)=>{u.kb("Gemm",l,{alpha:m,beta:E,transA:D,transB:G})},923926:l=>{u.kb("MatMul",l,void 0)},923980:(l,m,E,D)=>{u.kb("ArgMax",l,{keepDims:!!m,selectLastIndex:!!E,axis:D})},924088:(l,m,E,D)=>{u.kb("ArgMin",l,{keepDims:!!m,selectLastIndex:!!E,axis:D})},924196:(l,m)=>{u.kb("Softmax",l,{axis:m})},924259:(l,m)=>{u.kb("Concat",l,{axis:m})},924319:(l,m,E,D,G)=>{u.kb("Split",l,{axis:m,numOutputs:E,splitSizes:D?Array.from(o().subarray(Number(D)>>>0,Number(G)>>>0)):[]})},924475:l=>{u.kb("Expand",l,void 0)},924529:(l,m)=>{u.kb("Gather",l,{axis:Number(m)})},924600:(l,m)=>{u.kb("GatherElements",l,{axis:Number(m)})},924679:(l,m)=>{u.kb("GatherND",l,{batch_dims:Number(m)})},924758:(l,m,E,D,G,fe,Qe,et,bt,Pt,Rt)=>{u.kb("Resize",l,{antialias:m,axes:E?Array.from(o().subarray(Number(E)>>>0,Number(D)>>>0)):[],coordinateTransformMode:Ws(G),cubicCoeffA:fe,excludeOutside:Qe,extrapolationValue:et,keepAspectRatioPolicy:Ws(bt),mode:Ws(Pt),nearestMode:Ws(Rt)})},925120:(l,m,E,D,G,fe,Qe)=>{u.kb("Slice",l,{starts:m?Array.from(o().subarray(Number(m)>>>0,Number(E)>>>0)):[],ends:D?Array.from(o().subarray(Number(D)>>>0,Number(G)>>>0)):[],axes:fe?Array.from(o().subarray(Number(fe)>>>0,Number(Qe)>>>0)):[]})},925384:l=>{u.kb("Tile",l,void 0)},925436:(l,m,E)=>{u.kb("InstanceNormalization",l,{epsilon:m,format:E?"NHWC":"NCHW"})},925550:(l,m,E)=>{u.kb("InstanceNormalization",l,{epsilon:m,format:E?"NHWC":"NCHW"})},925664:l=>{u.kb("Range",l,void 0)},925717:(l,m)=>{u.kb("Einsum",l,{equation:Ws(m)})},925798:(l,m,E,D,G)=>{u.kb("Pad",l,{mode:m,value:E,pads:D?Array.from(o().subarray(Number(D)>>>0,Number(G)>>>0)):[]})},925941:(l,m,E,D,G,fe)=>{u.kb("BatchNormalization",l,{epsilon:m,momentum:E,spatial:!!G,trainingMode:!!D,format:fe?"NHWC":"NCHW"})},926110:(l,m,E,D,G,fe)=>{u.kb("BatchNormalization",l,{epsilon:m,momentum:E,spatial:!!G,trainingMode:!!D,format:fe?"NHWC":"NCHW"})},926279:(l,m,E)=>{u.kb("CumSum",l,{exclusive:Number(m),reverse:Number(E)})},926376:(l,m,E)=>{u.kb("DequantizeLinear",l,{axis:m,blockSize:E})},926466:(l,m,E,D,G)=>{u.kb("GridSample",l,{align_corners:m,mode:Ws(E),padding_mode:Ws(D),format:G?"NHWC":"NCHW"})},926636:(l,m,E,D,G)=>{u.kb("GridSample",l,{align_corners:m,mode:Ws(E),padding_mode:Ws(D),format:G?"NHWC":"NCHW"})},926806:(l,m,E,D,G,fe,Qe,et,bt)=>{u.kb("Attention",l,{numHeads:m,isUnidirectional:E,maskFilterValue:D,scale:G,doRotary:fe,qkvHiddenSizes:Qe?Array.from(o().subarray(Number(et)>>>0,Number(et)+Qe>>>0)):[],pastPresentShareBuffer:!!bt})},927078:l=>{u.kb("BiasAdd",l,void 0)},927133:l=>{u.kb("BiasSplitGelu",l,void 0)},927194:l=>{u.kb("FastGelu",l,void 0)},927250:(l,m,E,D,G,fe,Qe,et,bt,Pt,Rt,us,_s,Ge,os,Rs)=>{u.kb("Conv",l,{format:us?"NHWC":"NCHW",auto_pad:m,dilations:E?Array.from(o().subarray(Number(E)>>>0,Number(D)>>>0)):[],group:G,kernel_shape:fe?Array.from(o().subarray(Number(fe)>>>0,Number(Qe)>>>0)):[],pads:et?Array.from(o().subarray(Number(et)>>>0,Number(bt)>>>0)):[],strides:Pt?Array.from(o().subarray(Number(Pt)>>>0,Number(Rt)>>>0)):[],w_is_const:()=>!!t()[Number(_s)>>>0],activation:Ws(Ge),activation_params:os?Array.from(c().subarray(Number(os)>>>0,Number(Rs)>>>0)):[]})},927834:l=>{u.kb("Gelu",l,void 0)},927886:(l,m,E,D,G,fe,Qe,et,bt)=>{u.kb("GroupQueryAttention",l,{numHeads:m,kvNumHeads:E,scale:D,softcap:G,doRotary:fe,rotaryInterleaved:Qe,smoothSoftmax:et,localWindowSize:bt})},928103:(l,m,E,D)=>{u.kb("LayerNormalization",l,{axis:m,epsilon:E,simplified:!!D})},928214:(l,m,E,D)=>{u.kb("LayerNormalization",l,{axis:m,epsilon:E,simplified:!!D})},928325:(l,m,E,D,G,fe)=>{u.kb("MatMulNBits",l,{k:m,n:E,accuracyLevel:D,bits:G,blockSize:fe})},928452:(l,m,E,D,G,fe)=>{u.kb("MultiHeadAttention",l,{numHeads:m,isUnidirectional:E,maskFilterValue:D,scale:G,doRotary:fe})},928611:(l,m)=>{u.kb("QuickGelu",l,{alpha:m})},928675:(l,m,E,D,G)=>{u.kb("RotaryEmbedding",l,{interleaved:!!m,numHeads:E,rotaryEmbeddingDim:D,scale:G})},928814:(l,m,E)=>{u.kb("SkipLayerNormalization",l,{epsilon:m,simplified:!!E})},928916:(l,m,E)=>{u.kb("SkipLayerNormalization",l,{epsilon:m,simplified:!!E})},929018:(l,m,E,D)=>{u.kb("GatherBlockQuantized",l,{gatherAxis:m,quantizeAxis:E,blockSize:D})},929139:l=>{u.$b(l)},929173:(l,m)=>u.cc(Number(l),Number(m),u.Gb.hc,u.Gb.errors)};function Pf(l,m,E){return Em(async()=>{await u.Yb(Number(l),Number(m),Number(E))})}function Ef(){return typeof wasmOffsetConverter<"u"}function th(l){this.name="ExitStatus",this.message=`Program terminated with exit(${l})`,this.status=l}var sh=l=>{l.terminate(),l.onmessage=()=>{}},Hh=l=>{qn.length==0&&(Zh(),Jh(qn[0]));var m=qn.pop();if(!m)return 6;Si.push(m),on[l.Bb]=m,m.Bb=l.Bb;var E={cmd:"run",start_routine:l.ic,arg:l.Rb,pthread_ptr:l.Bb};return m.postMessage(E,l.nc),0},ki=0,Ds=(l,m,...E)=>{for(var D=2*E.length,G=Mh(),fe=yh(8*D),Qe=fe>>>3,et=0;et>>0]=bt)}return l=Xm(l,0,D,fe,m),Ip(G),l};function rh(l){if(z)return Ds(0,1,l);if(ts=l,!(0{if(ts=l,z)throw qh(l),"unwind";rh(l)},qn=[],Si=[],Qh=[],on={},Xh=l=>{var m=l.Bb;delete on[m],qn.push(l),Si.splice(Si.indexOf(l),1),l.Bb=0,wh(m)};function Yh(){Qh.forEach(l=>l())}var Jh=l=>new Promise(m=>{l.onmessage=G=>{var fe=(G=G.data).cmd;if(G.targetThread&&G.targetThread!=Pa()){var Qe=on[G.targetThread];Qe?Qe.postMessage(G,G.transferList):It(`Internal error! Worker sent a message "${fe}" to target pthread ${G.targetThread}, but that thread no longer exists!`)}else fe==="checkMailbox"?bp():fe==="spawnThread"?Hh(G):fe==="cleanupThread"?Xh(on[G.thread]):fe==="killThread"?(G=G.thread,fe=on[G],delete on[G],sh(fe),wh(G),Si.splice(Si.indexOf(fe),1),fe.Bb=0):fe==="cancelThread"?on[G.thread].postMessage({cmd:"cancel"}):fe==="loaded"?(l.loaded=!0,m(l)):fe==="alert"?alert(`Thread ${G.threadId}: ${G.text}`):G.target==="setimmediate"?l.postMessage(G):fe==="callHandler"?u[G.handler](...G.args):fe&&It(`worker sent an unknown command ${fe}`)},l.onerror=G=>{throw It(`worker sent an error! ${G.filename}:${G.lineno}: ${G.message}`),G};var E,D=[];for(E of[])u.hasOwnProperty(E)&&D.push(E);l.postMessage({cmd:"load",handlers:D,wasmMemory:Vt,wasmModule:St})});function Zh(){var l=new Worker(import.meta.url.startsWith("file:")?new URL(r("./node_modules/onnxruntime-web/dist/ort.bundle.min.mjs?46eb"),r.b):new URL(import.meta.url),{type:"module",workerData:"em-pthread",name:"em-pthread"});qn.push(l)}var Mp=l=>{for(;0{var l=Pa(),m=a()[l+52>>>2>>>0];l=a()[l+56>>>2>>>0],Jm(m,m-l),Ip(m)},kf=(l,m)=>{ki=0,l=Zm(l,m),0>>=0);throw m>>>=0,E>>>=0,a()[D.Kb+16>>>2>>>0]=0,a()[D.Kb+4>>>2>>>0]=m,a()[D.Kb+8>>>2>>>0]=E,l}function em(l,m,E,D){return z?Ds(2,1,l,m,E,D):tm(l,m,E,D)}function tm(l,m,E,D){if(l>>>=0,m>>>=0,E>>>=0,D>>>=0,ne===void 0)return It("Current environment does not support SharedArrayBuffer, pthreads are not available!"),6;var G=[];return z&&G.length===0?em(l,m,E,D):(l={ic:E,Bb:l,Rb:D,nc:G},z?(l.Nb="spawnThread",postMessage(l,G),0):Hh(l))}var sm=typeof TextDecoder<"u"?new TextDecoder("utf8"):void 0,rm=(l,m,E)=>{var D=(m>>>=0)+E;for(E=m;l[E]&&!(E>=D);)++E;if(16(G=(240&G)==224?(15&G)<<12|fe<<6|Qe:(7&G)<<18|fe<<12|Qe<<6|63&l[m++])?D+=String.fromCharCode(G):(G-=65536,D+=String.fromCharCode(55296|G>>10,56320|1023&G))}}else D+=String.fromCharCode(G)}return D},Ws=(l,m)=>(l>>>=0)?rm(s(),l,m):"";function nm(l,m,E){return z?Ds(3,1,l,m,E):0}function im(l,m){if(z)return Ds(4,1,l,m)}var ih=l=>{for(var m=0,E=0;E=D?m++:2047>=D?m+=2:55296<=D&&57343>=D?(m+=4,++E):m+=3}return m},om=(l,m,E,D)=>{if(!(0>>=0;D=E+D-1;for(var fe=0;fe=Qe&&(Qe=65536+((1023&Qe)<<10)|1023&l.charCodeAt(++fe)),127>=Qe){if(E>=D)break;m[E++>>>0]=Qe}else{if(2047>=Qe){if(E+1>=D)break;m[E++>>>0]=192|Qe>>6}else{if(65535>=Qe){if(E+2>=D)break;m[E++>>>0]=224|Qe>>12}else{if(E+3>=D)break;m[E++>>>0]=240|Qe>>18,m[E++>>>0]=128|Qe>>12&63}m[E++>>>0]=128|Qe>>6&63}m[E++>>>0]=128|63&Qe}}return m[E>>>0]=0,E-G},xa=(l,m,E)=>om(l,s(),m,E);function am(l,m){if(z)return Ds(5,1,l,m)}function lm(l,m,E){if(z)return Ds(6,1,l,m,E)}function um(l,m,E){return z?Ds(7,1,l,m,E):0}function dm(l,m){if(z)return Ds(8,1,l,m)}function cm(l,m,E){if(z)return Ds(9,1,l,m,E)}function pm(l,m,E,D){if(z)return Ds(10,1,l,m,E,D)}function hm(l,m,E,D){if(z)return Ds(11,1,l,m,E,D)}function mm(l,m,E,D){if(z)return Ds(12,1,l,m,E,D)}function fm(l){if(z)return Ds(13,1,l)}function _m(l,m){if(z)return Ds(14,1,l,m)}function gm(l,m,E){if(z)return Ds(15,1,l,m,E)}var wm,Qn,Af=()=>{Hn("")},an=l=>{for(var m="";s()[l>>>0];)m+=wm[s()[l++>>>0]];return m},oh={},ah={};function Tn(l,m,E={}){if(!("argPackAdvance"in m))throw new TypeError("registerType registeredInstance requires argPackAdvance");return function(D,G,fe={}){var Qe=G.name;if(!D)throw new Qn(`type "${Qe}" must have a positive integer typeid pointer`);if(ah.hasOwnProperty(D)){if(fe.Tb)return;throw new Qn(`Cannot register type '${Qe}' twice`)}ah[D]=G,oh.hasOwnProperty(D)&&(G=oh[D],delete oh[D],G.forEach(et=>et()))}(l,m,E)}var ym=(l,m,E)=>{switch(m){case 1:return E?D=>t()[D>>>0]:D=>s()[D>>>0];case 2:return E?D=>n()[D>>>1>>>0]:D=>i()[D>>>1>>>0];case 4:return E?D=>o()[D>>>2>>>0]:D=>a()[D>>>2>>>0];case 8:return E?D=>xs[D>>>3]:D=>xn[D>>>3];default:throw new TypeError(`invalid integer width (${m}): ${l}`)}};function If(l,m,E){E>>>=0,Tn(l>>>=0,{name:m=an(m>>>0),fromWireType:D=>D,toWireType:function(D,G){if(typeof G!="bigint"&&typeof G!="number")throw G=G===null?"null":(D=typeof G)=="object"||D==="array"||D==="function"?G.toString():""+G,new TypeError(`Cannot convert "${G}" to ${this.name}`);return typeof G=="number"&&(G=BigInt(G)),G},argPackAdvance:Xn,readValueFromPointer:ym(m,E,m.indexOf("u")==-1),Eb:null})}var Xn=8;function Ff(l,m,E,D){Tn(l>>>=0,{name:m=an(m>>>0),fromWireType:function(G){return!!G},toWireType:function(G,fe){return fe?E:D},argPackAdvance:Xn,readValueFromPointer:function(G){return this.fromWireType(s()[G>>>0])},Eb:null})}var lh=[],Pn=[];function uh(l){9<(l>>>=0)&&--Pn[l+1]==0&&(Pn[l]=void 0,lh.push(l))}var xr=l=>{if(!l)throw new Qn("Cannot use deleted val. handle = "+l);return Pn[l]},Or=l=>{switch(l){case void 0:return 2;case null:return 4;case!0:return 6;case!1:return 8;default:let m=lh.pop()||Pn.length;return Pn[m]=l,Pn[m+1]=1,m}};function dh(l){return this.fromWireType(a()[l>>>2>>>0])}var Of={name:"emscripten::val",fromWireType:l=>{var m=xr(l);return uh(l),m},toWireType:(l,m)=>Or(m),argPackAdvance:Xn,readValueFromPointer:dh,Eb:null};function Df(l){return Tn(l>>>0,Of)}var Lf=(l,m)=>{switch(m){case 4:return function(E){return this.fromWireType(c()[E>>>2>>>0])};case 8:return function(E){return this.fromWireType(p()[E>>>3>>>0])};default:throw new TypeError(`invalid float width (${m}): ${l}`)}};function zf(l,m,E){E>>>=0,Tn(l>>>=0,{name:m=an(m>>>0),fromWireType:D=>D,toWireType:(D,G)=>G,argPackAdvance:Xn,readValueFromPointer:Lf(m,E),Eb:null})}function Bf(l,m,E,D,G){if(l>>>=0,E>>>=0,m=an(m>>>0),G===-1&&(G=4294967295),G=et=>et,D===0){var fe=32-8*E;G=et=>et<>>fe}var Qe=m.includes("unsigned")?function(et,bt){return bt>>>0}:function(et,bt){return bt};Tn(l,{name:m,fromWireType:G,toWireType:Qe,argPackAdvance:Xn,readValueFromPointer:ym(m,E,D!==0),Eb:null})}function Rf(l,m,E){function D(fe){var Qe=a()[fe>>>2>>>0];return fe=a()[fe+4>>>2>>>0],new G(t().buffer,fe,Qe)}var G=[Int8Array,Uint8Array,Int16Array,Uint16Array,Int32Array,Uint32Array,Float32Array,Float64Array,BigInt64Array,BigUint64Array][m];Tn(l>>>=0,{name:E=an(E>>>0),fromWireType:D,argPackAdvance:Xn,readValueFromPointer:D},{Tb:!0})}function Nf(l,m){l>>>=0;var E=(m=an(m>>>0))==="std::string";Tn(l,{name:m,fromWireType:function(D){var G=a()[D>>>2>>>0],fe=D+4;if(E)for(var Qe=fe,et=0;et<=G;++et){var bt=fe+et;if(et==G||s()[bt>>>0]==0){if(Qe=Ws(Qe,bt-Qe),Pt===void 0)var Pt=Qe;else Pt+="\0",Pt+=Qe;Qe=bt+1}}else{for(Pt=Array(G),et=0;et>>0]);Pt=Pt.join("")}return un(D),Pt},toWireType:function(D,G){G instanceof ArrayBuffer&&(G=new Uint8Array(G));var fe=typeof G=="string";if(!(fe||G instanceof Uint8Array||G instanceof Uint8ClampedArray||G instanceof Int8Array))throw new Qn("Cannot pass non-string to std::string");var Qe=E&&fe?ih(G):G.length,et=$p(4+Qe+1),bt=et+4;if(a()[et>>>2>>>0]=Qe,E&&fe)xa(G,bt,Qe+1);else if(fe)for(fe=0;fe>>0]=Pt}else for(fe=0;fe>>0]=G[fe];return D!==null&&D.push(un,et),et},argPackAdvance:Xn,readValueFromPointer:dh,Eb(D){un(D)}})}var Mm=typeof TextDecoder<"u"?new TextDecoder("utf-16le"):void 0,jf=(l,m)=>{for(var E=l>>1,D=E+m/2;!(E>=D)&&i()[E>>>0];)++E;if(32<(E<<=1)-l&&Mm)return Mm.decode(s().slice(l,E));for(E="",D=0;!(D>=m/2);++D){var G=n()[l+2*D>>>1>>>0];if(G==0)break;E+=String.fromCharCode(G)}return E},Vf=(l,m,E)=>{if(E??=2147483647,2>E)return 0;var D=m;E=(E-=2)<2*l.length?E/2:l.length;for(var G=0;G>>1>>>0]=fe,m+=2}return n()[m>>>1>>>0]=0,m-D},Uf=l=>2*l.length,Wf=(l,m)=>{for(var E=0,D="";!(E>=m/4);){var G=o()[l+4*E>>>2>>>0];if(G==0)break;++E,65536<=G?(G-=65536,D+=String.fromCharCode(55296|G>>10,56320|1023&G)):D+=String.fromCharCode(G)}return D},Gf=(l,m,E)=>{if(m>>>=0,E??=2147483647,4>E)return 0;var D=m;E=D+E-4;for(var G=0;G=fe&&(fe=65536+((1023&fe)<<10)|1023&l.charCodeAt(++G)),o()[m>>>2>>>0]=fe,(m+=4)+4>E)break}return o()[m>>>2>>>0]=0,m-D},Kf=l=>{for(var m=0,E=0;E=D&&++E,m+=4}return m};function Hf(l,m,E){if(l>>>=0,m>>>=0,E=an(E>>>=0),m===2)var D=jf,G=Vf,fe=Uf,Qe=et=>i()[et>>>1>>>0];else m===4&&(D=Wf,G=Gf,fe=Kf,Qe=et=>a()[et>>>2>>>0]);Tn(l,{name:E,fromWireType:et=>{for(var bt,Pt=a()[et>>>2>>>0],Rt=et+4,us=0;us<=Pt;++us){var _s=et+4+us*m;us!=Pt&&Qe(_s)!=0||(Rt=D(Rt,_s-Rt),bt===void 0?bt=Rt:(bt+="\0",bt+=Rt),Rt=_s+m)}return un(et),bt},toWireType:(et,bt)=>{if(typeof bt!="string")throw new Qn(`Cannot pass non-string to C++ string type ${E}`);var Pt=fe(bt),Rt=$p(4+Pt+m);return a()[Rt>>>2>>>0]=Pt/m,G(bt,Rt+4,Pt+m),et!==null&&et.push(un,Rt),Rt},argPackAdvance:Xn,readValueFromPointer:dh,Eb(et){un(et)}})}function qf(l,m){Tn(l>>>=0,{Ub:!0,name:m=an(m>>>0),argPackAdvance:0,fromWireType:()=>{},toWireType:()=>{}})}var Qf=()=>1;function Xf(l){gh(l>>>0,!R,1,!B,131072,!1),Yh()}var bm=l=>{if(!Ss)try{if(l(),!(0>>=0,typeof Atomics.oc=="function"&&(Atomics.oc(o(),l>>>2,l).value.then(bp),l+=128,Atomics.store(o(),l>>>2,1))}var bp=()=>{var l=Pa();l&&(ch(l),bm(Ym))};function Yf(l,m){(l>>>=0)==m>>>0?setTimeout(bp):z?postMessage({targetThread:l,cmd:"checkMailbox"}):(l=on[l])&&l.postMessage({cmd:"checkMailbox"})}var ph=[];function Jf(l,m,E,D,G){for(m>>>=0,D/=2,ph.length=D,E=G>>>0>>>3,G=0;G>>0];return(m?eh[m]:V_[l])(...ph)}function Zf(l){l>>>=0,z?postMessage({cmd:"cleanupThread",thread:l}):Xh(on[l])}function e_(l){}var vp=(l,m)=>{var E=ah[l];if(E===void 0)throw l=Hm(l),E=an(l),un(l),new Qn(`${m} has unknown type ${E}`);return E},vm=(l,m,E)=>{var D=[];return l=l.toWireType(D,E),D.length&&(a()[m>>>2>>>0]=Or(D)),l};function t_(l,m,E){return m>>>=0,E>>>=0,l=xr(l>>>0),m=vp(m,"emval::as"),vm(m,E,l)}function s_(l,m){return m>>>=0,l=xr(l>>>0),(m=vp(m,"emval::as")).toWireType(null,l)}var xp=l=>{try{l()}catch(m){Hn(m)}},Yn=0,ln=null,xm=0,Tp=[],Tm={},Pm={},r_=0,hh=null,n_=[];function Em(l){return function(m){if(!Ss){if(Yn===0){var E=!1,D=!1;m((G=0)=>{if(!Ss&&(xm=G,E=!0,D)){Yn=2,xp(()=>sf(ln)),typeof Browser<"u"&&Browser.Lb.Sb&&Browser.Lb.resume(),G=!1;try{var fe=function(){var bt=o()[ln+8>>>2>>>0];return bt=Bt[Pm[bt]],--ki,bt()}()}catch(bt){fe=bt,G=!0}var Qe=!1;if(!ln){var et=hh;et&&(hh=null,(G?et.reject:et.resolve)(fe),Qe=!0)}if(G&&!Qe)throw fe}}),D=!0,E||(Yn=1,ln=function(){var G=$p(65548),fe=G+12;a()[G>>>2>>>0]=fe,a()[G+4>>>2>>>0]=fe+65536,fe=Tp[0];var Qe=Tm[fe];return Qe===void 0&&(Qe=r_++,Tm[fe]=Qe,Pm[Qe]=fe),fe=Qe,o()[G+8>>>2>>>0]=fe,G}(),typeof Browser<"u"&&Browser.Lb.Sb&&Browser.Lb.pause(),xp(()=>ef(ln)))}else Yn===2?(Yn=0,xp(rf),un(ln),ln=null,n_.forEach(bm)):Hn(`invalid state: ${Yn}`);return xm}}(m=>{l().then(m)})}function i_(l){return l>>>=0,Em(()=>(l=xr(l)).then(Or))}var Pp=[];function o_(l,m,E,D){return E>>>=0,D>>>=0,(l=Pp[l>>>0])(null,m=xr(m>>>0),E,D)}var a_={},Ep=l=>{var m=a_[l];return m===void 0?an(l):m};function l_(l,m,E,D,G){return E>>>=0,D>>>=0,G>>>=0,(l=Pp[l>>>0])(m=xr(m>>>0),m[E=Ep(E)],D,G)}var Cm=()=>typeof globalThis=="object"?globalThis:Function("return this")();function u_(l){return(l>>>=0)==0?Or(Cm()):(l=Ep(l),Or(Cm()[l]))}var d_=l=>{var m=Pp.length;return Pp.push(l),m},c_=(l,m)=>{for(var E=Array(l),D=0;D>>2>>>0],"parameter "+D);return E},km=(l,m)=>Object.defineProperty(m,"name",{value:l});function p_(l,m,E){var D=(m=c_(l,m>>>0)).shift();l--;var G=`return function (obj, func, destructorsRef, args) { +`,fe=0,Qe=[];E===0&&Qe.push("obj");for(var et=["retType"],bt=[D],Pt=0;PtRt.name).join(", ")}) => ${D.name}>`,d_(km(E,l))}function h_(l){return l=Ep(l>>>0),Or(u[l])}function m_(l,m){return m>>>=0,l=xr(l>>>0),m=xr(m),Or(l[m])}function f_(l){9<(l>>>=0)&&(Pn[l+1]+=1)}function __(){return Or([])}function g_(l){l=xr(l>>>0);for(var m=Array(l.length),E=0;E>>0))}function y_(){return Or({})}function M_(l){for(var m=xr(l>>>=0);m.length;){var E=m.pop();m.pop()(E)}uh(l)}function b_(l,m,E){m>>>=0,E>>>=0,l=xr(l>>>0),m=xr(m),E=xr(E),l[m]=E}function v_(l,m){return m>>>=0,l=(l=vp(l>>>0,"_emval_take_value")).readValueFromPointer(m),Or(l)}function x_(l,m){l=-9007199254740992>l||9007199254740992>>=0,l=new Date(1e3*l),o()[m>>>2>>>0]=l.getUTCSeconds(),o()[m+4>>>2>>>0]=l.getUTCMinutes(),o()[m+8>>>2>>>0]=l.getUTCHours(),o()[m+12>>>2>>>0]=l.getUTCDate(),o()[m+16>>>2>>>0]=l.getUTCMonth(),o()[m+20>>>2>>>0]=l.getUTCFullYear()-1900,o()[m+24>>>2>>>0]=l.getUTCDay(),l=(l.getTime()-Date.UTC(l.getUTCFullYear(),0,1,0,0,0,0))/864e5|0,o()[m+28>>>2>>>0]=l}var Ta=l=>l%4==0&&(l%100!=0||l%400==0),Sm=[0,31,60,91,121,152,182,213,244,274,305,335],$m=[0,31,59,90,120,151,181,212,243,273,304,334];function T_(l,m){l=-9007199254740992>l||9007199254740992>>=0,l=new Date(1e3*l),o()[m>>>2>>>0]=l.getSeconds(),o()[m+4>>>2>>>0]=l.getMinutes(),o()[m+8>>>2>>>0]=l.getHours(),o()[m+12>>>2>>>0]=l.getDate(),o()[m+16>>>2>>>0]=l.getMonth(),o()[m+20>>>2>>>0]=l.getFullYear()-1900,o()[m+24>>>2>>>0]=l.getDay();var E=(Ta(l.getFullYear())?Sm:$m)[l.getMonth()]+l.getDate()-1|0;o()[m+28>>>2>>>0]=E,o()[m+36>>>2>>>0]=-60*l.getTimezoneOffset(),E=new Date(l.getFullYear(),6,1).getTimezoneOffset();var D=new Date(l.getFullYear(),0,1).getTimezoneOffset();l=0|(E!=D&&l.getTimezoneOffset()==Math.min(D,E)),o()[m+32>>>2>>>0]=l}function P_(l){l>>>=0;var m=new Date(o()[l+20>>>2>>>0]+1900,o()[l+16>>>2>>>0],o()[l+12>>>2>>>0],o()[l+8>>>2>>>0],o()[l+4>>>2>>>0],o()[l>>>2>>>0],0),E=o()[l+32>>>2>>>0],D=m.getTimezoneOffset(),G=new Date(m.getFullYear(),6,1).getTimezoneOffset(),fe=new Date(m.getFullYear(),0,1).getTimezoneOffset(),Qe=Math.min(fe,G);return 0>E?o()[l+32>>>2>>>0]=+(G!=fe&&Qe==D):0>>2>>>0]=m.getDay(),E=(Ta(m.getFullYear())?Sm:$m)[m.getMonth()]+m.getDate()-1|0,o()[l+28>>>2>>>0]=E,o()[l>>>2>>>0]=m.getSeconds(),o()[l+4>>>2>>>0]=m.getMinutes(),o()[l+8>>>2>>>0]=m.getHours(),o()[l+12>>>2>>>0]=m.getDate(),o()[l+16>>>2>>>0]=m.getMonth(),o()[l+20>>>2>>>0]=m.getYear(),l=m.getTime(),BigInt(isNaN(l)?-1:l/1e3)}function Am(l,m,E,D,G,fe,Qe){return z?Ds(16,1,l,m,E,D,G,fe,Qe):-52}function Im(l,m,E,D,G,fe){if(z)return Ds(17,1,l,m,E,D,G,fe)}function E_(l,m,E,D){l>>>=0,m>>>=0,E>>>=0,D>>>=0;var G=new Date().getFullYear(),fe=new Date(G,0,1),Qe=new Date(G,6,1);G=fe.getTimezoneOffset();var et=Qe.getTimezoneOffset(),bt=Math.max(G,et);a()[l>>>2>>>0]=60*bt,o()[m>>>2>>>0]=+(G!=et),fe=(l=Pt=>Pt.toLocaleTimeString(void 0,{hour12:!1,timeZoneName:"short"}).split(" ")[1])(fe),Qe=l(Qe),et{mh.length=0;for(var E;E=s()[l++>>>0];){var D=E!=105;m+=(D&=E!=112)&&m%8?4:0,mh.push(E==112?a()[m>>>2>>>0]:E==106?xs[m>>>3]:E==105?o()[m>>>2>>>0]:p()[m>>>3>>>0]),m+=D?8:4}return mh};function C_(l,m,E){return l>>>=0,m=Fm(m>>>0,E>>>0),eh[l](...m)}function k_(l,m,E){return l>>>=0,m=Fm(m>>>0,E>>>0),eh[l](...m)}var S_=()=>{},$_=()=>Date.now();function A_(l,m){return It(Ws(l>>>0,m>>>0))}var Om,I_=()=>{throw ki+=1,"unwind"};function F_(){return 4294901760}Om=()=>performance.timeOrigin+performance.now();var O_=()=>navigator.hardwareConcurrency;function D_(){return Hn("Cannot use emscripten_pc_get_function without -sUSE_OFFSET_CONVERTER"),0}function L_(l){l>>>=0;var m=s().length;if(l<=m||4294901760=E;E*=2){var D=m*(1+.2/E);D=Math.min(D,l+100663296);var G=Math;D=Math.max(l,D);e:{G=(G.min.call(G,4294901760,D+(65536-D%65536)%65536)-Vt.buffer.byteLength+65535)/65536;try{Vt.grow(G),ir();var fe=1;break e}catch{}fe=void 0}if(fe)return!0}return!1}var Cp=()=>(Hn("Cannot use convertFrameToPC (needed by __builtin_return_address) without -sUSE_OFFSET_CONVERTER"),0),oc={},Dm=l=>{l.forEach(m=>{Cp()})};function z_(){var l=Error().stack.toString().split(` +`);return l[0]=="Error"&&l.shift(),Dm(l),oc.Qb=Cp(),oc.fc=l,oc.Qb}function B_(l,m,E){if(l>>>=0,m>>>=0,oc.Qb==l)var D=oc.fc;else(D=Error().stack.toString().split(` +`))[0]=="Error"&&D.shift(),Dm(D);for(var G=3;D[G]&&Cp()!=l;)++G;for(l=0;l>>2>>>0]=Cp();return l}var fh,_h={},Lm=()=>{if(!fh){var l,m={USER:"web_user",LOGNAME:"web_user",PATH:"/",PWD:"/",HOME:"/home/web_user",LANG:(typeof navigator=="object"&&navigator.languages&&navigator.languages[0]||"C").replace("-","_")+".UTF-8",_:be};for(l in _h)_h[l]===void 0?delete m[l]:m[l]=_h[l];var E=[];for(l in m)E.push(`${l}=${m[l]}`);fh=E}return fh};function zm(l,m){if(z)return Ds(18,1,l,m);l>>>=0,m>>>=0;var E=0;return Lm().forEach((D,G)=>{var fe=m+E;for(G=a()[l+4*G>>>2>>>0]=fe,fe=0;fe>>0]=D.charCodeAt(fe);t()[G>>>0]=0,E+=D.length+1}),0}function Bm(l,m){if(z)return Ds(19,1,l,m);l>>>=0,m>>>=0;var E=Lm();a()[l>>>2>>>0]=E.length;var D=0;return E.forEach(G=>D+=G.length+1),a()[m>>>2>>>0]=D,0}function Rm(l){return z?Ds(20,1,l):52}function Nm(l,m,E,D){return z?Ds(21,1,l,m,E,D):52}function jm(l,m,E,D){return z?Ds(22,1,l,m,E,D):70}var R_=[null,[],[]];function Vm(l,m,E,D){if(z)return Ds(23,1,l,m,E,D);m>>>=0,E>>>=0,D>>>=0;for(var G=0,fe=0;fe>>2>>>0],et=a()[m+4>>>2>>>0];m+=8;for(var bt=0;bt>>0],Rt=R_[l];Pt===0||Pt===10?((l===1?zt:It)(rm(Rt,0)),Rt.length=0):Rt.push(Pt)}G+=et}return a()[D>>>2>>>0]=G,0}var Um=[31,29,31,30,31,30,31,31,30,31,30,31],Wm=[31,28,31,30,31,30,31,31,30,31,30,31],N_=(l,m)=>{t().set(l,m>>>0)};function Gm(l,m,E,D){function G(Ge,os,Rs){for(Ge=typeof Ge=="number"?Ge.toString():Ge||"";Ge.lengthof?-1:0$i-Ge.getDate())){Ge.setDate(Ge.getDate()+os);break}os-=$i-Ge.getDate()+1,Ge.setDate(1),11>Rs?Ge.setMonth(Rs+1):(Ge.setMonth(0),Ge.setFullYear(Ge.getFullYear()+1))}return Rs=new Date(Ge.getFullYear()+1,0,4),os=et(new Date(Ge.getFullYear(),0,4)),Rs=et(Rs),0>=Qe(os,Ge)?0>=Qe(Rs,Ge)?Ge.getFullYear()+1:Ge.getFullYear():Ge.getFullYear()-1}l>>>=0,m>>>=0,E>>>=0,D>>>=0;var Pt=a()[D+40>>>2>>>0];for(var Rt in D={lc:o()[D>>>2>>>0],kc:o()[D+4>>>2>>>0],Ib:o()[D+8>>>2>>>0],Mb:o()[D+12>>>2>>>0],Jb:o()[D+16>>>2>>>0],Db:o()[D+20>>>2>>>0],vb:o()[D+24>>>2>>>0],Cb:o()[D+28>>>2>>>0],sc:o()[D+32>>>2>>>0],jc:o()[D+36>>>2>>>0],mc:Pt?Ws(Pt):""},E=Ws(E),Pt={"%c":"%a %b %d %H:%M:%S %Y","%D":"%m/%d/%y","%F":"%Y-%m-%d","%h":"%b","%r":"%I:%M:%S %p","%R":"%H:%M","%T":"%H:%M:%S","%x":"%m/%d/%y","%X":"%H:%M:%S","%Ec":"%c","%EC":"%C","%Ex":"%m/%d/%y","%EX":"%H:%M:%S","%Ey":"%y","%EY":"%Y","%Od":"%d","%Oe":"%e","%OH":"%H","%OI":"%I","%Om":"%m","%OM":"%M","%OS":"%S","%Ou":"%u","%OU":"%U","%OV":"%V","%Ow":"%w","%OW":"%W","%Oy":"%y"})E=E.replace(new RegExp(Rt,"g"),Pt[Rt]);var us="Sunday Monday Tuesday Wednesday Thursday Friday Saturday".split(" "),_s="January February March April May June July August September October November December".split(" ");for(Rt in Pt={"%a":Ge=>us[Ge.vb].substring(0,3),"%A":Ge=>us[Ge.vb],"%b":Ge=>_s[Ge.Jb].substring(0,3),"%B":Ge=>_s[Ge.Jb],"%C":Ge=>fe((Ge.Db+1900)/100|0,2),"%d":Ge=>fe(Ge.Mb,2),"%e":Ge=>G(Ge.Mb,2," "),"%g":Ge=>bt(Ge).toString().substring(2),"%G":bt,"%H":Ge=>fe(Ge.Ib,2),"%I":Ge=>((Ge=Ge.Ib)==0?Ge=12:12{for(var os=0,Rs=0;Rs<=Ge.Jb-1;os+=(Ta(Ge.Db+1900)?Um:Wm)[Rs++]);return fe(Ge.Mb+os,3)},"%m":Ge=>fe(Ge.Jb+1,2),"%M":Ge=>fe(Ge.kc,2),"%n":()=>` +`,"%p":Ge=>0<=Ge.Ib&&12>Ge.Ib?"AM":"PM","%S":Ge=>fe(Ge.lc,2),"%t":()=>" ","%u":Ge=>Ge.vb||7,"%U":Ge=>fe(Math.floor((Ge.Cb+7-Ge.vb)/7),2),"%V":Ge=>{var os=Math.floor((Ge.Cb+7-(Ge.vb+6)%7)/7);if(2>=(Ge.vb+371-Ge.Cb-2)%7&&os++,os)os==53&&((Rs=(Ge.vb+371-Ge.Cb)%7)==4||Rs==3&&Ta(Ge.Db)||(os=1));else{os=52;var Rs=(Ge.vb+7-Ge.Cb-1)%7;(Rs==4||Rs==5&&Ta(Ge.Db%400-1))&&os++}return fe(os,2)},"%w":Ge=>Ge.vb,"%W":Ge=>fe(Math.floor((Ge.Cb+7-(Ge.vb+6)%7)/7),2),"%y":Ge=>(Ge.Db+1900).toString().substring(2),"%Y":Ge=>Ge.Db+1900,"%z":Ge=>{var os=0<=(Ge=Ge.jc);return Ge=Math.abs(Ge)/60,(os?"+":"-")+("0000"+(Ge/60*100+Ge%60)).slice(-4)},"%Z":Ge=>Ge.mc,"%%":()=>"%"},E=E.replace(/%%/g,"\0\0"),Pt)E.includes(Rt)&&(E=E.replace(new RegExp(Rt,"g"),Pt[Rt](D)));return Rt=function(Ge){var os=Array(ih(Ge)+1);return om(Ge,os,0,os.length),os}(E=E.replace(/\0\0/g,"%")),Rt.length>m?0:(N_(Rt,l),Rt.length-1)}function j_(l,m,E,D){return Gm(l>>>0,m>>>0,E>>>0,D>>>0)}z||function(){for(var l=u.numThreads-1;l--;)Zh();yp.unshift(()=>{nc++,function(m){z?m():Promise.all(qn.map(Jh)).then(m)}(()=>jh())})}();for(var Km=Array(256),kp=0;256>kp;++kp)Km[kp]=String.fromCharCode(kp);wm=Km,Qn=u.BindingError=class extends Error{constructor(l){super(l),this.name="BindingError"}},u.InternalError=class extends Error{constructor(l){super(l),this.name="InternalError"}},Pn.push(0,1,void 0,1,null,1,!0,1,!1,1),u.count_emval_handles=()=>Pn.length/2-5-lh.length;var V_=[rh,qh,em,nm,im,am,lm,um,dm,cm,pm,hm,mm,fm,_m,gm,Am,Im,zm,Bm,Rm,Nm,jm,Vm],Bt=function(){function l(E,D){return Bt=E.exports,Bt=function(){var G=Bt,fe={};for(let[Qe,et]of Object.entries(G))fe[Qe]=typeof et=="function"?(...bt)=>{Tp.push(Qe);try{return et(...bt)}finally{Ss||(Tp.pop(),ln&&Yn===1&&Tp.length===0&&(Yn=0,ki+=1,xp(tf),typeof Fibers<"u"&&Fibers.tc()))}}:et;return fe}(),Bt=function(){var G=Bt,fe=et=>bt=>et(bt)>>>0,Qe=et=>()=>et()>>>0;return(G=Object.assign({},G)).Da=fe(G.Da),G.gb=Qe(G.gb),G.ib=fe(G.ib),G.emscripten_main_runtime_thread_id=Qe(G.emscripten_main_runtime_thread_id),G.tb=fe(G.tb),G.ub=Qe(G.ub),G}(),Qh.push(Bt.jb),rc.unshift(Bt.Ca),St=D,jh(),Bt}var m=Kh();if(nc++,u.instantiateWasm)try{return u.instantiateWasm(m,l)}catch(E){It(`Module.instantiateWasm callback failed with error: ${E}`),C(E)}return Zp||=u.locateFile?Vh("ort-wasm-simd-threaded.jsep.wasm")?"ort-wasm-simd-threaded.jsep.wasm":u.locateFile?u.locateFile("ort-wasm-simd-threaded.jsep.wasm",Ie):Ie+"ort-wasm-simd-threaded.jsep.wasm":new URL(r("./node_modules/onnxruntime-web/dist/ort-wasm-simd-threaded.jsep.wasm"),r.b).href,function(E,D){var G=Zp;return nt||typeof WebAssembly.instantiateStreaming!="function"||Vh(G)||Uh(G)||typeof fetch!="function"?Gh(G,E,D):fetch(G,{credentials:"same-origin"}).then(fe=>WebAssembly.instantiateStreaming(fe,E).then(D,function(Qe){return It(`wasm streaming compile failed: ${Qe}`),It("falling back to ArrayBuffer instantiation"),Gh(G,E,D)}))}(m,function(E){l(E.instance,E.module)}).catch(C),{}}(),Hm=l=>(Hm=Bt.Da)(l),qm=()=>(qm=Bt.Ea)();u._OrtInit=(l,m)=>(u._OrtInit=Bt.Fa)(l,m),u._OrtGetLastError=(l,m)=>(u._OrtGetLastError=Bt.Ga)(l,m),u._OrtCreateSessionOptions=(l,m,E,D,G,fe,Qe,et,bt,Pt)=>(u._OrtCreateSessionOptions=Bt.Ha)(l,m,E,D,G,fe,Qe,et,bt,Pt),u._OrtAppendExecutionProvider=(l,m)=>(u._OrtAppendExecutionProvider=Bt.Ia)(l,m),u._OrtAddFreeDimensionOverride=(l,m,E)=>(u._OrtAddFreeDimensionOverride=Bt.Ja)(l,m,E),u._OrtAddSessionConfigEntry=(l,m,E)=>(u._OrtAddSessionConfigEntry=Bt.Ka)(l,m,E),u._OrtReleaseSessionOptions=l=>(u._OrtReleaseSessionOptions=Bt.La)(l),u._OrtCreateSession=(l,m,E)=>(u._OrtCreateSession=Bt.Ma)(l,m,E),u._OrtReleaseSession=l=>(u._OrtReleaseSession=Bt.Na)(l),u._OrtGetInputOutputCount=(l,m,E)=>(u._OrtGetInputOutputCount=Bt.Oa)(l,m,E),u._OrtGetInputName=(l,m)=>(u._OrtGetInputName=Bt.Pa)(l,m),u._OrtGetOutputName=(l,m)=>(u._OrtGetOutputName=Bt.Qa)(l,m),u._OrtFree=l=>(u._OrtFree=Bt.Ra)(l),u._OrtCreateTensor=(l,m,E,D,G,fe)=>(u._OrtCreateTensor=Bt.Sa)(l,m,E,D,G,fe),u._OrtGetTensorData=(l,m,E,D,G)=>(u._OrtGetTensorData=Bt.Ta)(l,m,E,D,G),u._OrtReleaseTensor=l=>(u._OrtReleaseTensor=Bt.Ua)(l),u._OrtCreateRunOptions=(l,m,E,D)=>(u._OrtCreateRunOptions=Bt.Va)(l,m,E,D),u._OrtAddRunConfigEntry=(l,m,E)=>(u._OrtAddRunConfigEntry=Bt.Wa)(l,m,E),u._OrtReleaseRunOptions=l=>(u._OrtReleaseRunOptions=Bt.Xa)(l),u._OrtCreateBinding=l=>(u._OrtCreateBinding=Bt.Ya)(l),u._OrtBindInput=(l,m,E)=>(u._OrtBindInput=Bt.Za)(l,m,E),u._OrtBindOutput=(l,m,E,D)=>(u._OrtBindOutput=Bt._a)(l,m,E,D),u._OrtClearBoundOutputs=l=>(u._OrtClearBoundOutputs=Bt.$a)(l),u._OrtReleaseBinding=l=>(u._OrtReleaseBinding=Bt.ab)(l),u._OrtRunWithBinding=(l,m,E,D,G)=>(u._OrtRunWithBinding=Bt.bb)(l,m,E,D,G),u._OrtRun=(l,m,E,D,G,fe,Qe,et)=>(u._OrtRun=Bt.cb)(l,m,E,D,G,fe,Qe,et),u._OrtEndProfiling=l=>(u._OrtEndProfiling=Bt.db)(l),u._JsepOutput=(l,m,E)=>(u._JsepOutput=Bt.eb)(l,m,E),u._JsepGetNodeName=l=>(u._JsepGetNodeName=Bt.fb)(l);var Sp,Pa=()=>(Pa=Bt.gb)(),un=u._free=l=>(un=u._free=Bt.hb)(l),$p=u._malloc=l=>($p=u._malloc=Bt.ib)(l),gh=(l,m,E,D,G,fe)=>(gh=Bt.lb)(l,m,E,D,G,fe),Qm=()=>(Qm=Bt.mb)(),Xm=(l,m,E,D,G)=>(Xm=Bt.nb)(l,m,E,D,G),wh=l=>(wh=Bt.ob)(l),Ap=l=>(Ap=Bt.pb)(l),Ym=()=>(Ym=Bt.qb)(),Jm=(l,m)=>(Jm=Bt.rb)(l,m),Ip=l=>(Ip=Bt.sb)(l),yh=l=>(yh=Bt.tb)(l),Mh=()=>(Mh=Bt.ub)(),Zm=u.dynCall_ii=(l,m)=>(Zm=u.dynCall_ii=Bt.wb)(l,m),ef=l=>(ef=Bt.xb)(l),tf=()=>(tf=Bt.yb)(),sf=l=>(sf=Bt.zb)(l),rf=()=>(rf=Bt.Ab)();function nf(){0Mh(),u.stackRestore=l=>Ip(l),u.stackAlloc=l=>yh(l),u.setValue=function(l,m,E="i8"){switch(E.endsWith("*")&&(E="*"),E){case"i1":case"i8":t()[l>>>0]=m;break;case"i16":n()[l>>>1>>>0]=m;break;case"i32":o()[l>>>2>>>0]=m;break;case"i64":xs[l>>>3]=BigInt(m);break;case"float":c()[l>>>2>>>0]=m;break;case"double":p()[l>>>3>>>0]=m;break;case"*":a()[l>>>2>>>0]=m;break;default:Hn(`invalid type for setValue: ${E}`)}},u.getValue=function(l,m="i8"){switch(m.endsWith("*")&&(m="*"),m){case"i1":case"i8":return t()[l>>>0];case"i16":return n()[l>>>1>>>0];case"i32":return o()[l>>>2>>>0];case"i64":return xs[l>>>3];case"float":return c()[l>>>2>>>0];case"double":return p()[l>>>3>>>0];case"*":return a()[l>>>2>>>0];default:Hn(`invalid type for getValue: ${m}`)}},u.UTF8ToString=Ws,u.stringToUTF8=xa,u.lengthBytesUTF8=ih,ic=function l(){Sp||nf(),Sp||(ic=l)},nf(),u.PTR_SIZE=4,k}),As=Ps,globalThis.self?.name==="em-pthread"&&Ps()}),Tr,Gr,Ns,Mr,Lt,Kr,Pr,Er,Hr,dr,qr,Cr,Dr,Lr=y(()=>{qe(),Tr=typeof location>"u"?void 0:location.origin,Gr=()=>import.meta.url?.startsWith("file:")?new URL(new URL(r("./node_modules/onnxruntime-web/dist/ort.bundle.min.mjs?46eb"),r.b).href,Tr).href:import.meta.url,Ns=Gr(),Mr=()=>{if(Ns&&!Ns.startsWith("blob:"))return Ns.substring(0,Ns.lastIndexOf("/")+1)},Lt=(e,t)=>{try{let s=t??Ns;return(s?new URL(e,s):new URL(e)).origin===Tr}catch{return!1}},Kr=(e,t)=>{let s=t??Ns;try{return(s?new URL(e,s):new URL(e)).href}catch{return}},Pr=(e,t)=>`${t??"./"}${e}`,Er=async e=>{let t=await(await fetch(e,{credentials:"same-origin"})).blob();return URL.createObjectURL(t)},Hr=async e=>(await import(e)).default,dr=(ss(),x(tt)).default,qr=async()=>{if(!Ns)throw new Error("Failed to load proxy worker: cannot determine the script source URL.");if(Lt(Ns))return[void 0,dr()];let e=await Er(Ns);return[e,dr(e)]},Cr=(tr(),x(Ts)).default,Dr=async(e,t,s)=>{if(!e&&!t&&Cr&&Ns&&Lt(Ns))return[void 0,Cr];{let n="ort-wasm-simd-threaded.jsep.mjs",i=e??Kr(n,t),o=s&&i&&!Lt(i,t),a=o?await Er(i):i??Pr(n,t);return[o?a:void 0,await Hr(a)]}}}),or,it,vt,Ft,Ys,Cn,dn,gs,br=y(()=>{Lr(),it=!1,vt=!1,Ft=!1,Ys=()=>{if(typeof SharedArrayBuffer>"u")return!1;try{return typeof MessageChannel<"u"&&new MessageChannel().port1.postMessage(new SharedArrayBuffer(1)),WebAssembly.validate(new Uint8Array([0,97,115,109,1,0,0,0,1,4,1,96,0,0,3,2,1,0,5,4,1,3,1,1,10,11,1,9,0,65,0,254,16,2,0,26,11]))}catch{return!1}},Cn=()=>{try{return WebAssembly.validate(new Uint8Array([0,97,115,109,1,0,0,0,1,4,1,96,0,0,3,2,1,0,10,30,1,28,0,65,0,253,15,253,12,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,253,186,1,26,11]))}catch{return!1}},dn=async e=>{if(it)return Promise.resolve();if(vt)throw new Error("multiple calls to 'initializeWebAssembly()' detected.");if(Ft)throw new Error("previous call to 'initializeWebAssembly()' failed.");vt=!0;let t=e.initTimeout,s=e.numThreads;if(!Cn())throw new Error("WebAssembly SIMD is not supported in the current environment.");let n=Ys();s>1&&!n&&(typeof self<"u"&&!self.crossOriginIsolated&&console.warn("env.wasm.numThreads is set to "+s+", but this will not work unless you enable crossOriginIsolated mode. See https://web.dev/cross-origin-isolation-guide/ for more info."),console.warn("WebAssembly multi-threading is not supported in the current environment. Falling back to single-threading."),e.numThreads=s=1);let i=e.wasmPaths,o=typeof i=="string"?i:void 0,a=i?.mjs,c=a?.href??a,p=i?.wasm,h=p?.href??p,C=e.wasmBinary,[u,k]=await Dr(c,o,s>1),B=!1,R=[];if(t>0&&R.push(new Promise(z=>{setTimeout(()=>{B=!0,z()},t)})),R.push(new Promise((z,ne)=>{let J={numThreads:s};if(C)J.wasmBinary=C;else if(h||o)J.locateFile=W=>h??o+W;else if(c&&c.indexOf("blob:")!==0)J.locateFile=W=>new URL(W,c).href;else if(u){let W=Mr();W&&(J.locateFile=ue=>W+ue)}k(J).then(W=>{vt=!1,it=!0,or=W,z(),u&&URL.revokeObjectURL(u)},W=>{vt=!1,Ft=!0,ne(W)})})),await Promise.race(R),B)throw new Error(`WebAssembly backend initializing failed due to timeout: ${t}ms`)},gs=()=>{if(it&&or)return or;throw new Error("WebAssembly is not initialized yet.")}}),Ls,Qr,ns,cn=y(()=>{br(),Ls=(e,t)=>{let s=gs(),n=s.lengthBytesUTF8(e)+1,i=s._malloc(n);return s.stringToUTF8(e,i,n),t.push(i),i},Qr=(e,t,s,n)=>{if(typeof e=="object"&&e!==null){if(s.has(e))throw new Error("Circular reference in options");s.add(e)}Object.entries(e).forEach(([i,o])=>{let a=t?t+i:i;if(typeof o=="object")Qr(o,a+".",s,n);else if(typeof o=="string"||typeof o=="number")n(a,o.toString());else if(typeof o=="boolean")n(a,o?"1":"0");else throw new Error(`Can't handle extra config type: ${typeof o}`)})},ns=e=>{let t=gs(),s=t.stackSave();try{let n=t.PTR_SIZE,i=t.stackAlloc(2*n);t._OrtGetLastError(i,i+n);let o=Number(t.getValue(i,n===4?"i32":"i64")),a=t.getValue(i+n,"*"),c=a?t.UTF8ToString(a):"";throw new Error(`${e} ERROR_CODE: ${o}, ERROR_MESSAGE: ${c}`)}finally{t.stackRestore(s)}}}),zr,Jn=y(()=>{br(),cn(),zr=e=>{let t=gs(),s=0,n=[],i=e||{};try{if(e?.logSeverityLevel===void 0)i.logSeverityLevel=2;else if(typeof e.logSeverityLevel!="number"||!Number.isInteger(e.logSeverityLevel)||e.logSeverityLevel<0||e.logSeverityLevel>4)throw new Error(`log serverity level is not valid: ${e.logSeverityLevel}`);if(e?.logVerbosityLevel===void 0)i.logVerbosityLevel=0;else if(typeof e.logVerbosityLevel!="number"||!Number.isInteger(e.logVerbosityLevel))throw new Error(`log verbosity level is not valid: ${e.logVerbosityLevel}`);e?.terminate===void 0&&(i.terminate=!1);let o=0;return e?.tag!==void 0&&(o=Ls(e.tag,n)),s=t._OrtCreateRunOptions(i.logSeverityLevel,i.logVerbosityLevel,!!i.terminate,o),s===0&&ns("Can't create run options."),e?.extra!==void 0&&Qr(e.extra,"",new WeakSet,(a,c)=>{let p=Ls(a,n),h=Ls(c,n);t._OrtAddRunConfigEntry(s,p,h)!==0&&ns(`Can't set a run config entry: ${a} - ${c}.`)}),[s,n]}catch(o){throw s!==0&&t._OrtReleaseRunOptions(s),n.forEach(a=>t._free(a)),o}}}),kn,Sn,$n,Br,An,Zn=y(()=>{br(),cn(),kn=e=>{switch(e){case"disabled":return 0;case"basic":return 1;case"extended":return 2;case"all":return 99;default:throw new Error(`unsupported graph optimization level: ${e}`)}},Sn=e=>{switch(e){case"sequential":return 0;case"parallel":return 1;default:throw new Error(`unsupported execution mode: ${e}`)}},$n=e=>{e.extra||(e.extra={}),e.extra.session||(e.extra.session={});let t=e.extra.session;t.use_ort_model_bytes_directly||(t.use_ort_model_bytes_directly="1"),e.executionProviders&&e.executionProviders.some(s=>(typeof s=="string"?s:s.name)==="webgpu")&&(e.enableMemPattern=!1)},Br=(e,t,s)=>{for(let n of t){let i=typeof n=="string"?n:n.name;switch(i){case"webnn":if(i="WEBNN",typeof n!="string"){let a=n?.deviceType;if(a){let c=Ls("deviceType",s),p=Ls(a,s);gs()._OrtAddSessionConfigEntry(e,c,p)!==0&&ns(`Can't set a session config entry: 'deviceType' - ${a}.`)}}break;case"webgpu":if(i="JS",typeof n!="string"){let a=n;if(a?.preferredLayout){if(a.preferredLayout!=="NCHW"&&a.preferredLayout!=="NHWC")throw new Error(`preferredLayout must be either 'NCHW' or 'NHWC': ${a.preferredLayout}`);let c=Ls("preferredLayout",s),p=Ls(a.preferredLayout,s);gs()._OrtAddSessionConfigEntry(e,c,p)!==0&&ns(`Can't set a session config entry: 'preferredLayout' - ${a.preferredLayout}.`)}}break;case"wasm":case"cpu":continue;default:throw new Error(`not supported execution provider: ${i}`)}let o=Ls(i,s);gs()._OrtAppendExecutionProvider(e,o)!==0&&ns(`Can't append execution provider: ${i}.`)}},An=e=>{let t=gs(),s=0,n=[],i=e||{};$n(i);try{let o=kn(i.graphOptimizationLevel??"all"),a=Sn(i.executionMode??"sequential"),c=typeof i.logId=="string"?Ls(i.logId,n):0,p=i.logSeverityLevel??2;if(!Number.isInteger(p)||p<0||p>4)throw new Error(`log serverity level is not valid: ${p}`);let h=i.logVerbosityLevel??0;if(!Number.isInteger(h)||h<0||h>4)throw new Error(`log verbosity level is not valid: ${h}`);let C=typeof i.optimizedModelFilePath=="string"?Ls(i.optimizedModelFilePath,n):0;if(s=t._OrtCreateSessionOptions(o,!!i.enableCpuMemArena,!!i.enableMemPattern,a,!!i.enableProfiling,0,c,p,h,C),s===0&&ns("Can't create session options."),i.executionProviders&&Br(s,i.executionProviders,n),i.enableGraphCapture!==void 0){if(typeof i.enableGraphCapture!="boolean")throw new Error(`enableGraphCapture must be a boolean value: ${i.enableGraphCapture}`);let u=Ls("enableGraphCapture",n),k=Ls(i.enableGraphCapture.toString(),n);t._OrtAddSessionConfigEntry(s,u,k)!==0&&ns(`Can't set a session config entry: 'enableGraphCapture' - ${i.enableGraphCapture}.`)}if(i.freeDimensionOverrides)for(let[u,k]of Object.entries(i.freeDimensionOverrides)){if(typeof u!="string")throw new Error(`free dimension override name must be a string: ${u}`);if(typeof k!="number"||!Number.isInteger(k)||k<0)throw new Error(`free dimension override value must be a non-negative integer: ${k}`);let B=Ls(u,n);t._OrtAddFreeDimensionOverride(s,B,k)!==0&&ns(`Can't set a free dimension override: ${u} - ${k}.`)}return i.extra!==void 0&&Qr(i.extra,"",new WeakSet,(u,k)=>{let B=Ls(u,n),R=Ls(k,n);t._OrtAddSessionConfigEntry(s,B,R)!==0&&ns(`Can't set a session config entry: ${u} - ${k}.`)}),[s,n]}catch(o){throw s!==0&&t._OrtReleaseSessionOptions(s)!==0&&ns("Can't release session options."),n.forEach(a=>t._free(a)),o}}}),Rr,fr,ar,pn,Xr,hn,mn,fn,Ot=y(()=>{Rr=e=>{switch(e){case"int8":return 3;case"uint8":return 2;case"bool":return 9;case"int16":return 5;case"uint16":return 4;case"int32":return 6;case"uint32":return 12;case"float16":return 10;case"float32":return 1;case"float64":return 11;case"string":return 8;case"int64":return 7;case"uint64":return 13;case"int4":return 22;case"uint4":return 21;default:throw new Error(`unsupported data type: ${e}`)}},fr=e=>{switch(e){case 3:return"int8";case 2:return"uint8";case 9:return"bool";case 5:return"int16";case 4:return"uint16";case 6:return"int32";case 12:return"uint32";case 10:return"float16";case 1:return"float32";case 11:return"float64";case 8:return"string";case 7:return"int64";case 13:return"uint64";case 22:return"int4";case 21:return"uint4";default:throw new Error(`unsupported data type: ${e}`)}},ar=(e,t)=>{let s=[-1,4,1,1,2,2,4,8,-1,1,2,8,4,8,-1,-1,-1,-1,-1,-1,-1,.5,.5][e],n=typeof t=="number"?t:t.reduce((i,o)=>i*o,1);return s>0?Math.ceil(n*s):void 0},pn=e=>{switch(e){case"float16":return typeof Float16Array<"u"&&Float16Array.from?Float16Array:Uint16Array;case"float32":return Float32Array;case"uint8":return Uint8Array;case"int8":return Int8Array;case"uint16":return Uint16Array;case"int16":return Int16Array;case"int32":return Int32Array;case"bool":return Uint8Array;case"float64":return Float64Array;case"uint32":return Uint32Array;case"int64":return BigInt64Array;case"uint64":return BigUint64Array;default:throw new Error(`unsupported type: ${e}`)}},Xr=e=>{switch(e){case"verbose":return 0;case"info":return 1;case"warning":return 2;case"error":return 3;case"fatal":return 4;default:throw new Error(`unsupported logging level: ${e}`)}},hn=e=>e==="float32"||e==="float16"||e==="int32"||e==="int64"||e==="uint32"||e==="uint8"||e==="bool"||e==="uint4"||e==="int4",mn=e=>e==="float32"||e==="float16"||e==="int32"||e==="int64"||e==="uint32"||e==="uint64"||e==="int8"||e==="uint8"||e==="bool"||e==="uint4"||e==="int4",fn=e=>{switch(e){case"none":return 0;case"cpu":return 1;case"cpu-pinned":return 2;case"texture":return 3;case"gpu-buffer":return 4;case"ml-tensor":return 5;default:throw new Error(`unsupported data location: ${e}`)}}}),_n,In=y(()=>{qe(),_n=async e=>{if(typeof e=="string"){let t=await fetch(e);if(!t.ok)throw new Error(`failed to load external data file: ${e}`);let s=t.headers.get("Content-Length"),n=s?parseInt(s,10):0;if(n<1073741824)return new Uint8Array(await t.arrayBuffer());{if(!t.body)throw new Error(`failed to load external data file: ${e}, no response body.`);let i=t.body.getReader(),o;try{o=new ArrayBuffer(n)}catch(c){if(c instanceof RangeError){let p=Math.ceil(n/65536);o=new WebAssembly.Memory({initial:p,maximum:p}).buffer}else throw c}let a=0;for(;;){let{done:c,value:p}=await i.read();if(c)break;let h=p.byteLength;new Uint8Array(o,a,h).set(p),a+=h}return new Uint8Array(o,0,n)}}else return e instanceof Blob?new Uint8Array(await e.arrayBuffer()):e instanceof Uint8Array?e:new Uint8Array(e)}}),Fn,On,Nr,Dn,gn,Ln,as,Te=y(()=>{Ot(),Fn=["V","I","W","E","F"],On=(e,t)=>{console.log(`[${Fn[e]},${new Date().toISOString()}]${t}`)},gn=(e,t)=>{Nr=e,Dn=t},Ln=(e,t)=>{let s=Xr(e),n=Xr(Nr);s>=n&&On(s,typeof t=="function"?t():t)},as=(...e)=>{Dn&&Ln(...e)}}),M,Y=y(()=>{Ot(),M=(e,t)=>new(pn(t))(e)}),ce=y(()=>{}),me,Fe,Ye,gt,wt,yt,pt,rs,Yt,Ms=y(()=>{Te(),ce(),me=new Map([[64,250],[128,200],[256,200],[512,200],[2048,230],[4096,200],[8192,50],[16384,50],[32768,50],[65536,50],[131072,50],[262144,50],[524288,50],[1048576,50],[2097152,30],[4194304,20],[8388608,10],[12582912,10],[16777216,10],[26214400,15],[33554432,22],[44236800,2],[58982400,6],[67108864,6],[134217728,6],[167772160,6]]),Fe=[],Ye=e=>Math.ceil(Number(e)/16)*16,gt=e=>{for(let t=0;twt++,pt=async(e,t,s,n)=>{let i=Ye(s),o=e.device.createBuffer({size:i,usage:GPUBufferUsage.COPY_DST|GPUBufferUsage.MAP_READ});try{let a=e.getCommandEncoder();e.endComputePass(),a.copyBufferToBuffer(t,0,o,0,i),e.flush(),await o.mapAsync(GPUMapMode.READ);let c=o.getMappedRange();if(n){let p=n();return p.set(new Uint8Array(c,0,s)),p}else return new Uint8Array(c.slice(0,s))}finally{o.destroy()}},rs=class{constructor(e){this.backend=e,this.storageCache=new Map,this.freeBuffers=new Map,this.freeUniformBuffers=new Map,this.buffersPending=[],this.capturedPendingBuffers=new Map;for(let[t]of me)Fe.push(t),this.freeBuffers.set(t,[]),this.freeUniformBuffers.set(t,[]);this.sessionCount=0}upload(e,t){let s=t.buffer,n=t.byteOffset,i=t.byteLength,o=Ye(i),a=this.storageCache.get(e);if(!a)throw new Error("gpu data for uploading does not exist");if(Number(a.originalSize)!==i)throw new Error(`inconsistent data size. gpu data size=${a.originalSize}, data size=${i}`);let c=this.backend.device.createBuffer({mappedAtCreation:!0,size:o,usage:GPUBufferUsage.MAP_WRITE|GPUBufferUsage.COPY_SRC}),p=c.getMappedRange();new Uint8Array(p).set(new Uint8Array(s,n,i)),c.unmap();let h=this.backend.device.createCommandEncoder();h.copyBufferToBuffer(c,0,a.gpuData.buffer,0,o),this.backend.device.queue.submit([h.finish()]),c.destroy(),as("verbose",()=>`[WebGPU] GpuDataManager.upload(id=${e})`)}memcpy(e,t){let s=this.storageCache.get(e);if(!s)throw new Error("source gpu data for memcpy does not exist");let n=this.storageCache.get(t);if(!n)throw new Error("destination gpu data for memcpy does not exist");if(s.originalSize!==n.originalSize)throw new Error("inconsistent source and destination gpu data size");let i=Ye(s.originalSize),o=this.backend.getCommandEncoder();this.backend.endComputePass(),o.copyBufferToBuffer(s.gpuData.buffer,0,n.gpuData.buffer,0,i)}registerExternalBuffer(e,t,s){let n;if(s){if(n=s[0],e===s[1])return as("verbose",()=>`[WebGPU] GpuDataManager.registerExternalBuffer(size=${t}) => id=${n}, buffer is the same, skip.`),n;if(this.backend.capturedCommandList.has(this.backend.currentSessionId))throw new Error(`Registering a different external buffer under graph capture mode is not supported yet. + Please use the previous external buffer!`)}else n=yt();return this.storageCache.set(n,{gpuData:{id:n,type:0,buffer:e},originalSize:t}),as("verbose",()=>`[WebGPU] GpuDataManager.registerExternalBuffer(size=${t}) => id=${n}, registered.`),n}unregisterExternalBuffer(e){e!==void 0&&(this.storageCache.delete(e),as("verbose",()=>`[WebGPU] GpuDataManager.unregisterExternalBuffer() => id=${e}`))}create(e,t=GPUBufferUsage.STORAGE|GPUBufferUsage.COPY_SRC|GPUBufferUsage.COPY_DST){let s=gt(e),n,i=(t&GPUBufferUsage.STORAGE)===GPUBufferUsage.STORAGE,o=(t&GPUBufferUsage.UNIFORM)===GPUBufferUsage.UNIFORM;if(i||o){let c=(i?this.freeBuffers:this.freeUniformBuffers).get(s);c?c.length>0?n=c.pop():n=this.backend.device.createBuffer({size:s,usage:t}):n=this.backend.device.createBuffer({size:s,usage:t})}else n=this.backend.device.createBuffer({size:s,usage:t});let a={id:yt(),type:0,buffer:n};return this.storageCache.set(a.id,{gpuData:a,originalSize:Number(e)}),as("verbose",()=>`[WebGPU] GpuDataManager.create(size=${e}) => id=${a.id}`),a}get(e){return this.storageCache.get(e)?.gpuData}release(e){let t=typeof e=="bigint"?Number(e):e,s=this.storageCache.get(t);if(!s){if(this.storageCache.size===0)return 0;throw new Error("releasing data does not exist")}return as("verbose",()=>`[WebGPU] GpuDataManager.release(id=${t}), gpuDataId=${s.gpuData.id}`),this.storageCache.delete(t),this.buffersPending.push(s.gpuData.buffer),s.originalSize}async download(e,t){let s=this.storageCache.get(Number(e));if(!s)throw new Error("data does not exist");await pt(this.backend,s.gpuData.buffer,s.originalSize,t)}refreshPendingBuffers(){if(this.buffersPending.length!==0)if(this.backend.sessionStatus==="default"){for(let e of this.buffersPending){let t=me.get(e.size);if((e.usage&GPUBufferUsage.STORAGE)===GPUBufferUsage.STORAGE){let s=this.freeBuffers.get(e.size)||[];t===void 0||s.length>=t?e.destroy():s.push(e)}else if((e.usage&GPUBufferUsage.UNIFORM)===GPUBufferUsage.UNIFORM){let s=this.freeUniformBuffers.get(e.size)||[];t===void 0||s.length>=t?e.destroy():s.push(e)}else e.destroy()}this.buffersPending=[]}else{let e=this.capturedPendingBuffers.get(this.backend.currentSessionId);e||(e=[],this.capturedPendingBuffers.set(this.backend.currentSessionId,e));for(let t of this.buffersPending)e.push(t);this.buffersPending=[]}}dispose(){this.freeBuffers.forEach(e=>{e.forEach(t=>{t.destroy()})}),this.freeUniformBuffers.forEach(e=>{e.forEach(t=>{t.destroy()})}),this.storageCache.forEach(e=>{e.gpuData.buffer.destroy()}),this.capturedPendingBuffers.forEach(e=>{e.forEach(t=>{t.destroy()})}),this.storageCache=new Map,this.freeBuffers=new Map,this.freeUniformBuffers=new Map,this.capturedPendingBuffers=new Map}onCreateSession(){this.sessionCount+=1}onReleaseSession(e){let t=this.capturedPendingBuffers.get(e);t&&(t.forEach(s=>{s.destroy()}),this.capturedPendingBuffers.delete(e)),this.sessionCount-=1,this.sessionCount===0&&(as("warning",()=>"[WebGPU] Clearing webgpu buffer cache"),this.storageCache.forEach(s=>{s.gpuData.buffer.destroy()}),this.storageCache=new Map)}},Yt=(...e)=>new rs(...e)}),Gs,jt,is=y(()=>{Gs=class{constructor(e){Object.assign(this,e)}get cacheKey(){return this.key||(this.key=Object.getOwnPropertyNames(this).sort().map(e=>`${this[e]}`).join(";")),this.key}},jt=e=>new Gs(e)}),Ks,Js,De,Xs,kr,Es,Hs,$t=y(()=>{Ks=class{static calcMatMulShape(e,t){return e[1]!==t[0]?void 0:[e[0],t[1]]}},Js=class{static calcShape(e,t,s=!1){let n=e.length,i=t.length;if(n===0)return t;if(i===0)return e;let o=Math.max(e.length,t.length),a=new Array(o);if(s){if(n<2||i<2)return;let c=Ks.calcMatMulShape([e[n-2],e[n-1]],[t[i-2],t[i-1]]);if(c===void 0)return;[a[o-2],a[o-1]]=c}for(let c=s?3:1;c<=o;c++){let p=n-c<0?1:e[n-c],h=i-c<0?1:t[i-c];if(p!==h&&p>1&&h>1)return;let C=Math.max(p,h);if(p&&h)a[o-c]=Math.max(p,h);else{if(C>1)return;a[o-c]=0}}return a}static isValidBroadcast(e,t){let s=e.length,n=t.length;if(s>n)return!1;for(let i=1;i<=s;i++)if(e[s-i]!==1&&e[s-i]!==t[n-i])return!1;return!0}},De=class Dp{static size(t){return Dp.getSizeFromDimensionRange(t,0,t.length)}static convertShape(t,s=4){let n=t.length;if(n===0)return[];let i=new Array(n),o=n-1;for(;o>=0;){if(t[o]%s===0){i[o]=t[o]/s;break}if(s%t[o]!==0)throw new Error("cannot convert shape");i[o]=1,s/=t[o],o--}for(o--;o>=0;o--)i[o]=t[o];return i}static sizeFromDimension(t,s){if(s<0||s>t.length)throw new Error(`invalid dimension of ${s} for sizeFromDimension as Tensor has ${t.length} dimensions.`);return Dp.getSizeFromDimensionRange(t,s,t.length)}static sizeToDimension(t,s){if(s<0||s>t.length)throw new Error(`invalid dimension of ${s} for sizeToDimension as Tensor has ${t.length} dimensions.`);return Dp.getSizeFromDimensionRange(t,0,s)}static getSizeFromDimensionRange(t,s,n){let i=1;for(let o=s;o=0;--i)n[i]=n[i+1]*t[i+1];return n}static normalizeAxis(t,s){if(t<-s&&t>=s)throw new Error("unsupported axis for this operation.");return t<0?t+s:t}static normalizeAxes(t,s){return t.map(n=>this.normalizeAxis(n,s??t.length))}static sortBasedOnPerm(t,s){return s?s.map(n=>t[n]):t.slice().reverse()}static padShape(t,s){let n=t.length;return t.map((i,o)=>i+s[o]+s[o+n])}static areEqual(t,s){return t.length!==s.length?!1:t.every((n,i)=>n===s[i])}},Xs=class ac{static adjustPoolAttributes(t,s,n,i,o,a){if(!t&&n.length!==s.length-2)throw new Error("length of specified kernel shapes should be 2 less than length of input dimensions");if(t)for(let c=0;c=n.length?n.push(s[c+2]):n[c]=s[c+2];for(let c=0;c=n[c]||a[c+n.length]>=n[c])throw new Error("pads should be smaller than kernel")}}static adjustPadsBasedOnAutoPad(t,s,n,i,o,a,c){if(c){if(o.length!==2*(t.length-2))throw new Error("length of pads should be twice the length of data dimensions");if(s.length!==t.length-2)throw new Error("length of strides should be the length of data dimensions");if(i.length!==t.length-2)throw new Error("length of kernel shapes should be the length of data dimensions");for(let p=0;p{Ot(),$t(),sr=64,_r=(e,t)=>{if(t===3)throw new Error("vec3 has same alignment as vec4, use vec4 instead");switch(Number(e)){case 10:return t>1?`vec${t}`:"f16";case 1:return t>1?`vec${t}`:"f32";case 6:return t>1?`vec${t}`:"i32";case 12:return t>1?`vec${t}`:"u32";case 7:if(t>1)throw new Error("currently not supported vecX of uint64 yet");return["vec2","i32"];case 13:if(t>1)throw new Error("currently not supported vecX of uint64 yet");return["vec2","u32"];case 9:if(t!==4)throw new Error("bool must be vec4");return["u32","vec4"];case 22:return"i32";case 21:return"u32";default:throw new Error(`Unknown data type: ${e}`)}},ds=(e,t=1)=>{let s=_r(e,t);return typeof s=="string"?s:s[0]},Cs=(e,t=1)=>{let s=_r(e,t);return typeof s=="string"?s:s[1]},Mt=(...e)=>{let t=[];return e.forEach(s=>{s.length!==0&&t.push({type:12,data:s},{type:12,data:De.computeStrides(s)})}),t},Gt=e=>e%4===0?4:e%2===0?2:1,Is=(e="f32",t,s="0")=>!t||t===1?`${e}(${s})`:`vec${t}<${e}>(${s})`,ks=(e,t,s)=>e==="f32"?s:t===1?`f32(${s})`:`vec${t}(${s})`,js=(e,t)=>t===4?`(${e}.x + ${e}.y + ${e}.z + ${e}.w)`:t===2?`(${e}.x + ${e}.y)`:t===3?`(${e}.x + ${e}.y + ${e}.z)`:e,Tt=(e,t,s,n)=>e.startsWith("uniforms.")&&s>4?typeof t=="string"?n==="f16"?`${e}[(${t}) / 8][(${t}) % 8 / 4][(${t}) % 8 % 4]`:`${e}[(${t}) / 4][(${t}) % 4]`:n==="f16"?`${e}[${Math.floor(t/8)}][${Math.floor(t%8/4)}][${t%8%4}]`:`${e}[${Math.floor(t/4)}][${t%4}]`:s>1?`${e}[${t}]`:e,Yr=(e,t,s,n,i)=>{let o=typeof s=="number",a=o?s:s.length,c=[...new Array(a).keys()],p=a<2?"u32":a<=4?`vec${a}`:`array`,h=_r(t,i),C=typeof h=="string"?h:h[1],u=typeof h=="string"?h:h[0],k={indices:p,value:C,storage:u,tensor:t},B=ut=>typeof ut=="string"?ut:`${ut}u`,R={offsetToIndices:!1,indicesToOffset:!1,broadcastedIndicesToOffset:!1,set:!1,setByIndices:!1,get:!1,getByIndices:!1},z=o?"uniforms.":"",ne=`${z}${e}_shape`,J=`${z}${e}_strides`,W="";for(let ut=0;ut ${k.indices} { + var indices: ${k.indices}; + var current = offset; + ${W} + return indices; + }`,he=ut=>(R.offsetToIndices=!0,a<2?ut:`o2i_${e}(${ut})`),be=[];if(a>=2)for(let ut=a-1;ut>=0;ut--)be.push(`${Tt(J,ut,a)} * (indices[${ut}])`);let Be=a<2?"":` + fn i2o_${e}(indices: ${k.indices}) -> u32 { + return ${be.join("+")}; + }`,Ie=ut=>(R.indicesToOffset=!0,a<2?ut:`i2o_${e}(${ut})`),nt=(...ut)=>a===0?"0u":`${k.indices}(${ut.map(B).join(",")})`,dt=(ut,xt)=>a<2?`${ut}`:`${Tt(ut,xt,a)}`,Et=(ut,xt,hs)=>a<2?`${ut}=${hs};`:`${Tt(ut,xt,a)}=${hs};`,zt={},It=(ut,xt)=>{R.broadcastedIndicesToOffset=!0;let hs=`${xt.name}broadcastedIndicesTo${e}Offset`;if(hs in zt)return`${hs}(${ut})`;let vs=[];for(let xs=a-1;xs>=0;xs--){let xn=xt.indicesGet("outputIndices",xs+xt.rank-a);vs.push(`${dt(J,xs)} * (${xn} % ${dt(ne,xs)})`)}return zt[hs]=`fn ${hs}(outputIndices: ${xt.type.indices}) -> u32 { + return ${vs.length>0?vs.join("+"):"0u"}; + }`,`${hs}(${ut})`},ht=(ut,xt)=>(()=>{if(k.storage===k.value)return`${e}[${ut}]=${xt};`;if(k.storage==="vec2"&&k.value==="i32")return`${e}[${ut}]=vec2(u32(${xt}), select(0u, 0xFFFFFFFFu, ${xt} < 0));`;if(k.storage==="vec2"&&k.value==="u32")return`${e}[${ut}]=vec2(u32(${xt}), 0u);`;if(k.storage==="u32"&&k.value==="vec4")return`${e}[${ut}]=dot(vec4(0x1, 0x100, 0x10000, 0x1000000), vec4(${xt}));`;throw new Error(`not supported combination of storage type ${k.storage} and value type ${k.value} yet`)})(),Jt=ut=>(()=>{if(k.storage===k.value)return`${e}[${ut}]`;if(k.storage==="vec2"&&k.value==="i32")return`i32(${e}[${ut}].x)`;if(k.storage==="vec2"&&k.value==="u32")return`u32(${e}[${ut}].x)`;if(k.storage==="u32"&&k.value==="vec4")return`vec4(bool(${e}[${ut}] & 0xFFu), bool(${e}[${ut}] & 0xFF00u), bool(${e}[${ut}] & 0xFF0000u), bool(${e}[${ut}] & 0xFF000000u))`;throw new Error(`not supported combination of storage type ${k.storage} and value type ${k.value} yet`)})(),Vt=a<2?"":` + fn get_${e}ByIndices(indices: ${k.indices}) -> ${C} { + return ${Jt(`i2o_${e}(indices)`)}; + }`,St=a<2?"":(()=>{let ut=c.map(hs=>`d${hs}: u32`).join(", "),xt=c.map(hs=>`d${hs}`).join(", ");return` + fn get_${e}(${ut}) -> ${C} { + return get_${e}ByIndices(${nt(xt)}); + }`})(),ts=(...ut)=>{if(ut.length!==a)throw new Error(`indices length must be ${a}`);let xt=ut.map(B).join(",");return a===0?Jt("0u"):a===1?Jt(xt[0]):(R.get=!0,R.getByIndices=!0,R.indicesToOffset=!0,`get_${e}(${xt})`)},Xt=ut=>a<2?Jt(ut):(R.getByIndices=!0,R.indicesToOffset=!0,`get_${e}ByIndices(${ut})`),Ut=a<2?"":` + fn set_${e}ByIndices(indices: ${k.indices}, value: ${C}) { + ${ht(`i2o_${e}(indices)`,"value")} + }`,$s=a<2?"":(()=>{let ut=c.map(hs=>`d${hs}: u32`).join(", "),xt=c.map(hs=>`d${hs}`).join(", ");return` + fn set_${e}(${ut}, value: ${C}) { + set_${e}ByIndices(${nt(xt)}, value); + }`})();return{impl:()=>{let ut=[],xt=!1;return R.offsetToIndices&&(ut.push(ue),xt=!0),R.indicesToOffset&&(ut.push(Be),xt=!0),R.broadcastedIndicesToOffset&&(Object.values(zt).forEach(hs=>ut.push(hs)),xt=!0),R.set&&(ut.push($s),xt=!0),R.setByIndices&&(ut.push(Ut),xt=!0),R.get&&(ut.push(St),xt=!0),R.getByIndices&&(ut.push(Vt),xt=!0),!o&&xt&&ut.unshift(`const ${ne} = ${k.indices}(${s.join(",")});`,`const ${J} = ${k.indices}(${De.computeStrides(s).join(",")});`),ut.join(` +`)},type:k,offsetToIndices:he,indicesToOffset:Ie,broadcastedIndicesToOffset:It,indices:nt,indicesGet:dt,indicesSet:Et,set:(...ut)=>{if(ut.length!==a+1)throw new Error(`indices length must be ${a}`);let xt=ut[a];if(typeof xt!="string")throw new Error("value must be string");let hs=ut.slice(0,a).map(B).join(",");return a===0?ht("0u",xt):a===1?ht(hs[0],xt):(R.set=!0,R.setByIndices=!0,R.indicesToOffset=!0,`set_${e}(${hs}, ${xt})`)},setByOffset:ht,setByIndices:(ut,xt)=>a<2?ht(ut,xt):(R.setByIndices=!0,R.indicesToOffset=!0,`set_${e}ByIndices(${ut}, ${xt});`),get:ts,getByOffset:Jt,getByIndices:Xt,usage:n,name:e,strides:J,shape:ne,rank:a}},He=(e,t,s,n=1)=>Yr(e,t,s,"input",n),Ct=(e,t,s,n=1)=>Yr(e,t,s,"output",n),Ea=(e,t,s)=>Yr(e,t,s,"atomicOutput",1),Ii=(e,t,s,n=1)=>Yr(e,t,s,"internal",n),Ca=class{constructor(e,t){this.normalizedDispatchGroup=e,this.limits=t,this.internalVariables=[],this.variables=[],this.uniforms=[],this.variableIndex=0}guardAgainstOutOfBoundsWorkgroupSizes(e){return`if (global_idx >= ${typeof e=="number"?`${e}u`:e}) { return; }`}mainStart(e=sr){let t=typeof e=="number"?e:e[0],s=typeof e=="number"?1:e[1],n=typeof e=="number"?1:e[2];if(t>this.limits.maxComputeWorkgroupSizeX||s>this.limits.maxComputeWorkgroupSizeY||n>this.limits.maxComputeWorkgroupSizeZ)throw new Error(`workgroup size [${t}, ${s}, ${n}] exceeds the maximum workgroup size [${this.limits.maxComputeWorkgroupSizeX}, ${this.limits.maxComputeWorkgroupSizeY}, ${this.limits.maxComputeWorkgroupSizeZ}].`);if(t*s*n>this.limits.maxComputeInvocationsPerWorkgroup)throw new Error(`workgroup size [${t}, ${s}, ${n}] exceeds the maximum workgroup invocations ${this.limits.maxComputeInvocationsPerWorkgroup}.`);let i=this.normalizedDispatchGroup[1]===1&&this.normalizedDispatchGroup[2]===1,o=i?`@builtin(global_invocation_id) global_id : vec3, + @builtin(workgroup_id) workgroup_id : vec3, + @builtin(local_invocation_index) local_idx : u32, + @builtin(local_invocation_id) local_id : vec3`:`@builtin(global_invocation_id) global_id : vec3, + @builtin(local_invocation_id) local_id : vec3, + @builtin(local_invocation_index) local_idx : u32, + @builtin(workgroup_id) workgroup_id : vec3, + @builtin(num_workgroups) num_workgroups : vec3`,a=i?`let global_idx = global_id.x; + let workgroup_index = workgroup_id.x;`:`let workgroup_index = workgroup_id.z * num_workgroups[0] * num_workgroups[1] + + workgroup_id.y * num_workgroups[0] + workgroup_id.x; + let global_idx = workgroup_index * ${t*s*n}u + local_idx;`;return`@compute @workgroup_size(${t}, ${s}, ${n}) + fn main(${o}) { + ${a} + `}appendVariableUniforms(e){e.rank!==0&&(e.shape.startsWith("uniforms.")&&this.uniforms.push({name:e.shape.replace("uniforms.",""),type:"u32",length:e.rank}),e.strides.startsWith("uniforms.")&&this.uniforms.push({name:e.strides.replace("uniforms.",""),type:"u32",length:e.rank}))}declareVariable(e,t){if(e.usage==="internal")throw new Error("cannot use internal variable with declareVariable(). use registerInternalVariables() instead.");this.variables.push(e),this.appendVariableUniforms(e);let s=e.usage==="input"?"read":"read_write",n=e.usage==="atomicOutput"?"atomic":e.type.storage;return`@group(0) @binding(${t}) var ${e.name}: array<${n}>;`}declareVariables(...e){return e.map(t=>this.declareVariable(t,this.variableIndex++)).join(` +`)}registerInternalVariable(e){if(e.usage!=="internal")throw new Error("cannot use input or output variable with registerInternalVariable(). use declareVariables() instead.");this.internalVariables.push(e),this.appendVariableUniforms(e)}registerInternalVariables(...e){return e.forEach(t=>this.registerInternalVariable(t)),this}registerUniform(e,t,s=1){return this.uniforms.push({name:e,type:t,length:s}),this}registerUniforms(e){return this.uniforms=this.uniforms.concat(e),this}uniformDeclaration(){if(this.uniforms.length===0)return"";let e=[];for(let{name:t,type:s,length:n}of this.uniforms)if(n&&n>4)s==="f16"?e.push(`@align(16) ${t}:array, ${Math.ceil(n/8)}>`):e.push(`${t}:array, ${Math.ceil(n/4)}>`);else{let i=n==null||n===1?s:`vec${n}<${s}>`;e.push(`${t}:${i}`)}return` + struct Uniforms { ${e.join(", ")} }; + @group(0) @binding(${this.variableIndex}) var uniforms: Uniforms;`}get additionalImplementations(){return this.uniformDeclaration()+this.variables.map(e=>e.impl()).join(` +`)+this.internalVariables.map(e=>e.impl()).join(` +`)}get variablesInfo(){if(this.uniforms.length===0)return;let e=t=>[12,10,1,6][["u32","f16","f32","i32"].indexOf(t)];return this.uniforms.map(t=>[e(t.type),t.length??1])}},ka=(e,t)=>new Ca(e,t)}),Sa,Fi,Oi,$a,Aa,Di,cr,Ia,Li,jr=y(()=>{Ot(),$t(),is(),qt(),Sa=(e,t)=>{if(!e||e.length!==1)throw new Error("Transpose requires 1 input.");if(t.length!==0&&t.length!==e[0].dims.length)throw new Error(`perm size ${t.length} does not match input rank ${e[0].dims.length}`)},Fi=(e,t)=>t.length!==0?t:[...new Array(e).keys()].reverse(),Oi=(e,t)=>De.sortBasedOnPerm(e,Fi(e.length,t)),$a=(e,t,s,n)=>{let i=`fn perm(i: ${n.type.indices}) -> ${s.type.indices} { + var a: ${s.type.indices};`;for(let o=0;o{let s=[],n=[];for(let i=0;i{let s=0;for(let n=0;n{let s=e.dataType,n=e.dims.length,i=Fi(n,t),o=Oi(e.dims,i),a=e.dims,c=o,p=n<2||Di(i,e.dims),h;if(p)return h=R=>{let z=He("input",s,a,4),ne=Ct("output",s,c,4);return` + ${R.registerUniform("output_size","u32").declareVariables(z,ne)} + ${R.mainStart()} + ${R.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + output[global_idx] = input[global_idx]; + }`},{name:"TransposeCopy",shaderCache:{inputDependencies:["type"]},getRunData:()=>{let R=De.size(o);return{outputs:[{dims:o,dataType:e.dataType}],dispatchGroup:{x:Math.ceil(R/64/4)},programUniforms:[{type:12,data:Math.ceil(R/4)}]}},getShaderSource:h};let{newShape:C,newPerm:u}=Aa(e.dims,i),k=De.areEqual(u,[2,3,1]),B=De.areEqual(u,[3,1,2]);if(C.length===2||k||B){a=k?[C[0],C[1]*C[2]]:B?[C[0]*C[1],C[2]]:C,c=[a[1],a[0]];let R=16;return h=z=>{let ne=He("a",s,a.length),J=Ct("output",s,c.length);return` + ${z.registerUniform("output_size","u32").declareVariables(ne,J)} + var tile : array, ${R}>; + ${z.mainStart([R,R,1])} + let stride = (uniforms.output_shape[1] - 1) / ${R} + 1; + let workgroup_id_x = workgroup_index % stride; + let workgroup_id_y = workgroup_index / stride; + let input_col = workgroup_id_y * ${R}u + local_id.x; + let input_row = workgroup_id_x * ${R}u + local_id.y; + if (input_row < uniforms.a_shape[0] && input_col < uniforms.a_shape[1]) { + tile[local_id.y][local_id.x] = ${ne.getByIndices(`${ne.type.indices}(input_row, input_col)`)}; + } + workgroupBarrier(); + + let output_col = workgroup_id_x * ${R}u + local_id.x; + let output_row = workgroup_id_y * ${R}u + local_id.y; + if (output_row < uniforms.output_shape[0] && output_col < uniforms.output_shape[1]) { + ${J.setByIndices(`${J.type.indices}(output_row, output_col)`,"tile[local_id.x][local_id.y]")} + } + }`},{name:"TransposeShared",shaderCache:{inputDependencies:["type"]},getRunData:()=>{let z=De.size(o);return{outputs:[{dims:o,dataType:e.dataType}],dispatchGroup:{x:Math.ceil(c[1]/R),y:Math.ceil(c[0]/R)},programUniforms:[{type:12,data:z},...Mt(a,c)]}},getShaderSource:h}}return h=R=>{let z=He("a",s,a.length),ne=Ct("output",s,c.length);return` + ${R.registerUniform("output_size","u32").declareVariables(z,ne)} + + ${$a(i,n,z,ne)} + + ${R.mainStart()} + ${R.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + + let indices = ${ne.offsetToIndices("global_idx")}; + let aIndices = perm(indices); + + ${ne.setByOffset("global_idx",z.getByIndices("aIndices"))} + }`},{name:"Transpose",shaderCache:{hint:`${t}`,inputDependencies:["rank"]},getRunData:()=>{let R=De.size(o);return{outputs:[{dims:o,dataType:e.dataType}],dispatchGroup:{x:Math.ceil(R/64)},programUniforms:[{type:12,data:R},...Mt(a,c)]}},getShaderSource:h}},Ia=(e,t)=>{Sa(e.inputs,t.perm),e.compute(cr(e.inputs[0],t.perm))},Li=e=>jt({perm:e.perm})}),ei,Fa,Oa,Da,La,za,Ba,Ra,zi,Na,pr,Jr,ja,uc,Va,dc,Ua,Bi,Wa,Ga,Ka,cc=y(()=>{Ot(),$t(),qt(),ri(),jr(),ei={max:"select(bestValue, candidate, candidate > bestValue)",min:"select(bestValue, candidate, candidate < bestValue)",mean:"bestValue + candidate",sum:"bestValue + candidate",prod:"bestValue * candidate",sumSquare:"bestValue + candidate * candidate",logSumExp:"bestValue + exp(candidate)",l1:"bestValue + abs(candidate)",l2:"bestValue + candidate * candidate",logSum:"bestValue + candidate"},Fa={max:"select(bestValue, candidate, candidate > bestValue)",min:"select(bestValue, candidate, candidate < bestValue)",mean:"bestValue + candidate",sum:"bestValue + candidate",prod:"bestValue * candidate",sumSquare:"bestValue + candidate",logSumExp:"bestValue + candidate",l1:"bestValue + candidate",l2:"bestValue + candidate",logSum:"bestValue + candidate"},Oa={max:"_A[offset]",min:"_A[offset]",mean:"0",sum:"0",prod:"1",sumSquare:"0",logSumExp:"0",l1:"0",l2:"0",logSum:"0"},Da={max:"bestValue",min:"bestValue",sum:"bestValue",prod:"bestValue",sumSquare:"bestValue",logSumExp:"log(bestValue)",l1:"bestValue",l2:"sqrt(bestValue)",logSum:"log(bestValue)"},La=(e,t)=>{let s=[];for(let n=t-e;n{let s=[],n=e.length;for(let o=0;oe[o]);return[s,i]},Ba=(e,t)=>{let s=e.length+t.length,n=[],i=0;for(let o=0;o{for(let s=0;s{let s=[];if(!Ra(e,t)){for(let n=0;ns.push(n))}return s},Na=(e,t,s,n,i,o,a)=>{let c=s[0].dims,p=De.size(o),h=De.size(a),C=He("_A",s[0].dataType,c),u=Ct("output",i,o),k=64;p===1&&(k=256);let B=` + var aBestValues : array; + `,R=z=>` + ${z.registerUniform("reduceSize","u32").declareVariables(C,u)} + ${B} + fn DIV_CEIL(a : u32, b : u32) -> u32 { + return ((a - 1u) / b + 1u); + } + ${z.mainStart(k)} + + let outputIndex = global_idx / ${k}; + let offset = outputIndex * uniforms.reduceSize; + + var bestValue = f32(${Oa[n]}); + let Length = uniforms.reduceSize; + for (var k = local_idx; k < Length; k = k + ${k}) { + let candidate = f32(${C.getByOffset("offset + k")}); + bestValue = ${ei[n]}; + } + aBestValues[local_idx] = bestValue; + workgroupBarrier(); + + var reduceSize = min(Length, ${k}u); + for (var currentSize = reduceSize / 2u; reduceSize > 1u; + currentSize = reduceSize / 2u) { + let interval = DIV_CEIL(reduceSize, 2u); + if (local_idx < currentSize) { + let candidate = aBestValues[local_idx + interval]; + bestValue = ${Fa[n]}; + aBestValues[local_idx] = bestValue; + } + reduceSize = interval; + workgroupBarrier(); + } + + if (local_idx == 0u) { + ${u.setByOffset("outputIndex",`${n==="mean"?`${u.type.storage}(bestValue / f32(uniforms.reduceSize))`:`${u.type.storage}(${Da[n]})`}`)}; + } + }`;return{name:e,shaderCache:{hint:`${t};${k}`,inputDependencies:["type"]},getShaderSource:R,getRunData:()=>({outputs:[{dims:o,dataType:i}],dispatchGroup:{x:p},programUniforms:[{type:12,data:h}]})}},pr=(e,t,s,n)=>{let i=e.inputs.length===1?s:Ri(e.inputs,s),o=i.axes;o.length===0&&!i.noopWithEmptyAxes&&(o=e.inputs[0].dims.map((B,R)=>R));let a=De.normalizeAxes(o,e.inputs[0].dims.length),c=a,p=e.inputs[0],h=zi(c,e.inputs[0].dims.length);h.length>0&&(p=e.compute(cr(e.inputs[0],h),{inputs:[0],outputs:[-1]})[0],c=La(c.length,p.dims.length));let[C,u]=za(p.dims,c),k=C;i.keepDims&&(k=Ba(C,a)),e.compute(Na(t,i.cacheKey,[p],n,e.inputs[0].dataType,k,u),{inputs:[p]})},Jr=(e,t)=>{pr(e,"ReduceMeanShared",t,"mean")},ja=(e,t)=>{pr(e,"ReduceL1Shared",t,"l1")},uc=(e,t)=>{pr(e,"ReduceL2Shared",t,"l2")},Va=(e,t)=>{pr(e,"ReduceLogSumExpShared",t,"logSumExp")},dc=(e,t)=>{pr(e,"ReduceMaxShared",t,"max")},Ua=(e,t)=>{pr(e,"ReduceMinShared",t,"min")},Bi=(e,t)=>{pr(e,"ReduceProdShared",t,"prod")},Wa=(e,t)=>{pr(e,"ReduceSumShared",t,"sum")},Ga=(e,t)=>{pr(e,"ReduceSumSquareShared",t,"sumSquare")},Ka=(e,t)=>{pr(e,"ReduceLogSumShared",t,"logSum")}}),gr,ti,si,Ri,wr,Ni,Ha,qa,ji,Qa,Xa,Vi,Ya,Ja,Ui,yr,Za,Wi,el,tl,Gi,sl,rl,Ki,nl,il,ri=y(()=>{Ot(),$t(),is(),qt(),cc(),gr=e=>{if(!e||e.length===0||e.length>2)throw new Error("Reduce op requires 1 or 2 inputs.");if(e.length===2&&e[1].dims.length!==1)throw new Error("Invalid axes input dims.")},ti=e=>["","",`var value = ${e.getByIndices("input_indices")};`,""],si=(e,t,s,n,i,o,a=!1,c=!1)=>{let p=[],h=s[0].dims,C=h.length,u=De.normalizeAxes(i,C),k=!c&&u.length===0;h.forEach((z,ne)=>{k||u.indexOf(ne)>=0?a&&p.push(1):p.push(z)});let B=p.length,R=De.size(p);return{name:e,shaderCache:t,getShaderSource:z=>{let ne=[],J=He("_A",s[0].dataType,C),W=Ct("output",o,B),ue=n(J,W,u),he=ue[2];for(let be=0,Be=0;be=0?(a&&Be++,he=`for(var j${be}: u32 = 0; j${be} < ${h[be]}; j${be}++) { + ${ue[2].includes("last_index")?`let last_index = j${be};`:""} + ${J.indicesSet("input_indices",be,`j${be}`)} + ${he} + }`):(ne.push(`${J.indicesSet("input_indices",be,W.indicesGet("output_indices",Be))};`),Be++);return` + + ${z.registerUniform("output_size","u32").declareVariables(J,W)} + + ${z.mainStart()} + ${z.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + var input_indices: ${J.type.indices}; + let output_indices = ${W.offsetToIndices("global_idx")}; + + ${ne.join(` +`)} + ${ue[0]} // init ops for reduce max/min + ${ue[1]} + ${he} + ${ue[3]} + ${ue.length===4?W.setByOffset("global_idx","value"):ue.slice(4).join(` +`)} + }`},getRunData:()=>({outputs:[{dims:p,dataType:o}],dispatchGroup:{x:Math.ceil(R/64)},programUniforms:[{type:12,data:R},...Mt(h,p)]})}},Ri=(e,t)=>{let s=[];return e[1].dims[0]>0&&e[1].getBigInt64Array().forEach(n=>s.push(Number(n))),jt({axes:s,keepDims:t.keepDims,noopWithEmptyAxes:t.noopWithEmptyAxes})},wr=(e,t,s,n)=>{let i=e.inputs,o=i.length===1?s:Ri(i,s);e.compute(si(t,{hint:o.cacheKey,inputDependencies:["rank"]},[i[0]],o.noopWithEmptyAxes&&o.axes.length===0?ti:n,o.axes,i[0].dataType,o.keepDims,o.noopWithEmptyAxes),{inputs:[0]})},Ni=(e,t)=>{gr(e.inputs),wr(e,"ReduceLogSum",t,(s,n)=>[`var value = ${n.type.storage}(0);`,"",`value += ${s.getByIndices("input_indices")};`,"value = log(value);"])},Ha=(e,t)=>{gr(e.inputs),wr(e,"ReduceL1",t,(s,n)=>[`var value = ${n.type.storage}(0);`,"",`value += abs(${s.getByIndices("input_indices")});`,""])},qa=(e,t)=>{gr(e.inputs),wr(e,"ReduceL2",t,(s,n)=>[`var t = ${n.type.value}(0); var value = ${n.type.value}(0);`,"",`t = ${s.getByIndices("input_indices")}; value += (t * t);`,"value = sqrt(value);"])},ji=(e,t)=>{gr(e.inputs),wr(e,"ReduceLogSumExp",t,(s,n)=>[`var value = ${n.type.storage}(0);`,"",`value += exp(${s.getByIndices("input_indices")});`,"value = log(value);"])},Qa=(e,t)=>{gr(e.inputs),wr(e,"ReduceMax",t,(s,n,i)=>{let o=[];for(let a=0;a=0||i.length===0)&&o.push(s.indicesSet("input_indices",a,0));return[`${o.join(` +`)}`,`var value = ${s.getByIndices("input_indices")};`,`value = max(value, ${s.getByIndices("input_indices")});`,""]})},Xa=(e,t)=>{gr(e.inputs),wr(e,"ReduceMean",t,(s,n,i)=>{let o=1;for(let a=0;a=0||i.length===0)&&(o*=e.inputs[0].dims[a]);return["var sum = f32(0);","",`sum += f32(${s.getByIndices("input_indices")});`,`let value = ${n.type.value}(sum / ${o});`]})},Vi=(e,t)=>{gr(e.inputs),wr(e,"ReduceMin",t,(s,n,i)=>{let o=[];for(let a=0;a=0||i.length===0)&&o.push(`input_indices[${a}] = 0;`);return[`${o.join(` +`)}`,`var value = ${s.getByIndices("input_indices")};`,`value = min(value, ${s.getByIndices("input_indices")});`,""]})},Ya=(e,t)=>{gr(e.inputs),wr(e,"ReduceProd",t,(s,n)=>[`var value = ${n.type.storage}(1);`,"",`value *= ${s.getByIndices("input_indices")};`,""])},Ja=(e,t)=>{gr(e.inputs),wr(e,"ReduceSum",t,(s,n)=>[`var value = ${n.type.storage}(0);`,"",`value += ${s.getByIndices("input_indices")};`,""])},Ui=(e,t)=>{gr(e.inputs),wr(e,"ReduceSumSquare",t,(s,n)=>[`var t = ${n.type.value}(0); var value = ${n.type.value}(0);`,"",`t = ${s.getByIndices("input_indices")}; value += t * t;`,""])},yr=(e,t,s)=>{if(t.length===0)return s;let n=1,i=1;for(let o=0;o1024},Za=(e,t)=>{yr(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Xa(e,t):Jr(e,t)},Wi=(e,t)=>{yr(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Ha(e,t):ja(e,t)},el=(e,t)=>{yr(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?qa(e,t):uc(e,t)},tl=(e,t)=>{yr(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?ji(e,t):Va(e,t)},Gi=(e,t)=>{yr(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Qa(e,t):dc(e,t)},sl=(e,t)=>{yr(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Vi(e,t):Ua(e,t)},rl=(e,t)=>{yr(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Ya(e,t):Bi(e,t)},Ki=(e,t)=>{yr(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Ja(e,t):Wa(e,t)},nl=(e,t)=>{yr(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Ui(e,t):Ga(e,t)},il=(e,t)=>{yr(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Ni(e,t):Ka(e,t)}}),Hi,ol,qi,Qi,pc=y(()=>{Ot(),is(),ri(),Hi=e=>{if(!e||e.length===0||e.length>2)throw new Error("ArgMinMaxOp op requires 1 or 2 inputs.");if(e[0].dataType!==1)throw new Error("Invalid input type.")},ol=(e,t)=>{Hi(e.inputs);let s=(n,i,o)=>{let a=[];for(let c=0;c=0||o.length===0)&&a.push(`input_indices[${c}] = 0;`);return[`${a.join(` +`)}`,`var value = ${n.getByIndices("input_indices")}; +var best_index : i32 = 0;`,`if (${n.getByIndices("input_indices")} ${t.selectLastIndex>0?"<=":"<"} value) { + value = ${n.getByIndices("input_indices")}; + best_index = i32(last_index); + }`,"",i.setByOffset("global_idx","best_index")]};e.compute(si("ArgMin",{hint:t.cacheKey,inputDependencies:["rank"]},[e.inputs[0]],s,[t.axis],7,t.keepDims),{inputs:[0]})},qi=(e,t)=>{Hi(e.inputs);let s=(n,i,o)=>{let a=[];for(let c=0;c=0||o.length===0)&&a.push(`input_indices[${c}] = 0;`);return[`${a.join(` +`)}`,`var value = ${n.getByIndices("input_indices")}; +var best_index : i32 = 0;`,`if (${n.getByIndices("input_indices")} ${t.selectLastIndex>0?">=":">"} value) { + value = ${n.getByIndices("input_indices")}; + best_index = i32(last_index); + }`,"",i.setByOffset("global_idx","best_index")]};e.compute(si("argMax",{hint:t.cacheKey,inputDependencies:["rank"]},[e.inputs[0]],s,[t.axis],7,t.keepDims),{inputs:[0]})},Qi=e=>jt(e)}),Xi,ni,al,Yi,ll,zn,Ji,ul,Zi=y(()=>{Ot(),$t(),ce(),qt(),Xi=(e,t)=>{let s=e[0],n=e[1],i=e[2],o=e[3],a=e[4],c=e[5];if(a&&c)throw new Error("Attention cannot have both past and attention_bias");if(s.dims.length!==3)throw new Error('Input "input" must have 3 dimensions');let p=s.dims[0],h=s.dims[1],C=s.dims[2];if(i.dims.length!==1)throw new Error('Input "bias" is expected to have 1 dimensions');if(n.dims.length!==2)throw new Error('Input "weights" is expected to have 2 dimensions');if(n.dims[0]!==C)throw new Error("Input 1 dimension 0 should have same length as dimension 2 of input 0");if(i.dims[0]!==n.dims[1])throw new Error('Input "bias" dimension 0 should have same length as dimension 1 of input "weights"');let u=i.dims[0]/3,k=u,B=k;if(t.qkvHiddenSizes.length>0){if(t.qkvHiddenSizes.length!==3)throw new Error("qkv_hidden_sizes attribute should have 3 elements");for(let ue of t.qkvHiddenSizes)if(ue%t.numHeads!==0)throw new Error("qkv_hidden_sizes should be divisible by num_heads");u=t.qkvHiddenSizes[0],k=t.qkvHiddenSizes[1],B=t.qkvHiddenSizes[2]}let R=h;if(u!==k)throw new Error("qkv_hidden_sizes first element should be same as the second");if(i.dims[0]!==u+k+B)throw new Error('Input "bias" dimension 0 should have same length as sum of Q/K/V hidden sizes');let z=0;if(a){if(k!==B)throw new Error('Input "past" expect k_hidden_size == v_hidden_size');if(a.dims.length!==5)throw new Error('Input "past" must have 5 dimensions');if(a.dims[0]!==2)throw new Error('Input "past" first dimension must be 2');if(a.dims[1]!==p)throw new Error('Input "past" second dimension must be batch_size');if(a.dims[2]!==t.numHeads)throw new Error('Input "past" third dimension must be num_heads');if(a.dims[4]!==k/t.numHeads)throw new Error('Input "past" fifth dimension must be k_hidden_size / num_heads');t.pastPresentShareBuffer||(z=a.dims[3])}let ne=R+z,J=-1,W=0;if(o)throw new Error("Mask not supported");if(a)throw new Error("past is not supported");if(c){if(c.dims.length!==4)throw new Error('Input "attention_bias" must have 4 dimensions');if(c.dims[0]!==p||c.dims[1]!==t.numHeads||c.dims[2]!==h||c.dims[3]!==ne)throw new Error('Expect "attention_bias" shape (batch_size, num_heads, sequence_length, total_sequence_length)')}return{batchSize:p,sequenceLength:h,pastSequenceLength:z,kvSequenceLength:R,totalSequenceLength:ne,maxSequenceLength:J,inputHiddenSize:C,hiddenSize:u,vHiddenSize:B,headSize:Math.floor(u/t.numHeads),vHeadSize:Math.floor(B/t.numHeads),numHeads:t.numHeads,isUnidirectional:!1,pastPresentShareBuffer:!1,maskFilterValue:t.maskFilterValue,maskType:W,scale:t.scale,broadcastResPosBias:!1,passPastInKv:!1,qkvFormat:1}},ni=(e,t,s)=>t&&e?` + let total_sequence_length_input = u32(${t.getByOffset("0")}); + let present_sequence_length = max(total_sequence_length_input, uniforms.past_sequence_length); + let is_subsequent_prompt: bool = sequence_length > 1 && sequence_length != total_sequence_length_input; + let is_first_prompt: bool = is_subsequent_prompt == false && sequence_length == total_sequence_length_input; + total_sequence_length = u32(${e?.getByOffset("batchIdx")}) + 1; + var past_sequence_length: u32 = 0; + if (is_first_prompt == false) { + past_sequence_length = total_sequence_length - sequence_length; + } + `:` + ${s?"let past_sequence_length = uniforms.past_sequence_length":""}; + let present_sequence_length = total_sequence_length; + `,al=(e,t,s,n,i,o,a,c)=>{let p=Gt(a?1:o),h=64,C=o/p;C{let W=Ct("x",e.dataType,e.dims,p),ue=[W],he=a?He("seq_lens",a.dataType,a.dims):void 0;he&&ue.push(he);let be=c?He("total_sequence_length_input",c.dataType,c.dims):void 0;be&&ue.push(be);let Be=Cs(e.dataType),Ie=[{name:"batch_size",type:"u32"},{name:"num_heads",type:"u32"},{name:"past_sequence_length",type:"u32"},{name:"sequence_length",type:"u32"},{name:"total_sequence_length",type:"u32"},{name:"elements_per_thread",type:"u32"}];return` + var thread_max: array; + var thread_sum: array; + ${J.registerUniforms(Ie).declareVariables(...ue)} + ${J.mainStart([h,1,1])} + let batchIdx = workgroup_id.z / uniforms.num_heads; + let headIdx = workgroup_id.z % uniforms.num_heads; + let sequence_length = uniforms.sequence_length; + var total_sequence_length = uniforms.total_sequence_length; + ${ni(he,be,!1)} + let local_offset = local_idx * uniforms.elements_per_thread; + let offset = (global_idx / ${h}) * uniforms.total_sequence_length + local_offset; + let seq_causal_length = ${a?"u32(past_sequence_length + workgroup_id.y + 1)":"total_sequence_length"}; + var thread_max_vector = ${R}(-3.402823e+38f); + for (var i: u32 = 0; i < uniforms.elements_per_thread && i + local_offset < seq_causal_length; i++) { + thread_max_vector = max(${R}(x[offset + i]), thread_max_vector); + } + thread_max[local_idx] = ${(()=>{switch(p){case 1:return"thread_max_vector";case 2:return"max(thread_max_vector.x, thread_max_vector.y)";case 4:return"max(max(thread_max_vector.x, thread_max_vector.y), max(thread_max_vector.z, thread_max_vector.w))";default:throw new Error(`Unsupported components: ${p}`)}})()}; + workgroupBarrier(); + + var max_value = f32(-3.402823e+38f); + for (var i = 0u; i < ${h}; i++) { + max_value = max(thread_max[i], max_value); + } + + var sum_vector = ${R}(0); + for (var i: u32 = 0; i < uniforms.elements_per_thread && i + local_offset < seq_causal_length; i++) { + sum_vector += exp(${R}(x[offset + i]) - max_value); + } + thread_sum[local_idx] = ${(()=>{switch(p){case 1:return"sum_vector";case 2:return"sum_vector.x + sum_vector.y";case 4:return"sum_vector.x + sum_vector.y + sum_vector.z + sum_vector.w";default:throw new Error(`Unsupported components: ${p}`)}})()}; + workgroupBarrier(); + + var sum: f32 = 0; + for (var i = 0u; i < ${h}; i++) { + sum += thread_sum[i]; + } + + if (sum == 0) { + for (var i: u32 = 0; i < uniforms.elements_per_thread && i + local_offset < seq_causal_length; i++) { + x[offset + i] = ${W.type.value}(${Be}(1.0) / ${Be}(seq_causal_length)); + } + } else { + for (var i: u32 = 0; i < uniforms.elements_per_thread && i + local_offset < seq_causal_length; i++) { + var f32input = ${R}(x[offset + i]); + x[offset + i] = ${W.type.value}(exp(f32input - max_value) / sum); + } + } + ${a?` + for (var total_seq_id: u32 = seq_causal_length; total_seq_id + local_offset < uniforms.total_sequence_length; total_seq_id++) { + x[offset + total_seq_id] = ${W.type.value}(${Be}(0)); + }`:""}; + }`};return{name:"AttentionProbsSoftmax",shaderCache:{hint:`${h};${B};${p}`,inputDependencies:z},getShaderSource:ne,getRunData:()=>({outputs:[],dispatchGroup:{x:Math.ceil(o/h),y:i,z:t*s},programUniforms:k})}},Yi=(e,t,s,n,i,o,a,c,p)=>{let h=a+o.kvSequenceLength,C=[o.batchSize,o.numHeads,o.sequenceLength,h],u=e>1&&n,k=o.kvNumHeads?o.kvNumHeads:o.numHeads,B=u?[o.batchSize,k,h,o.headSize]:void 0,R=o.nReps?o.nReps:1,z=o.scale===0?1/Math.sqrt(o.headSize):o.scale,ne=Gt(o.headSize),J=o.headSize/ne,W=12,ue={x:Math.ceil(h/W),y:Math.ceil(o.sequenceLength/W),z:o.batchSize*o.numHeads},he=[{type:12,data:o.sequenceLength},{type:12,data:J},{type:12,data:h},{type:12,data:o.numHeads},{type:12,data:o.headSize},{type:1,data:z},{type:12,data:a},{type:12,data:o.kvSequenceLength},{type:12,data:R}],be=u&&n&&De.size(n.dims)>0,Be=["type","type"];be&&Be.push("type"),i&&Be.push("type"),c&&Be.push("type"),p&&Be.push("type");let Ie=[{dims:C,dataType:t.dataType,gpuDataType:0}];u&&Ie.push({dims:B,dataType:t.dataType,gpuDataType:0});let nt=dt=>{let Et=He("q",t.dataType,t.dims,ne),zt=He("key",s.dataType,s.dims,ne),It=[Et,zt];if(be){let Ut=He("past_key",n.dataType,n.dims,ne);It.push(Ut)}i&&It.push(He("attention_bias",i.dataType,i.dims));let ht=c?He("seq_lens",c.dataType,c.dims):void 0;ht&&It.push(ht);let Jt=p?He("total_sequence_length_input",p.dataType,p.dims):void 0;Jt&&It.push(Jt);let Vt=Ct("output",t.dataType,C),St=[Vt];u&&St.push(Ct("present_key",t.dataType,B,ne));let ts=Cs(1,ne),Xt=[{name:"M",type:"u32"},{name:"K",type:"u32"},{name:"N",type:"u32"},{name:"num_heads",type:"u32"},{name:"head_size",type:"u32"},{name:"alpha",type:"f32"},{name:"past_sequence_length",type:"u32"},{name:"kv_sequence_length",type:"u32"},{name:"n_reps",type:"u32"}];return` + const TILE_SIZE = ${W}u; + + var tileQ: array<${Et.type.storage}, ${W*W}>; + var tileK: array<${Et.type.storage}, ${W*W}>; + ${dt.registerUniforms(Xt).declareVariables(...It,...St)} + ${dt.mainStart([W,W,1])} + // x holds the N and y holds the M + let headIdx = workgroup_id.z % uniforms.num_heads; + let kvHeadIdx = ${R===1?"headIdx":"headIdx / uniforms.n_reps"}; + let kv_num_heads = ${R===1?"uniforms.num_heads":"uniforms.num_heads / uniforms.n_reps"}; + let batchIdx = workgroup_id.z / uniforms.num_heads; + let m = workgroup_id.y * TILE_SIZE; + let n = workgroup_id.x * TILE_SIZE; + let sequence_length = uniforms.M; + var total_sequence_length = uniforms.N; + ${ni(ht,Jt,!0)} + let absKvHeadIdx = batchIdx * kv_num_heads + kvHeadIdx; + let qOffset = workgroup_id.z * uniforms.M * uniforms.K + m * uniforms.K; + ${be&&u?"let pastKeyOffset = absKvHeadIdx * uniforms.past_sequence_length * uniforms.K;":""}; + let kOffset = absKvHeadIdx * uniforms.kv_sequence_length * uniforms.K; + ${u?"let presentKeyOffset = absKvHeadIdx * uniforms.N * uniforms.K;":""} + var value = ${ts}(0); + for (var w: u32 = 0u; w < uniforms.K; w += TILE_SIZE) { + if (global_id.y < uniforms.M && w + local_id.x < uniforms.K) { + tileQ[TILE_SIZE * local_id.y + local_id.x] = q[qOffset + local_id.y * uniforms.K + w + local_id.x]; + } + if (n + local_id.y < uniforms.N && w + local_id.x < uniforms.K) { + var idx = TILE_SIZE * local_id.y + local_id.x; + ${be&&u?` + if (n + local_id.y < past_sequence_length) { + tileK[idx] = past_key[pastKeyOffset + (n + local_id.y) * uniforms.K + w + local_id.x]; + } else if (n + local_id.y - past_sequence_length < uniforms.kv_sequence_length) { + tileK[idx] = key[kOffset + (n + local_id.y - past_sequence_length) * uniforms.K + w + local_id.x]; + }`:` + if (n + local_id.y < uniforms.kv_sequence_length) { + tileK[idx] = key[kOffset + (n + local_id.y) * uniforms.K + w + local_id.x]; + }`} + ${u?`if (n + local_id.y < present_sequence_length) { + present_key[presentKeyOffset + (n + local_id.y) * uniforms.K + w + local_id.x] = tileK[idx]; + }`:""} + } + workgroupBarrier(); + + for (var k: u32 = 0u; k < TILE_SIZE && w+k < uniforms.K; k++) { + value += ${ts}(tileQ[TILE_SIZE * local_id.y + k] * tileK[TILE_SIZE * local_id.x + k]); + } + + workgroupBarrier(); + } + + if (global_id.y < uniforms.M && global_id.x < total_sequence_length) { + let headOffset = workgroup_id.z * uniforms.M * uniforms.N; + let outputIdx = headOffset + global_id.y * uniforms.N + global_id.x; + var sum: f32 = ${(()=>{switch(ne){case 1:return"value";case 2:return"value.x + value.y";case 4:return"value.x + value.y + value.z + value.w";default:throw new Error(`Unsupported components: ${ne}`)}})()}; + output[outputIdx] = ${Vt.type.value} (sum * uniforms.alpha) + ${i?"attention_bias[outputIdx]":"0.0"}; + } + }`};return{name:"AttentionProbs",shaderCache:{hint:`${ne};${i!==void 0};${n!==void 0};${e}`,inputDependencies:Be},getRunData:()=>({outputs:Ie,dispatchGroup:ue,programUniforms:he}),getShaderSource:nt}},ll=(e,t,s,n,i,o,a=void 0,c=void 0)=>{let p=o+i.kvSequenceLength,h=i.nReps?i.nReps:1,C=i.vHiddenSize*h,u=e>1&&n,k=i.kvNumHeads?i.kvNumHeads:i.numHeads,B=u?[i.batchSize,k,p,i.headSize]:void 0,R=[i.batchSize,i.sequenceLength,C],z=12,ne={x:Math.ceil(i.vHeadSize/z),y:Math.ceil(i.sequenceLength/z),z:i.batchSize*i.numHeads},J=[{type:12,data:i.sequenceLength},{type:12,data:p},{type:12,data:i.vHeadSize},{type:12,data:i.numHeads},{type:12,data:i.headSize},{type:12,data:C},{type:12,data:o},{type:12,data:i.kvSequenceLength},{type:12,data:h}],W=u&&n&&De.size(n.dims)>0,ue=["type","type"];W&&ue.push("type"),a&&ue.push("type"),c&&ue.push("type");let he=[{dims:R,dataType:t.dataType,gpuDataType:0}];u&&he.push({dims:B,dataType:t.dataType,gpuDataType:0});let be=Be=>{let Ie=He("probs",t.dataType,t.dims),nt=He("v",s.dataType,s.dims),dt=[Ie,nt];W&&dt.push(He("past_value",n.dataType,n.dims));let Et=a?He("seq_lens",a.dataType,a.dims):void 0;a&&dt.push(Et);let zt=c?He("total_sequence_length_input",c.dataType,c.dims):void 0;c&&dt.push(zt);let It=[Ct("output",t.dataType,R)];u&&It.push(Ct("present_value",t.dataType,B));let ht=[{name:"M",type:"u32"},{name:"K",type:"u32"},{name:"N",type:"u32"},{name:"num_heads",type:"u32"},{name:"head_size",type:"u32"},{name:"v_hidden_size",type:"u32"},{name:"past_sequence_length",type:"u32"},{name:"kv_sequence_length",type:"u32"},{name:"n_reps",type:"u32"}];return` + const TILE_SIZE = ${z}u; + var tileQ: array<${Ie.type.value}, ${z*z}>; + var tileV: array<${Ie.type.value}, ${z*z}>; + ${Be.registerUniforms(ht).declareVariables(...dt,...It)} + ${Be.mainStart([z,z,1])} + let headIdx = workgroup_id.z % uniforms.num_heads; + let batchIdx = workgroup_id.z / uniforms.num_heads; + let kvHeadIdx = ${h===1?"headIdx":"headIdx / uniforms.n_reps"}; + let kv_num_heads = ${h===1?"uniforms.num_heads":"uniforms.num_heads / uniforms.n_reps"}; + let m = global_id.y; + let n = global_id.x; + let sequence_length = uniforms.M; + var total_sequence_length = uniforms.K; + ${ni(Et,zt,!0)} + let offsetA = workgroup_id.z * uniforms.M * uniforms.K + m * uniforms.K; + let absKvHeadIdx = batchIdx * kv_num_heads + kvHeadIdx; // kvHeadIdx is relative to the batch + ${W&&u?"let pastValueOffset = absKvHeadIdx * uniforms.N * uniforms.past_sequence_length + n;":""}; + let vOffset = absKvHeadIdx * uniforms.N * uniforms.kv_sequence_length + n; + ${u?"let presentValueOffset = absKvHeadIdx * uniforms.N * uniforms.K + n;":""} + var value = ${Ie.type.storage}(0); + for (var w: u32 = 0u; w < uniforms.K; w += TILE_SIZE) { + if (m < uniforms.M && w + local_id.x < uniforms.K) { + tileQ[TILE_SIZE * local_id.y + local_id.x] = probs[offsetA + w + local_id.x]; + } + if (n < uniforms.N && w + local_id.y < uniforms.K) { + var idx = TILE_SIZE * local_id.y + local_id.x; + ${W&&u?` + if (w + local_id.y < past_sequence_length) { + tileV[idx] = past_value[pastValueOffset + (w + local_id.y) * uniforms.N]; + } else if (w + local_id.y - past_sequence_length < uniforms.kv_sequence_length) { + tileV[idx] = v[vOffset + (w + local_id.y - past_sequence_length) * uniforms.N]; + } + `:` + if (w + local_id.y < uniforms.kv_sequence_length) { + tileV[idx] = v[vOffset + (w + local_id.y) * uniforms.N]; + }`} + ${u?` + if (w + local_id.y < present_sequence_length) { + present_value[presentValueOffset + (w + local_id.y) * uniforms.N] = tileV[idx]; + }`:""} + } + workgroupBarrier(); + for (var k: u32 = 0u; k < TILE_SIZE && w+k < total_sequence_length; k++) { + value += tileQ[TILE_SIZE * local_id.y + k] * tileV[TILE_SIZE * k + local_id.x]; + } + workgroupBarrier(); + } + + // we need to transpose output from BNSH_v to BSND_v + if (m < uniforms.M && n < uniforms.N) { + let outputIdx = batchIdx * uniforms.M * uniforms.v_hidden_size + m * uniforms.v_hidden_size + + headIdx * uniforms.N + n; + output[outputIdx] = value; + } + }`};return{name:"AttentionScore",shaderCache:{hint:`${n!==void 0};${e}`,inputDependencies:ue},getRunData:()=>({outputs:he,dispatchGroup:ne,programUniforms:J}),getShaderSource:be}},zn=(e,t,s,n,i,o,a,c,p,h,C=void 0,u=void 0)=>{let k=Math.min(e.outputCount,1+(a?1:0)+(c?1:0)),B=k>1?h.pastSequenceLength:0,R=B+h.kvSequenceLength,z=p&&De.size(p.dims)>0?p:void 0,ne=[t,s];k>1&&a&&De.size(a.dims)>0&&ne.push(a),z&&ne.push(z),C&&ne.push(C),u&&ne.push(u);let J=e.compute(Yi(k,t,s,a,z,h,B,C,u),{inputs:ne,outputs:k>1?[-1,1]:[-1]})[0];e.compute(al(J,h.batchSize,h.numHeads,B,h.sequenceLength,R,C,u),{inputs:C&&u?[J,C,u]:[J],outputs:[]});let W=[J,n];k>1&&c&&De.size(c.dims)>0&&W.push(c),C&&W.push(C),u&&W.push(u),e.compute(ll(k,J,n,c,h,B,C,u),{inputs:W,outputs:k>1?[0,2]:[0]})},Ji=(e,t)=>{let s=[t.batchSize,t.numHeads,t.sequenceLength,t.headSize],n=t.sequenceLength,i=t.inputHiddenSize,o=t.headSize,a=12,c={x:Math.ceil(t.headSize/a),y:Math.ceil(t.sequenceLength/a),z:t.batchSize*t.numHeads},p=[e.inputs[0],e.inputs[1],e.inputs[2]],h=[{type:12,data:n},{type:12,data:i},{type:12,data:o},{type:12,data:t.numHeads},{type:12,data:t.headSize},{type:12,data:t.hiddenSize},{type:12,data:t.hiddenSize+t.hiddenSize+t.vHiddenSize}],C=u=>{let k=Ct("output_q",p[0].dataType,s),B=Ct("output_k",p[0].dataType,s),R=Ct("output_v",p[0].dataType,s),z=He("input",p[0].dataType,p[0].dims),ne=He("weight",p[1].dataType,p[1].dims),J=He("bias",p[2].dataType,p[2].dims),W=z.type.storage,ue=[{name:"M",type:"u32"},{name:"K",type:"u32"},{name:"N",type:"u32"},{name:"num_heads",type:"u32"},{name:"head_size",type:"u32"},{name:"hidden_size",type:"u32"},{name:"ldb",type:"u32"}];return` + const TILE_SIZE = ${a}u; + var tileInput: array<${W}, ${a*a}>; + var tileWeightQ: array<${W}, ${a*a}>; + var tileWeightK: array<${W}, ${a*a}>; + var tileWeightV: array<${W}, ${a*a}>; + ${u.registerUniforms(ue).declareVariables(z,ne,J,k,B,R)} + ${u.mainStart([a,a,1])} + let batchIndex = workgroup_id.z / uniforms.num_heads; + let headNumber = workgroup_id.z % uniforms.num_heads; + let m = global_id.y; + let n = global_id.x; + + let inputOffset = batchIndex * (uniforms.M * uniforms.K) + m * uniforms.K; + let biasOffsetQ = headNumber * uniforms.head_size; + let biasOffsetK = uniforms.hidden_size + biasOffsetQ; + let biasOffsetV = uniforms.hidden_size + biasOffsetK; + + var valueQ = ${W}(0); + var valueK = ${W}(0); + var valueV = ${W}(0); + for (var w: u32 = 0u; w < uniforms.K; w += TILE_SIZE) { + if (m < uniforms.M && w + local_id.x < uniforms.K) { + tileInput[TILE_SIZE * local_id.y + local_id.x] = input[inputOffset + w + local_id.x]; + } + if (n < uniforms.N && w + local_id.y < uniforms.K) { + let offset = n + (w + local_id.y) * uniforms.ldb; + tileWeightQ[TILE_SIZE * local_id.y + local_id.x] = weight[biasOffsetQ + offset]; + tileWeightK[TILE_SIZE * local_id.y + local_id.x] = weight[biasOffsetK + offset]; + tileWeightV[TILE_SIZE * local_id.y + local_id.x] = weight[biasOffsetV + offset]; + } + workgroupBarrier(); + for (var k: u32 = 0u; k({outputs:[{dims:s,dataType:e.inputs[0].dataType,gpuDataType:0},{dims:s,dataType:e.inputs[0].dataType,gpuDataType:0},{dims:s,dataType:e.inputs[0].dataType,gpuDataType:0}],dispatchGroup:c,programUniforms:h}),getShaderSource:C},{inputs:p,outputs:[-1,-1,-1]})},ul=(e,t)=>{let s=Xi(e.inputs,t),[n,i,o]=Ji(e,s);return zn(e,n,i,o,e.inputs[4],void 0,void 0,void 0,e.inputs[5],s)}}),eo,dl,cl,to,hc=y(()=>{We(),Ot(),$t(),is(),qt(),eo=(e,t)=>{if(!e||e.length!==5)throw new Error("BatchNormalization requires 5 inputs");let s=(n,i,o)=>{let a=i.length;if(a!==n.length)throw new Error(`${o}: num dimensions != ${a}`);i.forEach((c,p)=>{if(c!==n[p])throw new Error(`${o}: dim[${p}] do not match`)})};if(e[0].dims.length>1){let n=t.format==="NHWC"?t.spatial?e[0].dims.slice(-1):e[0].dims.slice(-1).concat(e[0].dims.slice(1,e[0].dims.length-1)):e[0].dims.slice(1,t.spatial?2:void 0);s(e[1].dims,n,"Invalid input scale"),s(e[2].dims,n,"Invalid input B"),s(e[3].dims,n,"Invalid input mean"),s(e[4].dims,n,"Invalid input var")}else s(e[1].dims,[1],"Invalid input scale"),s(e[2].dims,[1],"Invalid input B"),s(e[3].dims,[1],"Invalid input mean"),s(e[4].dims,[1],"Invalid input var")},dl=(e,t)=>{let{epsilon:s,spatial:n,format:i}=t,o=e[0].dims,a=n?Gt(o[o.length-1]):1,c=i==="NHWC"&&o.length>1?a:1,p=De.size(o)/a,h=n,C=h?o.length:o,u=He("x",e[0].dataType,e[0].dims,a),k=He("scale",e[1].dataType,e[1].dims,c),B=He("bias",e[2].dataType,e[2].dims,c),R=He("inputMean",e[3].dataType,e[3].dims,c),z=He("inputVar",e[4].dataType,e[4].dims,c),ne=Ct("y",e[0].dataType,C,a),J=()=>{let ue="";if(n)ue=`let cOffset = ${o.length===1?"0u":i==="NHWC"?`outputIndices[${o.length-1}] / ${a}`:"outputIndices[1]"};`;else if(i==="NCHW")ue=` + ${ne.indicesSet("outputIndices","0","0")} + let cOffset = ${ne.indicesToOffset("outputIndices")};`;else{ue=`var cIndices = ${k.type.indices}(0); + cIndices[0] = outputIndices[${o.length-1}];`;for(let he=1;he` + const epsilon = ${s}; + ${ue.registerUniform("outputSize","u32").declareVariables(u,k,B,R,z,ne)} + ${ue.mainStart()} + ${ue.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} + var outputIndices = ${ne.offsetToIndices(`global_idx * ${a}`)}; + ${J()} + let scale = ${k.getByOffset("cOffset")}; + let bias = ${B.getByOffset("cOffset")}; + let inputMean = ${R.getByOffset("cOffset")}; + let inputVar = ${z.getByOffset("cOffset")}; + let x = ${u.getByOffset("global_idx")}; + let value = (x - inputMean) * inverseSqrt(inputVar + epsilon) * scale + bias; + ${ne.setByOffset("global_idx","value")} + }`;return{name:"BatchNormalization",shaderCache:{hint:`${t.epsilon}_${t.format}_${n}_${a}`,inputDependencies:h?["rank","type","type","type","type"]:void 0},getShaderSource:W,getRunData:()=>({outputs:[{dims:e[0].dims,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(p/64)},programUniforms:h?[{type:12,data:p},...Mt(o)]:[{type:12,data:p}]})}},cl=e=>jt(e),to=(e,t)=>{let{inputs:s,outputCount:n}=e,i=cl({...t,outputCount:n});if(F.webgpu.validateInputContent&&eo(s,i),t.trainingMode)throw new Error("BatchNormalization trainingMode is not supported yet.");e.compute(dl(s,i))}}),pl,so,hl,mc=y(()=>{$t(),qt(),pl=e=>{if(e[0].dims.length!==3)throw new Error("input should have 3 dimensions");if(![320,640,1280].includes(e[0].dims[2]))throw new Error("number of channels should be 320, 640 or 1280");if(e[1].dims.length!==1)throw new Error("bias is expected to have 1 dimensions");if(e[0].dims[2]!==e[1].dims[0])throw new Error("last dimension of input and bias are not the same")},so=e=>{let t=e[0].dims,s=e[0].dims[2],n=De.size(t)/4,i=e[0].dataType,o=He("input",i,t,4),a=He("bias",i,[s],4),c=He("residual",i,t,4),p=Ct("output",i,t,4);return{name:"BiasAdd",getRunData:()=>({outputs:[{dims:t,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(n/64)}}),getShaderSource:h=>` + const channels = ${s}u / 4; + ${h.declareVariables(o,a,c,p)} + + ${h.mainStart()} + ${h.guardAgainstOutOfBoundsWorkgroupSizes(n)} + let value = ${o.getByOffset("global_idx")} + + ${a.getByOffset("global_idx % channels")} + ${c.getByOffset("global_idx")}; + ${p.setByOffset("global_idx","value")} + }`}},hl=e=>{pl(e.inputs),e.compute(so(e.inputs))}}),ro,ls,ml,no,fl,_l,io,gl,wl,oo,yl,Ml,bl,vl,ao,xl,Bn,lo,ii,Tl,uo,Pl,El,co,Cl,kl,po,Sl,$l,ho,Al,Il,mo,Fl,Ol,fo,Dl,oi,_o,Ll,zl,Bl,go,Rl,Nl,wo=y(()=>{Ot(),$t(),is(),qt(),ro=(e,t,s,n,i,o,a)=>{let c=Math.ceil(t/4),p="";typeof i=="string"?p=`${i}(a)`:p=i("a");let h=He("inputData",s,[c],4),C=Ct("outputData",n,[c],4),u=[{name:"vec_size",type:"u32"}];return a&&u.push(...a),` + ${e.registerUniforms(u).declareVariables(h,C)} + + ${o??""} + + ${e.mainStart()} + ${e.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.vec_size")} + + let a = ${h.getByOffset("global_idx")}; + ${C.setByOffset("global_idx",p)} + }`},ls=(e,t,s,n,i,o=e.dataType,a,c)=>{let p=[{type:12,data:Math.ceil(De.size(e.dims)/4)}];return a&&p.push(...a),{name:t,shaderCache:{hint:i,inputDependencies:["type"]},getShaderSource:h=>ro(h,De.size(e.dims),e.dataType,o,s,n,c),getRunData:h=>({outputs:[{dims:e.dims,dataType:o}],dispatchGroup:{x:Math.ceil(De.size(h[0].dims)/64/4)},programUniforms:p})}},ml=e=>{e.compute(ls(e.inputs[0],"Abs","abs"))},no=e=>{e.compute(ls(e.inputs[0],"Acos","acos"))},fl=e=>{e.compute(ls(e.inputs[0],"Acosh","acosh"))},_l=e=>{e.compute(ls(e.inputs[0],"Asin","asin"))},io=e=>{e.compute(ls(e.inputs[0],"Asinh","asinh"))},gl=e=>{e.compute(ls(e.inputs[0],"Atan","atan"))},wl=e=>{e.compute(ls(e.inputs[0],"Atanh","atanh"))},oo=e=>jt(e),yl=(e,t)=>{let s;switch(t.to){case 10:s="vec4";break;case 1:s="vec4";break;case 12:s="vec4";break;case 6:s="vec4";break;case 9:s="vec4";break;default:throw new RangeError(`not supported type (specified in attribute 'to' from 'Cast' operator): ${t.to}`)}e.compute(ls(e.inputs[0],"Cast",s,void 0,t.cacheKey,t.to))},Ml=e=>{let t,s,n=e.length>=2&&e[1].data!==0,i=e.length>=3&&e[2].data!==0;switch(e[0].dataType){case 1:t=n?e[1].getFloat32Array()[0]:-34028234663852886e22,s=i?e[2].getFloat32Array()[0]:34028234663852886e22;break;case 10:t=n?e[1].getUint16Array()[0]:64511,s=i?e[2].getUint16Array()[0]:31743;break;default:throw new Error("Unsupport data type")}return jt({min:t,max:s})},bl=(e,t)=>{let s=t||Ml(e.inputs),n=Cs(e.inputs[0].dataType);e.compute(ls(e.inputs[0],"Clip",i=>`clamp(${i}, vec4<${n}>(uniforms.min), vec4<${n}>(uniforms.max))`,void 0,s.cacheKey,void 0,[{type:e.inputs[0].dataType,data:s.min},{type:e.inputs[0].dataType,data:s.max}],[{name:"min",type:n},{name:"max",type:n}]),{inputs:[0]})},vl=e=>{e.compute(ls(e.inputs[0],"Ceil","ceil"))},ao=e=>{e.compute(ls(e.inputs[0],"Cos","cos"))},xl=e=>{e.compute(ls(e.inputs[0],"Cosh","cosh"))},Bn=e=>jt(e),lo=(e,t)=>{let s=Cs(e.inputs[0].dataType);e.compute(ls(e.inputs[0],"Elu",n=>`elu_vf32(${n})`,` + const elu_alpha_ = ${s}(${t.alpha}); + + fn elu_f32(a: ${s}) -> ${s} { + return select((exp(a) - 1.0) * elu_alpha_, a, a >= 0.0); + } + + fn elu_vf32(v: vec4<${s}>) -> vec4<${s}> { + return vec4(elu_f32(v.x), elu_f32(v.y), elu_f32(v.z), elu_f32(v.w)); + }`,t.cacheKey))},ii=(e="f32")=>` +const r0: ${e} = 0.3275911; +const r1: ${e} = 0.254829592; +const r2: ${e} = -0.284496736; +const r3: ${e} = 1.421413741; +const r4: ${e} = -1.453152027; +const r5: ${e} = 1.061405429; + +fn erf_vf32(v: vec4<${e}>) -> vec4<${e}> { + let absv = abs(v); + let x = 1.0 / (1.0 + r0 * absv); + return sign(v) * (1.0 - ((((r5 * x + r4) * x + r3) * x + r2) * x + r1) * x * exp(-absv * absv)); +}`,Tl=e=>{let t=Cs(e.inputs[0].dataType);e.compute(ls(e.inputs[0],"Erf",s=>`erf_vf32(${s})`,ii(t)))},uo=e=>{e.compute(ls(e.inputs[0],"Exp","exp"))},Pl=e=>{e.compute(ls(e.inputs[0],"Floor","floor"))},El=e=>{let t=Cs(e.inputs[0].dataType);e.compute(ls(e.inputs[0],"Gelu",s=>`0.5 * ${s} * (1.0 + erf_vf32(${s} * 0.7071067811865475))`,ii(t)))},co=(e,t)=>{let s=Cs(e.inputs[0].dataType);e.compute(ls(e.inputs[0],"LeakyRelu",n=>`select(leaky_relu_alpha_ * ${n}, ${n}, ${n} >= vec4<${s}>(0.0))`,`const leaky_relu_alpha_ = ${s}(${t.alpha});`,t.cacheKey))},Cl=e=>{e.compute(ls(e.inputs[0],"Not",t=>`!${t}`))},kl=e=>{e.compute(ls(e.inputs[0],"Neg",t=>`-${t}`))},po=e=>{e.compute(ls(e.inputs[0],"Reciprocal",t=>`1.0/${t}`))},Sl=e=>{let t=Cs(e.inputs[0].dataType);e.compute(ls(e.inputs[0],"Relu",s=>`select(vec4<${t}>(0.0), ${s}, ${s} > vec4<${t}>(0.0))`))},$l=e=>{e.compute(ls(e.inputs[0],"Sigmoid",t=>`(1.0 / (1.0 + exp(-${t})))`))},ho=e=>jt(e),Al=(e,t)=>{let s=Cs(e.inputs[0].dataType);e.compute(ls(e.inputs[0],"HardSigmoid",n=>`max(vec4<${s}>(0.0), min(vec4<${s}>(1.0), ${t.alpha} * ${n} + vec4<${s}>(${t.beta})))`,void 0,t.cacheKey))},Il=e=>{e.compute(ls(e.inputs[0],"Sin","sin"))},mo=e=>{e.compute(ls(e.inputs[0],"Sinh","sinh"))},Fl=e=>{e.compute(ls(e.inputs[0],"Sqrt","sqrt"))},Ol=e=>{e.compute(ls(e.inputs[0],"Tan","tan"))},fo=e=>`sign(${e}) * (1 - exp(-2 * abs(${e}))) / (1 + exp(-2 * abs(${e})))`,Dl=e=>{e.compute(ls(e.inputs[0],"Tanh",fo))},oi=(e="f32")=>` +const fast_gelu_a: ${e} = 0.5; +const fast_gelu_b: ${e} = 0.7978845608028654; +const fast_gelu_c: ${e} = 0.035677408136300125; + +fn tanh_v(v: vec4<${e}>) -> vec4<${e}> { + return ${fo("v")}; +} +`,_o=e=>`(fast_gelu_a + fast_gelu_a * tanh_v(${e} * (fast_gelu_c * ${e} * ${e} + fast_gelu_b))) * ${e}`,Ll=e=>{let t=Cs(e.inputs[0].dataType);e.compute(ls(e.inputs[0],"FastGelu",_o,oi(t),void 0,e.inputs[0].dataType))},zl=(e,t)=>{let s=Cs(e.inputs[0].dataType);return e.compute(ls(e.inputs[0],"ThresholdedRelu",n=>`select(vec4<${s}>(0.0), ${n}, ${n} > thresholded_relu_alpha_)`,`const thresholded_relu_alpha_ = vec4<${s}>(${t.alpha});`,t.cacheKey)),0},Bl=e=>{e.compute(ls(e.inputs[0],"Log","log"))},go=(e,t)=>` +const alpha = vec4<${e}>(${t}); +const one = ${e}(1.0); +const zero = ${e}(0.0); + +fn quick_gelu_impl(x: vec4<${e}>) -> vec4<${e}> { + let v = x *alpha; + var x1 : vec4<${e}>; + for (var i = 0; i < 4; i = i + 1) { + if (v[i] >= zero) { + x1[i] = one / (one + exp(-v[i])); + } else { + x1[i] = one - one / (one + exp(v[i])); + } + } + return x * x1; +} +`,Rl=e=>`quick_gelu_impl(${e})`,Nl=(e,t)=>{let s=Cs(e.inputs[0].dataType);e.compute(ls(e.inputs[0],"QuickGelu",Rl,go(s,t.alpha),t.cacheKey,e.inputs[0].dataType))}}),jl,yo,Vl,fc=y(()=>{$t(),qt(),wo(),jl=e=>{if(e[0].dims.length!==3)throw new Error("input should have 3 dimensions");if(![2560,5120,10240].includes(e[0].dims[2]))throw new Error("hidden state should be 2560, 5120 or 10240");if(e[1].dims.length!==1)throw new Error("bias is expected to have 1 dimensions");if(e[0].dims[2]!==e[1].dims[0])throw new Error("last dimension of input and bias are not the same")},yo=e=>{let t=e[0].dims.slice();t[2]=t[2]/2;let s=He("input",e[0].dataType,e[0].dims,4),n=He("bias",e[0].dataType,[e[0].dims[2]],4),i=Ct("output",e[0].dataType,t,4),o=De.size(t)/4,a=ds(e[0].dataType);return{name:"BiasSplitGelu",getRunData:()=>({outputs:[{dims:t,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(o/64)}}),getShaderSource:c=>` + const M_SQRT2 = sqrt(2.0); + const halfChannels = ${e[0].dims[2]/4/2}u; + + ${c.declareVariables(s,n,i)} + + ${ii(a)} + + ${c.mainStart()} + ${c.guardAgainstOutOfBoundsWorkgroupSizes(o)} + let biasIdx = global_idx % halfChannels; + let batchIndex = global_idx / halfChannels; + let inputOffset = biasIdx + batchIndex * halfChannels * 2; + let valueLeft = input[inputOffset] + bias[biasIdx]; + let valueRight = input[inputOffset + halfChannels] + bias[biasIdx + halfChannels]; + let geluRight = valueRight * 0.5 * (erf_vf32(valueRight / M_SQRT2) + 1); + + ${i.setByOffset("global_idx","valueLeft * geluRight")} + }`}},Vl=e=>{jl(e.inputs),e.compute(yo(e.inputs))}}),Ul,Wl,hr,Gl,Kl,Mo,Hl,ql,bo,Ql,Xl,vo,Yl,_c=y(()=>{Ot(),$t(),qt(),Ul=(e,t,s,n,i,o,a,c,p,h,C,u)=>{let k,B;typeof c=="string"?k=B=(W,ue)=>`${c}((${W}),(${ue}))`:typeof c=="function"?k=B=c:(k=c.scalar,B=c.vector);let R=Ct("outputData",C,n.length,4),z=He("aData",p,t.length,4),ne=He("bData",h,s.length,4),J;if(i)if(o){let W=De.size(t)===1,ue=De.size(s)===1,he=t.length>0&&t[t.length-1]%4===0,be=s.length>0&&s[s.length-1]%4===0;W||ue?J=R.setByOffset("global_idx",B(W?`${z.type.value}(${z.getByOffset("0")}.x)`:z.getByOffset("global_idx"),ue?`${ne.type.value}(${ne.getByOffset("0")}.x)`:ne.getByOffset("global_idx"))):J=` + let outputIndices = ${R.offsetToIndices("global_idx * 4u")}; + let offsetA = ${z.broadcastedIndicesToOffset("outputIndices",R)}; + let offsetB = ${ne.broadcastedIndicesToOffset("outputIndices",R)}; + ${R.setByOffset("global_idx",B(a||he?z.getByOffset("offsetA / 4u"):`${z.type.value}(${z.getByOffset("offsetA / 4u")}[offsetA % 4u])`,a||be?ne.getByOffset("offsetB / 4u"):`${ne.type.value}(${ne.getByOffset("offsetB / 4u")}[offsetB % 4u])`))} + `}else J=R.setByOffset("global_idx",B(z.getByOffset("global_idx"),ne.getByOffset("global_idx")));else{if(!o)throw new Error("no necessary to use scalar implementation for element-wise binary op implementation.");let W=(ue,he,be="")=>{let Be=`aData[indexA${he}][componentA${he}]`,Ie=`bData[indexB${he}][componentB${he}]`;return` + let outputIndices${he} = ${R.offsetToIndices(`global_idx * 4u + ${he}u`)}; + let offsetA${he} = ${z.broadcastedIndicesToOffset(`outputIndices${he}`,R)}; + let offsetB${he} = ${ne.broadcastedIndicesToOffset(`outputIndices${he}`,R)}; + let indexA${he} = offsetA${he} / 4u; + let indexB${he} = offsetB${he} / 4u; + let componentA${he} = offsetA${he} % 4u; + let componentB${he} = offsetB${he} % 4u; + ${ue}[${he}] = ${be}(${k(Be,Ie)}); + `};C===9?J=` + var data = vec4(0); + ${W("data",0,"u32")} + ${W("data",1,"u32")} + ${W("data",2,"u32")} + ${W("data",3,"u32")} + outputData[global_idx] = dot(vec4(0x1, 0x100, 0x10000, 0x1000000), vec4(data));`:J=` + ${W("outputData[global_idx]",0)} + ${W("outputData[global_idx]",1)} + ${W("outputData[global_idx]",2)} + ${W("outputData[global_idx]",3)} + `}return` + ${e.registerUniform("vec_size","u32").declareVariables(z,ne,R)} + + ${u??""} + + ${e.mainStart()} + ${e.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.vec_size")} + ${J} + }`},Wl=(e,t,s,n,i,o,a=s.dataType)=>{let c=s.dims.map(z=>Number(z)??1),p=n.dims.map(z=>Number(z)??1),h=!De.areEqual(c,p),C=c,u=De.size(c),k=!1,B=!1,R=[h];if(h){let z=Js.calcShape(c,p,!1);if(!z)throw new Error("Can't perform binary op on the given tensors");C=z.slice(),u=De.size(C);let ne=De.size(c)===1,J=De.size(p)===1,W=c.length>0&&c[c.length-1]%4===0,ue=p.length>0&&p[p.length-1]%4===0;R.push(ne),R.push(J),R.push(W),R.push(ue);let he=1;for(let be=1;bez.toString()).join("_"),inputDependencies:["rank","rank"]},getShaderSource:z=>Ul(z,c,p,C,k,h,B,i,s.dataType,n.dataType,a,o),getRunData:()=>({outputs:[{dims:C,dataType:a}],dispatchGroup:{x:Math.ceil(u/64/4)},programUniforms:[{type:12,data:Math.ceil(De.size(C)/4)},...Mt(c,p,C)]})}},hr=(e,t,s,n,i,o)=>{e.compute(Wl(t,i??"",e.inputs[0],e.inputs[1],s,n,o))},Gl=e=>{hr(e,"Add",(t,s)=>`${t}+${s}`)},Kl=e=>{hr(e,"Div",(t,s)=>`${t}/${s}`)},Mo=e=>{hr(e,"Equal",{scalar:(t,s)=>`u32(${t}==${s})`,vector:(t,s)=>`vec4(${t}==${s})`},void 0,void 0,9)},Hl=e=>{hr(e,"Mul",(t,s)=>`${t}*${s}`)},ql=e=>{let t=He("input",e.inputs[0].dataType,e.inputs[0].dims).type.value;hr(e,"Pow",{scalar:(s,n)=>`pow_custom(${s},${n})`,vector:(s,n)=>`pow_vector_custom(${s},${n})`},` + fn pow_custom(a : ${t}, b : ${t}) -> ${t} { + if (b == ${t}(0.0)) { + return ${t}(1.0); + } else if (a < ${t}(0.0) && f32(b) != floor(f32(b))) { + return ${t}(pow(f32(a), f32(b))); // NaN + } + return select(sign(a), ${t}(1.0), round(f32(abs(b) % ${t}(2.0))) != 1.0) * ${t}(${t==="i32"?"round":""}(pow(f32(abs(a)), f32(b)))); + } + fn pow_vector_custom(a : vec4<${t}>, b : vec4<${t}>) -> vec4<${t}> { + // TODO: implement vectorized pow + return vec4<${t}>(pow_custom(a.x, b.x), pow_custom(a.y, b.y), pow_custom(a.z, b.z), pow_custom(a.w, b.w)); + } + `)},bo=e=>{hr(e,"Sub",(t,s)=>`${t}-${s}`)},Ql=e=>{hr(e,"Greater",{scalar:(t,s)=>`u32(${t}>${s})`,vector:(t,s)=>`vec4(${t}>${s})`},void 0,void 0,9)},Xl=e=>{hr(e,"Less",{scalar:(t,s)=>`u32(${t}<${s})`,vector:(t,s)=>`vec4(${t}<${s})`},void 0,void 0,9)},vo=e=>{hr(e,"GreaterOrEqual",{scalar:(t,s)=>`u32(${t}>=${s})`,vector:(t,s)=>`vec4(${t}>=${s})`},void 0,void 0,9)},Yl=e=>{hr(e,"LessOrEqual",{scalar:(t,s)=>`u32(${t}<=${s})`,vector:(t,s)=>`vec4(${t}<=${s})`},void 0,void 0,9)}}),xo,Jl,Zl,ai,eu,tu,su=y(()=>{Ot(),$t(),is(),qt(),xo=(e,t)=>{if(!e||e.length<1)throw new Error("too few inputs");let s=0,n=e[s],i=n.dataType,o=n.dims.length;e.forEach((a,c)=>{if(c!==s){if(a.dataType!==i)throw new Error("input tensors should be one type");if(a.dims.length!==o)throw new Error("input tensors should have the same shape");a.dims.forEach((p,h)=>{if(h!==t&&p!==n.dims[h])throw new Error("non concat dimensions must match")})}})},Jl=(e,t)=>` + fn calculateInputIndex(index: u32) -> u32 { + let sizeInConcatAxis = array(${t}); + for (var i: u32 = 0u; i < ${e}; i += 1u ) { + if (index < sizeInConcatAxis[i]) { + return i; + } + } + return ${e}u; + }`,Zl=(e,t)=>{let s=e.length,n=[];for(let i=0;i{let i=De.size(s),o=new Array(e.length),a=new Array(e.length),c=0,p=[],h=[],C=[{type:12,data:i}];for(let z=0;z`uniforms.sizeInConcatAxis${z}`).join(","),R=z=>` + + ${(()=>{z.registerUniform("outputSize","u32");for(let ne=0;ne(${B}); + ${k} -= sizeInConcatAxis[inputIndex - 1u]; + } + + ${Zl(a,u)} + }`;return{name:"Concat",shaderCache:{hint:`${t}`,inputDependencies:p},getRunData:()=>({outputs:[{dims:s,dataType:n}],dispatchGroup:{x:Math.ceil(i/64)},programUniforms:C}),getShaderSource:R}},eu=(e,t)=>{let s=e.inputs,n=s[0].dims,i=De.normalizeAxis(t.axis,n.length);xo(s,i);let o=n.slice();o[i]=s.reduce((c,p)=>c+(p.dims.length>i?p.dims[i]:0),0);let a=s.filter(c=>De.size(c.dims)>0);e.compute(ai(a,i,o,s[0].dataType),{inputs:a})},tu=e=>jt({axis:e.axis})}),Vr,Zr,Ur,To,en=y(()=>{Ot(),$t(),Vr=(e,t,s="f32")=>{switch(e.activation){case"Relu":return`value = max(value, ${t}(0.0));`;case"Sigmoid":return`value = (${t}(1.0) / (${t}(1.0) + exp(-value)));`;case"Clip":return`value = clamp(value, ${t}(${s}(uniforms.clip_min)), ${t}(${s}(uniforms.clip_max)));`;case"HardSigmoid":return`value = max(${t}(0.0), min(${t}(1.0), ${s}(uniforms.alpha) * value + ${s}(uniforms.beta)));`;case"LeakyRelu":return`value = select(${s}(uniforms.alpha) * value, value, value >= ${t}(0.0));`;case"Tanh":return`let e2x = exp(-2.0 * abs(value)); + value = sign(value) * (1.0 - e2x) / (1.0 + e2x); + `;case"":return"";default:throw new Error(`Unsupported activation ${e.activation}`)}},Zr=(e,t)=>{e.activation==="Clip"?t.push({type:1,data:e.clipMax},{type:1,data:e.clipMin}):e.activation==="HardSigmoid"?t.push({type:1,data:e.alpha},{type:1,data:e.beta}):e.activation==="LeakyRelu"&&t.push({type:1,data:e.alpha})},Ur=(e,t)=>{e.activation==="Clip"?t.push({name:"clip_max",type:"f32"},{name:"clip_min",type:"f32"}):e.activation==="HardSigmoid"?t.push({name:"alpha",type:"f32"},{name:"beta",type:"f32"}):e.activation==="LeakyRelu"&&t.push({name:"alpha",type:"f32"})},To=e=>{let t=e?.activation||"";if(t==="HardSigmoid"){let[s,n]=e?.activation_params||[.2,.5];return{activation:t,alpha:s,beta:n}}else if(t==="Clip"){let[s,n]=e?.activation_params||[Es,Hs];return{activation:t,clipMax:n,clipMin:s}}else if(t==="LeakyRelu"){let[s]=e?.activation_params||[.01];return{activation:t,alpha:s}}return{activation:t}}}),qs,Po,Eo=y(()=>{qs=(e,t)=>{switch(e){case 1:return t;case 2:return`vec2<${t}>`;case 3:return`vec3<${t}>`;case 4:return`vec4<${t}>`;default:throw new Error(`${e}-component is not supported.`)}},Po=e=>` + ${e?"value = value + getBiasByOutputCoords(coords);":""} + `}),ru,gc=y(()=>{ru=e=>` +fn getIndexFromCoords4D(coords : vec4, shape : vec4) -> i32 { + return dot(coords, vec4( + shape.y * shape.z * shape.w, shape.z * shape.w, shape.w, 1)); +} +fn getOutputIndexFromCoords(coords : vec4) -> i32 { + return dot(coords, vec4( + i32(${e}.x), i32(${e}.y), i32(${e}.z), 1)); +} +`}),wn,Co,ko=y(()=>{Ot(),$t(),qt(),en(),wn=(e,t,s,n,i)=>{let o=n-s;return` + ${Array.from({length:s}).map((a,c)=>` + if (${Tt(t.shape,c,t.rank)} != 1) { + ${t.indicesSet(e,c,Tt(i,c+o,n))} + } else { + ${t.indicesSet(e,c,0)} + }`).join("")} +`},Co=(e,t,s,n,i=!1,o)=>{let a=e[0].dims,c=e[1].dims,p=a[a.length-2],h=c[c.length-1],C=a[a.length-1],u=Gt(h),k=Gt(C),B=Gt(p),R=De.size(s)/u/B,z=e.length>2,ne=n?n.slice(0,-2):s.slice(0,-2),J=[De.size(ne),p,h],W=[{type:12,data:R},{type:12,data:p},{type:12,data:h},{type:12,data:C}];Zr(t,W),W.push(...Mt(ne,a,c)),z&&W.push(...Mt(e[2].dims)),W.push(...Mt(J));let ue=he=>{let be=Ii("batch_dims",e[0].dataType,ne.length),Be=He("a",e[0].dataType,a.length,k),Ie=He("b",e[1].dataType,c.length,u),nt=Ct("output",e[0].dataType,J.length,u),dt=ds(nt.type.tensor),Et=Vr(t,nt.type.value,dt),zt=[Be,Ie],It="";if(z){let Vt=i?u:1;zt.push(He("bias",e[2].dataType,e[2].dims.length,Vt)),It=`${i?`value += bias[col / ${Vt}];`:`value += ${nt.type.value}(bias[row + i]);`}`}let ht=[{name:"output_size",type:"u32"},{name:"M",type:"u32"},{name:"N",type:"u32"},{name:"K",type:"u32"}];Ur(t,ht);let Jt=()=>{let Vt=`var a_data: ${Be.type.value};`;for(let St=0;St; + for (var k: u32 = 0u; k < uniforms.K; k = k + ${k}) { + ${Jt()} + } + for (var i = 0u; i < ${B}u; i++) { + var value = values[i]; + ${It} + ${Et} + let cur_indices = ${nt.type.indices}(batch, row + i, col); + let offset = ${nt.indicesToOffset("cur_indices")}; + ${nt.setByOffset(`offset / ${u}`,"value")}; + } + } + `};return{name:"MatMulNaive",shaderCache:{hint:`${t.activation};${u};${k};${B};${i}`,inputDependencies:z?["rank","rank","rank"]:["rank","rank"]},getRunData:()=>({outputs:[{dims:o?o(s):s,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(R/64)},programUniforms:W}),getShaderSource:ue}}}),So,nu,$o,li,iu,Ao,Io,ui,Fo=y(()=>{Ot(),$t(),qt(),en(),ko(),Eo(),So=(e,t)=>e?` + mm_Asub[inputRow][inputCol] = mm_readA(batch, + kStart + inputRow, + globalRowStart / innerElementSize + inputCol${t?", batchIndices":""}); + `:` + mm_Asub[inputRow][inputCol] = mm_readA(batch, + globalRow + innerRow, + kStart / innerElementSize + inputCol${t?", batchIndices":""}); + `,nu=(e,t)=>e?` + let ACached0 = mm_Asub[k * innerElementSize][localRow]; + let ACached1 = mm_Asub[k * innerElementSize + 1][localRow]; + let ACached2 = mm_Asub[k * innerElementSize + 2][localRow]; + ${t===3?"":"let ACached3 = mm_Asub[k * innerElementSize + 3][localRow];"} + for (var i = 0; i < rowPerThread; i = i + 1) { + acc[i] = BCached0 * ACached0[i] + acc[i]; + acc[i] = BCached1 * ACached1[i] + acc[i]; + acc[i] = BCached2 * ACached2[i] + acc[i]; + ${t===3?"":"acc[i] = BCached3 * ACached3[i] + acc[i];"} + }`:` + for (var i = 0; i < rowPerThread; i = i + 1) { + let ACached = mm_Asub[tileRow + i][k]; + acc[i] = BCached0 * ACached.x + acc[i]; + acc[i] = BCached1 * ACached.y + acc[i]; + acc[i] = BCached2 * ACached.z + acc[i]; + ${t===3?"":"acc[i] = BCached3 * ACached.w + acc[i];"} + }`,$o=(e,t,s="f32",n,i=!1,o=32,a=!1,c=32)=>{let p=t[1]*e[1],h=t[0]*e[0],C=i?p:o,u=i?o:p,k=C/t[0],B=o/t[1];if(!((i&&k===4&&e[1]===4||!i&&(k===3||k===4))&&C%t[0]===0&&o%t[1]===0&&e[0]===4))throw new Error(`If transposeA ${i} is true, innerElementSize ${k} and workPerThread[1] ${e[1]} must be 4. + Otherwise, innerElementSize ${k} must be 3 or 4. + tileAWidth ${C} must be divisible by workgroupSize[0]${t[0]}. tileInner ${o} must be divisible by workgroupSize[1] ${t[1]}. colPerThread ${e[0]} must be 4.`);return` +var mm_Asub: array, ${C/k}>, ${u}>; +var mm_Bsub: array, ${h/e[0]}>, ${o}>; + +const rowPerThread = ${e[1]}; +const colPerThread = ${e[0]}; +const innerElementSize = ${k}; +const tileInner = ${o}; + +@compute @workgroup_size(${t[0]}, ${t[1]}, ${t[2]}) +fn main(@builtin(local_invocation_id) localId : vec3, + @builtin(global_invocation_id) globalId : vec3, + @builtin(workgroup_id) workgroupId : vec3) { + let localRow = i32(localId.y); + let tileRow = localRow * rowPerThread; + let tileCol = i32(localId.x); + + let globalRow =i32(globalId.y) * rowPerThread; + let globalCol = i32(globalId.x); + let batch = ${a?"0":"i32(globalId.z)"}; + ${n?`let batchIndices = ${n.offsetToIndices("u32(batch)")};`:""} + let globalRowStart = i32(workgroupId.y) * ${p}; + + let num_tiles = ${a?`${Math.ceil(c/o)}`:"(uniforms.dim_inner - 1) / tileInner + 1"}; + var kStart = ${a?`i32(globalId.z) * ${c}`:"0"}; + + var acc: array, rowPerThread>; + + // Loop over shared dimension. + let tileRowB = localRow * ${B}; + for (var t = 0; t < num_tiles; t = t + 1) { + // Load one tile of A into local memory. + for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) { + let inputRow = tileRow + innerRow; + let inputCol = tileCol; + ${So(i,n)} + } + + // Load one tile of B into local memory. + for (var innerRow = 0; innerRow < ${B}; innerRow = innerRow + 1) { + let inputRow = tileRowB + innerRow; + let inputCol = tileCol; + mm_Bsub[inputRow][inputCol] = mm_readB(batch, kStart + inputRow, globalCol${n?", batchIndices":""}); + } + kStart = kStart + tileInner; + workgroupBarrier(); + + // Compute acc values for a single thread. + for (var k = 0; k < tileInner / innerElementSize; k = k + 1) { + let BCached0 = mm_Bsub[k * innerElementSize][tileCol]; + let BCached1 = mm_Bsub[k * innerElementSize + 1][tileCol]; + let BCached2 = mm_Bsub[k * innerElementSize + 2][tileCol]; + ${k===3?"":"let BCached3 = mm_Bsub[k * innerElementSize + 3][tileCol];"} + + ${nu(i,k)} + } + + workgroupBarrier(); + } + + for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) { + mm_write(batch, globalRow + innerRow, globalCol, acc[innerRow]); + } +}`},li=(e,t)=>e?` + mm_Asub[inputRow][inputCol] = mm_readA(batch, + kStart + inputRow, + globalRowStart + inputCol${t?", batchIndices":""}); + `:` + mm_Asub[inputRow][inputCol] = mm_readA(batch, + globalRowStart + inputRow, + kStart + inputCol${t?", batchIndices":""}); + `,iu=e=>e?"let ACached = mm_Asub[k][tileRow + innerRow];":"let ACached = mm_Asub[tileRow + innerRow][k];",Ao=(e,t,s="f32",n,i=!1,o=32,a=!1,c=32,p=!1)=>{let h=e[1]*t[1],C=e[0]*t[0],u=i?h:o,k=i?o:h;if(!(k%t[1]===0&&u%t[0]===0&&o%t[1]===0))throw new Error(`tileAHight ${k} must be divisible by workgroupSize[1]${t[1]}, tileAWidth ${u} must be divisible by workgroupSize[0]${t[0]}, tileInner ${o} must be divisible by workgroupSize[1]${t[1]}`);let B=k/t[1],R=u/t[0],z=o/t[1],ne=p?` + let localRow = i32(localId.y); + let localCol = i32(localId.x); + let globalRowStart = i32(workgroupId.y) * ${h}; + let globalColStart = i32(workgroupId.x) * ${C}; + + // Loop over shared dimension. + for (var t = 0; t < num_tiles; t = t + 1) { + // Load one tile of A into local memory. + for (var inputRow = localRow; inputRow < ${k}; inputRow = inputRow + ${t[1]}) { + for (var inputCol = localCol; inputCol < ${u}; inputCol = inputCol + ${t[0]}) { + ${li(i,n)} + } + } + // Load one tile of B into local memory. + for (var inputRow = localRow; inputRow < ${o}; inputRow = inputRow + ${t[1]}) { + for (var inputCol = localCol; inputCol < ${C}; inputCol = inputCol + ${t[0]}) { + mm_Bsub[inputRow][inputCol] = mm_readB(batch, + kStart + inputRow, + globalColStart + inputCol${n?", batchIndices":""}); + } + } + kStart = kStart + tileInner; + workgroupBarrier(); + + // Compute acc values for a single thread. + var BCached : array<${s}, colPerThread>; + for (var k = 0; k < tileInner; k = k + 1) { + for (var inner = 0; inner < colPerThread; inner = inner + 1) { + BCached[inner] = mm_Bsub[k][localCol + inner * ${t[0]}]; + } + for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) { + let ACached = ${i?`mm_Asub[k][localRow + innerRow * ${t[1]}];`:`mm_Asub[localRow + innerRow * ${t[1]}][k];`} + for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) { + acc[innerRow][innerCol] = acc[innerRow][innerCol] + + ACached * BCached[innerCol]; + } + } + } + workgroupBarrier(); + } + for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) { + let gRow = globalRowStart + localRow + innerRow * ${t[1]}; + for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) { + let gCol = globalColStart + localCol + innerCol * ${t[0]}; + mm_write(batch, gRow, gCol, acc[innerRow][innerCol]); + } + } + `:` +let tileRow = i32(localId.y) * rowPerThread; +let tileCol = i32(localId.x) * colPerThread; + +let globalRow = i32(globalId.y) * rowPerThread; +let globalCol = i32(globalId.x) * colPerThread; +let globalRowStart = i32(workgroupId.y) * ${h}; + +let tileRowA = i32(localId.y) * ${B}; +let tileColA = i32(localId.x) * ${R}; +let tileRowB = i32(localId.y) * ${z}; +// Loop over shared dimension. +for (var t = 0; t < num_tiles; t = t + 1) { + // Load one tile of A into local memory. + for (var innerRow = 0; innerRow < ${B}; innerRow = innerRow + 1) { + for (var innerCol = 0; innerCol < ${R}; innerCol = innerCol + 1) { + let inputRow = tileRowA + innerRow; + let inputCol = tileColA + innerCol; + ${li(i,n)} + } + } + + // Load one tile of B into local memory. + for (var innerRow = 0; innerRow < ${z}; innerRow = innerRow + 1) { + for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) { + let inputRow = tileRowB + innerRow; + let inputCol = tileCol + innerCol; + mm_Bsub[inputRow][inputCol] = mm_readB(batch, + kStart + inputRow, + globalCol + innerCol${n?", batchIndices":""}); + } + } + kStart = kStart + tileInner; + workgroupBarrier(); + + // Compute acc values for a single thread. + var BCached : array<${s}, colPerThread>; + for (var k = 0; k < tileInner; k = k + 1) { + for (var inner = 0; inner < colPerThread; inner = inner + 1) { + BCached[inner] = mm_Bsub[k][tileCol + inner]; + } + + for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) { + ${iu(i)} + for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) { + acc[innerRow][innerCol] = acc[innerRow][innerCol] + ACached * BCached[innerCol]; + } + } + } + + workgroupBarrier(); +} + +for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) { + for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) { + mm_write(batch, globalRow + innerRow, globalCol + innerCol, + acc[innerRow][innerCol]); + } +} +`;return` + var mm_Asub : array, ${k}>; + var mm_Bsub : array, ${o}>; + const rowPerThread = ${e[1]}; + const colPerThread = ${e[0]}; + const tileInner = ${o}; + +@compute @workgroup_size(${t[0]}, ${t[1]}, ${t[2]}) +fn main(@builtin(local_invocation_id) localId : vec3, + @builtin(global_invocation_id) globalId : vec3, + @builtin(workgroup_id) workgroupId : vec3) { + let batch = ${a?"0":"i32(globalId.z)"}; + ${n?`let batchIndices = ${n.offsetToIndices("u32(batch)")};`:""} + let num_tiles = ${a?`${Math.ceil(c/o)}`:"(uniforms.dim_inner - 1) / tileInner + 1"}; + var kStart = ${a?`i32(globalId.z) * ${c}`:"0"}; + + var acc : array, rowPerThread>; + ${ne} + } +`},Io=(e,t,s,n,i=!1)=>{let[o,a,c,p]=n,h=ds(n[0].type.tensor);return` + fn mm_readA(batch: i32, row: i32, colIn: i32, batchIndices: ${o.type.indices}) -> ${qs(e,h)} { + var value = ${qs(e,h)}(0.0); + let col = colIn * ${e}; + if(row < uniforms.dim_a_outer && col < uniforms.dim_inner) + { + var aIndices: ${a.type.indices}; + ${wn("aIndices",a,a.rank-2,o.rank,"batchIndices")} + ${a.indicesSet("aIndices",a.rank-2,"u32(row)")} + ${a.indicesSet("aIndices",a.rank-1,"u32(colIn)")} + value = ${a.getByIndices("aIndices")}; + } + return value; + } + + fn mm_readB(batch: i32, row: i32, colIn: i32, batchIndices: ${o.type.indices}) -> ${qs(e,h)} { + var value = ${qs(e,h)}(0.0); + let col = colIn * ${e}; + if(row < uniforms.dim_inner && col < uniforms.dim_b_outer) + { + var bIndices: ${c.type.indices}; + ${wn("bIndices",c,c.rank-2,o.rank,"batchIndices")} + ${c.indicesSet("bIndices",c.rank-2,"u32(row)")} + ${c.indicesSet("bIndices",c.rank-1,"u32(colIn)")} + value = ${c.getByIndices("bIndices")}; + } + return value; + } + + fn mm_write(batch: i32, row: i32, colIn: i32, valueIn: ${qs(e,h)}) { + let col = colIn * ${e}; + if (row < uniforms.dim_a_outer && col < uniforms.dim_b_outer) { + var value = valueIn; + let coords = vec3(batch, row, colIn); + ${t?`value = value + ${i?"bias[colIn]":`${qs(e,h)}(bias[row])`};`:""} + ${s} + ${p.setByIndices("vec3(coords)","value")} + } + } + `},ui=(e,t,s,n,i=!1,o)=>{let a=e[0].dims,c=e[1].dims,p=a.slice(0,-2),h=c.slice(0,-2),C=n?n.slice(0,-2):s.slice(0,-2),u=De.size(C),k=a[a.length-2],B=a[a.length-1],R=c[c.length-1],z=B%4===0&&R%4===0,ne=k<=8?[4,1,1]:[4,4,1],J=[8,8,1],W=[Math.ceil(R/J[0]/ne[0]),Math.ceil(k/J[1]/ne[1]),Math.ceil(u/J[2]/ne[2])],ue=z?4:1,he=[...p,k,B/ue],be=he.length,Be=[...h,B,R/ue],Ie=Be.length,nt=[u,k,R/ue],dt=[{type:6,data:k},{type:6,data:R},{type:6,data:B}];Zr(t,dt),dt.push(...Mt(C,he,Be));let Et=["rank","rank"],zt=e.length>2;zt&&(dt.push(...Mt(e[2].dims)),Et.push("rank")),dt.push(...Mt(nt));let It=ht=>{let Jt=C.length,Vt=Ii("batchDims",e[0].dataType,Jt,1),St=ds(e[0].dataType),ts=He("a",e[0].dataType,be,ue),Xt=He("b",e[1].dataType,Ie,ue),Ut=Ct("result",e[0].dataType,nt.length,ue),$s=[ts,Xt];if(zt){let xs=i?ue:1;$s.push(He("bias",e[2].dataType,e[2].dims.length,xs))}let ut=[{name:"dim_a_outer",type:"i32"},{name:"dim_b_outer",type:"i32"},{name:"dim_inner",type:"i32"}];Ur(t,ut);let xt=ds(Ut.type.tensor),hs=Vr(t,Ut.type.value,xt),vs=Io(ue,zt,hs,[Vt,ts,Xt,Ut],i);return` + ${ht.registerUniforms(ut).registerInternalVariables(Vt).declareVariables(...$s,Ut)} + ${vs} + ${z?$o(ne,J,St,Vt):Ao(ne,J,St,Vt)} + `};return{name:"MatMul",shaderCache:{hint:`${ne};${t.activation};${z};${i}`,inputDependencies:Et},getRunData:()=>({outputs:[{dims:o?o(s):s,dataType:e[0].dataType}],dispatchGroup:{x:W[0],y:W[1],z:W[2]},programUniforms:dt}),getShaderSource:It}}}),Oo,ou,wc=y(()=>{Ot(),Te(),qt(),en(),Eo(),gc(),Fo(),Oo=(e,t,s,n,i=!1,o,a=4,c=4,p=4,h="f32")=>{let C=dt=>{switch(dt){case 1:return"resData = x[xIndex];";case 3:return`resData = vec3<${h}>(x[xIndex], x[xIndex + 1], x[xIndex + 2]);`;case 4:return"resData = x[xIndex / 4];";default:throw new Error(`innerElementSize ${dt} is not supported.`)}},u=dt=>{switch(dt){case 1:return"return w[row * i32(uniforms.w_shape[3]) + colIn];";case 4:return"return w[row * i32(uniforms.w_shape[3]) / 4 + colIn];";default:throw new Error(`innerElementSize ${dt} is not supported.`)}},k=e?` + let coord = vec4(batch, xRow, xCol, xCh); + `:` + let coord = vec4(batch, xCh, xRow, xCol); + `,B=e?` + let coords = vec4( + batch, + row / outWidth, + row % outWidth, + col); + `:` + let coords = vec4( + batch, + row, + col / outWidth, + col % outWidth); + `,R=e?"i32(uniforms.x_shape[1])":"i32(uniforms.x_shape[2])",z=e?"i32(uniforms.x_shape[2])":"i32(uniforms.x_shape[3])",ne=e?"row":"col",J=e?"col":"row",W=` + let inChannels = i32(uniforms.w_shape[2]); + let outWidth = ${e?"i32(uniforms.result_shape[2])":"i32(uniforms.result_shape[3])"}; + let outRow = ${ne} / outWidth; + let outCol = ${ne} % outWidth; + + let WRow = ${J} / (i32(uniforms.w_shape[1]) * inChannels); + let WCol = ${J} / inChannels % i32(uniforms.w_shape[1]); + let xRow = outRow * uniforms.stride[0] + uniforms.dilation[0] * WRow - uniforms.pad[0]; + let xCol = outCol * uniforms.stride[1] + uniforms.dilation[1] * WCol - uniforms.pad[1]; + let xCh = ${J} % inChannels; + var resData = ${qs(a,h)}(0.0); + // The bounds checking is always needed since we use it to pad zero for + // the 'same' padding type. + if (xRow >= 0 && xRow < ${R} && xCol >= 0 && xCol < ${z}) { + ${k} + let xIndex = getIndexFromCoords4D(coord, vec4(uniforms.x_shape)); + ${C(a)} + } + return resData;`,ue=e?t&&n?` + let col = colIn * ${a}; + ${W}`:` + let col = colIn * ${a}; + if (row < uniforms.dim_a_outer && col < uniforms.dim_inner) { + ${W} + } + return ${qs(a,h)}(0.0);`:n&&s?` + let col = colIn * ${a}; + ${W}`:` + let col = colIn * ${a}; + if (row < uniforms.dim_inner && col < uniforms.dim_b_outer) { + ${W} + } + return ${qs(a,h)}(0.0);`,he=e?n&&s?u(c):` + let col = colIn * ${c}; + if (row < uniforms.dim_inner && col < uniforms.dim_b_outer) { + ${u(c)} + } + return ${qs(c,h)}(0.0);`:` + let col = colIn * ${c}; + if (row < uniforms.dim_inner && col < uniforms.dim_a_outer) { + ${u(c)} + } + return ${qs(c,h)}(0.0);`,be=qs(p,h),Be=qs(e?a:c,h),Ie=qs(e?c:a,h),nt=Vr(o,be,h);return` + fn mm_readA(batch: i32, row : i32, colIn : i32) -> ${Be} { + ${e?ue:he} + } + + fn mm_readB(batch: i32, row : i32, colIn : i32) -> ${Ie} { + ${e?he:ue} + } + + fn mm_write(batch: i32, row : i32, colIn : i32, valueIn : ${be}) { + let col = colIn * ${p}; + if (row < uniforms.dim_a_outer && col < uniforms.dim_b_outer) + { + var value = valueIn; + let outWidth = ${e?"i32(uniforms.result_shape[2])":"i32(uniforms.result_shape[3])"}; + ${B} + ${Po(i)} + ${nt} + setOutputAtCoords(coords[0], coords[1], coords[2], coords[3], value); + } + }`},ou=(e,t,s,n,i,o,a,c,p)=>{let h=t.format==="NHWC",C=h?e[0].dims[3]:e[0].dims[1],u=s[0],k=h?s[2]:s[3],B=h?s[1]:s[2],R=h?s[3]:s[1],z=h&&(C%4===0||C%3===0)&&R%4===0,ne=h?R:k*B,J=h?k*B:R,W=[8,8,1],ue=n<=8?[4,1,1]:[4,4,1],he=[Math.ceil(ne/W[0]/ue[0]),Math.ceil(J/W[1]/ue[1]),Math.ceil(u/W[2]/ue[2])];as("verbose",()=>`[conv2d_mm_webgpu] dispatch = ${he}`);let be=z?h&&C%4!==0?3:4:1,Be=W[1]*ue[1],Ie=W[0]*ue[0],nt=Math.max(W[0]*be,W[1]),dt=n%Be===0,Et=i%Ie===0,zt=o%nt===0,It=z?[be,4,4]:[1,1,1],ht=[{type:6,data:n},{type:6,data:i},{type:6,data:o},{type:6,data:[t.pads[0],t.pads[1]]},{type:6,data:t.strides},{type:6,data:t.dilations}];Zr(t,ht),ht.push(...Mt(e[0].dims,e[1].dims));let Jt=["rank","rank"];a&&(ht.push(...Mt(e[2].dims)),Jt.push("rank")),ht.push(...Mt(s));let Vt=St=>{let ts=[{name:"dim_a_outer",type:"i32"},{name:"dim_b_outer",type:"i32"},{name:"dim_inner",type:"i32"},{name:"pad",type:"i32",length:2},{name:"stride",type:"i32",length:2},{name:"dilation",type:"i32",length:2}];Ur(t,ts);let Xt=z?4:1,Ut=ds(e[0].dataType),$s=` + fn setOutputAtIndex(flatIndex : i32, value : ${z?`vec4<${Ut}>`:Ut}) { + result[flatIndex] = ${z?`vec4<${Ut}>`:Ut}(value); + } + fn setOutputAtCoords(d0 : i32, d1 : i32, d2 : i32, d3 : i32, value : ${z?`vec4<${Ut}>`:Ut}) { + let flatIndex = getOutputIndexFromCoords(vec4(d0, d1, d2, d3)); + setOutputAtIndex(flatIndex ${z?"/ 4":""}, value); + }`,ut=He("x",e[0].dataType,e[0].dims.length,be===3?1:be),xt=He("w",e[1].dataType,e[1].dims.length,Xt),hs=[ut,xt],vs=Ct("result",e[0].dataType,s.length,Xt);if(a){let xs=He("bias",e[2].dataType,e[2].dims.length,Xt);hs.push(xs),$s+=` + fn getBiasByOutputCoords(coords : vec4) -> ${z?`vec4<${Ut}>`:Ut} { + return bias[coords.${h?"w":"y"}${z?"/ 4":""}]; + }`}return` + ${ru("uniforms.result_strides")} + //struct Uniforms { xShape : vec4, wShape : vec4, outShape : vec4, + // outShapeStrides: vec3, filterDims : vec2, pad : vec2, stride : vec2, + // dilation : vec2, dimAOuter : i32, dimBOuter : i32, dimInner : i32 }; + ${St.registerUniforms(ts).declareVariables(...hs,vs)} + ${$s} + ${Oo(h,dt,Et,zt,a,t,It[0],It[1],It[2],Ut)} + ${z?$o(ue,W,Ut,void 0,!h,nt):Ao(ue,W,Ut,void 0,!h,nt,!1,void 0,c)}`};return{name:"Conv2DMatMul",shaderCache:{hint:`${t.cacheKey};${be};${z};${dt};${Et};${zt};${Be};${Ie};${nt}`,inputDependencies:Jt},getRunData:()=>({outputs:[{dims:p?p(s):s,dataType:e[0].dataType}],dispatchGroup:{x:he[0],y:he[1],z:he[2]},programUniforms:ht}),getShaderSource:Vt}}}),Do,Lo,Rn,au,zo,di,lu,uu,yc=y(()=>{Ot(),Te(),$t(),qt(),en(),Eo(),Do=e=>{let t=1;for(let s=0;stypeof e=="number"?[e,e,e]:e,Rn=(e,t)=>t<=1?e:e+(e-1)*(t-1),au=(e,t,s,n=1)=>{let i=Rn(t,n);return Math.floor((e[0]*(s-1)-s+i)/2)},zo=(e,t,s,n,i)=>{i==null&&(i=au(e,t[0],n[0]));let o=[0,0,0,s];for(let a=0;a<3;a++)e[a]+2*i>=t[a]&&(o[a]=Math.trunc((e[a]-t[a]+2*i)/n[a]+1));return o},di=(e,t,s,n,i,o,a,c,p,h)=>{let C,u,k,B;if(e==="VALID"&&(e=0),typeof e=="number"){C={top:e,bottom:e,left:e,right:e,front:e,back:e};let R=zo([t,s,n,1],[c,p,h],1,[i,o,a],e);u=R[0],k=R[1],B=R[2]}else if(Array.isArray(e)){if(!e.every((z,ne,J)=>z===J[0]))throw Error(`Unsupported padding parameter: ${e}`);C={top:e[0],bottom:e[1],left:e[2],right:e[3],front:e[4],back:e[5]};let R=zo([t,s,n,1],[c,p,h],1,[i,o,a],e[0]);u=R[0],k=R[1],B=R[2]}else if(e==="SAME_UPPER"){u=Math.ceil(t/i),k=Math.ceil(s/o),B=Math.ceil(n/a);let R=(u-1)*i+c-t,z=(k-1)*o+p-s,ne=(B-1)*a+h-n,J=Math.floor(R/2),W=R-J,ue=Math.floor(z/2),he=z-ue,be=Math.floor(ne/2),Be=ne-be;C={top:ue,bottom:he,left:be,right:Be,front:J,back:W}}else throw Error(`Unknown padding parameter: ${e}`);return{padInfo:C,outDepth:u,outHeight:k,outWidth:B}},lu=(e,t,s,n,i,o=!1,a="channelsLast")=>{let c,p,h,C,u;if(a==="channelsLast")[c,p,h,C,u]=e;else if(a==="channelsFirst")[c,u,p,h,C]=e;else throw new Error(`Unknown dataFormat ${a}`);let[k,,B,R,z]=t,[ne,J,W]=Lo(s),[ue,he,be]=Lo(n),Be=Rn(B,ue),Ie=Rn(R,he),nt=Rn(z,be),{padInfo:dt,outDepth:Et,outHeight:zt,outWidth:It}=di(i,p,h,C,ne,J,W,Be,Ie,nt),ht=o?k*u:k,Jt=[0,0,0,0,0];return a==="channelsFirst"?Jt=[c,ht,Et,zt,It]:a==="channelsLast"&&(Jt=[c,Et,zt,It,ht]),{batchSize:c,dataFormat:a,inDepth:p,inHeight:h,inWidth:C,inChannels:u,outDepth:Et,outHeight:zt,outWidth:It,outChannels:ht,padInfo:dt,strideDepth:ne,strideHeight:J,strideWidth:W,filterDepth:B,filterHeight:R,filterWidth:z,effectiveFilterDepth:Be,effectiveFilterHeight:Ie,effectiveFilterWidth:nt,dilationDepth:ue,dilationHeight:he,dilationWidth:be,inShape:e,outShape:Jt,filterShape:t}},uu=(e,t,s,n,i,o)=>{let a=o==="channelsLast";a?e[0].dims[3]:e[0].dims[1];let c=[64,1,1],p={x:s.map((ne,J)=>J)},h=[Math.ceil(Do(p.x.map(ne=>s[ne]))/c[0]),1,1];as("verbose",()=>`[conv3d_naive_webgpu] dispatch = ${h}`);let C=1,u=De.size(s),k=[{type:12,data:u},{type:12,data:n},{type:12,data:i},{type:12,data:t.strides},{type:12,data:t.dilations}];Zr(t,k),k.push(...Mt(e[0].dims,e[1].dims));let B=["rank","rank"],R=e.length===3;R&&(k.push(...Mt(e[2].dims)),B.push("rank")),k.push(...Mt(s));let z=ne=>{let J=[{name:"output_size",type:"u32"},{name:"filter_dims",type:"u32",length:n.length},{name:"pads",type:"u32",length:i.length},{name:"strides",type:"u32",length:t.strides.length},{name:"dilations",type:"u32",length:t.dilations.length}];Ur(t,J);let W=1,ue=ds(e[0].dataType),he=He("x",e[0].dataType,e[0].dims.length,C),be=He("W",e[1].dataType,e[1].dims.length,W),Be=[he,be],Ie=Ct("result",e[0].dataType,s.length,W),nt="";if(R){let zt=He("bias",e[2].dataType,e[2].dims.length,W);Be.push(zt),nt+=` + fn getBiasByOutputCoords(coords : array) -> ${ue} { + return bias[${a?Tt("coords",4,5):Tt("coords",1,5)}]; + }`}let dt=qs(C,ue),Et=Vr(t,dt,ue);return` + ${nt} + fn getX(d0 : u32, d1 : u32, d2 : u32, d3 : u32, d4 : u32) -> f32 { + let aIndices = array(d0, d1, d2, d3, d4); + return ${he.getByIndices("aIndices")}; + } + fn getW(d0 : u32, d1 : u32, d2 : u32, d3 : u32, d4 : u32) -> f32 { + let aIndices = array(d0, d1, d2, d3, d4); + return ${be.getByIndices("aIndices")}; + } + ${ne.registerUniforms(J).declareVariables(...Be,Ie)} + ${ne.mainStart()} + ${ne.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + let coords = ${Ie.offsetToIndices("global_idx")}; + let batch = ${Tt("coords",0,he.rank)}; + let d2 = ${a?Tt("coords",he.rank-1,he.rank):Tt("coords",1,he.rank)}; + let xFRCCorner = vec3(${a?Tt("coords",1,he.rank):Tt("coords",2,he.rank)}, + ${a?Tt("coords",2,he.rank):Tt("coords",3,he.rank)}, + ${a?Tt("coords",3,he.rank):Tt("coords",4,he.rank)}) * uniforms.strides - uniforms.pads; + let xFCorner = xFRCCorner.x; + let xRCorner = xFRCCorner.y; + let xCCorner = xFRCCorner.z; + let xShapeY = ${a?Tt("uniforms.x_shape",1,he.rank):Tt("uniforms.x_shape",2,he.rank)}; + let xShapeZ = ${a?Tt("uniforms.x_shape",2,he.rank):Tt("uniforms.x_shape",3,he.rank)}; + let xShapeW = ${a?Tt("uniforms.x_shape",3,he.rank):Tt("uniforms.x_shape",4,he.rank)}; + let xShapeU = ${a?Tt("uniforms.x_shape",4,he.rank):Tt("uniforms.x_shape",1,he.rank)}; + let inputDepthNearestVec4 = (xShapeU / 4) * 4; + let inputDepthVec4Remainder = xShapeU % 4; + + var value = 0.0; + for (var wF = 0u; wF < uniforms.filter_dims[0]; wF++) { + let xF = xFCorner + wF * uniforms.dilations[0]; + if (xF < 0 || xF >= xShapeY) { + continue; + } + + for (var wR = 0u; wR < uniforms.filter_dims[1]; wR++) { + let xR = xRCorner + wR * uniforms.dilations[1]; + if (xR < 0 || xR >= xShapeZ) { + continue; + } + + for (var wC = 0u; wC < uniforms.filter_dims[2]; wC++) { + let xC = xCCorner + wC * uniforms.dilations[2]; + if (xC < 0 || xC >= xShapeW) { + continue; + } + + for (var d1 = 0u; d1 < inputDepthNearestVec4; d1 += 4) { + ${a?`let xValues = vec4( + getX(batch, xF, xR, xC, d1), + getX(batch, xF, xR, xC, d1 + 1), + getX(batch, xF, xR, xC, d1 + 2), + getX(batch, xF, xR, xC, d1 + 3)); + `:`let xValues = vec4( + getX(batch, d1, xF, xR, xC), + getX(batch, d1 + 1, xF, xR, xC), + getX(batch, d1 + 2, xF, xR, xC), + getX(batch, d1 + 3, xF, xR, xC)); + `} + let wValues = vec4( + getW(d2, d1, wF, wR, wC), + getW(d2, d1 + 1, wF, wR, wC), + getW(d2, d1 + 2, wF, wR, wC), + getW(d2, d1 + 3, wF, wR, wC)); + value += dot(xValues, wValues); + } + if (inputDepthVec4Remainder == 1) { + ${a?`value += getX(batch, xF, xR, xC, inputDepthNearestVec4) + * getW(d2, inputDepthNearestVec4, wF, wR, wC);`:`value += getX(batch, inputDepthNearestVec4, xF, xR, xC) + * getW(d2, inputDepthNearestVec4, wF, wR, wC);`} + } else if (inputDepthVec4Remainder == 2) { + ${a?`let xValues = vec2( + getX(batch, xF, xR, xC, inputDepthNearestVec4), + getX(batch, xF, xR, xC, inputDepthNearestVec4 + 1)); + `:`let xValues = vec2( + getX(batch, inputDepthNearestVec4, xF, xR, xC), + getX(batch, inputDepthNearestVec4 + 1, xF, xR, xC)); + `} + let wValues = vec2( + getW(d2, inputDepthNearestVec4, wF, wR, wC), + getW(d2, inputDepthNearestVec4 + 1, wF, wR, wC)); + value += dot(xValues, wValues); + } else if (inputDepthVec4Remainder == 3) { + ${a?`let xValues = vec3( + getX(batch, xF, xR, xC, inputDepthNearestVec4), + getX(batch, xF, xR, xC, inputDepthNearestVec4 + 1), + getX(batch, xF, xR, xC, inputDepthNearestVec4 + 2)); + `:`let xValues = vec3( + getX(batch, inputDepthNearestVec4, xF, xR, xC), + getX(batch, inputDepthNearestVec4 + 1, xF, xR, xC), + getX(batch, inputDepthNearestVec4 + 2, xF, xR, xC)); + `} + let wValues = vec3( + getW(d2, inputDepthNearestVec4, wF, wR, wC), + getW(d2, inputDepthNearestVec4 + 1, wF, wR, wC), + getW(d2, inputDepthNearestVec4 + 2, wF, wR, wC)); + value += dot(xValues, wValues); + } + } + } + } + ${R?"value = value + getBiasByOutputCoords(coords)":""}; + ${Et} + result[global_idx] = f32(value); + }`};return{name:"Conv3DNaive",shaderCache:{hint:`${t.cacheKey};${a};${C};${R}`,inputDependencies:B},getRunData:()=>({outputs:[{dims:s,dataType:e[0].dataType}],dispatchGroup:{x:h[0],y:h[1],z:h[2]},programUniforms:k}),getShaderSource:z}}}),du,cu,pu=y(()=>{Ot(),$t(),qt(),en(),du=(e,t,s,n)=>{let i=e.length>2,o=i?"value += b[output_channel];":"",a=e[0].dims,c=e[1].dims,p=t.format==="NHWC",h=p?s[3]:s[1],C=h/t.group,u=p&&C>=4?Gt(h):1,k=De.size(s)/u,B=[{type:12,data:k},{type:12,data:t.dilations},{type:12,data:[t.strides[0],t.strides[1]]},{type:12,data:[t.pads[0],t.pads[1]]},{type:12,data:C}];Zr(t,B),B.push(...Mt(a,[c[0],c[1],c[2],c[3]/u]));let R=i?["rank","rank","rank"]:["rank","rank"];B.push(...Mt([s[0],s[1],s[2],s[3]/u]));let z=ne=>{let J=Ct("output",e[0].dataType,s.length,u),W=ds(J.type.tensor),ue=Vr(t,J.type.value,W),he=He("x",e[0].dataType,a.length),be=He("w",e[1].dataType,c.length,u),Be=[he,be];i&&Be.push(He("b",e[2].dataType,e[2].dims,u));let Ie=[{name:"output_size",type:"u32"},{name:"dilations",type:"u32",length:t.dilations.length},{name:"strides",type:"u32",length:2},{name:"pads",type:"u32",length:2},{name:"output_channels_per_group",type:"u32"}];Ur(t,Ie);let nt=p?` + for (var wHeight: u32 = 0u; wHeight < uniforms.w_shape[0]; wHeight++) { + let xHeight = xRCCorner.x + wHeight * uniforms.dilations[0]; + + if (xHeight < 0u || xHeight >= uniforms.x_shape[1]) { + continue; + } + + for (var wWidth: u32 = 0u; wWidth < uniforms.w_shape[1]; wWidth++) { + let xWidth = xRCCorner.y + wWidth * uniforms.dilations[1]; + if (xWidth < 0u || xWidth >= uniforms.x_shape[2]) { + continue; + } + + for (var wInChannel: u32 = 0u; wInChannel < uniforms.w_shape[2]; wInChannel++) { + let input_channel = in_channel_offset + wInChannel; + let xVal = ${he.get("batch","xHeight","xWidth","input_channel")}; + let wVal = ${be.get("wHeight","wWidth","wInChannel","output_channel")}; + value += xVal * wVal; + } + } + } + `:` + for (var wInChannel: u32 = 0u; wInChannel < uniforms.w_shape[1]; wInChannel++) { + let input_channel = in_channel_offset + wInChannel; + for (var wHeight: u32 = 0u; wHeight < uniforms.w_shape[2]; wHeight++) { + let xHeight = xRCCorner.x + wHeight * uniforms.dilations[0]; + + if (xHeight < 0u || xHeight >= uniforms.x_shape[2]) { + continue; + } + + for (var wWidth: u32 = 0u; wWidth < uniforms.w_shape[3]; wWidth++) { + let xWidth = xRCCorner.y + wWidth * uniforms.dilations[1]; + if (xWidth < 0u || xWidth >= uniforms.x_shape[3]) { + continue; + } + + let xVal = ${he.get("batch","input_channel","xHeight","xWidth")}; + let wVal = ${be.get("output_channel","wInChannel","wHeight","wWidth")}; + value += xVal * wVal; + } + } + } + `;return` + ${ne.registerUniforms(Ie).declareVariables(...Be,J)} + + ${ne.mainStart()} + ${ne.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + + let outputIndices = ${J.offsetToIndices("global_idx")}; + let batch: u32 = outputIndices[0]; + let output_channel: u32 = outputIndices[${p?3:1}]; + let xRCCorner: vec2 = vec2(outputIndices[${p?1:2}], outputIndices[${p?2:3}]) * uniforms.strides - uniforms.pads; + let group_id: u32 = output_channel * ${u} / uniforms.output_channels_per_group; + var in_channel_offset = group_id * uniforms.w_shape[${p?2:1}]; + + var value: ${J.type.value} = ${J.type.value}(0); + ${nt} + ${o} + ${ue} + ${J.setByOffset("global_idx","value")} + }`};return{name:"GroupedConv",shaderCache:{hint:`${t.cacheKey}_${u}`,inputDependencies:R},getRunData:()=>({outputs:[{dims:n?n(s):s,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(k/64)},programUniforms:B}),getShaderSource:z}},cu=(e,t,s,n)=>{let i=e.length>2,o=Gt(s[3]),a=Gt(s[2]),c=De.size(s)/o/a,p=[e[0].dims[0],e[0].dims[1],e[0].dims[2],e[0].dims[3]/o],h=[e[1].dims[0],e[1].dims[1],e[1].dims[2],e[1].dims[3]/o],C=[s[0],s[1],s[2],s[3]/o],u=[{type:12,data:c},{type:6,data:[t.strides[0],t.strides[1]]},{type:6,data:[t.pads[0],t.pads[1]]}];Zr(t,u),u.push(...Mt(p,h,C));let k=(a-1)*t.strides[1]+h[1],B=R=>{let z=Ct("output",e[0].dataType,C.length,o),ne=ds(z.type.tensor),J=Vr(t,z.type.value,ne),W=He("x",e[0].dataType,p.length,o),ue=He("w",e[1].dataType,h.length,o),he=[W,ue];i&&he.push(He("b",e[2].dataType,e[2].dims,o));let be=i?"value += b[output_channel];":"",Be=[{name:"output_size",type:"u32"},{name:"strides",type:"i32",length:2},{name:"pads",type:"i32",length:2}];return Ur(t,Be),` + ${R.registerUniforms(Be).declareVariables(...he,z)} + ${R.mainStart()} + ${R.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + let width0 = uniforms.output_shape[3]; + let output_channel = global_idx % width0; + var index1 = global_idx / width0; + let width1 = uniforms.output_shape[2] / ${a}u; + let col = (index1 % width1) * ${a}u; + index1 = index1 / width1; + let row = index1 % uniforms.output_shape[1]; + let batch = index1 / uniforms.output_shape[1]; + + let x_corner = vec2(i32(row), i32(col)) * uniforms.strides - uniforms.pads; + + var x_vals: array<${W.type.value}, ${k}>; + var values: array<${z.type.value}, ${a}>; + let input_channel = output_channel; + // Use constant instead of uniform can give better performance for w's height/width. + for (var w_height: u32 = 0u; w_height < ${h[0]}; w_height++) { + let x_height = x_corner.x + i32(w_height); + if (x_height >= 0 && u32(x_height) < uniforms.x_shape[1]) { + for (var i = 0; i < ${k}; i++) { + let x_width = x_corner.y + i; + if (x_width >= 0 && u32(x_width) < uniforms.x_shape[2]) { + x_vals[i] = ${W.get("batch","u32(x_height)","u32(x_width)","input_channel")}; + } else { + x_vals[i] = ${W.type.value}(0); + } + } + for (var w_width: u32 = 0u; w_width < ${h[1]}; w_width++) { + let w_val = ${ue.get("w_height","w_width","0","output_channel")}; + for (var i = 0u; i < ${a}u; i++) { + values[i] = fma(x_vals[i * u32(uniforms.strides[1]) + w_width], w_val, values[i]); + } + } + } + } + + for (var i = 0u; i < ${a}u; i++) { + var value = values[i]; + ${be} + ${J} + ${z.set("batch","row","col + i","output_channel","value")}; + } + }`};return{name:"GroupedConv-Vectorize",shaderCache:{hint:`${t.cacheKey};${o};${a};${k};${h[0]};${h[1]}`,inputDependencies:i?["rank","rank","type"]:["rank","rank"]},getRunData:()=>({outputs:[{dims:n?n(s):s,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(c/64)},programUniforms:u}),getShaderSource:B}}}),hu,ci,Bo,pi,Ro,No,mu,jo,Vo,Mc=y(()=>{$t(),wc(),yc(),Fo(),pu(),en(),ko(),jr(),hu=(e,t,s,n,i,o)=>{let a=e[0],c=e.slice(o?1:2,o?3:4),p=c.length,h=t[0],C=t.slice(2).map((k,B)=>k+(k-1)*(s[B]-1)),u=c.map((k,B)=>k+n[B]+n[B+p]).map((k,B)=>Math.floor((k-C[B]+i[B])/i[B]));return u.splice(0,0,a),u.splice(o?3:1,0,h),u},ci=[2,3,1,0],Bo=(e,t)=>{if(!e||e.length!==2&&e.length!==3)throw new Error("Conv requires 2 or 3 inputs");if(e[0].dims.length>5)throw new Error("greater than 5D is not supported");if(e[0].dims.length!==e[1].dims.length)throw new Error("filter does not have same dimension as input");let s=e[0].dims[t.format==="NHWC"?e[0].dims.length-1:1],n=e[1].dims[1]*t.group;if(s!==n)throw new Error("FILTER_IN_CHANNEL should be equal to DATA_CHANNEL");if(e.length===3&&(e[2].dims.length!==1||e[1].dims[0]!==e[2].dims[0]))throw new Error("invalid bias");let i=e[0].dims.length-2;if(t.dilations.length!==i)throw new Error(`dilations should be ${i}D`);if(t.strides.length!==i)throw new Error(`strides should be ${i}D`);if(t.pads.length!==i*2)throw new Error(`pads should be ${i*2}D`);if(t.kernelShape.length!==0&&t.kernelShape.length!==e[1].dims.length-2)throw new Error("invalid kernel shape")},pi=(e,t)=>{let s=e.kernelShape.slice();s.length{let t=To(e),s=e.format,n=["NOTSET","VALID","SAME_UPPER","SAME_LOWER"][e.auto_pad],i=e.dilations,o=e.group,a=e.kernel_shape,c=e.pads,p=e.strides,h=e.w_is_const();return{autoPad:n,format:s,dilations:i,group:o,kernelShape:a,pads:c,strides:p,wIsConst:h,...t,cacheKey:`${e.format};${t.activation};`}},No=(e,t,s,n)=>{let i=s.format==="NHWC",o=hu(t[0].dims,t[1].dims,s.dilations,s.pads,s.strides,i);if(s.group!==1){let Be=[t[0]];if(i){let Ie=e.kernelCustomData.wT??e.compute(cr(t[1],ci),{inputs:[1],outputs:[s.wIsConst?-2:-1]})[0];s.wIsConst&&!e.kernelCustomData.wT&&(e.kernelCustomData.wT=Ie),Be.push(Ie)}else Be.push(t[1]);t.length===3&&Be.push(t[2]),!e.adapterInfo.isArchitecture("ampere")&&i&&t[1].dims[0]===s.group&&t[1].dims[1]===1&&s.dilations[0]===1&&s.dilations[1]===1?e.compute(cu(Be,s,o,n),{inputs:Be}):e.compute(du(Be,s,o,n),{inputs:Be});return}let a=t.length===3,c=t[0].dims[i?1:2],p=t[0].dims[i?2:3],h=t[0].dims[i?3:1],C=t[1].dims[2],u=t[1].dims[3],k=o[i?1:2],B=o[i?2:3],R=o[i?3:1],z=i&&C===c&&u===p&&s.pads[0]===0&&s.pads[1]===0;if(z||C===1&&u===1&&s.dilations[0]===1&&s.dilations[1]===1&&s.strides[0]===1&&s.strides[1]===1&&s.pads[0]===0&&s.pads[1]===0){let Be=o[0],Ie,nt,dt,Et=[];if(i){let ht=e.kernelCustomData.wT??e.compute(cr(t[1],ci),{inputs:[1],outputs:[s.wIsConst?-2:-1]})[0];if(s.wIsConst&&!e.kernelCustomData.wT&&(e.kernelCustomData.wT=ht),z){let Jt=c*p*h;Ie=t[0].reshape([1,Be,Jt]),nt=ht.reshape([1,Jt,R]),dt=[1,Be,R]}else Ie=t[0].reshape([Be,c*p,h]),nt=ht.reshape([1,h,R]),dt=[Be,k*B,R];Et.push(Ie),Et.push(nt)}else Ie=t[0].reshape([Be,h,c*p]),nt=t[1].reshape([1,R,h]),dt=[Be,R,k*B],Et.push(nt),Et.push(Ie);a&&Et.push(t[2]);let zt=dt[2],It=Et[0].dims[Et[0].dims.length-1];zt<8&&It<8?e.compute(Co(Et,s,o,dt,i,n),{inputs:Et}):e.compute(ui(Et,s,o,dt,i,n),{inputs:Et});return}let ne=!0,J=e.kernelCustomData.wT??e.compute(cr(t[1],ci),{inputs:[1],outputs:[s.wIsConst?-2:-1]})[0];s.wIsConst&&!e.kernelCustomData.wT&&(e.kernelCustomData.wT=J);let W=[t[0],J];a&&W.push(t[2]);let ue=i?k*B:R,he=i?R:k*B,be=C*u*h;e.compute(ou(W,s,o,ue,he,be,a,ne,n),{inputs:W})},mu=(e,t)=>{let s=t.format==="NHWC",n=[e.inputs[0].reshape(s?[e.inputs[0].dims[0],1,e.inputs[0].dims[1],e.inputs[0].dims[2]]:[e.inputs[0].dims[0],e.inputs[0].dims[1],1,e.inputs[0].dims[2]]),e.inputs[1].reshape([e.inputs[1].dims[0],e.inputs[1].dims[1],1,e.inputs[1].dims[2]])];e.inputs.length===3&&n.push(e.inputs[2]);let i=[0,t.pads[0],0,t.pads[1]],o=[1].concat(t.strides),a=[1].concat(t.dilations),c=[1].concat(t.kernelShape),p=pi({...t,pads:i,strides:o,dilations:a,kernelShape:c},n);No(e,n,p,h=>s?[h[0],h[2],h[3]]:[h[0],h[1],h[3]])},jo=(e,t,s)=>{let n=s.format==="NHWC"?"channelsLast":"channelsFirst",i=pi(s,t),o=s.autoPad==="NOTSET"?s.pads:s.autoPad,a=lu(t[0].dims,t[1].dims,s.strides,s.dilations,o,!1,n);e.compute(uu(t,i,a.outShape,[a.filterDepth,a.filterHeight,a.filterWidth],[a.padInfo.front,a.padInfo.top,a.padInfo.left],n))},Vo=(e,t)=>{if(Bo(e.inputs,t),e.inputs[0].dims.length===3)mu(e,t);else if(e.inputs[0].dims.length===5)jo(e,e.inputs,t);else{let s=pi(t,e.inputs);No(e,e.inputs,s)}}}),Uo,bc=y(()=>{Ot(),Te(),$t(),qt(),Uo=(e,t,s)=>{let n=e.length>2,i=t.outputShape,o=t.format==="NHWC",a=t.group,c=e[1].dims,p=c[2]/a,h=c[3],C=o?Gt(p):1,u=o?Gt(h):1,k=o?h===1?C:u:1,B=De.size(i)/u,R=[Math.ceil(B/64),1,1];as("verbose",()=>`[conv2d_backprop_webgpu] dispatch = ${R}`);let z=["rank","rank"],ne=[t.strides[0],t.strides[1]],J=[t.kernelShape[o?1:2],t.kernelShape[o?2:3]],W=[t.dilations[0],t.dilations[1]],ue=[J[0]+(t.dilations[0]<=1?0:(t.kernelShape[o?1:2]-1)*(t.dilations[0]-1)),J[1]+(t.dilations[1]<=1?0:(t.kernelShape[o?2:3]-1)*(t.dilations[1]-1))],he=[ue[0]-1-Math.floor((t.pads[0]+t.pads[2])/2),ue[1]-1-Math.floor((t.pads[1]+t.pads[3])/2)],be=[{type:12,data:B},{type:12,data:ne},{type:12,data:J},{type:12,data:W},{type:12,data:ue},{type:6,data:he},{type:12,data:p},{type:12,data:h},...Mt(e[0].dims,e[1].dims)];n&&(be.push(...Mt(e[2].dims)),z.push("rank")),be.push(...Mt(i));let Be=Ie=>{let nt=[{name:"output_size",type:"u32"},{name:"strides",type:"u32",length:ne.length},{name:"filter_dims",type:"u32",length:J.length},{name:"dilations",type:"u32",length:J.length},{name:"effective_filter_dims",type:"u32",length:ue.length},{name:"pads",type:"i32",length:he.length},{name:"input_channels_per_group",type:"u32"},{name:"output_channels_per_group",type:"u32"}],dt=ds(e[0].dataType),Et=o?1:2,zt=o?2:3,It=o?3:1,ht=He("W",e[1].dataType,e[1].dims.length,k),Jt=He("Dy",e[0].dataType,e[0].dims.length,C),Vt=[Jt,ht];n&&Vt.push(He("bias",e[2].dataType,[i[It]].length,u));let St=Ct("result",e[0].dataType,i.length,u),ts=()=>{let Ut="";if(C===1)Ut+=` + let w_offset = ${ht.indicesToOffset(`${ht.type.indices}(u32(wRPerm), u32(wCPerm), inputChannel, wOutChannel)`)}; + let wValue = ${ht.getByOffset(`w_offset / ${k}`)}; + dotProd = dotProd + xValue * wValue;`;else if(h===1)Ut+=` + let wValue = ${ht.getByOffset(`${ht.indicesToOffset(`${ht.type.indices}(u32(wRPerm), u32(wCPerm), inputChannel, wOutChannel)`)} / ${k}`)}; + dotProd = dotProd + dot(xValue, wValue);`;else for(let $s=0;$s(i32(r), i32(c)) - uniforms.pads; + let dyRCorner = dyCorner.x; + let dyCCorner = dyCorner.y; + let groupId = d1 / uniforms.output_channels_per_group; + let wOutChannel = d1 - groupId * uniforms.output_channels_per_group; + // Convolve dy(?, ?, d2) with w(:, :, d1, d2) to compute dx(xR, xC, d1). + // ? = to be determined. : = across all values in that axis. + var dotProd = ${St.type.value}(0.0); + for (var wR: u32 = 0; wR < uniforms.effective_filter_dims.x; wR = wR + 1) { + if (wR % uniforms.dilations.x != 0) { + continue; + } + let dyR = (${dt}(dyRCorner) + ${dt}(wR)) / ${dt}(uniforms.strides[0]); + let wRPerm = uniforms.filter_dims.x - 1 - wR / uniforms.dilations.x; + if (dyR < 0.0 || dyR >= ${dt}(uniforms.Dy_shape[${Et}]) || fract(dyR) > 0.0 || + wRPerm < 0) { + continue; + } + wR = wR + uniforms.strides[0] - 1; + let idyR: u32 = u32(dyR); + + for (var wC: u32 = 0; wC < uniforms.effective_filter_dims.y; wC = wC + 1) { + if (wC % uniforms.dilations.y != 0) { + continue; + } + let dyC = (${dt}(dyCCorner) + ${dt}(wC)) / ${dt}(uniforms.strides.y); + let wCPerm = uniforms.filter_dims.y - 1 - wC / uniforms.dilations.y; + if (dyC < 0.0 || dyC >= ${dt}(uniforms.Dy_shape[${zt}]) || + fract(dyC) > 0.0 || wCPerm < 0) { + continue; + } + wC = wC + uniforms.strides.y - 1; + let idyC: u32 = u32(dyC); + var inputChannel = groupId * uniforms.input_channels_per_group; + for (var d2: u32 = 0; d2 < uniforms.input_channels_per_group; d2 = d2 + ${C}) { + let xValue = ${o?Jt.getByOffset(`${Jt.indicesToOffset(`${Jt.type.indices}(batch, idyR, idyC, inputChannel)`)} / ${C}`):Jt.get("batch","inputChannel","idyR","idyC")}; + ${ts()} + inputChannel = inputChannel + ${C}; + } + } + } + let value = dotProd${n?` + bias[d1 / ${u}]`:""}; + ${St.setByOffset("global_idx","value")}; + `;return` + ${Ie.registerUniforms(nt).declareVariables(...Vt,St)} + ${Ie.mainStart()} + ${Ie.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")}; + ${Xt}}`};return{name:"ConvTranspose2D",shaderCache:{hint:`${t.cacheKey};${C}${k}${u}${h===1}`,inputDependencies:z},getRunData:()=>({dispatchGroup:{x:R[0],y:R[1],z:R[2]},outputs:[{dims:s?s(i):i,dataType:e[0].dataType}],programUniforms:be}),getShaderSource:Be}}}),fu,Wo,_u,Go,Ko,gu,Ho,wu,yu,Mu=y(()=>{bc(),en(),jr(),fu=(e,t,s,n,i,o)=>(e-1)*t+s+(n-1)*i+1-o,Wo=(e,t,s,n,i)=>{let o=Math.floor(e/2);t==="SAME_UPPER"?(s[n]=o,s[i]=e-o):t==="SAME_LOWER"&&(s[n]=e-o,s[i]=o)},_u=(e,t,s,n,i,o,a,c,p,h)=>{let C=e.length-2,u=h.length===0;p.length{let s=e.kernelShape.slice();if(e.kernelShape.length===0||e.kernelShape.reduce((u,k)=>u*k,1)===0){s.length=0;for(let u=2;uu+k,0)===0){let u=t[0].dims.length-2;p=new Array(u).fill(1)}let h=e.strides.slice();if(h.reduce((u,k)=>u+k,0)===0){let u=t[0].dims.length-2;h=new Array(u).fill(1)}_u(c,s,p,e.autoPad,e.group,i,h,n,a,o);let C=Object.assign({},e);return Object.assign(C,{kernelShape:s,pads:i,outputPadding:a,outputShape:o,dilations:p,strides:h}),C},Ko=e=>{let t=To(e),s=e.format,n=["NOTSET","VALID","SAME_UPPER","SAME_LOWER"][typeof e.autoPad>"u"?0:e.autoPad],i=e.dilations,o=e.group,a=e.kernelShape,c=e.pads,p=e.strides,h=e.wIsConst(),C=e.outputPadding,u=e.outputShape;return{autoPad:n,format:s,dilations:i,group:o,kernelShape:a,outputPadding:C,outputShape:u,pads:c,strides:p,wIsConst:h,...t,cacheKey:`${e.format};${t.activation};`}},gu=(e,t)=>{if(!e||e.length!==2&&e.length!==3)throw new Error("Conv requires 2 or 3 inputs");if(e[0].dims.length!==4&&e[0].dims.length!==3)throw new Error("currently only support 2-dimensional conv");if(e[0].dims.length!==e[1].dims.length)throw new Error("filter does not have same dimension as input");let s=e[0].dims[t.format==="NHWC"?e[0].dims.length-1:1],n=e[1].dims[0];if(s!==n)throw new Error("FILTER_IN_CHANNEL should be equal to DATA_CHANNEL");let i=e[1].dims[1]*t.group;if(e.length===3&&(e[2].dims.length!==1||e[2].dims[0]!==i))throw new Error("invalid bias");let o=e[0].dims.length-2;if(t.dilations.reduce((a,c)=>a+c,0)>0&&t.dilations.length!==o)throw new Error(`dilations should be ${o}D`);if(t.strides.reduce((a,c)=>a+c,0)>0&&t.strides.length!==o)throw new Error(`strides should be ${o}D`);if(t.pads.reduce((a,c)=>a+c,0)>0&&t.pads.length!==o*2)throw new Error(`pads should be ${o*2}D`);if(t.outputPadding.length!==o&&t.outputPadding.length!==0)throw new Error(`output_padding should be ${o}D`);if(t.kernelShape.reduce((a,c)=>a+c,0)>0&&t.kernelShape.length!==0&&t.kernelShape.length!==e[1].dims.length-2)throw new Error("invalid kernel shape");if(t.outputShape.length!==0&&t.outputShape.length!==e[0].dims.length-2)throw new Error("invalid output shape")},Ho=(e,t,s,n)=>{let i=e.kernelCustomData.wT??e.compute(cr(t[1],[2,3,0,1]),{inputs:[1],outputs:[s.wIsConst?-2:-1]})[0];s.wIsConst&&!e.kernelCustomData.wT&&(e.kernelCustomData.wT=i);let o=[t[0],i];t.length===3&&o.push(t[2]),e.compute(Uo(o,s,n),{inputs:o})},wu=(e,t)=>{let s=t.format==="NHWC",n=[e.inputs[0].reshape(s?[e.inputs[0].dims[0],1,e.inputs[0].dims[1],e.inputs[0].dims[2]]:[e.inputs[0].dims[0],e.inputs[0].dims[1],1,e.inputs[0].dims[2]]),e.inputs[1].reshape([e.inputs[1].dims[0],e.inputs[1].dims[1],1,e.inputs[1].dims[2]])];e.inputs.length===3&&n.push(e.inputs[2]);let i=t.kernelShape;(i.length===0||i[0]===0)&&(i=[e.inputs[1].dims[2]]);let o=t.dilations;(o.length===0||o[0]===0)&&(o=[1]);let a=t.strides;(a.length===0||a[0]===0)&&(a=[1]);let c=t.pads;c.length===0&&(c=[0,0]),c=[0,c[0],0,c[1]],a=[1].concat(a),o=[1].concat(o),i=[1].concat(i);let p=Go({...t,pads:c,strides:a,dilations:o,kernelShape:i},n);Ho(e,n,p,h=>s?[h[0],h[2],h[3]]:[h[0],h[1],h[3]])},yu=(e,t)=>{if(gu(e.inputs,t),e.inputs[0].dims.length===3)wu(e,t);else{let s=Go(t,e.inputs);Ho(e,e.inputs,s)}}}),bu,vu,xu,vc=y(()=>{Ot(),$t(),is(),qt(),bu=(e,t,s,n)=>{let i=De.size(t),o=t.length,a=He("input",e,o),c=Ct("output",e,o),p=s.dataType===6?s.getInt32Array()[0]:Number(s.getBigInt64Array()[0]),h=De.normalizeAxis(p,o),C=u=>{let k=` i32(${a.indicesGet("inputIndices","uniforms.axis")}) `,B=Tt("uniforms.input_shape","uniforms.axis",o),R=n.reverse?k+(n.exclusive?" + 1":""):"0",z=n.reverse?B:k+(n.exclusive?"":" + 1");return` + ${u.registerUniform("outputSize","u32").registerUniform("axis","u32").declareVariables(a,c)} + ${u.mainStart()} + ${u.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} + var inputIndices = ${c.offsetToIndices("global_idx")}; + var sum = ${c.type.value}(0); + let first : i32 = ${R}; + let last : i32 = ${z}; + for (var i : i32 = first; i < last; i++) { + ${a.indicesSet("inputIndices","uniforms.axis","u32(i)")}; + sum = sum + ${a.getByIndices("inputIndices")}; + } + ${c.setByOffset("global_idx","sum")}; + }`};return{name:"CumSum",shaderCache:{hint:n.cacheKey,inputDependencies:["rank"]},getRunData:()=>({outputs:[{dims:t,dataType:e}],dispatchGroup:{x:Math.ceil(i/64)},programUniforms:[{type:12,data:i},{type:12,data:h},...Mt(t,t)]}),getShaderSource:C}},vu=(e,t)=>{let s=e.inputs[0].dims,n=e.inputs[0].dataType,i=e.inputs[1];e.compute(bu(n,s,i,t),{inputs:[0]})},xu=e=>{let t=e.exclusive===1,s=e.reverse===1;return jt({exclusive:t,reverse:s})}}),Tu,Pu,qo,Eu,Cu,ku=y(()=>{Ot(),$t(),is(),qt(),Tu=e=>{if(!e||e.length!==1)throw new Error("DepthToSpace requires 1 input.");if(e[0].dims.length!==4)throw new Error("DepthToSpace requires 4D input.")},Pu=(e,t,s,n)=>{let i=[];i.push(`fn perm(i: ${n.type.indices}) -> ${s.type.indices} { + var a: ${s.type.indices};`);for(let o=0;o{let s,n,i,o,a,c,p=t.format==="NHWC",h=t.blocksize,C=t.mode==="DCR";p?([s,n,i,o]=e.dims,a=C?[s,n,i,h,h,o/h**2]:[s,n,i,o/h**2,h,h],c=C?[0,1,3,2,4,5]:[0,1,4,2,5,3]):([s,n,i,o]=[e.dims[0],e.dims[2],e.dims[3],e.dims[1]],a=C?[s,h,h,o/h**2,n,i]:[s,o/h**2,h,h,n,i],c=C?[0,3,4,1,5,2]:[0,1,4,2,5,3]);let u=e.reshape(a),k=u.dims.length,B=e.dataType,R=He("a",B,k),z=Ct("output",B,k),ne=J=>` + ${J.registerUniform("output_size","u32").declareVariables(R,z)} + + ${Pu(c,k,R,z)} + + ${J.mainStart()} + ${J.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + + let indices = ${z.offsetToIndices("global_idx")}; + let aIndices = perm(indices); + + ${z.setByOffset("global_idx",R.getByIndices("aIndices"))} + }`;return{name:"DepthToSpace",shaderCache:{hint:`${e.dims};${t.blocksize};${t.mode}`,inputDependencies:["rank"]},getRunData:J=>{let W=p?[s,n*h,i*h,o/h**2]:[s,o/h**2,n*h,i*h],ue=De.size(W),he=u.dims,be=De.sortBasedOnPerm(he,c);return{outputs:[{dims:W,dataType:J[0].dataType}],dispatchGroup:{x:Math.ceil(ue/64)},programUniforms:[{type:12,data:ue},...Mt(he,be)]}},getShaderSource:ne}},Eu=(e,t)=>{Tu(e.inputs),e.compute(qo(e.inputs[0],t))},Cu=e=>jt({blocksize:e.blocksize,mode:e.mode,format:e.format})}),hi,Nn,Sr,Su,$u,Au,Iu,mi,Fu,Ou,Du,xc=y(()=>{Ot(),$t(),is(),qt(),hi="[a-zA-Z]|\\.\\.\\.",Nn="("+hi+")+",Sr="^"+Nn+"$",Su="("+Nn+",)*"+Nn,$u="^"+Su+"$",Au=class{constructor(e=-1){this.symbolToIndices=new Map,this.inputIndex=e}addSymbol(e,t){let s=this.symbolToIndices.get(e);s===void 0?s=[t]:s.push(t),this.symbolToIndices.set(e,s)}},Iu=class{constructor(e,t){this.equation=t,this.hasEllipsis=!1,this.symbolToInfo=new Map,this.lhs=new Array,this.outputDims=[];let[s,n]=t.includes("->")?t.split("->",2):[t,""];if(!s.match(RegExp($u)))throw new Error("Invalid LHS term");if(s.split(",").forEach((i,o)=>{let a=e[o].dims.slice();if(!i.match(RegExp(Sr)))throw new Error("Invalid LHS term");let c=this.processTerm(i,!0,a,o);this.lhs.push(c)}),n==="")n+=[...this.symbolToInfo.entries()].filter(([i,o])=>o.count===1||i==="...").map(([i])=>i).join("");else if(!n.match(RegExp(Nn)))throw new Error("Invalid RHS");n.match(RegExp(hi,"g"))?.forEach(i=>{if(i==="...")this.outputDims=this.outputDims.concat(this.ellipsisDims);else{let o=this.symbolToInfo.get(i);if(o===void 0)throw new Error("Invalid RHS symbol");this.outputDims.push(o.dimValue)}}),this.rhs=this.processTerm(n,!1,this.outputDims)}addSymbol(e,t,s){let n=this.symbolToInfo.get(e);if(n!==void 0){if(n.dimValue!==t&&n.count!==1)throw new Error("Dimension mismatch");n.count++,n.inputIndices.push(s)}else n={count:1,dimValue:t,inputIndices:[s]};this.symbolToInfo.set(e,n)}processTerm(e,t,s,n=-1){let i=s.length,o=!1,a=[],c=0;if(!e.match(RegExp(Sr))&&!t&&e!=="")throw new Error("Invalid LHS term");let p=e.match(RegExp(hi,"g")),h=new Au(n);return p?.forEach((C,u)=>{if(C==="..."){if(o)throw new Error("Only one ellipsis is allowed per input term");o=!0;let k=i-p.length+1;if(k<0)throw new Error("Ellipsis out of bounds");if(a=s.slice(c,c+k),this.hasEllipsis){if(this.ellipsisDims.length!==a.length||this.ellipsisDims.toString()!==a.toString())throw new Error("Ellipsis dimensions mismatch")}else if(t)this.hasEllipsis=!0,this.ellipsisDims=a;else throw new Error("Ellipsis must be specified in the LHS");for(let B=0;Be+"_max",Fu=(e,t,s,n)=>{let i=e.map(h=>h.length).map((h,C)=>He(`input${C}`,t,h)),o=De.size(n),a=Ct("output",t,n.length),c=[...s.symbolToInfo.keys()].filter(h=>!s.rhs.symbolToIndices.has(h)),p=h=>{let C=[],u="var prod = 1.0;",k="var sum = 0.0;",B="sum += prod;",R=[],z=[],ne=[],J=[],W=s.symbolToInfo.size===s.rhs.symbolToIndices.size;s.symbolToInfo.forEach((he,be)=>{if(s.rhs.symbolToIndices.has(be)){let Be=s.rhs.symbolToIndices.get(be)?.[0];Be!==void 0&&s.lhs.forEach((Ie,nt)=>{if(he.inputIndices.includes(nt)){let dt=Ie.symbolToIndices.get(be);if(dt===void 0)throw new Error("Invalid symbol error");dt.forEach(Et=>{C.push(`${i[nt].indicesSet(`input${nt}Indices`,Et,a.indicesGet("outputIndices",Be))}`)})}})}else s.lhs.forEach((Be,Ie)=>{if(he.inputIndices.includes(Ie)){let nt=Be.symbolToIndices.get(be);if(nt===void 0)throw new Error("Invalid symbol error");nt.forEach(dt=>{R.push(`${i[Ie].indicesSet(`input${Ie}Indices`,dt,`${be}`)}`)}),J.push(`prod *= ${i[Ie].getByIndices(`input${Ie}Indices`)};`)}}),z.push(`for(var ${be}: u32 = 0; ${be} < uniforms.${mi(be)}; ${be}++) {`),ne.push("}")});let ue=W?[...C,`let sum = ${i.map((he,be)=>he.getByIndices(`input${be}Indices`)).join(" * ")};`]:[...C,k,...z,...R,u,...J,B,...ne];return` + ${h.registerUniforms(c.map(he=>({name:`${mi(he)}`,type:"u32"}))).registerUniform("outputSize","u32").declareVariables(...i,a)} + + ${h.mainStart()} + ${h.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} + var outputIndices = ${a.offsetToIndices("global_idx")}; + ${i.map((he,be)=>`var input${be}Indices: ${i[be].type.indices};`).join(` +`)} + ${ue.join(` +`)}; + ${a.setByOffset("global_idx","sum")}; + }`};return{name:"Einsum",shaderCache:{hint:s.equation,inputDependencies:e.map(()=>"rank")},getRunData:()=>{let h=c.filter(u=>s.symbolToInfo.has(u)).map(u=>({type:12,data:s.symbolToInfo.get(u)?.dimValue||0}));h.push({type:12,data:o});let C=e.map((u,k)=>[...Mt(u)]).reduce((u,k)=>u.concat(k),h);return C.push(...Mt(n)),{outputs:[{dims:n,dataType:t}],dispatchGroup:{x:Math.ceil(o/64)},programUniforms:C}},getShaderSource:p}},Ou=(e,t)=>{let s=new Iu(e.inputs,t.equation),n=s.outputDims,i=e.inputs.map((o,a)=>o.dims);e.compute(Fu(i,e.inputs[0].dataType,s,n))},Du=e=>{let t=e.equation.replace(/\s+/g,"");return jt({equation:t})}}),fi,Qo,Lu,zu,jn,Tc=y(()=>{Ot(),$t(),qt(),fi=e=>{if(!e||e.length!==2)throw new Error("Expand requires 2 input.");let t=e[0].dims,s=Array.from(e[1].getBigInt64Array(),Number),n=s.length{let s=e.length-t.length,n=[];for(let i=0;ie.length>t.length?Qo(e,t):Qo(t,e),zu=e=>{let t=e[0].dims,s=Array.from(e[1].getBigInt64Array(),Number),n=Lu(t,s),i=e[0].dataType,o=i===9||De.size(t)===1,a=i===9||t.length>0&&t[t.length-1]%4===0?4:1,c=o||n.length>0&&n[n.length-1]%4===0?4:1,p=Math.ceil(De.size(n)/c),h=u=>{let k=He("input",i,t.length,a),B=Ct("output",i,n.length,c),R;if(i===9){let z=(ne,J,W="")=>` + let outputIndices${J} = ${B.offsetToIndices(`outputOffset + ${J}u`)}; + let offset${J} = ${k.broadcastedIndicesToOffset(`outputIndices${J}`,B)}; + let index${J} = offset${J} / 4u; + let component${J} = offset${J} % 4u; + ${ne}[${J}] = ${W}(${k.getByOffset(`index${J}`)}[component${J}]); + `;R=` + let outputOffset = global_idx * ${c}; + var data = vec4(0); + ${z("data",0,"u32")} + ${z("data",1,"u32")} + ${z("data",2,"u32")} + ${z("data",3,"u32")} + ${B.setByOffset("global_idx","data")} + }`}else R=` + let outputIndices = ${B.offsetToIndices(`global_idx * ${c}`)}; + let inputOffset = ${k.broadcastedIndicesToOffset("outputIndices",B)}; + let data = ${B.type.value}(${k.getByOffset(`inputOffset / ${a}`)}); + ${B.setByOffset("global_idx","data")} + }`;return` + ${u.registerUniform("vec_size","u32").declareVariables(k,B)} + ${u.mainStart()} + ${u.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.vec_size")} + ${R}`},C=[{type:12,data:p},...Mt(t,n)];return{name:"Expand",shaderCache:{hint:`${n.length};${a}${c}`,inputDependencies:["rank"]},getShaderSource:h,getRunData:()=>({outputs:[{dims:n,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(p/64)},programUniforms:C})}},jn=e=>{fi(e.inputs),e.compute(zu(e.inputs),{inputs:[0]})}}),Bu,Ru,Pc=y(()=>{Ot(),$t(),qt(),wo(),Bu=e=>{let t=e[0].dataType,s=De.size(e[0].dims),n=De.size(e[1].dims),i=n%4===0,o=a=>{let c=He("x",t,[1],4),p=He("bias",t,[1],4),h=Ct("y",t,[1],4),C=[{name:"output_vec_size",type:"u32"},{name:"bias_size",type:"u32"}],u=B=>` + let bias${B}_offset: u32 = (global_idx * 4 + ${B}) % uniforms.bias_size; + let bias${B} = ${p.getByOffset(`bias${B}_offset / 4`)}[bias${B}_offset % 4];`,k=i?` + let bias = ${p.getByOffset("global_idx % (uniforms.bias_size / 4)")};`:`${u(0)}${u(1)}${u(2)}${u(3)} + let bias = ${c.type.value}(bias0, bias1, bias2, bias3);`;return`${a.registerUniforms(C).declareVariables(c,p,h)} + + ${oi(Cs(t))} + + ${a.mainStart(sr)} + ${a.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_vec_size")} + + let x = ${c.getByOffset("global_idx")}; + ${k} + let x_in = x + bias; + ${h.setByOffset("global_idx",_o("x_in"))} + }`};return{name:"FastGeluWithBias",shaderCache:{hint:`${i}`,inputDependencies:["type","type"]},getShaderSource:o,getRunData:a=>({outputs:[{dims:a[0].dims,dataType:a[0].dataType}],programUniforms:[{type:12,data:Math.ceil(s/4)},{type:12,data:n}],dispatchGroup:{x:Math.ceil(s/sr/4)}})}},Ru=e=>{e.inputs.length<2||De.size(e.inputs[1].dims)===0?Ll(e):e.compute(Bu(e.inputs))}}),_i,Nu,ju,Vu,Bp=y(()=>{Ot(),$t(),is(),qt(),_i=e=>{if(!e||e.length!==2)throw new Error("Gather requires 2 inputs.")},Nu=(e,t)=>{let s=e[0].dims,n=e[1].dims,i=s.length,o=De.normalizeAxis(t.axis,i),a=s.slice(0);a.splice(o,1,...n);let c=s[o],p=e[0].dataType===9?4:1,h=Math.ceil(De.size(a)/p),C=[{type:12,data:h},{type:6,data:c},{type:12,data:o},...Mt(e[0].dims,e[1].dims,a)],u=k=>{let B=He("data",e[0].dataType,e[0].dims.length,p),R=He("inputIndices",e[1].dataType,e[1].dims.length),z=Ct("output",e[0].dataType,a.length,p),ne=W=>{let ue=n.length,he=`var indicesIndices${W} = ${R.type.indices}(0);`;for(let be=0;be1?`indicesIndices${W}[${be}]`:`indicesIndices${W}`} = ${a.length>1?`outputIndices${W}[uniforms.axis + ${be}]`:`outputIndices${W}`};`;he+=` + var idx${W} = ${R.getByIndices(`indicesIndices${W}`)}; + if (idx${W} < 0) { + idx${W} = idx${W} + uniforms.axisDimLimit; + } + var dataIndices${W} : ${B.type.indices}; + `;for(let be=0,Be=0;be1?`dataIndices${W}[${be}]`:`dataIndices${W}`} = u32(idx${W});`,Be+=ue):(he+=`${i>1?`dataIndices${W}[${be}]`:`dataIndices${W}`} = ${a.length>1?`outputIndices${W}[${Be}]`:`outputIndices${W}`};`,Be++);return he},J;if(e[0].dataType===9){let W=(ue,he,be="")=>` + let outputIndices${he} = ${z.offsetToIndices(`outputOffset + ${he}u`)}; + ${ne(he)}; + let offset${he} = ${B.indicesToOffset(`dataIndices${he}`)}; + let index${he} = offset${he} / 4u; + let component${he} = offset${he} % 4u; + ${ue}[${he}] = ${be}(${B.getByOffset(`index${he}`)}[component${he}]); + `;J=` + let outputOffset = global_idx * ${p}; + var value = vec4(0); + ${W("value",0,"u32")} + ${W("value",1,"u32")} + ${W("value",2,"u32")} + ${W("value",3,"u32")} + ${z.setByOffset("global_idx","value")} + `}else J=` + let outputIndices = ${z.offsetToIndices("global_idx")}; + ${ne("")}; + let value = ${B.getByIndices("dataIndices")}; + ${z.setByOffset("global_idx","value")}; + `;return` + ${k.registerUniform("outputSize","u32").registerUniform("axisDimLimit","i32").registerUniform("axis","u32").declareVariables(B,R,z)} + ${k.mainStart()} + ${k.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} + ${J} + }`};return{name:"Gather",shaderCache:{hint:t.cacheKey,inputDependencies:["rank","rank"]},getRunData:()=>({outputs:[{dims:a,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(h/64)},programUniforms:C}),getShaderSource:u}},ju=e=>jt({axis:e.axis}),Vu=(e,t)=>{let s=e.inputs;_i(s),e.compute(Nu(e.inputs,t))}}),Uu,Wu,Gu,Vn=y(()=>{Ot(),$t(),qt(),Uu=(e,t,s,n,i,o,a,c,p)=>{let h=[{type:12,data:o},{type:12,data:n},{type:12,data:i},{type:12,data:s},{type:12,data:a},{type:12,data:c},{type:12,data:p}],C=[o];h.push(...Mt(t.dims,C));let u=k=>{let B=He("indices_data",t.dataType,t.dims.length),R=Ct("input_slice_offsets_data",12,1,1),z=[B,R],ne=[{name:"output_size",type:"u32"},{name:"batch_dims",type:"u32"},{name:"input_dims",type:"u32",length:i.length},{name:"sizes_from_slice_dims_data",type:"u32",length:s.length},{name:"num_slices_per_batch",type:"u32"},{name:"input_batch_stride",type:"u32"},{name:"num_slice_dims",type:"u32"}];return` + ${k.registerUniforms(ne).declareVariables(...z)} + ${k.mainStart()} + ${k.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + let batch_idx = global_idx / uniforms.num_slices_per_batch; + let base_offset = batch_idx * uniforms.input_batch_stride; + + let slice_indices_base_offset = global_idx * uniforms.num_slice_dims; + var relative_slice_offset = 0; + for (var dim_idx = 0u; dim_idx < uniforms.num_slice_dims; dim_idx ++) { + var index = i32(indices_data[dim_idx + slice_indices_base_offset].x); + let input_dim_idx = uniforms.batch_dims + dim_idx; + if (index < 0) { + ${i.length===1?"index += i32(uniforms.input_dims);":"index += i32(uniforms.input_dims[input_dim_idx]);"} + } + ${s.length===1?"relative_slice_offset += index * i32(uniforms.sizes_from_slice_dims_data);":"relative_slice_offset += index * i32(uniforms.sizes_from_slice_dims_data[dim_idx]);"} + } + + input_slice_offsets_data[global_idx] = base_offset + u32(relative_slice_offset); + }`};return e.compute({name:"computeSliceOffsets",shaderCache:{hint:`${i.length}_${s.length}`,inputDependencies:["rank"]},getRunData:()=>({outputs:[{dims:C,dataType:e.inputs[1].dataType}],dispatchGroup:{x:Math.ceil(o/64)},programUniforms:h}),getShaderSource:u},{inputs:[t],outputs:[-1]})[0]},Wu=(e,t)=>{let s=e.inputs,n=s[0].dims,i=s[0].dataType,o=s[1].dims,a=o[o.length-1],c=De.sizeToDimension(o,o.length-1),p=De.sizeFromDimension(n,t.batchDims+a),h=De.sizeToDimension(n,t.batchDims),C=De.sizeFromDimension(n,t.batchDims),u=c/h,k=new Array(a),B=p;for(let he=0;hen.length)throw new Error("last dimension of indices must not be larger than rank of input tensor");let ne=o.slice(0,-1).concat(n.slice(z)),J=De.size(ne),W=[{type:12,data:J},{type:12,data:p},...Mt(s[0].dims,R.dims,ne)],ue=he=>{let be=He("data",s[0].dataType,s[0].dims.length),Be=He("slice_offsets",12,R.dims.length),Ie=Ct("output",s[0].dataType,ne.length);return` + ${he.registerUniform("output_size","u32").registerUniform("slice_size","u32").declareVariables(be,Be,Ie)} + ${he.mainStart()} + ${he.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + let slice_offset = slice_offsets[global_idx / uniforms.slice_size]; + output[global_idx] = data[u32(slice_offset) + global_idx % uniforms.slice_size]; + }`};e.compute({name:"GatherND",shaderCache:{hint:t.cacheKey,inputDependencies:["rank","rank"]},getRunData:()=>({outputs:[{dims:ne,dataType:i}],dispatchGroup:{x:Math.ceil(J/64)},programUniforms:W}),getShaderSource:ue},{inputs:[s[0],R]})},Gu=e=>({batchDims:e.batch_dims,cacheKey:""})}),Ku,Hu,qu,Qu,Ec=y(()=>{Ot(),$t(),is(),qt(),Ku=(e,t)=>{if(e.length<3||e.length>4)throw new Error("GatherBlockQuantized requires 3 or 4 inputs.");let s=De.normalizeAxis(t.quantizeAxis,e[0].dims.length),n=t.blockSize,i=e[0],o=e[2],a=e.length===4?e[3]:void 0;if(o.dims.length!==i.dims.length||!i.dims.map((c,p)=>p===s?Math.ceil(c/n)===o.dims[p]:c===o.dims[p]).reduce((c,p)=>c&&p,!0))throw new Error("Scales must have the same rank as the input tensor and the dims should match except on gatherAxis.");if(a){if(a.dataType!==i.dataType)throw new Error("Zero point must have the same data type as the input tensor.");if(a.dims.length!==o.dims.length||!a.dims.map((c,p)=>c===o.dims[p]).reduce((c,p)=>c&&p,!0))throw new Error("Zero point must have the same rank as the input tensor and the dims should match except on quantizeAxis.")}},Hu=(e,t)=>{let s=e[0].dims,n=e[1].dims,i=s.length,o=De.normalizeAxis(t.gatherAxis,i),a=De.normalizeAxis(t.quantizeAxis,i),c=s.slice(0);c.splice(o,1,...n);let p=De.size(c),h=e[2].dataType,C=e[0].dataType===22,u=[{type:12,data:p},{type:12,data:a},{type:12,data:o},{type:12,data:t.blockSize},...Mt(...e.map((B,R)=>B.dims),c)],k=B=>{let R=He("data",e[0].dataType,e[0].dims.length),z=He("inputIndices",e[1].dataType,e[1].dims.length),ne=He("scales",e[2].dataType,e[2].dims.length),J=e.length>3?He("zeroPoint",e[3].dataType,e[3].dims.length):void 0,W=Ct("output",h,c.length),ue=[R,z,ne];J&&ue.push(J);let he=[{name:"output_size",type:"u32"},{name:"quantize_axis",type:"u32"},{name:"gather_axis",type:"u32"},{name:"block_size",type:"u32"}];return` + ${B.registerUniforms(he).declareVariables(...ue,W)} + ${B.mainStart()} + let output_indices = ${W.offsetToIndices("global_idx")}; + var indices_indices = ${z.type.indices}(0); + ${n.length>1?` + for (var i: u32 = 0; i < ${n.length}; i++) { + let index = ${W.indicesGet("output_indices","uniforms.gather_axis + i")}; + ${z.indicesSet("indices_indices","i","index")}; + }`:`indices_indices = ${W.indicesGet("output_indices","uniforms.gather_axis")};`}; + var data_indices = ${R.type.indices}(0); + for (var i: u32 = 0; i < uniforms.gather_axis; i++) { + let index = ${W.indicesGet("output_indices","i")}; + ${R.indicesSet("data_indices","i","index")}; + } + var index_from_indices = ${z.getByIndices("indices_indices")}; + if (index_from_indices < 0) { + index_from_indices += ${s[o]}; + } + ${R.indicesSet("data_indices","uniforms.gather_axis","u32(index_from_indices)")}; + for (var i = uniforms.gather_axis + 1; i < ${c.length}; i++) { + let index = ${W.indicesGet("output_indices",`i + ${n.length} - 1`)}; + ${R.indicesSet("data_indices","i","index")}; + } + let data_offset = ${R.indicesToOffset("data_indices")}; + let data_index = data_offset % 8; + // Convert 4-bit packed data to 8-bit packed data. + let packed_4bit_quantized_data = ${R.getByOffset("data_offset / 8")}; + let packed_8bit_quantized_data = (packed_4bit_quantized_data >> (4 * (data_index % 2))) & 0x0f0f0f0f; + let quantized_data_vec = ${C?"unpack4xI8":"unpack4xU8"}(u32(packed_8bit_quantized_data)); + let quantized_data = quantized_data_vec[data_index / 2]; + var scale_indices = data_indices; + let quantize_axis_index = ${ne.indicesGet("data_indices","uniforms.quantize_axis")} / uniforms.block_size; + ${ne.indicesSet("scale_indices","uniforms.quantize_axis","quantize_axis_index")}; + var scale = ${ne.getByIndices("scale_indices")}; + ${J?` + let zero_point_indices = scale_indices; + let zero_point_offset = ${J.indicesToOffset("zero_point_indices")}; + let zero_point_index = zero_point_offset % 8; + let packed_4bit_zero_points = ${J.getByOffset("zero_point_offset / 8")}; + let packed_8bit_zero_points = (packed_4bit_zero_points >> (4 * (zero_point_index % 2))) & 0x0f0f0f0f; + let zero_point_vec = ${C?"unpack4xI8":"unpack4xU8"}(u32(packed_8bit_zero_points)); + let zero_point = zero_point_vec[zero_point_index / 2];`:"var zero_point = 0"}; + let dequantized_data = ${Cs(h)}(quantized_data - zero_point) * scale; + ${W.setByOffset("global_idx","dequantized_data")}; + }`};return{name:"GatherBlockQuantized",shaderCache:{hint:`${t.cacheKey};${e.filter((B,R)=>R!==1).map(B=>B.dims.join("_")).join(";")}`,inputDependencies:Array.from({length:e.length},(B,R)=>"rank")},getRunData:()=>({outputs:[{dims:c,dataType:h}],dispatchGroup:{x:Math.ceil(p/64)},programUniforms:u}),getShaderSource:k}},qu=(e,t)=>{let s=e.inputs;Ku(s,t),e.compute(Hu(e.inputs,t))},Qu=e=>jt({blockSize:e.blockSize,gatherAxis:e.gatherAxis,quantizeAxis:e.quantizeAxis})}),Xu,Yu,gi,Cc,kc=y(()=>{Ot(),$t(),is(),qt(),Xu=e=>{if(!e||e.length!==2)throw new Error("GatherElements requires 2 inputs.");if(e[0].dims.length<1)throw new Error("GatherElements requires that the data input be rank >= 1.");if(e[0].dims.length!==e[1].dims.length)throw new Error(`GatherElements requires that the data input and + indices input tensors be of same rank.`)},Yu=(e,t)=>{let s=e[0].dims,n=e[0].dataType,i=s.length,o=e[1].dims,a=e[1].dataType,c=De.normalizeAxis(t.axis,i),p=s[c],h=o.slice(0),C=De.size(h),u=He("input",n,i),k=He("indicesInput",a,o.length),B=Ct("output",n,h.length),R=[{type:12,data:C},{type:6,data:p},{type:12,data:c}];return R.push(...Mt(s,o,h)),{name:"GatherElements",shaderCache:{inputDependencies:["rank","rank"]},getRunData:()=>({outputs:[{dims:h,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(C/64)},programUniforms:R}),getShaderSource:z=>` + ${z.registerUniform("outputSize","u32").registerUniform("axisDimLimit","i32").registerUniform("axis","u32").declareVariables(u,k,B)} + ${z.mainStart()} + ${z.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} + + let outputIndices = ${B.offsetToIndices("global_idx")}; + + var idx = ${k.getByOffset("global_idx")}; + if (idx < 0) { + idx = idx + uniforms.axisDimLimit; + } + var inputIndices = ${u.type.indices}(outputIndices); + ${u.indicesSet("inputIndices","uniforms.axis","u32(idx)")}; + let value = ${u.getByIndices("inputIndices")}; + + ${B.setByOffset("global_idx","value")}; + }`}},gi=e=>jt({axis:e.axis}),Cc=(e,t)=>{let s=e.inputs;Xu(s),e.compute(Yu(e.inputs,t))}}),Ju,Zu,ed,td,sd=y(()=>{Ot(),$t(),qt(),Ju=e=>{if(!e)throw new Error("Input is missing");if(e.length<2||e.length>3)throw new Error("Invaid input number.");if(e.length===3&&e[2].dims.length>2)throw new Error("Invalid input shape of C");if(e[0].dataType!==e[1].dataType||e.length===3&&e[0].dataType!==e[2].dataType)throw new Error("Input types are mismatched")},Zu=(e,t)=>{let s=e[0].dims.slice(),n=e[1].dims.slice(),[i,o,a]=kr.getShapeOfGemmResult(s,t.transA,n,t.transB,e.length===3?e[2].dims:void 0),c=[i,o];if(!c)throw new Error("Can't use gemm on the given tensors");let p=16,h=Math.ceil(o/p),C=Math.ceil(i/p),u=!0,k=De.size(c),B=[{type:12,data:u?h:k},{type:12,data:i},{type:12,data:o},{type:12,data:a},{type:1,data:t.alpha},{type:1,data:t.beta}],R=["type","type"];e.length===3&&(B.push(...Mt(e[2].dims)),R.push("rank")),B.push(...Mt(c));let z=J=>{let W="";t.transA&&t.transB?W="value += a[k * uniforms.M + m] * b[n * uniforms.K + k];":t.transA&&!t.transB?W="value += a[k * uniforms.M + m] * b[k * uniforms.N + n];":!t.transA&&t.transB?W="value += a[m * uniforms.K + k] * b[n * uniforms.K + k];":!t.transA&&!t.transB&&(W="value += a[m * uniforms.K + k] * b[k * uniforms.N + n];");let ue=t.alpha===1?"":"value *= uniforms.alpha;",he=He("a",e[0].dataType,e[0].dims),be=He("b",e[1].dataType,e[1].dims),Be=he.type.value,Ie=null,nt=[he,be];e.length===3&&(Ie=He("c",e[2].dataType,e[2].dims.length),nt.push(Ie));let dt=Ct("output",e[0].dataType,c.length);nt.push(dt);let Et=[{name:"output_size",type:"u32"},{name:"M",type:"u32"},{name:"N",type:"u32"},{name:"K",type:"u32"},{name:"alpha",type:"f32"},{name:"beta",type:"f32"}];return` + ${J.registerUniforms(Et).declareVariables(...nt)} + + ${J.mainStart()} + ${J.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + + let m = global_idx / uniforms.N; + let n = global_idx % uniforms.N; + + var value = ${Be}(0); + for (var k: u32 = 0u; k < uniforms.K; k++) { + ${W} + } + + ${ue} + ${Ie!=null?`let cOffset = ${Ie.broadcastedIndicesToOffset("vec2(m, n)",dt)}; value += ${Be}(uniforms.beta) * ${Ie.getByOffset("cOffset")};`:""} + output[global_idx] = value; + }`},ne=J=>{let W=He("a",e[0].dataType,e[0].dims),ue=He("b",e[1].dataType,e[1].dims),he=null,be=[W,ue];e.length===3&&(he=He("c",e[2].dataType,e[2].dims.length),be.push(he));let Be=Ct("output",e[0].dataType,c.length);be.push(Be);let Ie=[{name:"num_tile_n",type:"u32"},{name:"M",type:"u32"},{name:"N",type:"u32"},{name:"K",type:"u32"},{name:"alpha",type:"f32"},{name:"beta",type:"f32"}],nt="",dt="";t.transA&&t.transB?(dt=` + var col = tile_row_start + local_id.x; + var row = k_start + local_id.y; + if (col < uniforms.M && row < uniforms.K) { + tile_a[local_id.y][local_id.x] = a[row * uniforms.M + col]; + } else { + tile_a[local_id.y][local_id.x] = ${W.type.value}(0); + } + + col = k_start + local_id.x; + row = tile_col_start + local_id.y; + if (col < uniforms.K && row < uniforms.N) { + tile_b[local_id.y][local_id.x] = b[row * uniforms.K + col]; + } else { + tile_b[local_id.y][local_id.x] = ${ue.type.value}(0); + } + `,nt="value += tile_a[k][local_id.y] * tile_b[local_id.x][k];"):t.transA&&!t.transB?(dt=` + var col = tile_row_start + local_id.x; + var row = k_start + local_id.y; + if (col < uniforms.M && row < uniforms.K) { + tile_a[local_id.y][local_id.x] = a[row * uniforms.M + col]; + } else { + tile_a[local_id.y][local_id.x] = ${W.type.value}(0); + } + + col = tile_col_start + local_id.x; + row = k_start + local_id.y; + if (col < uniforms.N && row < uniforms.K) { + tile_b[local_id.y][local_id.x] = b[row * uniforms.N + col]; + } else { + tile_b[local_id.y][local_id.x] = ${ue.type.value}(0); + } + `,nt="value += tile_a[k][local_id.y] * tile_b[k][local_id.x];"):!t.transA&&t.transB?(dt=` + var col = k_start + local_id.x; + var row = tile_row_start + local_id.y; + if (col < uniforms.K && row < uniforms.M) { + tile_a[local_id.y][local_id.x] = a[row * uniforms.K + col]; + } else { + tile_a[local_id.y][local_id.x] = ${W.type.value}(0); + } + + col = k_start + local_id.x; + row = tile_col_start + local_id.y; + if (col < uniforms.K && row < uniforms.N) { + tile_b[local_id.y][local_id.x] = b[row * uniforms.K + col]; + } else { + tile_b[local_id.y][local_id.x] = ${ue.type.value}(0); + } + `,nt="value += tile_a[local_id.y][k] * tile_b[local_id.x][k];"):!t.transA&&!t.transB&&(dt=` + var col = k_start + local_id.x; + var row = tile_row_start + local_id.y; + if (col < uniforms.K && row < uniforms.M) { + tile_a[local_id.y][local_id.x] = a[row * uniforms.K + col]; + } else { + tile_a[local_id.y][local_id.x] = ${W.type.value}(0); + } + + col = tile_col_start + local_id.x; + row = k_start + local_id.y; + if (col < uniforms.N && row < uniforms.K) { + tile_b[local_id.y][local_id.x] = b[row * uniforms.N + col]; + } else { + tile_b[local_id.y][local_id.x] = ${ue.type.value}(0); + } + `,nt="value += tile_a[local_id.y][k] * tile_b[k][local_id.x];");let Et=t.alpha===1?"":"value *= uniforms.alpha;";return` + ${J.registerUniforms(Ie).declareVariables(...be)} + var tile_a: array, ${p}>; + var tile_b: array, ${p}>; + ${J.mainStart([p,p,1])} + let tile_col_start = (workgroup_index % uniforms.num_tile_n) * ${p}; + let tile_row_start = (workgroup_index / uniforms.num_tile_n) * ${p}; + let num_tiles = (uniforms.K - 1) / ${p} + 1; + var k_start = 0u; + var value = ${Be.type.value}(0); + for (var t: u32 = 0u; t < num_tiles; t++) { + ${dt} + k_start = k_start + ${p}; + workgroupBarrier(); + + for (var k: u32 = 0u; k < ${p}; k++) { + ${nt} + } + workgroupBarrier(); + } + + ${Et} + let m = tile_row_start + local_id.y; + let n = tile_col_start + local_id.x; + ${he!=null?`let cOffset = ${he.broadcastedIndicesToOffset("vec2(m, n)",Be)}; value += ${Be.type.value}(uniforms.beta) * ${he.getByOffset("cOffset")};`:""} + if (m < uniforms.M && n < uniforms.N) { + output[m * uniforms.N + n] = value; + } + }`};return u?{name:"GemmShared",shaderCache:{hint:`${t.cacheKey}`,inputDependencies:R},getRunData:()=>({outputs:[{dims:c,dataType:e[0].dataType}],dispatchGroup:{x:h*C},programUniforms:B}),getShaderSource:ne}:{name:"Gemm",shaderCache:{hint:`${t.cacheKey}`,inputDependencies:R},getRunData:()=>({outputs:[{dims:c,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(k/64)},programUniforms:B}),getShaderSource:z}},ed=e=>{let t=e.transA,s=e.transB,n=e.alpha,i=e.beta;return{transA:t,transB:s,alpha:n,beta:i,cacheKey:`${e.transA};${e.transB};${e.alpha===1}`}},td=(e,t)=>{Ju(e.inputs),e.compute(Zu(e.inputs,t))}}),vr,$r,Wr,tn,rd,Xo,nd,id,wi,od,ad,ld,ud,Yo,Jo=y(()=>{Ot(),$t(),is(),qt(),[vr,$r,Wr,tn]=[0,1,2,3],rd=e=>{if(e[0].dims.length!==4)throw new Error("only 4-D tensor is supported.");if(e[0].dims.length!==e[1].dims.length)throw new Error("input dimensions must be equal to grid dimensions");if(e[0].dims.length-2!==e[1].dims[e[1].dims.length-1])throw new Error(`last dimension of grid must be equal to ${e[0].dims.length-2}`);if(e[0].dims[0]!==e[1].dims[0])throw new Error("grid batch size must match input batch size")},Xo=` + fn gs_get_cubic_coeffs(x: f32) -> vec4 { + let cubic_alpha = -0.75f; + let x_abs = abs(x); + var coeffs: vec4; + coeffs[0] = (((cubic_alpha * (x_abs + 1) - 5 * cubic_alpha) * (x_abs + 1) + 8 * cubic_alpha) * (x_abs + 1) - 4 * cubic_alpha); + coeffs[1] = (((cubic_alpha + 2) * x_abs - (cubic_alpha + 3)) * x_abs * x_abs + 1); + coeffs[2] = (((cubic_alpha + 2) * (1 - x_abs) - (cubic_alpha + 3)) * (1 - x_abs) * (1 - x_abs) + 1); + coeffs[3] = (((cubic_alpha * (2 - x_abs) - 5 * cubic_alpha) * (2 - x_abs) + 8 * cubic_alpha) * (2 - x_abs) - 4 * cubic_alpha); + return coeffs; + } +`,nd=e=>` + fn gs_bicubic_interpolate(p: mat4x4<${e}>, x: f32, y: f32) -> ${e} { + var v: vec4; + var coeffs = gs_get_cubic_coeffs(x); + for (var i = 0; i < 4; i++) { + v[i] = coeffs[0] * p[i][0] + coeffs[1] * p[i][1] + coeffs[2] * p[i][2] + coeffs[3] * p[i][3]; + } + coeffs = gs_get_cubic_coeffs(y); + let pixel = ${e}(coeffs[0] * v[0] + coeffs[1] * v[1] + coeffs[2] * v[2] + coeffs[3] * v[3]); + return pixel; + } +`,id=e=>` + fn gs_denormalize(n: f32, length: i32) -> f32 { + ${e.alignCorners===0?` + // alignCorners: false => [-1, 1] to [-0.5, length - 0.5] + return ((n + 1.0) * f32(length) - 1.0) / 2.0; + `:` + // alignCorners: true => [-1, 1] to [0, length - 1] + return (n + 1.0) / 2.0 * (f32(length - 1)); + `} + } +`,wi=e=>` + ${e.paddingMode==="reflection"?` + fn gs_reflect(x: i32, x_min: f32, x_max: f32) -> u32 { + var dx = 0.0; + var fx = f32(x); + let range = x_max - x_min; + if (fx < x_min) { + dx = x_min - fx; + let n = u32(dx / range); + let r = dx - f32(n) * range; + if (n % 2 == 0) { + fx = x_min + r; + } else { + fx = x_max - r; + } + } else if (fx > x_max) { + dx = fx - x_max; + let n = u32(dx / range); + let r = dx - f32(n) * range; + if (n % 2 == 0) { + fx = x_max - r; + } else { + fx = x_min + r; + } + } + return u32(fx); + }`:""} +`,od=(e,t,s)=>` + fn pixel_at_grid(r: i32, c: i32, H: i32, W: i32, batch: u32, channel: u32, border: vec4) -> ${t} { + var pixel = ${t}(0); + var indices = vec4(0); + indices[${vr}] = batch; + indices[${$r}] = channel;`+(()=>{switch(s.paddingMode){case"zeros":return` + if (r >= 0 && r < H && c >=0 && c < W) { + indices[${Wr}] = u32(r); + indices[${tn}] = u32(c); + } + `;case"border":return` + indices[${Wr}] = u32(clamp(r, 0, H - 1)); + indices[${tn}] = u32(clamp(c, 0, W - 1)); + `;case"reflection":return` + indices[${Wr}] = gs_reflect(r, border[1], border[3]); + indices[${tn}] = gs_reflect(c, border[0], border[2]); + `;default:throw new Error(`padding mode ${s.paddingMode} is not supported`)}})()+` + return ${e.getByIndices("indices")}; + } +`,ad=(e,t,s)=>(()=>{switch(s.mode){case"nearest":return` + let result = pixel_at_grid(i32(round(y)), i32(round(x)), H_in, W_in, indices[${vr}], indices[${$r}], border); + `;case"bilinear":return` + let x1 = i32(floor(x)); + let y1 = i32(floor(y)); + let x2 = x1 + 1; + let y2 = y1 + 1; + + let p11 = pixel_at_grid(y1, x1, H_in, W_in, indices[${vr}], indices[${$r}], border); + let p12 = pixel_at_grid(y1, x2, H_in, W_in, indices[${vr}], indices[${$r}], border); + let p21 = pixel_at_grid(y2, x1, H_in, W_in, indices[${vr}], indices[${$r}], border); + let p22 = pixel_at_grid(y2, x2, H_in, W_in, indices[${vr}], indices[${$r}], border); + + let dx2 = ${t}(f32(x2) - x); + let dx1 = ${t}(x - f32(x1)); + let dy2 = ${t}(f32(y2) - y); + let dy1 = ${t}(y - f32(y1)); + let result = dy2 * (dx2 * p11 + dx1 * p12) + dy1 * (dx2 * p21 + dx1 * p22); + `;case"bicubic":return` + let x0 = i32(floor(x)) - 1; + let y0 = i32(floor(y)) - 1; + var p: mat4x4<${t}>; + for (var h = 0; h < 4; h++) { + for (var w = 0; w < 4; w++) { + p[h][w] = pixel_at_grid(h + y0, w + x0, H_in, W_in, indices[${vr}], indices[${$r}], border); + } + } + + let dx = x - f32(x0 + 1); + let dy = y - f32(y0 + 1); + let result = gs_bicubic_interpolate(p, dx, dy); + `;default:throw new Error(`mode ${s.mode} is not supported`)}})()+`${e.setByOffset("global_idx","result")}`,ld=(e,t)=>{let s=He("x",e[0].dataType,e[0].dims.length),n=[e[1].dims[0],e[1].dims[1],e[1].dims[2]],i=He("grid",e[1].dataType,n.length,2),o=[e[0].dims[0],e[0].dims[1],e[1].dims[1],e[1].dims[2]];t.format==="NHWC"&&(o=[e[0].dims[0],e[1].dims[1],e[1].dims[2],e[0].dims[3]],[vr,$r,Wr,tn]=[0,3,1,2]);let a=Ct("output",e[0].dataType,o.length),c=s.type.value,p=De.size(o),h=[{type:12,data:p},...Mt(e[0].dims,n,o)],C=u=>` + ${u.registerUniform("output_size","u32").declareVariables(s,i,a)} + ${Xo} + ${nd(c)} + ${id(t)} + ${wi(t)} + ${od(s,c,t)} + + ${u.mainStart()} + ${u.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + let H_in = i32(uniforms.x_shape[${Wr}]); + let W_in = i32(uniforms.x_shape[${tn}]); + + ${t.alignCorners===0?` + let x_min = -0.5; + let x_max = f32(W_in) - 0.5; + let y_min = -0.5; + let y_max = f32(H_in) - 0.5; + `:` + let x_min = 0.0; + let x_max = f32(W_in) - 1.0; + let y_min = 0.0; + let y_max = f32(H_in) - 1.0; + `}; + let border = vec4(x_min, y_min, x_max, y_max); + + let indices = ${a.offsetToIndices("global_idx")}; + var grid_indices = vec3(indices[${vr}], indices[${Wr}], indices[${tn}]); + let nxy = ${i.getByIndices("grid_indices")}; + var x = gs_denormalize(f32(nxy[0]), W_in); + var y = gs_denormalize(f32(nxy[1]), H_in); + + ${ad(a,c,t)} + }`;return{name:"GridSample",shaderCache:{hint:`${t.cacheKey}`,inputDependencies:["type","type"]},getRunData:u=>{let k=De.size(o);return{outputs:[{dims:o,dataType:u[0].dataType}],dispatchGroup:{x:Math.ceil(k/64)},programUniforms:h}},getShaderSource:C}},ud=(e,t)=>{rd(e.inputs),e.compute(ld(e.inputs,t))},Yo=e=>jt({alignCorners:e.align_corners,mode:e.mode,paddingMode:e.padding_mode,format:e.format})}),rr,dd,cd,yi,pd,Un,Zo,hd=y(()=>{Ot(),$t(),is(),ce(),Zi(),qt(),jr(),rr=(e,t)=>e.length>t&&e[t].dims.length>0?e[t]:void 0,dd=(e,t)=>{let s=e[0],n=rr(e,1),i=rr(e,2),o=rr(e,3),a=rr(e,4),c=rr(e,5),p=rr(e,6),h=rr(e,7);if(s.dims.length!==3&&s.dims.length!==5)throw new Error("Input query is expected to have 3 or 5 dimensions");let C=s.dims[0],u=s.dims[1],k=s.dims.length===3?s.dims[2]:t.numHeads*s.dims[4],B=u,R=0,z=0,ne=Math.floor(k/t.numHeads);if(p&&h&&De.size(p.dims)&&De.size(h.dims)){if(p.dims.length!==4)throw new Error('Input "past_key" is expected to have 4 dimensions');if(p.dims[0]!==C||p.dims[1]!==t.numHeads||p.dims[3]!==ne)throw new Error('Input "past_key" shape (batch_size, num_heads, past_sequence_length, head_size)');if(h.dims[0]!==C||h.dims[1]!==t.numHeads||h.dims[3]!==ne)throw new Error('Input "past_value" shape (batch_size, num_heads, past_sequence_length, head_size)');if(p.dims[2]!==h.dims[2])throw new Error('Input "past_key" and "past_value" shall have same dim 2 (past_sequence_length)');if(h.dims.length!==4)throw new Error('Input "past_value" is expected to have 4 dimensions');R=p.dims[2],z=p.dims[2]}else if(p&&De.size(p.dims)||h&&De.size(h.dims))throw new Error('Input "past_key" and "past_value" shall be both present or both absent');let J;if(n&&De.size(n.dims)>0){if(s.dims.length!==3)throw new Error('Input "query" is expected to have 3 dimensions when key is given');if(n.dims.length<3||n.dims.length>5)throw new Error('Input "key" is expected to have 3, 4, or 5 dimensions');if(s.dims[0]!==n.dims[0])throw new Error('Input "query" and "key" shall have same dim 0 (batch size)');if(n.dims.length===3){if(n.dims[2]!==s.dims[2])throw new Error('Input "query" and "key" shall have same dim 2 (hidden_size)');J=2,B=n.dims[1]}else if(n.dims.length===5){if(n.dims[2]!==t.numHeads||n.dims[3]!==2||n.dims[4]!==ne)throw new Error('Expect "key" shape (batch_size, kv_sequence_length, num_heads, 2, head_size) for packed kv');if(i)throw new Error('Expect "value" be none when "key" has packed kv format.');J=5,B=n.dims[1]}else{if(n.dims[1]!==t.numHeads||n.dims[3]!==ne)throw new Error('Expect "key" shape (batch_size, num_heads, kv_sequence_length, head_size) for past_key');J=0,B=n.dims[2]}}else{if(s.dims.length!==5)throw new Error('Input "query" is expected to have 5 dimensions when key is empty');if(s.dims[2]!==t.numHeads||s.dims[3]!==3)throw new Error('Expect "query" shape (batch_size, kv_sequence_length, num_heads, 3, head_size) for packed kv');J=3}if(o&&De.size(o.dims)>0){if(o.dims.length!==1)throw new Error('Input "bias" is expected to have 1 dimension');if(n&&n.dims.length===5&&n.dims[3]===2)throw new Error("bias is not allowed for packed kv.")}let W=R+B,ue=0;if(a&&De.size(a.dims)>0){ue=8;let Ie=a.dims;throw Ie.length===1?Ie[0]===C?ue=1:Ie[0]===3*C+2&&(ue=3):Ie.length===2&&Ie[0]===C&&Ie[1]===W&&(ue=5),ue===8?new Error('Input "key_padding_mask" shape shall be (batch_size) or (batch_size, total_sequence_length)'):new Error("Mask not supported")}let he=!1,be=k;if(i&&De.size(i.dims)>0){if(i.dims.length!==3&&i.dims.length!==4)throw new Error('Input "value" is expected to have 3 or 4 dimensions');if(s.dims[0]!==i.dims[0])throw new Error('Input "query" and "value" shall have same dim 0 (batch_size)');if(i.dims.length===3){if(B!==i.dims[1])throw new Error('Input "key" and "value" shall have the same dim 1 (kv_sequence_length)');be=i.dims[2]}else{if(B!==i.dims[2])throw new Error('Input "key" and "value" shall have the same dim 2 (kv_sequence_length)');be=i.dims[1]*i.dims[3],he=!0}}let Be=!1;if(a&&De.size(a.dims)>0)throw new Error("Key padding mask is not supported");if(c&&De.size(c.dims)>0){if(c.dims.length!==4)throw new Error('Input "attention_bias" is expected to have 4 dimensions');if(c.dims[0]!==C||c.dims[1]!==t.numHeads||c.dims[2]!==u||c.dims[3]!==W)throw new Error('Expect "attention_bias" shape (batch_size, num_heads, sequence_length, total_sequence_length)')}return{batchSize:C,sequenceLength:u,pastSequenceLength:R,kvSequenceLength:B,totalSequenceLength:W,maxSequenceLength:z,inputHiddenSize:0,hiddenSize:k,vHiddenSize:be,headSize:ne,vHeadSize:Math.floor(be/t.numHeads),numHeads:t.numHeads,isUnidirectional:!1,pastPresentShareBuffer:!1,maskFilterValue:t.maskFilterValue,maskType:ue,scale:t.scale,broadcastResPosBias:Be,passPastInKv:he,qkvFormat:J}},cd=e=>jt({...e}),yi=jt({perm:[0,2,1,3]}),pd=(e,t,s,n,i,o,a)=>{let c=[n,i,o],p=De.size(c),h=[{type:12,data:p},{type:12,data:a},{type:12,data:o}],C=u=>{let k=Ct("qkv_with_bias",t.dataType,c),B=He("qkv",t.dataType,c),R=He("bias",s.dataType,c),z=[{name:"output_size",type:"u32"},{name:"bias_offset",type:"u32"},{name:"hidden_size",type:"u32"}];return` + ${u.registerUniforms(z).declareVariables(B,R,k)} + ${u.mainStart()} + ${u.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + let bias_offset_idx = (global_idx % uniforms.hidden_size) + uniforms.bias_offset; + + qkv_with_bias[global_idx] = qkv[global_idx] + bias[bias_offset_idx]; + }`};return e.compute({name:"MultiHeadAttentionAddBias",shaderCache:{inputDependencies:["type","type"]},getRunData:()=>({outputs:[{dims:c,dataType:t.dataType,gpuDataType:0}],dispatchGroup:{x:Math.ceil(p/64)},programUniforms:h}),getShaderSource:C},{inputs:[t,s],outputs:[-1]})[0]},Un=(e,t,s,n,i,o,a,c)=>{let p=o;if(a&&De.size(a.dims)>0){if(n===1)throw new Error("AddBiasReshape is not implemented. Please export your model with packed QKV or KV");return p=pd(e,o,a,t,n,s*i,c),p=p.reshape([t,n,s,i]),s===1||n===1?p:e.compute(cr(p,yi.perm),{inputs:[p],outputs:[-1]})[0]}else return o.dims.length===3&&(p=o.reshape([t,n,s,i])),s===1||n===1?p:e.compute(cr(p,yi.perm),{inputs:[p],outputs:[-1]})[0]},Zo=(e,t)=>{let s=dd(e.inputs,t),n=e.inputs[0],i=rr(e.inputs,1),o=rr(e.inputs,2),a=rr(e.inputs,3),c=rr(e.inputs,4),p=rr(e.inputs,5),h=rr(e.inputs,6),C=rr(e.inputs,7);if(n.dims.length===5)throw new Error("Packed QKV is not implemented");if(i?.dims.length===5)throw new Error("Packed KV is not implemented");let u=i&&o&&i.dims.length===4&&o.dims.length===4,k=Un(e,s.batchSize,s.numHeads,s.sequenceLength,s.headSize,n,a,0);if(u)return zn(e,k,i,o,c,void 0,h,C,p,s);if(!i||!o)throw new Error("key and value must be provided");let B=Un(e,s.batchSize,s.numHeads,s.kvSequenceLength,s.headSize,i,a,s.hiddenSize),R=Un(e,s.batchSize,s.numHeads,s.kvSequenceLength,s.vHeadSize,o,a,2*s.hiddenSize);zn(e,k,B,R,c,void 0,h,C,p,s)}}),md,ea,Sc,$c,Mi,ta,fd,_d=y(()=>{Ot(),$t(),is(),qt(),md=e=>{if(!e||e.length<1)throw new Error("too few inputs")},ea=(e,t)=>{let s=[],n=t.numOutputs;return e[1].dims[0]>0&&(e[1].getBigInt64Array().forEach(i=>s.push(Number(i))),n=s.length),jt({numOutputs:n,axis:t.axis,splitSizes:s})},Sc=e=>` +fn calculateOutputIndex(index: u32) -> u32 { + for (var i: u32 = 0u; i < ${e}u; i += 1u ) { + if (index < ${Tt("uniforms.size_in_split_axis","i",e)}) { + return i; + } + } + return ${e}u; +}`,$c=e=>{let t=e.length,s=[];for(let n=0;n{let s=e[0].dims,n=De.size(s),i=e[0].dataType,o=De.normalizeAxis(t.axis,s.length),a=new Array(t.numOutputs),c=He("input",i,s.length),p=new Array(t.numOutputs),h=[],C=[],u=0,k=[{type:12,data:n}];for(let R=0;R` + ${R.registerUniform("input_size","u32").registerUniform("size_in_split_axis","u32",p.length).declareVariables(c,...a)} + ${Sc(p.length)} + ${$c(a)} + + ${R.mainStart()} + ${R.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.input_size")} + + var indices = ${c.offsetToIndices("global_idx")}; + var index = ${c.indicesGet("indices",o)}; + let output_number = calculateOutputIndex(index); + if (output_number != 0) { + index -= ${Tt("uniforms.size_in_split_axis","output_number - 1u",p.length)}; + ${c.indicesSet("indices",o,"index")}; + } + writeBufferData(output_number, indices, global_idx); + }`;return{name:"Split",shaderCache:{hint:t.cacheKey,inputDependencies:["rank"]},getShaderSource:B,getRunData:()=>({outputs:h,dispatchGroup:{x:Math.ceil(n/64)},programUniforms:k})}},ta=(e,t)=>{md(e.inputs);let s=e.inputs.length===1?t:ea(e.inputs,t);e.compute(Mi(e.inputs,s),{inputs:[0]})},fd=e=>{let t=e.axis,s=e.splitSizes,n=e.numOutputs<0?s.length:e.numOutputs;if(n!==s.length)throw new Error("numOutputs and splitSizes lengh must be equal");return jt({axis:t,numOutputs:n,splitSizes:s})}}),sa,gd,ra,na,Ac=y(()=>{is(),Zi(),hd(),_d(),jr(),sa=(e,t)=>{if(t.doRotary)throw new Error("GroupQuerryAttention do_rotary attribute is not supported");if(t.doRotary&&e.length<=7)throw new Error("cos_cache and sin_cache inputs are required if do_rotary is specified");let s=e[0],n=e[1],i=e[2],o=e[3],a=e[4];if(t.localWindowSize!==-1)throw new Error("Local attention is not supported");if(t.softcap!==0)throw new Error("Softcap is not supported");if(t.rotaryInterleaved!==0)throw new Error("Rotary interleaved is not supported");if(t.smoothSoftmax)throw new Error("Smooth softmax is not supported");if(s.dims.length!==3&&s.dims.length!==5)throw new Error("Input query is expected to have 3 or 5 dimensions");let c=!1,p=s.dims[0],h=s.dims[1],C=s.dims.length===3?c?s.dims[2]/3:s.dims[2]:t.numHeads*s.dims[4],u=h,k=0,B=!n||n.dims.length===0,R=Math.floor(B?C/(t.numHeads+2*t.kvNumHeads):C/t.numHeads);B&&(C=R*t.numHeads);let z=o&&o.dims.length!==0,ne=a&&a.dims.length!==0;if(z&&o.dims.length===4&&o.dims[0]===p&&o.dims[1]!==t.kvNumHeads&&o.dims[2]===t.kvNumHeads&&o.dims[3]===R)throw new Error("BSNH pastKey/pastValue is not supported");if(z&&ne){if(o.dims.length!==4)throw new Error('Input "past_key" is expected to have 4 dimensions');if(a.dims.length!==4)throw new Error('Input "past_value" is expected to have 4 dimensions');k=o.dims[2]}else if(z||ne)throw new Error('Input "past_key" and "past_value" shall be both present or both absent');let J=1;if(n&&n.dims.length>0){if(s.dims.length!==3)throw new Error('Input "query" is expected to have 3 dimensions when key is given');if(n.dims.length<3||n.dims.length>5)throw new Error('Input "key" is expected to have 3, 4, or 5 dimensions');if(s.dims[0]!==n.dims[0])throw new Error('Input "query" and "key" shall have same dim 0 (batch size)');if(n.dims.length===3){if(s.dims[2]%n.dims[2]!==0)throw new Error('Dimension 2 of "query" should be a multiple of "key"');u=n.dims[1]}else if(n.dims.length===5){if(n.dims[2]!==t.numHeads||n.dims[3]!==2||n.dims[4]!==R)throw new Error('Expect "key" shape (batch_size, kv_sequence_length, num_heads, 2, head_size) for packed kv');if(i)throw new Error('Expect "value" be none when "key" has packed kv format.');u=n.dims[1]}else{if(n.dims[1]!==t.numHeads||n.dims[3]!==R)throw new Error('Expect "key" shape (batch_size, num_heads, kv_sequence_length, head_size) for past_key');u=n.dims[2]}}else{if(s.dims.length!==3&&s.dims.length!==5)throw new Error('Input "query" is expected to have 3 or 5 dimensions when key is empty');if(s.dims.length===5&&(s.dims[2]!==t.numHeads||s.dims[3]!==3))throw new Error('Expect "query" shape (batch_size, kv_sequence_length, num_heads, 3, head_size) for packed kv');J=3}let W=0,ue=!1,he=t.kvNumHeads?R*t.kvNumHeads:C;if(i&&i.dims.length>0){if(i.dims.length!==3&&i.dims.length!==4)throw new Error('Input "value" is expected to have 3 or 4 dimensions');if(s.dims[0]!==i.dims[0])throw new Error('Input "query" and "value" shall have same dim 0 (batch_size)');if(i.dims.length===3){if(u!==i.dims[1])throw new Error('Input "key" and "value" shall have the same dim 1 (kv_sequence_length)');he=i.dims[2]}else{if(u!==i.dims[2])throw new Error('Input "past_key" and "past_value" shall have the same dim 2 (kv_sequence_length)');he=i.dims[1]*i.dims[3],ue=!0}}let be=e.length>4?e[5]:void 0;if(be&&be.dims.length!==1&&be.dims[0]!==p)throw new Error('Input "seqlens" is expected to have 1 dimension and the same dim 0 as batch_size');return{batchSize:p,sequenceLength:h,pastSequenceLength:k,kvSequenceLength:u,totalSequenceLength:-1,maxSequenceLength:-1,inputHiddenSize:0,hiddenSize:C,vHiddenSize:he,headSize:R,vHeadSize:Math.floor(he/t.kvNumHeads),numHeads:t.numHeads,kvNumHeads:t.kvNumHeads,nReps:t.numHeads/t.kvNumHeads,pastPresentShareBuffer:!1,maskType:W,scale:t.scale,broadcastResPosBias:!1,passPastInKv:ue,qkvFormat:J}},gd=jt({perm:[0,2,1,3]}),ra=(e,t,s)=>{let n=t,i=s.kvNumHeads;return t.dims.length===3&&s.kvSequenceLength!==0&&(n=t.reshape([s.batchSize,s.kvSequenceLength,i,s.headSize]),n=e.compute(cr(n,gd.perm),{inputs:[n],outputs:[-1]})[0]),n},na=(e,t)=>{let s=sa(e.inputs,t);if(e.inputs[0].dims.length===5)throw new Error("Packed QKV is not implemented");if(e.inputs[1]?.dims.length===5)throw new Error("Packed KV is not implemented");let n=e.inputs[0],i=e.inputs[1]&&e.inputs[1].dims.length>0?e.inputs[1]:void 0,o=e.inputs[2]&&e.inputs[2].dims.length>0?e.inputs[2]:void 0,a=e.inputs[3]&&e.inputs[3].dims.length!==0?e.inputs[3]:void 0,c=e.inputs[4]&&e.inputs[4].dims.length!==0?e.inputs[4]:void 0,p=e.inputs.length>4?e.inputs[5]:void 0,h=e.inputs.length>5?e.inputs[6]:void 0,C=s.kvNumHeads?s.kvNumHeads:s.numHeads,u=jt({axis:2,numOutputs:3,splitSizes:[s.numHeads*s.headSize,C*s.headSize,C*s.headSize]}),[k,B,R]=!i&&!o?e.compute(Mi([n],u),{inputs:[n],outputs:[-1,-1,-1]}):[n,i,o],z=Un(e,s.batchSize,s.numHeads,s.sequenceLength,s.headSize,k,void 0,0);zn(e,z,ra(e,B,s),ra(e,R,s),void 0,void 0,a,c,void 0,s,p,h)}}),ia,oa,wd,yd,Ic=y(()=>{Ot(),$t(),jr(),qt(),ia=(e,t,s,n,i,o,a,c)=>{let p=Gt(o),h=p===1?"f32":`vec${p}f`,C=p===1?"vec2f":`mat2x${p}f`,u=i*a,k=64;u===1&&(k=256);let B=[i,a,o/p],R=[i,a,2],z=["rank","type","type"],ne=[];ne.push(...Mt(B,R));let J=W=>{let ue=He("x",t.dataType,3,p),he=He("scale",s.dataType,s.dims),be=He("bias",n.dataType,n.dims),Be=Ct("output",1,3,2),Ie=[ue,he,be,Be];return` + var workgroup_shared : array<${C}, ${k}>; + const workgroup_size = ${k}u; + ${W.declareVariables(...Ie)} + ${W.mainStart(k)} + let batch = workgroup_index / uniforms.x_shape[1]; + let channel = workgroup_index % uniforms.x_shape[1]; + let hight = uniforms.x_shape[2]; + // initialize workgroup memory + var sum = ${h}(0); + var squared_sum = ${h}(0); + for (var h = local_idx; h < hight; h += workgroup_size) { + let value = ${h}(${ue.get("batch","channel","h")}); + sum += value; + squared_sum += value * value; + } + workgroup_shared[local_idx] = ${C}(sum, squared_sum); + workgroupBarrier(); + + for (var currSize = workgroup_size >> 1; currSize > 0; currSize = currSize >> 1) { + if (local_idx < currSize) { + workgroup_shared[local_idx] = workgroup_shared[local_idx] + workgroup_shared[local_idx + currSize]; + } + workgroupBarrier(); + } + if (local_idx == 0) { + let sum_final = ${js("workgroup_shared[0][0]",p)} / f32(hight * ${p}); + let squared_sum_final = ${js("workgroup_shared[0][1]",p)} / f32(hight * ${p}); + + let inv_std_dev = inverseSqrt(squared_sum_final - sum_final * sum_final + f32(${c})); + let channel_scale = inv_std_dev * f32(scale[channel]); + let channel_shift = f32(bias[channel]) - sum_final * channel_scale; + output[workgroup_index] = vec2f(channel_scale, channel_shift); + } + }`};return e.compute({name:"InstanceNormComputeChannelScaleShift",shaderCache:{hint:`${p};${c};${k}`,inputDependencies:z},getRunData:()=>({outputs:[{dims:R,dataType:1}],dispatchGroup:{x:u},programUniforms:ne}),getShaderSource:J},{inputs:[t,s,n],outputs:[-1]})[0]},oa=(e,t,s)=>{let n=t[0].dims,i=n,o=2,a=n[0],c=n[1],p=De.sizeFromDimension(n,o),h=Gt(p),C=De.size(i)/h,u=ia(e,t[0],t[1],t[2],a,p,c,s.epsilon),k=[a,c,p/h],B=[a,c],R=["type","none"],z=ne=>{let J=He("x",t[0].dataType,k.length,h),W=He("scale_shift",1,B.length,2),ue=Ct("output",t[0].dataType,k.length,h),he=[J,W,ue];return` + ${ne.registerUniform("output_size","u32").declareVariables(...he)} + ${ne.mainStart()} + ${ne.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + let outputIndices = ${ue.offsetToIndices("global_idx")}; + let batch = outputIndices[0]; + let channel = outputIndices[1]; + let scale_shift = ${W.getByIndices("vec2(batch, channel)")}; + let value = ${J.getByOffset("global_idx")} * ${ue.type.value}(scale_shift.x) + ${ue.type.value}(scale_shift.y); + ${ue.setByOffset("global_idx","value")}; + }`};e.compute({name:"InstanceNormalization",shaderCache:{hint:`${h}`,inputDependencies:R},getRunData:()=>({outputs:[{dims:i,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(C/64)},programUniforms:[{type:12,data:C},...Mt(k,B,k)]}),getShaderSource:z},{inputs:[t[0],u]})},wd=(e,t,s)=>{let n=t[0].dims,i=n,o=n[0],a=n[n.length-1],c=De.sizeFromDimension(n,1)/a,p=Gt(a),h=De.size(i)/p,C=[{type:12,data:c},{type:12,data:Math.floor(a/p)}],u=["type","type"],k=!1,B=[0,n.length-1];for(let J=0;Jn[B[W]])),z=ia(e,R,t[1],t[2],o,c,a,s.epsilon),ne=J=>{let W=ds(t[0].dataType),ue=p===1?"vec2f":`mat${p}x2f`,he=Ie=>{let nt=Ie===0?"x":"y",dt=p===1?"f32":`vec${p}f`;switch(p){case 1:return`${W}(${dt}(scale.${nt}))`;case 2:return`vec2<${W}>(${dt}(scale[0].${nt}, scale[1].${nt}))`;case 4:return`vec4<${W}>(${dt}(scale[0].${nt}, scale[1].${nt}, scale[2].${nt}, scale[3].${nt}))`;default:throw new Error(`Not supported compoents ${p}`)}},be=He("input",t[0].dataType,t[0].dims,p),Be=Ct("output",t[0].dataType,i,p);return` + @group(0) @binding(0) var input : array<${be.type.storage}>; + @group(0) @binding(1) var scale_input : array<${ue}>; + @group(0) @binding(2) var output : array<${Be.type.storage}>; + struct Uniforms {H: u32, C : u32}; + @group(0) @binding(3) var uniforms: Uniforms; + + ${J.mainStart()} + let current_image_number = global_idx / (uniforms.C * uniforms.H); + let current_channel_number = global_idx % uniforms.C; + + let scale_offset = current_image_number * uniforms.C + current_channel_number; + let scale = scale_input[scale_offset]; + output[global_idx] = fma(input[global_idx], ${he(0)}, ${he(1)}); + }`};e.compute({name:"InstanceNormalizationNHWC",shaderCache:{hint:`${p}`,inputDependencies:u},getRunData:()=>({outputs:[{dims:i,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(h/64)},programUniforms:C}),getShaderSource:ne},{inputs:[t[0],z]})},yd=(e,t)=>{t.format==="NHWC"?wd(e,e.inputs,t):oa(e,e.inputs,t)}}),Md,bd,vd,Fc=y(()=>{Ot(),$t(),qt(),Md=e=>{if(!e||e.length<2)throw new Error("layerNorm requires at least 2 inputs.")},bd=(e,t,s)=>{let n=t.simplified,i=e[0].dims,o=e[1],a=!n&&e[2],c=i,p=De.normalizeAxis(t.axis,i.length),h=De.sizeToDimension(i,p),C=De.sizeFromDimension(i,p),u=De.size(o.dims),k=a?De.size(a.dims):0;if(u!==C||a&&k!==C)throw new Error(`Size of X.shape()[axis:] == ${C}. + Size of scale and bias (if provided) must match this. + Got scale size of ${u} and bias size of ${k}`);let B=[];for(let be=0;be1,W=s>2,ue=be=>{let Be=ds(e[0].dataType),Ie=[He("x",e[0].dataType,e[0].dims,R),He("scale",o.dataType,o.dims,R)];a&&Ie.push(He("bias",a.dataType,a.dims,R)),Ie.push(Ct("output",e[0].dataType,c,R)),J&&Ie.push(Ct("mean_data_output",1,B)),W&&Ie.push(Ct("inv_std_output",1,B));let nt=[{name:"norm_count",type:"u32"},{name:"norm_size",type:"f32"},{name:"norm_size_vectorized",type:"u32"},{name:"epsilon",type:"f32"}];return` + ${be.registerUniforms(nt).declareVariables(...Ie)} + ${be.mainStart()} + ${be.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.norm_count")} + let offset = global_idx * uniforms.norm_size_vectorized; + var mean_vector = ${Is("f32",R)}; + var mean_square_vector = ${Is("f32",R)}; + + for (var h: u32 = 0u; h < uniforms.norm_size_vectorized; h++) { + let value = ${ks(Be,R,"x[h + offset]")}; + mean_vector += value; + mean_square_vector += value * value; + } + let mean = ${js("mean_vector",R)} / uniforms.norm_size; + let inv_std_dev = inverseSqrt(${js("mean_square_vector",R)} / uniforms.norm_size ${n?"":"- mean * mean"} + uniforms.epsilon); + + for (var j: u32 = 0; j < uniforms.norm_size_vectorized; j++) { + let f32input = ${ks(Be,R,"x[j + offset]")}; + let f32scale = ${ks(Be,R,"scale[j]")}; + output[j + offset] = ${Ie[0].type.value}((f32input ${n?"":"- mean"}) * inv_std_dev * f32scale + ${a?`+ ${ks(Be,R,"bias[j]")}`:""} + ); + } + + ${J?"mean_data_output[global_idx] = mean":""}; + ${W?"inv_std_output[global_idx] = inv_std_dev":""}; + }`},he=[{dims:c,dataType:e[0].dataType}];return J&&he.push({dims:B,dataType:1}),W&&he.push({dims:B,dataType:1}),{name:"LayerNormalization",shaderCache:{hint:`${R};${s};${n}`,inputDependencies:z},getRunData:()=>({outputs:he,dispatchGroup:{x:Math.ceil(h/64)},programUniforms:ne}),getShaderSource:ue}},vd=(e,t)=>{Md(e.inputs),e.compute(bd(e.inputs,t,e.outputCount))}}),xd,Td,Pd=y(()=>{$t(),ko(),Fo(),xd=e=>{if(!e||e.length!==2)throw new Error("MatMul requires 2 inputs.");if(e[0].dims[e[0].dims.length-1]!==e[1].dims[e[1].dims.length-2])throw new Error("shared dimension does not match.")},Td=e=>{xd(e.inputs);let t=Js.calcShape(e.inputs[0].dims,e.inputs[1].dims,!0);if(!t)throw new Error("Can't use matmul on the given tensors");let s=t[t.length-1],n=e.inputs[0].dims[e.inputs[0].dims.length-1];if(s<8&&n<8)e.compute(Co(e.inputs,{activation:""},t));else{let i=t[t.length-2],o=De.size(e.inputs[0].dims.slice(0,-2)),a=De.size(e.inputs[1].dims.slice(0,-2));if(o!==1&&i===1&&a===1){let c=e.inputs[0].reshape([1,o,n]),p=e.inputs[1].reshape([1,n,s]),h=[1,o,s],C=[c,p];e.compute(ui(C,{activation:""},t,h),{inputs:C})}else e.compute(ui(e.inputs,{activation:""},t))}}}),Ed,Cd,aa,kd,Sd,fs=y(()=>{Ot(),$t(),is(),qt(),Ed=(e,t)=>{if(e.length<3||e.length>4)throw new Error("MatMulNBits requires 3 or 4 inputs");let s=e[0],n=s.dims.length;if(s.dims[n-1]!==t.k)throw new Error("The last dim of input shape does not match the k value");let i=Math.floor((t.k+t.blockSize-1)/t.blockSize),o=t.blockSize/8*t.bits,a=e[1];if(!De.areEqual(a.dims,[t.n,i,o]))throw new Error("The second inputs must be 3D tensor with shape N X nBlocksPerCol X blobSize");let c=e[2].dims;if(De.size(c)!==t.n*i)throw new Error("scales input size error.");if(e.length===4){let p=e[3].dims,h=t.bits>4?t.n*i:t.n*Math.floor((i+1)/2);if(De.size(p)!==h)throw new Error("zeroPoints input size error.")}},Cd=(e,t)=>{let s=e[0].dims,n=s.length,i=s[n-2],o=t.k,a=t.n,c=s.slice(0,n-2),p=De.size(c),h=e[1].dims[2]/4,C=e[0].dataType,u=Gt(t.k),k=Gt(h),B=Gt(a),R=c.concat([i,a]),z=i>1&&a/B%2===0?2:1,ne=De.size(R)/B/z,J=64,W=[],ue=[p,i,o/u],he=De.convertShape(e[1].dims).slice();he.splice(-1,1,h/k),W.push(...Mt(ue)),W.push(...Mt(he)),W.push(...Mt(e[2].dims)),e.length===4&&W.push(...Mt(De.convertShape(e[3].dims)));let be=[p,i,a/B];W.push(...Mt(be));let Be=Ie=>{let nt=ue.length,dt=He("a",e[0].dataType,nt,u),Et=He("b",12,he.length,k),zt=He("scales",e[2].dataType,e[2].dims.length),It=[dt,Et,zt],ht=e.length===4?He("zero_points",12,e[3].dims.length):void 0;ht&&It.push(ht);let Jt=be.length,Vt=Ct("output",e[0].dataType,Jt,B),St=ds(e[0].dataType),ts=(()=>{switch(u){case 1:return`array<${St}, 8>`;case 2:return`mat4x2<${St}>`;case 4:return`mat2x4<${St}>`;default:throw new Error(`${u}-component is not supported.`)}})(),Xt=()=>{let ut=` + // reuse a data + var input_offset = ${dt.indicesToOffset(`${dt.type.indices}(batch, row, word_offset)`)}; + var a_data: ${ts}; + for (var j: u32 = 0; j < ${8/u}; j++) { + a_data[j] = ${dt.getByOffset("input_offset")}; + input_offset++; + } + `;for(let xt=0;xt> 4) & b_mask); + b_quantized_values = ${ts}(${Array.from({length:4},(hs,vs)=>`${St}(b_value_lower[${vs}]), ${St}(b_value_upper[${vs}])`).join(", ")}); + b_dequantized_values = ${u===1?`${ts}(${Array.from({length:8},(hs,vs)=>`(b_quantized_values[${vs}] - ${ht?`zero_point${xt}`:"zero_point"}) * scale${xt}`).join(", ")});`:`(b_quantized_values - ${ts}(${Array(8).fill(`${ht?`zero_point${xt}`:"zero_point"}`).join(",")})) * scale${xt};`}; + workgroup_shared[local_id.x * ${z} + ${Math.floor(xt/B)}]${B>1?`[${xt%B}]`:""} += ${Array.from({length:8/u},(hs,vs)=>`${u===1?`a_data[${vs}] * b_dequantized_values[${vs}]`:`dot(a_data[${vs}], b_dequantized_values[${vs}])`}`).join(" + ")}; + `;return ut},Ut=()=>{let ut=` + var col_index = col * ${B}; + ${ht?` + let zero_point_bytes_per_col = (nBlocksPerCol + 1) / 2; + var zero_point_byte_count: u32; + var zero_point_word_index: u32; + var zero_point_byte_offset: u32; + let zero_point_nibble_offset: u32 = block & 0x1u; + var zero_point_bits_offset: u32; + var zero_point_word: u32;`:` + // The default zero point is 8 for unsigned 4-bit quantization. + let zero_point = ${St}(8);`} + `;for(let xt=0;xt> 0x1u); + zero_point_word_index = zero_point_byte_count >> 0x2u; + zero_point_byte_offset = zero_point_byte_count & 0x3u; + zero_point_bits_offset = (zero_point_byte_offset << 3) + (zero_point_nibble_offset << 2); + zero_point_word = ${ht.getByOffset("zero_point_word_index")} >> zero_point_bits_offset; + let zero_point${xt} = ${St}((zero_point_word) & 0xFu);`:""} + col_index += 1;`;return ut},$s=()=>{let ut=`col_index = col * ${B};`;for(let xt=0;xt; + var b_value_upper: vec4; + var b_quantized_values: ${ts}; + var b_dequantized_values: ${ts};`,ut};return` + var workgroup_shared: array<${Vt.type.value}, ${z*J}>; + ${Ie.declareVariables(...It,Vt)} + ${Ie.mainStart([J,1,1])} + let output_indices = ${Vt.offsetToIndices(`(global_idx / ${J}) * ${z}`)}; + let col = output_indices[2]; + let row = output_indices[1]; + let batch = output_indices[0]; + let nBlocksPerCol = uniforms.b_shape[1]; + + for (var block = local_id.x; block < nBlocksPerCol; block += ${J}) { + //process one block + var word_offset: u32 = block * ${t.blockSize/u}; + ${Ut()} + for (var word: u32 = 0; word < ${h}; word += ${k}) { + ${$s()} + for (var i: u32 = 0; i < ${k}; i++) { + ${Xt()} + word_offset += ${8/u}; + } + } + } + workgroupBarrier(); + + if (local_id.x < ${z}) { + var output_value: ${Vt.type.value} = ${Vt.type.value}(0); + var workgroup_shared_offset: u32 = local_id.x; + for (var b: u32 = 0u; b < ${J}u; b++) { + output_value += workgroup_shared[workgroup_shared_offset]; + workgroup_shared_offset += ${z}; + } + ${Vt.setByIndices(`${Vt.type.indices}(batch, row, col + local_id.x)`,"output_value")}; + } + }`};return{name:"MatMulNBits",shaderCache:{hint:`${t.blockSize};${t.bits};${u};${k};${B};${z};${J}`,inputDependencies:Array(e.length).fill("rank")},getRunData:()=>({outputs:[{dims:R,dataType:C}],dispatchGroup:{x:ne},programUniforms:W}),getShaderSource:Be}},aa=(e,t)=>{let s=e[0].dims,n=s.length,i=s[n-2],o=t.k,a=t.n,c=s.slice(0,n-2),p=De.size(c),h=e[1].dims[2]/4,C=e[0].dataType,u=Gt(t.k),k=Gt(h),B=c.concat([i,a]),R=128,z=a%8===0?8:a%4===0?4:1,ne=R/z,J=ne*k*8,W=J/u,ue=J/t.blockSize,he=De.size(B)/z,be=[],Be=[p,i,o/u],Ie=De.convertShape(e[1].dims).slice();Ie.splice(-1,1,h/k),be.push(...Mt(Be)),be.push(...Mt(Ie)),be.push(...Mt(e[2].dims)),e.length===4&&be.push(...Mt(De.convertShape(e[3].dims)));let nt=[p,i,a];be.push(...Mt(nt));let dt=Et=>{let zt=Be.length,It=He("a",e[0].dataType,zt,u),ht=He("b",12,Ie.length,k),Jt=He("scales",e[2].dataType,e[2].dims.length),Vt=[It,ht,Jt],St=e.length===4?He("zero_points",12,e[3].dims.length):void 0;St&&Vt.push(St);let ts=nt.length,Xt=Ct("output",e[0].dataType,ts),Ut=ds(e[0].dataType),$s=()=>{switch(u){case 1:return` + let a_data0 = vec4<${Ut}>(sub_a[word_offset], sub_a[word_offset + 1], sub_a[word_offset + 2], sub_a[word_offset + 3]); + let a_data1 = vec4<${Ut}>(sub_a[word_offset + 4], sub_a[word_offset + 5], sub_a[word_offset + 6], sub_a[word_offset + 7]);`;case 2:return` + let a_data0 = vec4<${Ut}>(sub_a[word_offset], sub_a[word_offset + 1]); + let a_data1 = vec4<${Ut}>(sub_a[word_offset + 2], sub_a[word_offset + 3]);`;case 4:return` + let a_data0 = sub_a[word_offset]; + let a_data1 = sub_a[word_offset + 1];`;default:throw new Error(`${u}-component is not supported.`)}};return` + var sub_a: array<${It.type.value}, ${W}>; + var inter_results: array, ${z}>; + ${Et.declareVariables(...Vt,Xt)} + ${Et.mainStart([ne,z,1])} + let output_indices = ${Xt.offsetToIndices(`workgroup_index * ${z}`)}; + let col = output_indices[2]; + let row = output_indices[1]; + let batch = output_indices[0]; + let n_blocks_per_col = uniforms.b_shape[1]; + let num_tiles = (n_blocks_per_col - 1) / ${ue} + 1; + + // Loop over shared dimension. + for (var tile: u32 = 0; tile < num_tiles; tile += 1) { + let a_col_start = tile * ${W}; + // load one tile A data into shared memory. + for (var a_offset = local_idx; a_offset < ${W}; a_offset += ${R}) + { + let a_col = a_col_start + a_offset; + if (a_col < uniforms.a_shape[2]) + { + sub_a[a_offset] = ${It.getByIndices(`${It.type.indices}(batch, row, a_col)`)}; + } else { + sub_a[a_offset] = ${It.type.value}(0); + } + } + workgroupBarrier(); + + // each thread process one block + let b_row = col + local_id.y; + let block = tile * ${ue} + local_id.x; + ${St?` + let zero_point_bytes_per_col = (n_blocks_per_col + 1) / 2; + let zero_point_byte_count = b_row * zero_point_bytes_per_col + (block >> 0x1u); + let zero_point_word_index = zero_point_byte_count >> 0x2u; + let zero_point_byte_offset = zero_point_byte_count & 0x3u; + let zero_point_nibble_offset: u32 = block & 0x1u; + let zero_point_bits_offset = (zero_point_byte_offset << 3) + (zero_point_nibble_offset << 2); + let zero_point_word = ${St.getByOffset("zero_point_word_index")} >> zero_point_bits_offset; + let zero_point = ${Ut}((zero_point_word) & 0xFu);`:` + // The default zero point is 8 for unsigned 4-bit quantization. + let zero_point = ${Ut}(8);`} + let scale = ${Jt.getByOffset("b_row * n_blocks_per_col + block")}; + let b_data = ${ht.getByIndices(`${ht.type.indices}(b_row, block, 0)`)}; + var word_offset = local_id.x * ${t.blockSize/u}; + for (var i: u32 = 0; i < ${k}; i++) { + ${$s()} + let b_value = ${k===1?"b_data":"b_data[i]"}; + let b_value_lower = unpack4xU8(b_value & 0x0F0F0F0Fu); + let b_value_upper = unpack4xU8((b_value >> 4) & 0x0F0F0F0Fu); + let b_quantized_values = mat2x4<${Ut}>(${Array.from({length:4},(ut,xt)=>`${Ut}(b_value_lower[${xt}]), ${Ut}(b_value_upper[${xt}])`).join(", ")}); + let b_dequantized_values = (b_quantized_values - mat2x4<${Ut}>(${Array(8).fill("zero_point").join(",")})) * scale; + inter_results[local_id.y][local_id.x] += ${Array.from({length:2},(ut,xt)=>`${`dot(a_data${xt}, b_dequantized_values[${xt}])`}`).join(" + ")}; + word_offset += ${8/u}; + } + workgroupBarrier(); + } + + if (local_idx < ${z}) { + var output_value: ${Xt.type.value} = ${Xt.type.value}(0); + for (var b = 0u; b < ${ne}; b++) { + output_value += inter_results[local_idx][b]; + } + if (col + local_idx < uniforms.output_shape[2]) + { + ${Xt.setByIndices(`${Xt.type.indices}(batch, row, col + local_idx)`,"output_value")} + } + } + }`};return{name:"BlockwiseMatMulNBits32",shaderCache:{hint:`${t.blockSize};${u};${k};${ne};${z}`,inputDependencies:Array(e.length).fill("rank")},getRunData:()=>({outputs:[{dims:B,dataType:C}],dispatchGroup:{x:he},programUniforms:be}),getShaderSource:dt}},kd=(e,t)=>{Ed(e.inputs,t),t.blockSize===32&&e.adapterInfo.isVendor("intel")&&e.adapterInfo.isArchitecture("gen-12lp")?e.compute(aa(e.inputs,t)):e.compute(Cd(e.inputs,t))},Sd=e=>jt(e)}),Oc,Dc,Lc,la,$d,Ad,Id,Fd,ua,Od=y(()=>{Ot(),$t(),qt(),Oc=e=>{if(!e||e.length<1)throw new Error("Too few inputs");if(e[0].dataType!==1&&e[0].dataType!==10)throw new Error("Input type must be float or float16.");if(e.length>=2){let t=e[0].dims.length*2===e[1].dims[0];if(e.length===4&&(t=e[3].dims[0]*2===e[1].dims[0]),!t)throw new Error("The pads should be a 1D tensor of shape [2 * input_rank] or [2 * num_axes].")}},Dc=(e,t,s)=>{let n="";for(let i=t-1;i>=0;--i)n+=` + k = i32(${e.indicesGet("indices",i)}) - ${Tt("uniforms.pads",i,s)}; + if (k < 0) { + break; + } + if (k >= i32(${Tt("uniforms.x_shape",i,t)})) { + break; + } + offset += k * i32(${Tt("uniforms.x_strides",i,t)}); + `;return` + value = ${e.type.value}(uniforms.constant_value); + for (var i = 0; i < 1; i++) { + var offset = 0; + var k = 0; + ${n} + value = x[offset]; + } + `},Lc=(e,t,s)=>{let n="";for(let i=t-1;i>=0;--i)n+=` + k = i32(${e.indicesGet("indices",i)}) - ${Tt("uniforms.pads",i,s)}; + if (k < 0) { + k = -k; + } + { + let _2n_1 = 2 * (i32(${Tt("uniforms.x_shape",i,t)}) - 1); + k = k % _2n_1; + if(k >= i32(${Tt("uniforms.x_shape",i,t)})) { + k = _2n_1 - k; + } + } + offset += k * i32(${Tt("uniforms.x_strides",i,t)}); + `;return` + var offset = 0; + var k = 0; + ${n} + value = x[offset]; + `},la=(e,t,s)=>{let n="";for(let i=t-1;i>=0;--i)n+=` + k = i32(${e.indicesGet("indices",i)}) - ${Tt("uniforms.pads",i,s)}; + if (k < 0) { + k = 0; + } + if (k >= i32(${Tt("uniforms.x_shape",i,t)})) { + k = i32(${Tt("uniforms.x_shape",i,t)}) - 1; + } + offset += k * i32(${Tt("uniforms.x_strides",i,t)}); + `;return` + var offset = 0; + var k = 0; + ${n} + value = x[offset]; + `},$d=(e,t,s)=>{let n="";for(let i=t-1;i>=0;--i)n+=` + k = i32(${e.indicesGet("indices",i)}) - ${Tt("uniforms.pads",i,s)}; + if (k < 0) { + k += i32(${Tt("uniforms.x_shape",i,t)}]); + } + if (k >= i32(${Tt("uniforms.x_shape",i,t)})) { + k -= i32(${Tt("uniforms.x_shape",i,t)}); + } + offset += k * i32(${Tt("uniforms.x_strides",i,t)}); + `;return` + var offset = 0; + var k = 0; + ${n} + value = x[offset]; + `},Ad=(e,t,s)=>{switch(s.mode){case 0:return Dc(e,t,s.pads.length);case 1:return Lc(e,t,s.pads.length);case 2:return la(e,t,s.pads.length);case 3:return $d(e,t,s.pads.length);default:throw new Error("Invalid mode")}},Id=(e,t)=>{let s=De.padShape(e[0].dims.slice(),t.pads),n=e[0].dims,i=De.size(s),o=[{type:12,data:i},{type:6,data:t.pads}],a=e.length>=3&&e[2].data;t.mode===0&&o.push({type:a?e[2].dataType:1,data:t.value}),o.push(...Mt(e[0].dims,s));let c=["rank"],p=h=>{let C=Ct("output",e[0].dataType,s.length),u=He("x",e[0].dataType,n.length),k=u.type.value,B=Ad(C,n.length,t),R=[{name:"output_size",type:"u32"},{name:"pads",type:"i32",length:t.pads.length}];return t.mode===0&&R.push({name:"constant_value",type:a?k:"f32"}),` + ${h.registerUniforms(R).declareVariables(u,C)} + ${h.mainStart()} + ${h.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + + let indices = ${C.offsetToIndices("global_idx")}; + + var value = ${k}(0); + ${B} + output[global_idx] = value; + }`};return{name:"Pad",shaderCache:{hint:`${t.mode}${a}`,inputDependencies:c},getRunData:()=>({outputs:[{dims:s,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(De.size(s)/64)},programUniforms:o}),getShaderSource:p}},Fd=(e,t)=>{if(e.length>1){let s=e[1].getBigInt64Array(),n=e.length>=3&&e[2].data?e[2].dataType===10?e[2].getUint16Array()[0]:e[2].getFloat32Array()[0]:0,i=e[0].dims.length,o=new Int32Array(2*i).fill(0);if(e.length>=4){let c=e[3].getBigInt64Array();for(let p=0;po[Number(p)]=Number(c));let a=[];return o.forEach(c=>a.push(c)),{mode:t.mode,value:n,pads:a}}else return t},ua=(e,t)=>{Oc(e.inputs);let s=Fd(e.inputs,t);e.compute(Id(e.inputs,s),{inputs:[0]})}}),bi,da,ca,vi,Dd,zc,Ld,pa,ha,zd,Bd,ma,Rd,Nd,fa,jd,Vd,Ud,Bc,Rc=y(()=>{We(),Ot(),$t(),qt(),bi=e=>{if(F.webgpu.validateInputContent&&(!e||e.length!==1))throw new Error("Pool ops requires 1 input.")},da=(e,t,s)=>{let n=t.format==="NHWC",i=e.dims.slice();n&&i.splice(1,0,i.pop());let o=Object.hasOwnProperty.call(t,"dilations"),a=t.kernelShape.slice(),c=t.strides.slice(),p=o?t.dilations.slice():[],h=t.pads.slice();Xs.adjustPoolAttributes(s,i,a,c,p,h);let C=Xs.computePoolOutputShape(s,i,c,p,a,h,t.autoPad),u=Object.assign({},t);o?Object.assign(u,{kernelShape:a,strides:c,pads:h,dilations:p,cacheKey:t.cacheKey}):Object.assign(u,{kernelShape:a,strides:c,pads:h,cacheKey:t.cacheKey});let k=C.slice();return k.push(k.splice(1,1)[0]),[u,n?k:C]},ca=(e,t)=>{let s=t.format==="NHWC",n=De.size(e),i=De.size(t.kernelShape),o=[{type:12,data:n},{type:12,data:i}],a=[{name:"outputSize",type:"u32"},{name:"kernelSize",type:"u32"}];if(t.kernelShape.length<=2){let c=t.kernelShape[t.kernelShape.length-1],p=t.strides[t.strides.length-1],h=t.pads[t.pads.length/2-1],C=t.pads[t.pads.length-1],u=!!(h+C);o.push({type:12,data:c},{type:12,data:p},{type:12,data:h},{type:12,data:C}),a.push({name:"kw",type:"u32"},{name:"sw",type:"u32"},{name:"pwStart",type:"u32"},{name:"pwEnd",type:"u32"});let k=!1;if(t.kernelShape.length===2){let B=t.kernelShape[t.kernelShape.length-2],R=t.strides[t.strides.length-2],z=t.pads[t.pads.length/2-2],ne=t.pads[t.pads.length-2];k=!!(z+ne),o.push({type:12,data:B},{type:12,data:R},{type:12,data:z},{type:12,data:ne}),a.push({name:"kh",type:"u32"},{name:"sh",type:"u32"},{name:"phStart",type:"u32"},{name:"phEnd",type:"u32"})}return[o,a,!0,u,k]}else{if(s)throw new Error("Pooling with kernelShape.length > 2 is not supported for NHWC format.");let c=De.computeStrides(t.kernelShape);o.push({type:12,data:c},{type:12,data:t.pads},{type:12,data:t.strides}),a.push({name:"kernelStrides",type:"u32",length:c.length},{name:"pads",type:"u32",length:t.pads.length},{name:"strides",type:"u32",length:t.strides.length});let p=t.pads.reduce((h,C)=>h+C);return[o,a,!!p,!1,!1]}},vi=(e,t,s,n,i,o,a,c,p,h,C,u)=>{let k=i.format==="NHWC",B=t.type.value,R=Ct("output",t.type.tensor,n);if(i.kernelShape.length<=2){let z="",ne="",J="",W=s-(k?2:1);if(C?z=` + for (var i: u32 = 0u; i < uniforms.kw; i++) { + xIndices[${W}] = indices[${W}] * uniforms.sw - uniforms.pwStart + i; + if (xIndices[${W}] < 0 || xIndices[${W}] + >= uniforms.x_shape[${W}]) { + pad++; + continue; + } + let x_val = x[${t.indicesToOffset("xIndices")}]; + ${o} + }`:z=` + for (var i: u32 = 0u; i < uniforms.kw; i++) { + xIndices[${W}] = indices[${W}] * uniforms.sw - uniforms.pwStart + i; + let x_val = x[${t.indicesToOffset("xIndices")}]; + ${o} + }`,i.kernelShape.length===2){let ue=s-(k?3:2);u?ne=` + for (var j: u32 = 0u; j < uniforms.kh; j++) { + xIndices[${ue}] = indices[${ue}] * uniforms.sh - uniforms.phStart + j; + if (xIndices[${ue}] < 0 || xIndices[${ue}] >= uniforms.x_shape[${ue}]) { + pad += i32(uniforms.kw); + continue; + } + `:ne=` + for (var j: u32 = 0u; j < uniforms.kh; j++) { + xIndices[${ue}] = indices[${ue}] * uniforms.sh - uniforms.phStart + j; + `,J=` + } + `}return` + ${e.registerUniforms(p).declareVariables(t,R)} + + ${e.mainStart()} + ${e.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} + + let indices = ${R.offsetToIndices("global_idx")}; + var xIndices = ${R.offsetToIndices("global_idx")}; + + var value = ${B}(${c}); + var pad = 0; + ${ne} + ${z} + ${J} + ${a} + + output[global_idx] = value; + }`}else{if(k)throw new Error("Pooling with kernelShape.length > 2 is not supported for NHWC format.");let z=i.kernelShape.length,ne=i.pads.length,J="";return h?J=` + if (xIndices[j] >= uniforms.x_shape[j]) { + pad++; + isPad = true; + break; + } + } + if (!isPad) { + let x_val = x[${t.indicesToOffset("xIndices")}]; + ${o} + }`:J=` + } + let x_val = x[${t.indicesToOffset("xIndices")}]; + ${o} + `,` + ${e.registerUniforms(p).declareVariables(t,R)} + + ${e.mainStart()} + ${e.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} + let indices = ${R.offsetToIndices("global_idx")}; + var xIndices = ${R.offsetToIndices("global_idx")}; + + var offsets: array; + + var value = ${B}(${c}); + var pad = 0; + var isPad = false; + + for (var i: u32 = 0u; i < uniforms.kernelSize; i++) { + var offset = i; + for (var j = 0u; j < ${z-1}u; j++) { + offsets[j] = offset / ${Tt("uniforms.kernelStrides","j",z)}; + offset -= offsets[j] * ${Tt("uniforms.kernelStrides","j",z)}; + } + offsets[${z-1}] = offset; + + isPad = false; + for (var j = ${s-z}u; j < ${s}u; j++) { + xIndices[j] = indices[j] * ${Tt("uniforms.strides",`j - ${s-z}u`,z)} + + offsets[j - ${s-z}u] - ${Tt("uniforms.pads","j - 2u",ne)}; + ${J} + } + ${a} + + output[global_idx] = value; + }`}},Dd=e=>`${e.format};${e.ceilMode};${e.autoPad};${e.kernelShape.length}`,zc=e=>`${Dd(e)};${e.countIncludePad}`,Ld=e=>`${Dd(e)};${e.storageOrder};${e.dilations}`,pa=e=>({format:e.format,autoPad:["NOTSET","VALID","SAME_UPPER","SAME_LOWER"][e.auto_pad],ceilMode:e.ceil_mode,kernelShape:e.kernel_shape,strides:e.strides,pads:e.pads}),ha=(e,t,s,n)=>{let[i,o]=da(t,n,s),a=He("x",t.dataType,t.dims.length),c=a.type.value,p="value += x_val;",h="";i.countIncludePad?h+=`value /= ${c}(uniforms.kernelSize);`:h+=`value /= ${c}(i32(uniforms.kernelSize) - pad);`;let[C,u,k,B,R]=ca(o,i);C.push(...Mt(t.dims,o));let z=["rank"];return{name:e,shaderCache:{hint:`${n.cacheKey};${k};${B};${R}`,inputDependencies:z},getRunData:()=>({outputs:[{dims:o,dataType:t.dataType}],dispatchGroup:{x:Math.ceil(De.size(o)/64)},programUniforms:C}),getShaderSource:ne=>vi(ne,a,t.dims.length,o.length,i,p,h,0,u,k,B,R)}},zd=e=>{let t=e.count_include_pad!==0,s=pa(e);if(s.ceilMode!==0)throw new Error("using ceil() in shape computation is not yet supported for AveragePool");let n={countIncludePad:t,...s,cacheKey:""};return{...n,cacheKey:zc(n)}},Bd=(e,t)=>{bi(e.inputs),e.compute(ha("AveragePool",e.inputs[0],!1,t))},ma={autoPad:"",ceilMode:0,countIncludePad:!1,kernelShape:[],strides:[],pads:[],storageOrder:0,dilations:[]},Rd=e=>{let t=e.format;return{format:t,...ma,cacheKey:t}},Nd=(e,t)=>{bi(e.inputs),e.compute(ha("GlobalAveragePool",e.inputs[0],!0,t))},fa=(e,t,s,n)=>{let[i,o]=da(t,n,s),a=` + value = max(x_val, value); + `,c="",p=He("x",t.dataType,t.dims.length),h=["rank"],[C,u,k,B,R]=ca(o,i);return C.push(...Mt(t.dims,o)),{name:e,shaderCache:{hint:`${n.cacheKey};${k};${B};${R}`,inputDependencies:h},getRunData:()=>({outputs:[{dims:o,dataType:t.dataType}],dispatchGroup:{x:Math.ceil(De.size(o)/64)},programUniforms:C}),getShaderSource:z=>vi(z,p,t.dims.length,o.length,i,a,c,t.dataType===10?-65504:-1e5,u,k,B,R)}},jd=(e,t)=>{bi(e.inputs),e.compute(fa("MaxPool",e.inputs[0],!1,t))},Vd=e=>{let t=e.storage_order,s=e.dilations,n=pa(e);if(t!==0)throw new Error("column major storage order is not yet supported for MaxPool");if(n.ceilMode!==0)throw new Error("using ceil() in shape computation is not yet supported for MaxPool");let i={storageOrder:t,dilations:s,...n,cacheKey:""};return{...i,cacheKey:Ld(i)}},Ud=e=>{let t=e.format;return{format:t,...ma,cacheKey:t}},Bc=(e,t)=>{bi(e.inputs),e.compute(fa("GlobalMaxPool",e.inputs[0],!0,t))}}),Wd,Gd,Kd,Hd,Nc=y(()=>{Ot(),$t(),is(),qt(),Wd=(e,t)=>{if(e.length<2||e.length>3)throw new Error("DequantizeLinear requires 2 or 3 inputs.");if(e.length===3&&e[1].dims===e[2].dims)throw new Error("x-scale and x-zero-point must have the same shape.");if(e.length===3&&e[0].dataType!==e[2].dataType)throw new Error("x and x-zero-point must have the same data type.");if(e[0].dataType===6&&e.length>2)throw new Error("In the case of dequantizing int32 there is no zero point.");if(e[1].dims.length!==0&&e[1].dims.length!==1&&e[1].dims.length!==e[0].dims.length)throw new Error("scale input must be a scalar, a 1D tensor, or have the same rank as the input tensor.");if(e.length>2){if(e[0].dataType!==e[2].dataType)throw new Error("x and x-zero-point must have the same data type.");if(e[1].dims.length!==e[2].dims.length)throw new Error("scale and zero-point inputs must have the same rank.");if(!e[1].dims.map((s,n)=>s===e[2].dims[n]).reduce((s,n)=>s&&n,!0))throw new Error("scale and zero-point inputs must have the same shape.")}if(t.blockSize>0){if(e[1].dims.length===0||e[1].dims.length===1&&e[1].dims[0]===1)throw new Error("blockSize must be set only for block quantization.");if(!e[1].dims.map((i,o)=>o===t.axis||i===e[0].dims[o]).reduce((i,o)=>i&&o,!0))throw new Error("For block qunatization, scale input shape to match the input shape except for the axis");if(e[1].dims.length!==e[0].dims.length)throw new Error("For block qunatization the scale input rank must be the same as the x rank.");let s=e[0].dims[t.axis],n=e[1].dims[t.axis];if(t.blockSizeMath.ceil(s/(n-1)-1))throw new Error("blockSize must be with in the range [ceil(dI / Si), ceil(dI / (Si - 1) - 1)].")}},Gd=(e,t)=>{let s=De.normalizeAxis(t.axis,e[0].dims.length),n=e[0].dataType,i=n===3,o=e[0].dims,a=e[1].dataType,c=De.size(o),p=n===3||n===2,h=p?[Math.ceil(De.size(e[0].dims)/4)]:e[0].dims,C=e[1].dims,u=e.length>2?e[2]:void 0,k=u?p?[Math.ceil(De.size(u.dims)/4)]:u.dims:void 0,B=C.length===0||C.length===1&&C[0]===1,R=B===!1&&C.length===1,z=Gt(c),ne=B&&(!p||z===4),J=ne?z:1,W=ne&&!p?z:1,ue=He("input",p?12:n,h.length,W),he=He("scale",a,C.length),be=u?He("zero_point",p?12:n,k.length):void 0,Be=Ct("output",a,o.length,J),Ie=[ue,he];be&&Ie.push(be);let nt=[h,C];u&&nt.push(k);let dt=[{type:12,data:c/J},{type:12,data:s},{type:12,data:t.blockSize},...Mt(...nt,o)],Et=zt=>{let It=[{name:"output_size",type:"u32"},{name:"axis",type:"u32"},{name:"block_size",type:"u32"}];return` + ${zt.registerUniforms(It).declareVariables(...Ie,Be)} + ${zt.mainStart()} + ${zt.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + let output_indices = ${Be.offsetToIndices("global_idx")}; + + // Set input x + ${p?` + let input = ${ue.getByOffset("global_idx / 4")}; + let x_vec = ${i?"unpack4xI8(input)":"unpack4xU8(input)"}; + let x_value = ${J===1?"x_vec[global_idx % 4]":"x_vec"};`:`let x_value = ${ue.getByOffset("global_idx")};`}; + + // Set scale input + ${B?`let scale_value= ${he.getByOffset("0")}`:R?` + let scale_index = ${Be.indicesGet("output_indices","uniforms.axis")}; + let scale_value= ${he.getByOffset("scale_index")};`:` + var scale_indices: ${he.type.indices} = output_indices; + let index = ${he.indicesGet("scale_indices","uniforms.axis")} / uniforms.block_size; + ${he.indicesSet("scale_indices","uniforms.axis","index")}; + let scale_value= ${he.getByIndices("scale_indices")};`}; + + // Set zero-point input + ${be?B?p?` + let zero_point_input = ${be.getByOffset("0")}; + let zero_point_vec = ${i?"unpack4xI8(zero_point_input)":"unpack4xU8(zero_point_input)"}; + let zero_point_value= zero_point_vec[0]`:`let zero_point_value = ${be.getByOffset("0")}`:R?p?` + let zero_point_index = ${Be.indicesGet("output_indices","uniforms.axis")}; + let zero_point_input = ${be.getByOffset("zero_point_index / 4")}; + let zero_point_vec = ${i?"unpack4xI8(zero_point_input)":"unpack4xU8(zero_point_input)"}; + let zero_point_value = zero_point_vec[zero_point_index % 4]`:` + let zero_point_index = ${Be.indicesGet("output_indices","uniforms.axis")}; + let zero_point_value = ${be.getByOffset("zero_point_index")};`:p?` + let zero_point_offset = ${he.indicesToOffset("scale_indices")}; + let zero_point_input = ${be.getByOffset("zero_point_offset / 4")}; + let zero_point_vec = ${i?"unpack4xI8(zero_point_input)":"unpack4xU8(zero_point_input)"}; + let zero_point_value = zero_point_vec[zero_point_offset % 4];`:`let zero_point_value = ${be.getByIndices("scale_indices")};`:`let zero_point_value = ${p?i?"i32":"u32":ue.type.value}(0);`}; + // Compute and write output + ${Be.setByOffset("global_idx",`${Be.type.value}(x_value - zero_point_value) * scale_value`)}; + }`};return{name:"DequantizeLinear",shaderCache:{hint:t.cacheKey,inputDependencies:be?["rank","rank","rank"]:["rank","rank"]},getShaderSource:Et,getRunData:()=>({outputs:[{dims:o,dataType:a}],dispatchGroup:{x:Math.ceil(c/J/64),y:1,z:1},programUniforms:dt})}},Kd=(e,t)=>{Wd(e.inputs,t),e.compute(Gd(e.inputs,t))},Hd=e=>jt({axis:e.axis,blockSize:e.blockSize})}),jc,Vc,Uc,Rp=y(()=>{We(),Ot(),qt(),jc=(e,t,s)=>{let n=e===t,i=et&&s>0;if(n||i||o)throw new Error("Range these inputs' contents are invalid.")},Vc=(e,t,s,n)=>{let i=Math.abs(Math.ceil((t-e)/s)),o=[i],a=i,c=[{type:12,data:a},{type:n,data:e},{type:n,data:s},...Mt(o)],p=h=>{let C=Ct("output",n,o.length),u=C.type.value,k=[{name:"outputSize",type:"u32"},{name:"start",type:u},{name:"delta",type:u}];return` + ${h.registerUniforms(k).declareVariables(C)} + ${h.mainStart()} + ${h.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} + output[global_idx] = uniforms.start + ${u}(global_idx) * uniforms.delta; + }`};return{name:"Range",shaderCache:{hint:`${n}`},getShaderSource:p,getRunData:()=>({outputs:[{dims:o,dataType:n}],dispatchGroup:{x:Math.ceil(a/64)},programUniforms:c})}},Uc=e=>{let t=0,s=0,n=0;e.inputs[0].dataType===6?(t=e.inputs[0].getInt32Array()[0],s=e.inputs[1].getInt32Array()[0],n=e.inputs[2].getInt32Array()[0]):e.inputs[0].dataType===1&&(t=e.inputs[0].getFloat32Array()[0],s=e.inputs[1].getFloat32Array()[0],n=e.inputs[2].getFloat32Array()[0]),F.webgpu.validateInputContent&&jc(t,s,n),e.compute(Vc(t,s,n,e.inputs[0].dataType),{inputs:[]})}}),Wc,Gc,Kc,Hc,Np=y(()=>{Ot(),$t(),is(),qt(),Wc=(e,t,s,n)=>{if(e!=="none"&&n!=="i32"&&n!=="u32"&&n!=="f32")throw new Error(`Input ${n} is not supported with reduction ${e}.`);let i=`{ + var oldValue = 0; + loop { + let newValueF32 =`,o=`; + let newValue = bitcast(newValueF32); + let res = atomicCompareExchangeWeak(&${t}, oldValue, newValue); + if res.exchanged { + break; + } + oldValue = res.old_value; + } + }`;switch(e){case"none":return`${t}=${s};`;case"add":return n==="i32"||n==="u32"?`atomicAdd(&${t}, bitcast<${n}>(${s}));`:` + ${i}bitcast<${n}>(oldValue) + (${s})${o}`;case"max":return n==="i32"||n==="u32"?`atomicMax(&${t}, bitcast<${n}>(${s}));`:` + ${i}max(bitcast(oldValue), (${s}))${o}`;case"min":return n==="i32"||n==="u32"?`atomicMin(&${t}, bitcast<${n}>(${s}));`:`${i}min(bitcast<${n}>(oldValue), (${s}))${o}`;case"mul":return`${i}(bitcast<${n}>(oldValue) * (${s}))${o}`;default:throw new Error(`Reduction ${e} is not supported.`)}},Gc=(e,t)=>{let s=e[0].dims,n=e[1].dims,i=s,o=1,a=Math.ceil(De.size(n)/o),c=n[n.length-1],p=De.sizeFromDimension(s,c),h=[{type:12,data:a},{type:12,data:c},{type:12,data:p},...Mt(e[1].dims,e[2].dims,i)],C=u=>{let k=He("indices",e[1].dataType,e[1].dims.length),B=He("updates",e[2].dataType,e[2].dims.length,o),R=t.reduction!=="none"&&t.reduction!==""?Ea("output",e[0].dataType,i.length):Ct("output",e[0].dataType,i.length,o);return` + ${u.registerUniform("output_size","u32").registerUniform("last_index_dimension","u32").registerUniform("num_updates_elements","u32").declareVariables(k,B,R)} + ${u.mainStart()} + ${u.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + var data_offset = 0u; + let indices_start = uniforms.last_index_dimension * global_idx; + let indices_end = indices_start + uniforms.last_index_dimension; + for (var i = indices_start; i < indices_end; i++) { + var index = i32(indices[i].x); + ${e[0].dims.length===1?` + let element_count_dim = uniforms.output_strides; + let dim_value = uniforms.output_shape;`:` + let element_count_dim = uniforms.output_strides[i - indices_start]; + let dim_value = uniforms.output_shape[i - indices_start + uniforms.last_index_dimension];`} + if (index >= 0) { + if (index >= i32(dim_value)) { + index = i32(dim_value - 1); + } + } else { + if (index < -i32(dim_value)) { + index = 0; + } else { + index += i32(dim_value); + } + } + data_offset += u32((u32(index) * element_count_dim)); + } + + for (var i = 0u; i < uniforms.num_updates_elements; i++) { + let value = updates[uniforms.num_updates_elements * global_idx + i]; + ${Wc(t.reduction,"output[data_offset + i]","value",R.type.value)} + } + + }`};return{name:"ScatterND",shaderCache:{hint:`${t.cacheKey}_${t.reduction}`,inputDependencies:["rank","rank"]},getRunData:()=>({outputs:[{dims:i,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(a/64)},programUniforms:h}),getShaderSource:C}},Kc=e=>jt({reduction:e.reduction}),Hc=(e,t)=>{e.compute(Gc(e.inputs,t),{inputs:[e.inputs[1],e.inputs[2]],outputs:[]})}}),qc,Qc,Xc,Yc,Jc,Zc,ep,tp,sp,rp,np,qd,ip,op,ap,lp,up,dp,cp,jp=y(()=>{Ot(),$t(),is(),qt(),qc=(e,t)=>{if(e.every(s=>s>0||(()=>{throw new Error("Resize requires scales input values to be positive")})),e.length>0){if(t.mode==="linear"){if(!(e.length===2||e.length===3||e.length===4&&e[0]===1&&e[1]===1||e.length===4&&e[0]===1&&e[3]===1||e.length===5&&e[0]===1&&e[1]===1))throw new Error(`For linear mode, Resize requires scales to be 2D, 3D, 4D with either two outermost or one innermost and + one outermost scale values equal to 1, or 5D with two outermost scale values equal to 1`)}else if(t.mode==="cubic"&&!(e.length===2||e.length===4&&e[0]===1&&e[1]===1||e.length===4&&e[0]===1&&e[3]===1))throw new Error("Resize requires scales input size to be 2 or 4 for cubic mode")}},Qc=(e,t,s)=>{t.every(i=>i>=0&&i{throw new Error("Resize requires axes input values to be positive and less than rank")}));let n=new Array(s).fill(1);return t.forEach((i,o)=>n[i]=e[o]),n},Xc=(e,t,s,n,i,o)=>{let[a,c,p]=s>10?[1,2,3]:[-1,e.length>1?1:-1,-1],h=e[0].dims.length;if(a>0&&e.length>a&&e[a].dims.length>0)e[a].getFloat32Array().forEach(C=>o.push(C));else if(t.coordinateTransformMode==="tf_crop_and_resize")throw new Error("Resize requires RoI input to be specified when coordinateTransformMode is tfCropAndResize");if(c>0&&e.length>c&&e[c].dims.length===1&&e[c].dims[0]>0){if(e[c].getFloat32Array().forEach(C=>n.push(C)),n.length!==0&&n.length!==h&&s>=18&&n.length!==t.axes.length)throw new Error("Resize requires scales input size to be same as input rank or axes size for opset 18 and up");qc(n,t),t.axes.length>0&&Qc(n,t.axes,h).forEach((C,u)=>n[u]=C)}if(p>0&&e.length>p&&e[p].dims.length===1&&e[p].dims[0]>0&&(e[p].getBigInt64Array().forEach(C=>i.push(Number(C))),i.length!==0&&i.length!==h&&s>=18&&i.length!==t.axes.length))throw new Error("Resize requires sizes input size to be same as input rank or axes size for opset 18 and up");if(t.axes.length>0){if(n.length!==0&&n.length!==t.axes.length)throw new Error('Resize requires "scales" input size to be of axes rank when axes attributes is specified');if(i.length!==0&&i.length!==t.axes.length)throw new Error('Resize requires "sizes" input size to be of rank axes rank when axes attributes is specified')}if(typeof n<"u"&&typeof i<"u"&&n.length>0&&i.length>h)throw new Error("Resize requires only of scales or sizes to be specified")},Yc=(e,t)=>`fn getOriginalCoordinateFromResizedCoordinate(xResized: u32, xScale: f32, lengthResized: u32, + lengthOriginal: u32, roiStart: f32, roiEnd: f32) -> ${t} { `+(()=>{switch(e){case"asymmetric":return`return ${t}(xResized) / ${t}(xScale);`;case"pytorch_half_pixel":return`if (lengthResized > 1) { + return (${t}(xResized) + 0.5) / ${t}(xScale) - 0.5; + } else { + return 0.0; + }`;case"tf_half_pixel_for_nn":return`return (${t}(xResized) + 0.5) / ${t}(xScale);`;case"align_corners":return`if (lengthResized == 1) { + return 0.0; + } else { + // The whole part and the fractional part are calculated separately due to inaccuracy of floating + // point division. As an example, f32(21) / f32(7) may evaluate to 2.99... instead of 3, causing an + // offset-by-one error later in floor(). + let whole = ${t}(xResized * (lengthOriginal - 1) / (lengthResized - 1)); + let fract = + ${t}(xResized * (lengthOriginal - 1) % (lengthResized - 1)) / ${t}(lengthResized - 1); + return whole + fract; + }`;case"tf_crop_and_resize":return`if (lengthResized > 1) { + return ${t}(roiStart) * ${t}(lengthOriginal - 1) + + (${t}(xResized) * ${t}(roiEnd - roiStart) * ${t}(lengthOriginal - 1)) / + ${t}(lengthResized - 1); + } else { + return 0.5 * ${t}(roiStart + roiEnd) * ${t}(lengthOriginal - 1); + }`;case"half_pixel_symmetric":return`const outputWidth = ${t}xScale * ${t}(lengthResized); + const adjustment = ${t}(lengthResized) / outputWidth; + const center = ${t}(lengthOriginal) / 2; + const offset = center * (1 - adjustment); + return offset + ((${t}(xResized) + 0.5) / ${t}(xScale)) - 0.5;`;case"half_pixel":return`return ((${t}(xResized) + 0.5) / ${t}(xScale)) - 0.5;`;default:throw new Error(`Coordinate transform mode ${e} is not supported`)}})()+"}",Jc=(e,t,s)=>`fn getNearestPixelFromOriginal(xOriginal: ${s}, isDownSample: bool) -> ${s} {`+(()=>{switch(e){case"round_prefer_ceil":return"if (fract(xOriginal) == 0.5) { return ceil(xOriginal); } else { return round(xOriginal); }";case"floor":return"return floor(xOriginal);";case"ceil":return"return ceil(xOriginal);";case"round_prefer_floor":return"if (fract(xOriginal) == 0.5) { return floor(xOriginal); } else { return round(xOriginal); }";case"simple":default:if(t<11)return"if (isDownSample) { return ceil(xOriginal); } else { return xOriginal; }";throw new Error(`Nearest mode ${e} is not supported`)}})()+"}",Zc=(e,t,s)=>{let n=new Array(s).fill(0).concat(new Array(s).fill(1)),i=e.length===0?n:e.slice();return t.length>0?(t.forEach((o,a)=>{n[o]=i[a],n[a+s]=i[t.length+a]}),n):i},ep=(e,t,s,n)=>{let i=[];if(s.length>0)if(n.length>0){if(e.forEach(o=>i.push(o)),Math.max(...n)>e.length)throw new Error("axes is out of bound");n.forEach((o,a)=>i[o]=s[a])}else s.forEach(o=>i.push(o));else{if(t.length===0)throw new Error("Resize requires either scales or sizes.");i=e.map((o,a)=>Math.round(o*t[a]))}return i},tp=(e,t,s)=>{let n=(()=>{switch(s.keepAspectRatioPolicy){case"not_larger":return s.axes.length>0?Math.min(...s.axes.map(o=>t[o]),Number.MAX_VALUE):Math.min(...t,Number.MAX_VALUE);case"not_smaller":return s.axes.length>0?Math.max(...s.axes.map(o=>t[o]),Number.MIN_VALUE):Math.max(...t,Number.MIN_VALUE);default:throw new Error(`Keep aspect ratio policy ${s.keepAspectRatioPolicy} is not supported`)}})();t.fill(1,0,t.length);let i=e.slice();return s.axes.length>0?(s.axes.forEach(o=>t[o]=n),s.axes.forEach(o=>i[o]=Math.round(e[o]*t[o]))):(t.fill(n,0,t.length),i.forEach((o,a)=>i[a]=Math.round(o*t[a]))),i},sp=(e,t,s,n,i)=>` + fn calculateOriginalIndicesFromOutputIndices(output_indices: ${e.type.indices}) -> array<${e.type.value}, ${s.length}> { + var original_indices: array<${e.type.value}, ${s.length}>; + for (var i:u32 = 0; i < ${s.length}; i++) { + var output_index = ${e.indicesGet("output_indices","i")}; + var scale = ${Tt("uniforms.scales","i",n)}; + var roi_low = ${Tt("uniforms.roi","i",i)}; + var roi_hi = ${Tt("uniforms.roi",`i + ${t.length}`,i)}; + if (scale == 1.0) { + original_indices[i] = ${e.type.value}(output_index); + } else { + var input_shape_i = ${Tt("uniforms.input_shape","i",t.length)}; + var output_shape_i = ${Tt("uniforms.output_shape","i",s.length)}; + original_indices[i] = getOriginalCoordinateFromResizedCoordinate(output_index, scale, output_shape_i, + input_shape_i, roi_low, roi_hi); + } + } + return original_indices; + }`,rp=(e,t,s,n,i,o,a)=>` + fn calculateInputIndicesFromOutputIndices(output_indices: ${t.type.indices}) -> ${e.type.indices} { + var input_indices: ${e.type.indices}; + for (var i:u32 = 0; i < ${n.length}; i++) { + var output_index = ${t.indicesGet("output_indices","i")}; + var input_index: u32; + var scale = ${Tt("uniforms.scales","i",i)}; + if (scale == 1.0) { + input_index = output_index; + } else { + var roi_low = ${Tt("uniforms.roi","i",o)}; + var roi_hi = ${Tt("uniforms.roi",`i + ${s.length}`,o)}; + var input_shape_i = ${Tt("uniforms.input_shape","i",s.length)}; + var output_shape_i = ${Tt("uniforms.output_shape","i",n.length)}; + var original_idx = getOriginalCoordinateFromResizedCoordinate(output_index, scale, output_shape_i, + input_shape_i, roi_low, roi_hi); + if (!${a} || (original_idx >= 0 && original_idx < ${t.type.value}(input_shape_i))) { + if (original_idx < 0) { + input_index = 0; + } else if (original_idx > ${t.type.value}(input_shape_i - 1)) { + input_index = input_shape_i - 1; + } else { + input_index = u32(getNearestPixelFromOriginal(original_idx, scale < 1)); + } + } else { + input_index = u32(original_idx); + } + } + ${e.indicesSet("input_indices","i"," input_index")} + } + return input_indices; + }`,np=(e,t)=>` + fn checkInputIndices(input_indices: ${e.type.indices}) -> bool { + for (var i:u32 = 0; i < ${t.length}; i++) { + var input_index = ${e.indicesGet("input_indices","i")}; + if (input_index < 0 || input_index >= ${Tt("uniforms.input_shape","i",t.length)}) { + return false; + } + } + return true; + }`,qd=(e,t,s,n)=>e.rank>n?` + ${e.indicesSet("input_indices",t,"channel")}; + ${e.indicesSet("input_indices",s,"batch")}; +`:"",ip=(e,t,s,n,i)=>{let[o,a,c,p]=s.length===2?[-1,0,1,-1]:[0,2,3,1],h=e.type.value;return` + fn getInputValue(batch: u32, channel: u32, row: u32, col: u32) -> ${h} { + var input_indices: ${e.type.indices}; + ${e.indicesSet("input_indices",a,`max(0, min(row, ${s[a]} - 1))`)}; + ${e.indicesSet("input_indices",c,`max(0, min(col, ${s[c]} - 1))`)}; + ${qd(e,p,o,2)} + return ${e.getByIndices("input_indices")}; + } + + fn bilinearInterpolation(output_indices: ${t.type.indices}) -> ${h} { + var originalIndices = calculateOriginalIndicesFromOutputIndices(output_indices); + var row:${h} = originalIndices[${a}]; + var col:${h} = originalIndices[${c}]; + ${n?`if (row < 0 || row > (${s[a]} - 1) || col < 0 || col > (${s[c]} - 1)) { + return ${i}; + }`:""}; + row = max(0, min(row, ${s[a]} - 1)); + col = max(0, min(col, ${s[c]} - 1)); + var row1: u32 = u32(row); + var col1: u32 = u32(col); + var row2: u32 = u32(row + 1); + var col2: u32 = u32(col + 1); + var channel: u32 = ${s.length>2?`u32(originalIndices[${p}])`:"0"}; + var batch: u32 = ${s.length>2?`u32(originalIndices[${o}])`:"0"}; + var x11: ${h} = getInputValue(batch, channel, row1, col1); + var x12: ${h} = getInputValue(batch, channel, row1, col2); + var x21: ${h} = getInputValue(batch, channel, row2, col1); + var x22: ${h} = getInputValue(batch, channel, row2, col2); + var dx1: ${h} = abs(row - ${h}(row1)); + var dx2: ${h} = abs(${h}(row2) - row); + var dy1: ${h} = abs(col - ${h}(col1)); + var dy2: ${h} = abs(${h}(col2) - col); + if (row1 == row2) { + dx1 = 0.5; + dx2 = 0.5; + } + if (col1 == col2) { + dy1 = 0.5; + dy2 = 0.5; + } + return (x11 * dx2 * dy2 + x12 * dx2 * dy1 + x21 * dx1 * dy2 + x22 * dx1 * dy1); + }`},op=(e,t,s,n,i,o,a,c,p,h)=>{let C=s.length===2,[u,k]=C?[0,1]:[2,3],B=e.type.value,R=z=>{let ne=z===u?"row":"col";return` + fn ${ne}CubicInterpolation(input_indices: ${e.type.indices}, output_indices: ${t.type.indices}) -> ${B} { + var output_index = ${t.indicesGet("output_indices",z)}; + var originalIdx: ${B} = getOriginalCoordinateFromResizedCoordinate(output_index, ${i[z]}, + ${n[z]}, ${s[z]}, ${o[z]}, ${o[z]} + ${s.length}); + var fractOriginalIdx: ${B} = originalIdx - floor(originalIdx); + var coefs = getCubicInterpolationCoefs(fractOriginalIdx); + + if (${c} && (originalIdx < 0 || originalIdx > (${s[z]} - 1))) { + return ${p}; + } + var data: array<${B}, 4> = array<${B}, 4>(0.0, 0.0, 0.0, 0.0); + for (var i: i32 = -1; i < 3; i++) { + var ${ne}: ${B} = originalIdx + ${B}(i); + if (${ne} < 0 || ${ne} >= ${s[z]}) { + ${h?`coefs[i + 1] = 0.0; + continue;`:c?`return ${p};`:`${ne} = max(0, min(${ne}, ${s[z]} - 1));`}; + } + var input_indices_copy: ${e.type.indices} = input_indices; + ${e.indicesSet("input_indices_copy",z,`u32(${ne})`)}; + data[i + 1] = ${z===u?e.getByIndices("input_indices_copy"):"rowCubicInterpolation(input_indices_copy, output_indices)"}; + } + return cubicInterpolation1D(data, coefs); + }`};return` + ${R(u)}; + ${R(k)}; + fn getCubicInterpolationCoefs(s: ${B}) -> array<${B}, 4> { + var absS = abs(s); + var coeffs: array<${B}, 4> = array<${B}, 4>(0.0, 0.0, 0.0, 0.0); + var oneMinusAbsS: ${B} = 1.0 - absS; + var twoMinusAbsS: ${B} = 2.0 - absS; + var onePlusAbsS: ${B} = 1.0 + absS; + coeffs[0] = ((${a} * onePlusAbsS - 5 * ${a}) * onePlusAbsS + 8 * ${a}) * onePlusAbsS - 4 * ${a}; + coeffs[1] = ((${a} + 2) * absS - (${a} + 3)) * absS * absS + 1; + coeffs[2] = ((${a} + 2) * oneMinusAbsS - (${a} + 3)) * oneMinusAbsS * oneMinusAbsS + 1; + coeffs[3] = ((${a} * twoMinusAbsS - 5 * ${a}) * twoMinusAbsS + 8 * ${a}) * twoMinusAbsS - 4 * ${a}; + return coeffs; + } + + fn cubicInterpolation1D(x: array<${B}, 4>, coefs: array<${B}, 4>) -> ${B} { + var coefsSum: ${B} = coefs[0] + coefs[1] + coefs[2] + coefs[3]; + return (x[0] * coefs[0] + x[1] * coefs[1]+ x[2] * coefs[2]+ x[3] * coefs[3]) / coefsSum; + } + + fn bicubicInterpolation(output_indices: ${t.type.indices}) -> ${B} { + var input_indices: ${e.type.indices} = output_indices; + return colCubicInterpolation(input_indices, output_indices); + } + `},ap=(e,t,s,n,i)=>{let[o,a,c,p,h]=s.length===3?[-1,0,1,2,-1]:[0,2,3,4,1],C=e.type.value;return` + fn getInputValue(batch: u32, channel: u32, depth:u32, height: u32, width: u32) -> ${C} { + var input_indices: ${e.type.indices}; + ${e.indicesSet("input_indices",a,`max(0, min(depth, ${s[a]} - 1))`)}; + ${e.indicesSet("input_indices",c,`max(0, min(height, ${s[c]} - 1))`)}; + ${e.indicesSet("input_indices",p,`max(0, min(width, ${s[p]} - 1))`)}; + ${qd(e,h,o,3)} + return ${e.getByIndices("input_indices")}; + } + + fn trilinearInterpolation(output_indices: ${t.type.indices}) -> ${C} { + var originalIndices = calculateOriginalIndicesFromOutputIndices(output_indices); + var depth:${C} = originalIndices[${a}]; + var height:${C} = originalIndices[${c}]; + var width:${C} = originalIndices[${p}]; + ${n?`if (depth < 0 || depth > (${s[a]} - 1) || height < 0 || height > (${s[c]} - 1) || width < 0 || (width > ${s[p]} - 1)) { + return ${i}; + }`:""}; + + depth = max(0, min(depth, ${s[a]} - 1)); + height = max(0, min(height, ${s[c]} - 1)); + width = max(0, min(width, ${s[p]} - 1)); + var depth1: u32 = u32(depth); + var height1: u32 = u32(height); + var width1: u32 = u32(width); + var depth2: u32 = u32(depth + 1); + var height2: u32 = u32(height + 1); + var width2: u32 = u32(width + 1); + var channel: u32 = ${s.length>3?`u32(originalIndices[${h}])`:"0"}; + var batch: u32 = ${s.length>3?`u32(originalIndices[${o}])`:"0"}; + + var x111: ${C} = getInputValue(batch, channel, depth1, height1, width1); + var x112: ${C} = getInputValue(batch, channel, depth1, height1, width2); + var x121: ${C} = getInputValue(batch, channel, depth1, height2, width1); + var x122: ${C} = getInputValue(batch, channel, depth1, height2, width2); + var x211: ${C} = getInputValue(batch, channel, depth2, height1, width1); + var x212: ${C} = getInputValue(batch, channel, depth2, height1, width2); + var x221: ${C} = getInputValue(batch, channel, depth2, height2, width1); + var x222: ${C} = getInputValue(batch, channel, depth2, height2, width2); + var dx1: ${C} = abs(depth - ${C}(depth1)); + var dx2: ${C} = abs(${C}(depth2) - depth); + var dy1: ${C} = abs(height - ${C}(height1)); + var dy2: ${C} = abs(${C}(height2) - height); + var dz1: ${C} = abs(width - ${C}(width1)); + var dz2: ${C} = abs(${C}(width2) - width); + if (depth1 == depth2) { + dx1 = 0.5; + dx2 = 0.5; + } + if (height1 == height2) { + dy1 = 0.5; + dy2 = 0.5; + } + if (width1 == width2) { + dz1 = 0.5; + dz2 = 0.5; + } + return (x111 * dx2 * dy2 * dz2 + x112 * dx2 * dy2 * dz1 + x121 * dx2 * dy1 *dz2 + x122 * dx2 * dy1 * dz1 + + x211 * dx1 * dy2 * dz2 + x212 * dx1 * dy2 * dz1 + x221 * dx1 * dy1 *dz2 + x222 * dx1 * dy1 * dz1); + }`},lp=(e,t,s,n,i,o)=>{let a=e.dims,c=Zc(o,t.axes,a.length),p=ep(a,n,i,t.axes),h=n.slice();n.length===0&&(h=a.map((W,ue)=>W===0?1:p[ue]/W),t.keepAspectRatioPolicy!=="stretch"&&(p=tp(a,h,t)));let C=Ct("output",e.dataType,p.length),u=He("input",e.dataType,a.length),k=De.size(p),B=a.length===p.length&&a.every((W,ue)=>W===p[ue]),R=t.coordinateTransformMode==="tf_crop_and_resize",z=t.extrapolationValue,ne=u.type.value,J=W=>` + ${B?"":` + ${Yc(t.coordinateTransformMode,ne)}; + ${(()=>{switch(t.mode){case"nearest":return` + ${np(u,a)}; + ${Jc(t.nearestMode,s,ne)}; + ${rp(u,C,a,p,h.length,c.length,R)}; + `;case"linear":return` + ${sp(C,a,p,h.length,c.length)}; + ${(()=>{if(a.length===2||a.length===4)return`${ip(u,C,a,R,z)}`;if(a.length===3||a.length===5)return`${ap(u,C,a,R,z)}`;throw Error("Linear mode only supports input dims 2, 3, 4 and 5 are supported in linear mode.")})()}; + `;case"cubic":return` + ${(()=>{if(a.length===2||a.length===4)return`${op(u,C,a,p,h,c,t.cubicCoeffA,R,t.extrapolationValue,t.excludeOutside)}`;throw Error("Cubic mode only supports input dims 2 and 4 are supported in linear mode.")})()}; + `;default:throw Error("Invalid resize mode")}})()}; + `} + ${W.registerUniform("output_size","u32").registerUniform("scales","f32",h.length).registerUniform("roi","f32",c.length).declareVariables(u,C)} + ${W.mainStart()} + ${W.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + ${B?"output[global_idx] = input[global_idx];":` + let output_indices = ${C.offsetToIndices("global_idx")}; + var input_indices: ${u.type.indices}; + ${(()=>{switch(t.mode){case"nearest":return`input_indices = calculateInputIndicesFromOutputIndices(output_indices); + if (checkInputIndices(input_indices)) { + output[global_idx] = ${u.getByIndices("input_indices")}; + } else { + output[global_idx] = ${t.extrapolationValue}; + }`;case"linear":return`output[global_idx] = ${a.length===2||a.length===4?"bilinearInterpolation":"trilinearInterpolation"}(output_indices);`;case"cubic":return"output[global_idx] = bicubicInterpolation(output_indices);";default:throw Error(`Unsupported resize mode: ${t.mode}`)}})()}; +`} + }`;return{name:"Resize",shaderCache:{hint:`${t.cacheKey}|${s}|${h.length>0?h:""}|${i.length>0?i:""}|${c.length>0?c:""}|${B}|${a}`,inputDependencies:["rank"]},getShaderSource:J,getRunData:()=>({outputs:[{dims:p,dataType:e.dataType}],dispatchGroup:{x:Math.ceil(k/64)},programUniforms:[{type:12,data:k},{type:1,data:h},{type:1,data:c},...Mt(a,p)]})}},up=e=>{let t=e.customDataBuffer;return new Uint32Array(t,t.byteOffset,1)[0]},dp=(e,t)=>{let s=[],n=[],i=[],o=up(e);if(t.antialias!==0)throw Error("Only default value (0) for Antialias attribute is supported");Xc(e.inputs,t,o,s,n,i),e.compute(lp(e.inputs[0],t,o,s,n,i),{inputs:[0]})},cp=e=>{let t=e.antialias,s=e.axes,n=e.coordinateTransformMode,i=e.cubicCoeffA,o=e.excludeOutside!==0,a=e.extrapolationValue,c=e.keepAspectRatioPolicy,p=e.mode,h=e.nearestMode===""?"simple":e.nearestMode;return jt({antialias:t,axes:s,coordinateTransformMode:n,cubicCoeffA:i,excludeOutside:o,extrapolationValue:a,keepAspectRatioPolicy:c,mode:p,nearestMode:h})}}),pp,hp,Kt,mp=y(()=>{Ot(),$t(),is(),qt(),pp=(e,t)=>{let[s,n,i,o]=e,{numHeads:a,rotaryEmbeddingDim:c}=t;if(s.dims.length!==3&&s.dims.length!==4)throw new Error(`Input 'x' is expected to have 3 or 4 dimensions, got ${s.dims.length}`);if(!De.areEqual(n.dims,[])&&!De.areEqual(n.dims,[1])&&n.dims.length!==2)throw new Error(`Input 'position_ids' is expected to have 0, 1, or 2 dimensions, got ${n.dims.length}`);if(i.dims.length!==2)throw new Error(`Input 'cos_cache' is expected to have 2 dimensions, got ${i.dims.length}`);if(o.dims.length!==2)throw new Error(`Input 'sin_cache' is expected to have 2 dimensions, got ${o.dims.length}`);if(!De.areEqual(i.dims,o.dims))throw new Error("Inputs 'cos_cache' and 'sin_cache' are expected to have the same shape");if(c>0&&a===0)throw new Error("num_heads must be provided if rotary_embedding_dim is specified");let p=s.dims[0],h=s.dims[s.dims.length-2],C=i.dims[0],u=De.sizeFromDimension(s.dims,1)/h,k=c===0?i.dims[1]*2:u/a;if(c>k)throw new Error("rotary_embedding_dim must be less than or equal to head_size");if(n.dims.length===2){if(p!==n.dims[0])throw new Error(`Input 'position_ids' dimension 0 should be of size batch_size, got ${n.dims[0]}`);if(h!==n.dims[1])throw new Error(`Input 'position_ids' dimension 1 should be of size sequence_length, got ${n.dims[1]}`)}if(k/2!==i.dims[1]&&c/2!==i.dims[1])throw new Error(`Input 'cos_cache' dimension 1 should be same as head_size / 2 or rotary_embedding_dim / 2, got ${i.dims[1]}`);if(h>C)throw new Error("Updating cos_cache and sin_cache in RotaryEmbedding is not currently supported")},hp=(e,t)=>{let{interleaved:s,numHeads:n,rotaryEmbeddingDim:i,scale:o}=t,a=e[0].dims[0],c=De.sizeFromDimension(e[0].dims,1),p=e[0].dims[e[0].dims.length-2],h=c/p,C=e[2].dims[1],u=i===0?C*2:h/n,k=new Array(a,p,h/u,u-C),B=De.computeStrides(k),R=[{type:1,data:o},{type:12,data:k},{type:12,data:B},...e[0].dims.length===3?new Array({type:12,data:[c,h,u,1]}):[],...e[0].dims.length===4?new Array({type:12,data:[c,u,p*u,1]}):[],...Mt(e[0].dims,e[1].dims,e[2].dims,e[3].dims,e[0].dims)],z=ne=>{let J=He("input",e[0].dataType,e[0].dims.length),W=He("position_ids",e[1].dataType,e[1].dims.length),ue=He("cos_cache",e[2].dataType,e[2].dims.length),he=He("sin_cache",e[3].dataType,e[3].dims.length),be=Ct("output",e[0].dataType,e[0].dims.length);return ne.registerUniforms([{name:"scale",type:"f32"},{name:"global_shape",type:"u32",length:k.length},{name:"global_strides",type:"u32",length:B.length},{name:"input_output_strides",type:"u32",length:B.length}]),` + ${ne.declareVariables(J,W,ue,he,be)} + + ${ne.mainStart(sr)} + let half_rotary_emb_dim = uniforms.${ue.name}_shape[1]; + let bsnh = global_idx / uniforms.global_strides % uniforms.global_shape; + let size = uniforms.global_shape[0] * uniforms.global_strides[0]; + ${ne.guardAgainstOutOfBoundsWorkgroupSizes("size")} + + if (bsnh[3] < half_rotary_emb_dim) { + let position_ids_idx = + ${W.broadcastedIndicesToOffset("bsnh.xy",Ct("",W.type.tensor,2))}; + let position_id = + u32(${W.getByOffset("position_ids_idx")}) + select(0, bsnh[1], position_ids_idx == 0); + let i = dot(bsnh, uniforms.input_output_strides) + select(0, bsnh[3], ${s}); + let j = i + select(half_rotary_emb_dim, 1, ${s}); + let re = ${J.getByOffset("i")} * ${ue.get("position_id","bsnh[3]")} - + ${J.getByOffset("j")} * ${he.get("position_id","bsnh[3]")}; + ${be.setByOffset("i","re")} + let im = ${J.getByOffset("i")} * ${he.get("position_id","bsnh[3]")} + + ${J.getByOffset("j")} * ${ue.get("position_id","bsnh[3]")}; + ${be.setByOffset("j","im")} + } else { + let k = dot(bsnh, uniforms.input_output_strides) + half_rotary_emb_dim; + ${be.setByOffset("k",J.getByOffset("k"))} + } + }`};return{name:"RotaryEmbedding",shaderCache:{hint:jt({interleaved:s}).cacheKey,inputDependencies:["rank","rank","rank","rank"]},getShaderSource:z,getRunData:()=>({outputs:[{dims:e[0].dims,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(De.size(k)/sr)},programUniforms:R})}},Kt=(e,t)=>{pp(e.inputs,t),e.compute(hp(e.inputs,t))}}),Vs,Qs,Zs,yn=y(()=>{Ot(),$t(),qt(),Vs=e=>{if(!e||e.length<3)throw new Error("layerNorm requires at least 3 inputs.");let t=e[0],s=e[1],n=e[2];if(t.dataType!==s.dataType||t.dataType!==n.dataType)throw new Error("All inputs must have the same data type");if(t.dims.length!==3&&t.dims.length!==2)throw new Error("Input must be 2D or 3D");if(s.dims.length!==3&&s.dims.length!==2)throw new Error("Skip must be 2D or 3D");let i=t.dims[t.dims.length-1],o=t.dims[t.dims.length-2];if(s.dims[s.dims.length-1]!==i)throw new Error("Skip must have the same hidden size as input");if(s.dims[s.dims.length-2]!==o)throw new Error("Skip must have the same sequence length as input");if(n.dims.length!==1)throw new Error("Gamma must be 1D");if(n.dims[n.dims.length-1]!==i)throw new Error("Gamma must have the same hidden size as input");if(e.length>3){let a=e[3];if(a.dims.length!==1)throw new Error("Beta must be 1D");if(a.dims[a.dims.length-1]!==i)throw new Error("Beta must have the same hidden size as input")}if(e.length>4){let a=e[4];if(a.dims.length!==1)throw new Error("Bias must be 1D");if(a.dims[a.dims.length-1]!==i)throw new Error("Bias must have the same hidden size as input")}},Qs=(e,t,s,n)=>{let i=t.simplified,o=e[0].dims,a=De.size(o),c=o,p=a,h=o.slice(-1)[0],C=n?o.slice(0,-1).concat(1):[],u=!i&&e.length>3,k=e.length>4,B=n&&s>1,R=n&&s>2,z=s>3,ne=64,J=Gt(h),W=[{type:12,data:p},{type:12,data:J},{type:12,data:h},{type:1,data:t.epsilon}],ue=be=>{let Be=[{name:"output_size",type:"u32"},{name:"components",type:"u32"},{name:"hidden_size",type:"u32"},{name:"epsilon",type:"f32"}],Ie=[He("x",e[0].dataType,e[0].dims,J),He("skip",e[1].dataType,e[1].dims,J),He("gamma",e[2].dataType,e[2].dims,J)];u&&Ie.push(He("beta",e[3].dataType,e[3].dims,J)),k&&Ie.push(He("bias",e[4].dataType,e[4].dims,J)),Ie.push(Ct("output",e[0].dataType,c,J)),B&&Ie.push(Ct("mean_output",1,C)),R&&Ie.push(Ct("inv_std_output",1,C)),z&&Ie.push(Ct("input_skip_bias_sum",e[0].dataType,c,J));let nt=ds(e[0].dataType),dt=ds(1,J);return` + + ${be.registerUniforms(Be).declareVariables(...Ie)} + var sum_shared : array<${dt}, ${ne}>; + var sum_squared_shared : array<${dt}, ${ne}>; + + ${be.mainStart([ne,1,1])} + let ix = local_id.x; + let iy = global_id.x / ${ne}; + + let hidden_size_vectorized: u32 = uniforms.hidden_size / uniforms.components; + var stride = hidden_size_vectorized / ${ne}; + let offset = ix * stride + iy * hidden_size_vectorized; + let offset1d = stride * ix; + if (ix == ${ne-1}) { + stride = hidden_size_vectorized - stride * ix; + } + for (var i: u32 = 0; i < stride; i++) { + let skip_value = skip[offset + i]; + let bias_value = ${k?"bias[offset1d + i]":nt+"(0.0)"}; + let input_value = x[offset + i]; + let value = input_value + skip_value + bias_value; + ${z?"input_skip_bias_sum[offset + i] = value;":""} + output[offset + i] = value; + let f32_value = ${ks(nt,J,"value")}; + sum_shared[ix] += f32_value; + sum_squared_shared[ix] += f32_value * f32_value; + } + workgroupBarrier(); + + var reduce_size : u32 = ${ne}; + for (var curr_size = reduce_size >> 1; curr_size > 0; curr_size = reduce_size >> 1) { + reduce_size = curr_size + (reduce_size & 1); + if (ix < curr_size) { + sum_shared[ix] += sum_shared[ix + reduce_size]; + sum_squared_shared[ix] += sum_squared_shared[ix + reduce_size]; + } + workgroupBarrier(); + } + + let sum = sum_shared[0]; + let square_sum = sum_squared_shared[0]; + let mean = ${js("sum",J)} / f32(uniforms.hidden_size); + let inv_std_dev = inverseSqrt(${js("square_sum",J)} / f32(uniforms.hidden_size) ${i?"":"- mean * mean"} + uniforms.epsilon); + ${B?"mean_output[global_idx] = mean;":""} + ${R?"inv_std_output[global_idx] = inv_std_dev;":""} + + for (var i: u32 = 0; i < stride; i++) { + output[offset + i] = (output[offset + i] ${i?"":`- ${nt}(mean)`}) * + ${nt}(inv_std_dev) * gamma[offset1d + i] + ${u?"+ beta[offset1d + i]":""}; + } + }`},he=[{dims:c,dataType:e[0].dataType}];return s>1&&he.push({dims:C,dataType:1}),s>2&&he.push({dims:C,dataType:1}),s>3&&he.push({dims:o,dataType:e[0].dataType}),{name:"SkipLayerNormalization",shaderCache:{hint:`${J};${B};${R};${z}`,inputDependencies:e.map((be,Be)=>"type")},getShaderSource:ue,getRunData:()=>({outputs:he,dispatchGroup:{x:Math.ceil(p/h)},programUniforms:W})}},Zs=(e,t)=>{Vs(e.inputs);let s=[0];e.outputCount>1&&s.push(-3),e.outputCount>2&&s.push(-3),e.outputCount>3&&s.push(3),e.compute(Qs(e.inputs,t,e.outputCount,!1),{outputs:s})}}),fp,Wn,Qd,_,f,q,xe,$e,Le=y(()=>{Ot(),$t(),is(),qt(),fp=(e,t)=>{if(!e||e.length<1)throw new Error("too few inputs");if(t.axes.length!==0){if(t.axes.length!==t.starts.length||t.axes.length!==t.ends.length)throw new Error("axes, starts and ends must have the same length")}else if(t.starts.length!==t.ends.length)throw new Error("starts and ends must have the same length");e.slice(1).forEach((s,n)=>{if(e[n+1].dataType!==6&&e[n+1].dataType!==7)throw new Error(`Input ${n} must be an array of int32 or int64`)})},Wn=(e,t)=>{let s=[];if(e.length>t)if(e[t].dataType===7)e[t].getBigInt64Array().forEach(n=>s.push(Number(n)));else if(e[t].dataType===6)e[t].getInt32Array().forEach(n=>s.push(Number(n)));else throw new Error(`Input ${t} must be an array of int32 or int64`);return s},Qd=(e,t)=>{if(e.length>1){let s=Wn(e,1),n=Wn(e,2),i=Wn(e,3);return i.length===0&&(i=[...Array(e[0].dims.length).keys()]),jt({starts:s,ends:n,axes:i})}else return t},_=(e,t,s,n,i)=>{let o=e;return e<0&&(o+=s[n[t]]),i[t]<0?Math.max(0,Math.min(o,s[n[t]]-1)):Math.max(0,Math.min(o,s[n[t]]))},f=(e,t,s)=>`fn calculateInputIndices(output_indices: ${t.type.indices}) -> ${e.type.indices} { + var input_indices: ${e.type.indices}; + var carry = 0u; + for (var i = ${s.length}; i >= 0; i--) { + let input_shape_i = ${Tt("uniforms.input_shape","i",s.length)}; + let steps_i = ${Tt("uniforms.steps","i",s.length)}; + let signs_i = ${Tt("uniforms.signs","i",s.length)}; + let starts_i = ${Tt("uniforms.starts","i",s.length)}; + var output_index = ${t.indicesGet("output_indices","i")}; + var input_index = output_index * steps_i + starts_i + carry; + carry = input_index / input_shape_i; + input_index = input_index % input_shape_i; + if (signs_i < 0) { + input_index = input_shape_i - input_index - 1u + starts_i; + } + ${e.indicesSet("input_indices","i","input_index")}; + } + return input_indices; + }`,q=(e,t)=>{let s=e[0].dims,n=De.size(s),i=t.axes.length>0?De.normalizeAxes(t.axes,s.length):[...Array(s.length).keys()],o=Wn(e,4);o.forEach(J=>J!==0||(()=>{throw new Error("step cannot be 0")})),o.length===0&&(o=Array(i.length).fill(1));let a=t.starts.map((J,W)=>_(J,W,s,i,o)),c=t.ends.map((J,W)=>_(J,W,s,i,o));if(i.length!==a.length||i.length!==c.length)throw new Error("start, ends and axes should have the same number of elements");if(i.length!==s.length)for(let J=0;JMath.sign(J));o.forEach((J,W,ue)=>{if(J<0){let he=(c[W]-a[W])/J,be=a[W],Be=be+he*o[W];a[W]=Be,c[W]=be,ue[W]=-J}});let h=s.slice(0);i.forEach((J,W)=>{h[J]=Math.ceil((c[J]-a[J])/o[J])});let C={dims:h,dataType:e[0].dataType},u=Ct("output",e[0].dataType,h.length),k=He("input",e[0].dataType,e[0].dims.length),B=De.size(h),R=[{name:"outputSize",type:"u32"},{name:"starts",type:"u32",length:a.length},{name:"signs",type:"i32",length:p.length},{name:"steps",type:"u32",length:o.length}],z=[{type:12,data:B},{type:12,data:a},{type:6,data:p},{type:12,data:o},...Mt(e[0].dims,h)],ne=J=>` + ${J.registerUniforms(R).declareVariables(k,u)} + ${f(k,u,s)} + ${J.mainStart()} + ${J.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} + let output_indices = ${u.offsetToIndices("global_idx")}; + let input_indices = calculateInputIndices(output_indices); + ${u.setByOffset("global_idx",k.getByIndices("input_indices"))} + }`;return{name:"Slice",shaderCache:{hint:`${p.length}_${a.length}_${o.length}`,inputDependencies:["rank"]},getShaderSource:ne,getRunData:()=>({outputs:[C],dispatchGroup:{x:Math.ceil(n/64)},programUniforms:z})}},xe=(e,t)=>{fp(e.inputs,t);let s=Qd(e.inputs,t);e.compute(q(e.inputs,s),{inputs:[0]})},$e=e=>{let t=e.starts,s=e.ends,n=e.axes;return jt({starts:t,ends:s,axes:n})}}),rt,ot,_t,kt,Zt=y(()=>{Ot(),$t(),is(),jr(),qt(),rt=e=>{if(!e||e.length!==1)throw new Error("Softmax op requires 1 input.")},ot=(e,t)=>{let s=e.inputs[0],n=s.dims,i=De.size(n),o=n.length,a=De.normalizeAxis(t.axis,o),c=ant),h[a]=o-1,h[o-1]=a,p=e.compute(cr(s,h),{inputs:[s],outputs:[-1]})[0]):p=s;let C=p.dims,u=C[o-1],k=i/u,B=Gt(u),R=u/B,z=64;k===1&&(z=256);let ne=(Ie,nt)=>nt===4?`max(max(${Ie}.x, ${Ie}.y), max(${Ie}.z, ${Ie}.w))`:nt===2?`max(${Ie}.x, ${Ie}.y)`:nt===3?`max(max(${Ie}.x, ${Ie}.y), ${Ie}.z)`:Ie,J=He("x",p.dataType,p.dims,B),W=Ct("result",p.dataType,p.dims,B),ue=J.type.value,he=ds(p.dataType)==="f32"?`var threadMax = ${ue}(-3.402823e+38f);`:`var threadMax = ${ue}(-65504.0h);`,be=Ie=>` + var rowMaxShared : ${ue}; + var rowSumShared : ${ue}; + var threadShared : array<${ue}, ${z}>; + + fn getValue(row: i32, col: i32, row_stride: i32) -> ${ue} { + let index = row * row_stride + col; + return x[index]; + } + + fn setValue(row: i32, col: i32, row_stride: i32, value: ${ue}) { + let index = row * row_stride + col; + result[index] = value; + } + ${Ie.registerUniform("packedCols","i32").declareVariables(J,W)} + ${Ie.mainStart(z)} + let gindex = i32(global_idx); + let lindex = i32(local_idx); + const wg = ${z}; + let row = gindex / wg; + let cols = uniforms.packedCols; + let row_stride : i32 = uniforms.packedCols; + + // find the rows max + ${he} + for (var col = lindex; col < cols; col += wg) { + let value = getValue(row, col, row_stride); + threadMax = max(threadMax, value); + } + if (lindex < cols) { + threadShared[lindex] = threadMax; + } + workgroupBarrier(); + + var reduceSize = min(cols, wg); + for (var currSize = reduceSize >> 1; currSize > 0; currSize = reduceSize >> 1) { + reduceSize = currSize + (reduceSize & 1); + if (lindex < currSize) { + threadShared[lindex] = max(threadShared[lindex], threadShared[lindex + reduceSize]); + } + workgroupBarrier(); + } + if (lindex == 0) { + rowMaxShared = ${ue}(${ne("threadShared[0]",B)}); + } + workgroupBarrier(); + + // find the rows sum + var threadSum = ${ue}(0.0); + for (var col = lindex; col < cols; col += wg) { + let subExp = exp(getValue(row, col, row_stride) - rowMaxShared); + threadSum += subExp; + } + threadShared[lindex] = threadSum; + workgroupBarrier(); + + for (var currSize = wg >> 1; currSize > 0; currSize = currSize >> 1) { + if (lindex < currSize) { + threadShared[lindex] = threadShared[lindex] + threadShared[lindex + currSize]; + } + workgroupBarrier(); + } + if (lindex == 0) { + rowSumShared = ${ue}(${js("threadShared[0]",B)}); + } + workgroupBarrier(); + + // calculate final value for each element in the row + for (var col = lindex; col < cols; col += wg) { + let value = exp(getValue(row, col, row_stride) - rowMaxShared) / rowSumShared; + setValue(row, col, row_stride, value); + } + }`,Be=e.compute({name:"Softmax",shaderCache:{hint:`${B};${z}`,inputDependencies:["type"]},getRunData:()=>({outputs:[{dims:C,dataType:p.dataType}],dispatchGroup:{x:k},programUniforms:[{type:6,data:R}]}),getShaderSource:be},{inputs:[p],outputs:[c?-1:0]})[0];c&&e.compute(cr(Be,h),{inputs:[Be]})},_t=(e,t)=>{rt(e.inputs),ot(e,t)},kt=e=>jt({axis:e.axis})}),Wt,Dt,At,bs,Ht,Qt=y(()=>{Ot(),$t(),qt(),Wt=e=>Array.from(e.getBigInt64Array(),Number),Dt=e=>{if(!e||e.length!==2)throw new Error("Tile requires 2 inputs.");if(e[0].dataType!==1&&e[0].dataType!==10&&e[0].dataType!==6&&e[0].dataType!==12)throw new Error("Tile only support float, float16, int32, and uint32 data types");if(e[1].dataType!==7)throw new Error("Tile `repeats` input should be of int64 data type");if(e[1].dims.length!==1)throw new Error("Tile `repeats` input should be 1-D");if(Wt(e[1]).length!==e[0].dims.length)throw new Error("Tile `repeats` input should have same number of elements as rank of input data tensor")},At=(e,t)=>{let s=[];for(let n=0;n{let s=e[0].dims,n=t??Wt(e[1]),i=At(s,n),o=De.size(i),a=e[0].dataType,c=He("input",a,s.length),p=Ct("output",a,i.length),h=C=>` + const inputShape = ${c.indices(...s)}; + ${C.registerUniform("output_size","u32").declareVariables(c,p)} + ${C.mainStart()} + ${C.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} + let output_indices = ${p.offsetToIndices("global_idx")}; + var input_indices: ${c.type.indices}; + for (var i = 0; i < ${s.length}; i++) { + let input_dim_i = ${c.indicesGet("uniforms.input_shape","i")}; + let input_dim_value = ${p.indicesGet("output_indices","i")} % input_dim_i; + + ${c.indicesSet("input_indices","i","input_dim_value")} + } + ${p.setByOffset("global_idx",c.getByIndices("input_indices"))} + }`;return{name:"Tile",shaderCache:{hint:`${n}`,inputDependencies:["rank"]},getRunData:()=>({outputs:[{dims:i,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(o/64)},programUniforms:[{type:12,data:o},...Mt(e[0].dims,i)]}),getShaderSource:h}},Ht=e=>{Dt(e.inputs),e.compute(bs(e.inputs),{inputs:[0]})}}),ps,ys,es,Us=y(()=>{Ot(),$t(),qt(),ps=(e,t,s,n,i)=>{let o=Ct("output_data",i,s.length,4),a=He("a_data",t[1].dataType,t[1].dims.length,4),c=He("b_data",t[2].dataType,t[2].dims.length,4),p=He("c_data",t[0].dataType,t[0].dims.length,4),h,C=(u,k,B)=>`select(${k}, ${u}, ${B})`;if(!n)h=o.setByOffset("global_idx",C(a.getByOffset("global_idx"),c.getByOffset("global_idx"),p.getByOffset("global_idx")));else{let u=(k,B,R="")=>{let z=`a_data[index_a${B}][component_a${B}]`,ne=`b_data[index_b${B}][component_b${B}]`,J=`bool(c_data[index_c${B}] & (0xffu << (component_c${B} * 8)))`;return` + let output_indices${B} = ${o.offsetToIndices(`global_idx * 4u + ${B}u`)}; + let offset_a${B} = ${a.broadcastedIndicesToOffset(`output_indices${B}`,o)}; + let offset_b${B} = ${c.broadcastedIndicesToOffset(`output_indices${B}`,o)}; + let offset_c${B} = ${p.broadcastedIndicesToOffset(`output_indices${B}`,o)}; + let index_a${B} = offset_a${B} / 4u; + let index_b${B} = offset_b${B} / 4u; + let index_c${B} = offset_c${B} / 4u; + let component_a${B} = offset_a${B} % 4u; + let component_b${B} = offset_b${B} % 4u; + let component_c${B} = offset_c${B} % 4u; + ${k}[${B}] = ${R}(${C(z,ne,J)}); + `};i===9?h=` + var data = vec4(0); + ${u("data",0,"u32")} + ${u("data",1,"u32")} + ${u("data",2,"u32")} + ${u("data",3,"u32")} + output_data[global_idx] = dot(vec4(0x1, 0x100, 0x10000, 0x1000000), vec4(data));`:h=` + ${u("output_data[global_idx]",0)} + ${u("output_data[global_idx]",1)} + ${u("output_data[global_idx]",2)} + ${u("output_data[global_idx]",3)} + `}return` + ${e.registerUniform("vec_size","u32").declareVariables(p,a,c,o)} + ${e.mainStart()} + ${e.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.vec_size")} + ${h} + }`},ys=e=>{let t=e[1].dims,s=e[2].dims,n=e[0].dims,i=e[1].dataType,o=!(De.areEqual(t,s)&&De.areEqual(s,n)),a=t,c=De.size(t);if(o){let h=Js.calcShape(Js.calcShape(t,s,!1),n,!1);if(!h)throw new Error("Can't perform where op on the given tensors");a=h,c=De.size(a)}let p=Math.ceil(c/4);return{name:"Where",shaderCache:{inputDependencies:["rank","rank","rank"]},getShaderSource:h=>ps(h,e,a,o,i),getRunData:()=>({outputs:[{dims:a,dataType:i}],dispatchGroup:{x:Math.ceil(c/64/4)},programUniforms:[{type:12,data:p},...Mt(n,t,s,a)]})}},es=e=>{e.compute(ys(e.inputs))}}),zs,Fs=y(()=>{pc(),Zi(),hc(),mc(),fc(),_c(),su(),Mc(),Mu(),vc(),ku(),xc(),Tc(),Pc(),Bp(),Vn(),Ec(),kc(),sd(),Jo(),Ac(),Ic(),Fc(),Pd(),fs(),hd(),Od(),Rc(),Nc(),Rp(),Np(),ri(),jp(),mp(),yn(),Le(),Zt(),_d(),Qt(),jr(),wo(),Us(),zs=new Map([["Abs",[ml]],["Acos",[no]],["Acosh",[fl]],["Add",[Gl]],["ArgMax",[qi,Qi]],["ArgMin",[ol,Qi]],["Asin",[_l]],["Asinh",[io]],["Atan",[gl]],["Atanh",[wl]],["Attention",[ul]],["AveragePool",[Bd,zd]],["BatchNormalization",[to]],["BiasAdd",[hl]],["BiasSplitGelu",[Vl]],["Cast",[yl,oo]],["Ceil",[vl]],["Clip",[bl]],["Concat",[eu,tu]],["Conv",[Vo,Ro]],["ConvTranspose",[yu,Ko]],["Cos",[ao]],["Cosh",[xl]],["CumSum",[vu,xu]],["DepthToSpace",[Eu,Cu]],["DequantizeLinear",[Kd,Hd]],["Div",[Kl]],["Einsum",[Ou,Du]],["Elu",[lo,Bn]],["Equal",[Mo]],["Erf",[Tl]],["Exp",[uo]],["Expand",[jn]],["FastGelu",[Ru]],["Floor",[Pl]],["FusedConv",[Vo,Ro]],["Gather",[Vu,ju]],["GatherElements",[Cc,gi]],["GatherBlockQuantized",[qu,Qu]],["GatherND",[Wu,Gu]],["Gelu",[El]],["Gemm",[td,ed]],["GlobalAveragePool",[Nd,Rd]],["GlobalMaxPool",[Bc,Ud]],["Greater",[Ql]],["GreaterOrEqual",[vo]],["GridSample",[ud,Yo]],["GroupQueryAttention",[na]],["HardSigmoid",[Al,ho]],["InstanceNormalization",[yd]],["LayerNormalization",[vd]],["LeakyRelu",[co,Bn]],["Less",[Xl]],["LessOrEqual",[Yl]],["Log",[Bl]],["MatMul",[Td]],["MatMulNBits",[kd,Sd]],["MaxPool",[jd,Vd]],["Mul",[Hl]],["MultiHeadAttention",[Zo,cd]],["Neg",[kl]],["Not",[Cl]],["Pad",[ua]],["Pow",[ql]],["QuickGelu",[Nl,Bn]],["Range",[Uc]],["Reciprocal",[po]],["ReduceMin",[sl]],["ReduceMean",[Za]],["ReduceMax",[Gi]],["ReduceSum",[Ki]],["ReduceProd",[rl]],["ReduceL1",[Wi]],["ReduceL2",[el]],["ReduceLogSum",[il]],["ReduceLogSumExp",[tl]],["ReduceSumSquare",[nl]],["Relu",[Sl]],["Resize",[dp,cp]],["RotaryEmbedding",[Kt]],["ScatterND",[Hc,Kc]],["Sigmoid",[$l]],["Sin",[Il]],["Sinh",[mo]],["Slice",[xe,$e]],["SkipLayerNormalization",[Zs]],["Split",[ta,fd]],["Sqrt",[Fl]],["Softmax",[_t,kt]],["Sub",[bo]],["Tan",[Ol]],["Tanh",[Dl]],["ThresholdedRelu",[zl,Bn]],["Tile",[Ht]],["Transpose",[Ia,Li]],["Where",[es]]])}),Bs,nr=y(()=>{We(),Te(),qt(),Bs=class{constructor(e){this.backend=e,this.repo=new Map,this.attributesBound=!1}getArtifact(e){return this.repo.get(e)}setArtifact(e,t){this.repo.set(e,t)}run(e,t,s,n,i){Ue(e.programInfo.name);let o=this.backend.device,a=this.backend.getComputePassEncoder();this.backend.writeTimestamp(this.backend.pendingDispatchNumber*2);let c=[];for(let h of t)c.push({binding:c.length,resource:{buffer:h.buffer}});for(let h of s)c.push({binding:c.length,resource:{buffer:h.buffer}});i&&c.push({binding:c.length,resource:i});let p=o.createBindGroup({layout:e.computePipeline.getBindGroupLayout(0),entries:c,label:e.programInfo.name});if(this.backend.sessionStatus==="capturing"){let h={kernelId:this.backend.currentKernelId,computePipeline:e.computePipeline,bindGroup:p,dispatchGroup:n};this.backend.capturedCommandList.get(this.backend.currentSessionId).push(h)}a.setPipeline(e.computePipeline),a.setBindGroup(0,p),a.dispatchWorkgroups(...n),this.backend.writeTimestamp(this.backend.pendingDispatchNumber*2+1),this.backend.pendingDispatchNumber++,(this.backend.pendingDispatchNumber>=this.backend.maxDispatchNumber||this.backend.queryType==="at-passes")&&this.backend.endComputePass(),this.backend.pendingDispatchNumber>=this.backend.maxDispatchNumber&&this.backend.flush(),ze(e.programInfo.name)}dispose(){}build(e,t){Ue(e.name);let s=this.backend.device,n=[];[{feature:"shader-f16",extension:"f16"},{feature:"subgroups",extension:"subgroups"},{feature:"subgroups-f16",extension:"subgroups_f16"}].forEach(h=>{s.features.has(h.feature)&&n.push(`enable ${h.extension};`)});let i=ka(t,this.backend.device.limits),o=e.getShaderSource(i),a=`${n.join(` +`)} +${i.additionalImplementations} +${o}`,c=s.createShaderModule({code:a,label:e.name});as("verbose",()=>`[WebGPU] ${e.name} shader code: ${a}`);let p=s.createComputePipeline({compute:{module:c,entryPoint:"main"},layout:"auto",label:e.name});return ze(e.name),{programInfo:e,computePipeline:p,uniformVariablesInfo:i.variablesInfo}}normalizeDispatchGroupSize(e){let t=typeof e=="number"?e:e.x,s=typeof e=="number"?1:e.y||1,n=typeof e=="number"?1:e.z||1,i=this.backend.device.limits.maxComputeWorkgroupsPerDimension;if(t<=i&&s<=i&&n<=i)return[t,s,n];let o=t*s*n,a=Math.ceil(Math.sqrt(o));if(a>i){if(a=Math.ceil(Math.cbrt(o)),a>i)throw new Error("Total dispatch size exceeds WebGPU maximum.");return[a,a,a]}else return[a,a,1]}}}),mr,_a,lr,Ar,Gn,Xd=y(()=>{We(),Ot(),Te(),Y(),Ms(),Fs(),nr(),mr=(e,t)=>{if(t.length!==e.length)throw new Error(`inputDependencies length ${t.length} is not equal to inputTensors length ${e.length}.`);let s=[];for(let n=0;n{let n=e.name;return e.shaderCache?.hint&&(n+="["+e.shaderCache.hint+"]"),n+=":"+s+`:${mr(t,e.shaderCache?.inputDependencies??new Array(t.length).fill("dims"))}`,n},lr=class{constructor(e){e&&(this.architecture=e.architecture,this.vendor=e.vendor)}isArchitecture(e){return this.architecture===e}isVendor(e){return this.vendor===e}},Ar=class{constructor(e){this.subgroupsSupported=e.features.has("subgroups"),this.subgroupsF16Supported=e.features.has("subgroups");let t=e.limits;!this.subgroupsSupported||!t.minSubgroupSize||!t.maxSubgroupSize?this.subgroupSizeRange=void 0:this.subgroupSizeRange=[t.minSubgroupSize,t.maxSubgroupSize]}},Gn=class{constructor(){this.currentSessionId=null,this.currentKernelId=null,this.commandEncoder=null,this.computePassEncoder=null,this.maxDispatchNumber=16,this.pendingDispatchNumber=0,this.pendingKernels=[],this.pendingQueries=new Map,this.sessionStatus="default",this.capturedCommandList=new Map,this.capturedPendingKernels=new Map,this.sessionExternalDataMapping=new Map}get currentKernelCustomData(){if(this.currentKernelId===null)throw new Error("currentKernelCustomData(): currentKernelId is null. (should not happen)");let e=this.kernelCustomData.get(this.currentKernelId);return e||(e={},this.kernelCustomData.set(this.currentKernelId,e)),e}async initialize(e,t){this.env=e;let s=[],n={requiredLimits:{maxComputeWorkgroupStorageSize:t.limits.maxComputeWorkgroupStorageSize,maxComputeWorkgroupsPerDimension:t.limits.maxComputeWorkgroupsPerDimension,maxStorageBufferBindingSize:t.limits.maxStorageBufferBindingSize,maxBufferSize:t.limits.maxBufferSize,maxComputeInvocationsPerWorkgroup:t.limits.maxComputeInvocationsPerWorkgroup,maxComputeWorkgroupSizeX:t.limits.maxComputeWorkgroupSizeX,maxComputeWorkgroupSizeY:t.limits.maxComputeWorkgroupSizeY,maxComputeWorkgroupSizeZ:t.limits.maxComputeWorkgroupSizeZ},requiredFeatures:s},i=o=>t.features.has(o)&&s.push(o)&&!0;i("chromium-experimental-timestamp-query-inside-passes")||i("timestamp-query"),i("shader-f16"),i("subgroups")&&i("subgroups-f16"),this.device=await t.requestDevice(n),this.deviceInfo=new Ar(this.device),this.adapterInfo=new lr(t.info||await t.requestAdapterInfo()),this.gpuDataManager=Yt(this),this.programManager=new Bs(this),this.kernels=new Map,this.kernelPersistentData=new Map,this.kernelCustomData=new Map,gn(e.logLevel,!!e.debug),this.device.onuncapturederror=o=>{o.error instanceof GPUValidationError&&console.error(`An uncaught WebGPU validation error was raised: ${o.error.message}`)},Object.defineProperty(this.env.webgpu,"device",{value:this.device,writable:!1,enumerable:!0,configurable:!1}),Object.defineProperty(this.env.webgpu,"adapter",{value:t,writable:!1,enumerable:!0,configurable:!1}),this.setQueryType()}dispose(){typeof this.querySet<"u"&&this.querySet.destroy(),this.gpuDataManager.dispose()}getCommandEncoder(){return this.commandEncoder||(this.commandEncoder=this.device.createCommandEncoder()),this.commandEncoder}getComputePassEncoder(){if(!this.computePassEncoder){let e=this.getCommandEncoder(),t={};this.queryType==="at-passes"&&(t.timestampWrites={querySet:this.querySet,beginningOfPassWriteIndex:this.pendingDispatchNumber*2,endOfPassWriteIndex:this.pendingDispatchNumber*2+1}),this.computePassEncoder=e.beginComputePass(t)}return this.computePassEncoder}endComputePass(){this.computePassEncoder&&(this.computePassEncoder.end(),this.computePassEncoder=null)}flush(){if(!this.commandEncoder)return;Ue(),this.endComputePass();let e;this.queryType!=="none"&&(this.commandEncoder.resolveQuerySet(this.querySet,0,this.pendingDispatchNumber*2,this.queryResolveBuffer,0),e=this.device.createBuffer({size:this.pendingDispatchNumber*2*8,usage:GPUBufferUsage.MAP_READ|GPUBufferUsage.COPY_DST}),this.pendingQueries.set(e,this.pendingKernels),this.pendingKernels=[],this.commandEncoder.copyBufferToBuffer(this.queryResolveBuffer,0,e,0,this.pendingDispatchNumber*2*8)),this.device.queue.submit([this.commandEncoder.finish()]),this.gpuDataManager.refreshPendingBuffers(),this.commandEncoder=null,this.pendingDispatchNumber=0,this.queryType!=="none"&&e.mapAsync(GPUMapMode.READ).then(()=>{let t=new BigUint64Array(e.getMappedRange()),s=this.pendingQueries.get(e);for(let n=0;n"u"&&(this.queryTimeBase=k);let R=Number(k-this.queryTimeBase),z=Number(B-this.queryTimeBase);if(!Number.isSafeInteger(R)||!Number.isSafeInteger(z))throw new RangeError("incorrect timestamp range");if(this.env.webgpu.profiling?.ondata)this.env.webgpu.profiling.ondata({version:1,inputsMetadata:C.map(ne=>({dims:ne.dims,dataType:fr(ne.dataType)})),outputsMetadata:u.map(ne=>({dims:ne.dims,dataType:fr(ne.dataType)})),kernelId:o,kernelType:c,kernelName:p,programName:h,startTime:R,endTime:z});else{let ne="";C.forEach((W,ue)=>{ne+=`input[${ue}]: [${W.dims}] | ${fr(W.dataType)}, `});let J="";u.forEach((W,ue)=>{J+=`output[${ue}]: [${W.dims}] | ${fr(W.dataType)}, `}),console.log(`[profiling] kernel "${o}|${c}|${p}|${h}" ${ne}${J}execution time: ${z-R} ns`)}Ke("GPU",`${h}::${k}::${B}`)}e.unmap(),this.pendingQueries.delete(e)}),ze()}run(e,t,s,n,i,o){Ue(e.name);let a=[];for(let W=0;Wue):s;if(C.length!==c.length)throw new Error(`Output size ${C.length} must be equal to ${c.length}.`);let u=[],k=[];for(let W=0;W=o)throw new Error(`Invalid output index: ${C[W]}`);if(C[W]===-3)continue;let ue=C[W]===-1,he=C[W]===-2,be=ue||he?i(c[W].dataType,c[W].dims):n(C[W],c[W].dataType,c[W].dims);if(u.push(be),be.data===0)continue;let Be=this.gpuDataManager.get(be.data);if(!Be)throw new Error(`no GPU data for output: ${be.data}`);if(ue&&this.temporaryData.push(Be),he){let Ie=this.kernelPersistentData.get(this.currentKernelId);Ie||(Ie=[],this.kernelPersistentData.set(this.currentKernelId,Ie)),Ie.push(Be)}k.push(Be)}if(a.length!==t.length||k.length!==u.length){if(k.length===0)return ze(e.name),u;throw new Error(`Program ${e.name} has zero-sized tensor(s) in inputs or outputs. This is not supported now.`)}let B;if(h){let W=0,ue=[];h.forEach(Ie=>{let nt=typeof Ie.data=="number"?[Ie.data]:Ie.data;if(nt.length===0)return;let dt=Ie.type===10?2:4,Et,zt;Ie.type===10?(zt=nt.length>4?16:nt.length>2?8:nt.length*dt,Et=nt.length>4?16:dt*nt.length):(zt=nt.length<=2?nt.length*dt:16,Et=16),W=Math.ceil(W/zt)*zt,ue.push(W);let It=Ie.type===10?8:4;W+=nt.length>4?Math.ceil(nt.length/It)*Et:nt.length*dt});let he=16;W=Math.ceil(W/he)*he;let be=new ArrayBuffer(W);h.forEach((Ie,nt)=>{let dt=ue[nt],Et=typeof Ie.data=="number"?[Ie.data]:Ie.data;if(Ie.type===6)new Int32Array(be,dt,Et.length).set(Et);else if(Ie.type===12)new Uint32Array(be,dt,Et.length).set(Et);else if(Ie.type===10)new Uint16Array(be,dt,Et.length).set(Et);else if(Ie.type===1)new Float32Array(be,dt,Et.length).set(Et);else throw new Error(`Unsupported uniform type: ${fr(Ie.type)}`)});let Be=this.gpuDataManager.create(W,GPUBufferUsage.COPY_DST|GPUBufferUsage.UNIFORM);this.device.queue.writeBuffer(Be.buffer,0,be,0,W),this.gpuDataManager.release(Be.id),B={offset:0,size:W,buffer:Be.buffer}}let R=this.programManager.normalizeDispatchGroupSize(p),z=R[1]===1&&R[2]===1,ne=_a(e,t,z),J=this.programManager.getArtifact(ne);if(J||(J=this.programManager.build(e,R),this.programManager.setArtifact(ne,J),as("info",()=>`[artifact] key: ${ne}, programName: ${e.name}`)),h&&J.uniformVariablesInfo){if(h.length!==J.uniformVariablesInfo.length)throw new Error(`Uniform variables count mismatch: expect ${J.uniformVariablesInfo.length}, got ${h.length} in program "${J.programInfo.name}".`);for(let W=0;W`[ProgramManager] run "${e.name}" (key=${ne}) with ${R[0]}x${R[1]}x${R[2]}`),this.queryType!=="none"||this.sessionStatus==="capturing"){let W={kernelId:this.currentKernelId,programName:J.programInfo.name,inputTensorViews:t,outputTensorViews:u};this.pendingKernels.push(W),this.sessionStatus==="capturing"&&this.capturedPendingKernels.get(this.currentSessionId).push(W)}return this.programManager.run(J,a,k,R,B),ze(e.name),u}upload(e,t){this.gpuDataManager.upload(e,t)}memcpy(e,t){this.gpuDataManager.memcpy(e,t)}async download(e,t){await this.gpuDataManager.download(e,t)}alloc(e){return this.gpuDataManager.create(e).id}free(e){return this.gpuDataManager.release(e)}createKernel(e,t,s,n){let i=zs.get(e);if(!i)throw new Error(`kernel not implemented: ${e}`);let o={kernelType:e,kernelName:n,kernelEntry:i[0],attributes:[i[1],s]};this.kernels.set(t,o)}releaseKernel(e){let t=this.kernelPersistentData.get(e);if(t){for(let s of t)this.gpuDataManager.release(s.id);this.kernelPersistentData.delete(e)}this.kernelCustomData.delete(e),this.kernels.delete(e)}computeKernel(e,t,s){let n=this.kernels.get(e);if(!n)throw new Error(`kernel not created: ${e}`);let i=n.kernelType,o=n.kernelName,a=n.kernelEntry,c=n.attributes;if(this.currentKernelId!==null)throw new Error(`kernel "[${i}] ${o}" is not allowed to be called recursively`);this.currentKernelId=e,c[0]&&(c[1]=c[0](c[1]),c[0]=void 0),as("info",()=>`[WebGPU] Start to run kernel "[${i}] ${o}"...`);let p=this.env.debug;this.temporaryData=[];try{return p&&this.device.pushErrorScope("validation"),a(t,c[1]),0}catch(h){return s.push(Promise.resolve(`[WebGPU] Kernel "[${i}] ${o}" failed. ${h}`)),1}finally{p&&s.push(this.device.popErrorScope().then(h=>h?`GPU validation error for kernel "[${i}] ${o}": ${h.message}`:null));for(let h of this.temporaryData)this.gpuDataManager.release(h.id);this.temporaryData=[],this.currentKernelId=null}}registerBuffer(e,t,s,n){let i=this.sessionExternalDataMapping.get(e);i||(i=new Map,this.sessionExternalDataMapping.set(e,i));let o=i.get(t),a=this.gpuDataManager.registerExternalBuffer(s,n,o);return i.set(t,[a,s]),a}unregisterBuffers(e){let t=this.sessionExternalDataMapping.get(e);t&&(t.forEach(s=>this.gpuDataManager.unregisterExternalBuffer(s[0])),this.sessionExternalDataMapping.delete(e))}getBuffer(e){let t=this.gpuDataManager.get(e);if(!t)throw new Error(`no GPU data for buffer: ${e}`);return t.buffer}createDownloader(e,t,s){return async()=>{let n=await pt(this,e,t);return M(n.buffer,s)}}writeTimestamp(e){this.queryType==="inside-passes"&&this.computePassEncoder.writeTimestamp(this.querySet,e)}setQueryType(){this.queryType="none",(this.env.webgpu.profiling?.mode==="default"||(typeof this.env.trace>"u"?this.env.wasm.trace:this.env.trace))&&(this.device.features.has("chromium-experimental-timestamp-query-inside-passes")?this.queryType="inside-passes":this.device.features.has("timestamp-query")&&(this.queryType="at-passes"),this.queryType!=="none"&&typeof this.querySet>"u"&&(this.querySet=this.device.createQuerySet({type:"timestamp",count:this.maxDispatchNumber*2}),this.queryResolveBuffer=this.device.createBuffer({size:this.maxDispatchNumber*2*8,usage:GPUBufferUsage.COPY_SRC|GPUBufferUsage.QUERY_RESOLVE})))}captureBegin(){as("info","captureBegin"),this.capturedCommandList.get(this.currentSessionId)||this.capturedCommandList.set(this.currentSessionId,[]),this.capturedPendingKernels.get(this.currentSessionId)||this.capturedPendingKernels.set(this.currentSessionId,[]),this.flush(),this.sessionStatus="capturing"}captureEnd(){as("info","captureEnd"),this.flush(),this.sessionStatus="default"}replay(){as("info","replay"),this.sessionStatus="replaying";let e=this.capturedCommandList.get(this.currentSessionId),t=this.capturedPendingKernels.get(this.currentSessionId),s=e.length;this.pendingKernels=[];for(let n=0;n=this.maxDispatchNumber||this.queryType==="at-passes")&&this.endComputePass(),this.pendingDispatchNumber>=this.maxDispatchNumber&&this.flush()}this.flush(),this.sessionStatus="default"}onCreateSession(){this.gpuDataManager.onCreateSession()}onReleaseSession(e){this.unregisterBuffers(e),this.capturedCommandList.has(e)&&this.capturedCommandList.delete(e),this.capturedPendingKernels.has(e)&&this.capturedPendingKernels.delete(e),this.gpuDataManager.onReleaseSession(e)}onRunStart(e){this.currentSessionId=e,this.setQueryType()}}}),xi,Mn,_p,ws,Os,Ir,sn,bn,ga=y(()=>{Te(),xi=1,Mn=()=>xi++,_p=new Map([["float32",32],["float16",16],["int32",32],["uint32",32],["int64",64],["uint64",64],["int8",8],["uint8",8],["int4",4],["uint4",4]]),ws=(e,t)=>{let s=_p.get(e);if(!s)throw new Error("Unsupported data type.");return t.length>0?Math.ceil(t.reduce((n,i)=>n*i)*s/8):0},Os=class{constructor(e){this.sessionId=e.sessionId,this.mlContext=e.context,this.mlTensor=e.tensor,this.dataType=e.dataType,this.tensorShape=e.shape}get tensor(){return this.mlTensor}get type(){return this.dataType}get shape(){return this.tensorShape}get byteLength(){return ws(this.dataType,this.tensorShape)}destroy(){as("verbose",()=>"[WebNN] TensorWrapper.destroy"),this.mlTensor.destroy()}write(e){this.mlContext.writeTensor(this.mlTensor,e)}async read(e){return e?this.mlContext.readTensor(this.mlTensor,e):this.mlContext.readTensor(this.mlTensor)}canReuseTensor(e,t,s){return this.mlContext===e&&this.dataType===t&&this.tensorShape.length===s.length&&this.tensorShape.every((n,i)=>n===s[i])}},Ir=class{constructor(e,t){this.tensorManager=e,this.wrapper=t}get tensorWrapper(){return this.wrapper}releaseTensor(){this.tensorWrapper&&(this.tensorManager.releaseTensor(this.tensorWrapper),this.wrapper=void 0)}async ensureTensor(e,t,s,n){if(this.wrapper){if(this.wrapper.canReuseTensor(e,t,s))return this.wrapper.tensor;if(n){if(this.wrapper.byteLength!==ws(t,s))throw new Error("Unable to copy data to tensor with different size.");this.activeUpload=new Uint8Array(await this.wrapper.read())}this.tensorManager.releaseTensor(this.wrapper)}let i=typeof MLTensorUsage>"u"?void 0:MLTensorUsage.READ|MLTensorUsage.WRITE;return this.wrapper=await this.tensorManager.getCachedTensor(t,s,i,!0,!0),n&&this.activeUpload&&(this.wrapper.write(this.activeUpload),this.activeUpload=void 0),this.wrapper.tensor}upload(e){if(this.wrapper)if(e.byteLength===this.wrapper.byteLength){this.wrapper.write(e);return}else as("verbose",()=>"Data size does not match tensor size. Releasing tensor."),this.releaseTensor();this.activeUpload?this.activeUpload.set(e):this.activeUpload=new Uint8Array(e)}async download(e){if(this.activeUpload)if(e){e instanceof ArrayBuffer?new Uint8Array(e).set(this.activeUpload):new Uint8Array(e.buffer,e.byteOffset,e.byteLength).set(this.activeUpload);return}else return this.activeUpload.buffer;if(!this.wrapper)throw new Error("Tensor has not been created.");return e?this.wrapper.read(e):this.wrapper.read()}},sn=class{constructor(e){this.backend=e,this.tensorTrackersById=new Map,this.freeTensors=[],this.externalTensors=new Set}reserveTensorId(){let e=Mn();return this.tensorTrackersById.set(e,new Ir(this)),e}releaseTensorId(e){let t=this.tensorTrackersById.get(e);t&&(this.tensorTrackersById.delete(e),t.tensorWrapper&&this.releaseTensor(t.tensorWrapper))}async ensureTensor(e,t,s,n){as("verbose",()=>`[WebNN] TensorManager.ensureTensor {tensorId: ${e}, dataType: ${t}, shape: ${s}, copyOld: ${n}}`);let i=this.tensorTrackersById.get(e);if(!i)throw new Error("Tensor not found.");return i.ensureTensor(this.backend.currentContext,t,s,n)}upload(e,t){let s=this.tensorTrackersById.get(e);if(!s)throw new Error("Tensor not found.");s.upload(t)}async download(e,t){as("verbose",()=>`[WebNN] TensorManager.download {tensorId: ${e}, dstBuffer: ${t?.byteLength}}`);let s=this.tensorTrackersById.get(e);if(!s)throw new Error("Tensor not found.");return s.download(t)}releaseTensorsForSession(e){for(let t of this.freeTensors)t.sessionId===e&&t.destroy();this.freeTensors=this.freeTensors.filter(t=>t.sessionId!==e)}registerTensor(e,t,s,n){let i=Mn(),o=new Os({sessionId:this.backend.currentSessionId,context:e,tensor:t,dataType:s,shape:n});return this.tensorTrackersById.set(i,new Ir(this,o)),this.externalTensors.add(o),i}async getCachedTensor(e,t,s,n,i){let o=this.backend.currentSessionId,a=this.backend.currentContext;for(let[p,h]of this.freeTensors.entries())if(h.canReuseTensor(a,e,t)){as("verbose",()=>`[WebNN] Reusing tensor {dataType: ${e}, shape: ${t}}`);let C=this.freeTensors.splice(p,1)[0];return C.sessionId=o,C}as("verbose",()=>`[WebNN] MLContext.createTensor {dataType: ${e}, shape: ${t}}`);let c=await a.createTensor({dataType:e,shape:t,dimensions:t,usage:s,writable:n,readable:i});return new Os({sessionId:o,context:a,tensor:c,dataType:e,shape:t})}releaseTensor(e){this.externalTensors.has(e)&&this.externalTensors.delete(e),this.freeTensors.push(e)}},bn=(...e)=>new sn(...e)}),Ti,wa,ya,Vp=y(()=>{Ot(),br(),Y(),ga(),Te(),Ti=new Map([[1,"float32"],[10,"float16"],[6,"int32"],[12,"uint32"],[7,"int64"],[13,"uint64"],[22,"int4"],[21,"uint4"],[3,"int8"],[2,"uint8"],[9,"uint8"]]),wa=(e,t)=>{if(e===t)return!0;if(e===void 0||t===void 0)return!1;let s=Object.keys(e).sort(),n=Object.keys(t).sort();return s.length===n.length&&s.every((i,o)=>i===n[o]&&e[i]===t[i])},ya=class{constructor(e){this.tensorManager=bn(this),this.mlContextBySessionId=new Map,this.sessionIdsByMLContext=new Map,this.mlContextCache=[],gn(e.logLevel,!!e.debug)}get currentSessionId(){if(this.activeSessionId===void 0)throw new Error("No active session");return this.activeSessionId}onRunStart(e){this.activeSessionId=e}async createMLContext(e){if(e instanceof GPUDevice){let s=this.mlContextCache.findIndex(n=>n.gpuDevice===e);if(s!==-1)return this.mlContextCache[s].mlContext;{let n=await navigator.ml.createContext(e);return this.mlContextCache.push({gpuDevice:e,mlContext:n}),n}}else if(e===void 0){let s=this.mlContextCache.findIndex(n=>n.options===void 0&&n.gpuDevice===void 0);if(s!==-1)return this.mlContextCache[s].mlContext;{let n=await navigator.ml.createContext();return this.mlContextCache.push({mlContext:n}),n}}let t=this.mlContextCache.findIndex(s=>wa(s.options,e));if(t!==-1)return this.mlContextCache[t].mlContext;{let s=await navigator.ml.createContext(e);return this.mlContextCache.push({options:e,mlContext:s}),s}}get currentContext(){let e=this.getMLContext(this.currentSessionId);if(!e)throw new Error(`No MLContext found for session ${this.currentSessionId}`);return e}registerMLContext(e,t){this.mlContextBySessionId.set(e,t);let s=this.sessionIdsByMLContext.get(t);s||(s=new Set,this.sessionIdsByMLContext.set(t,s)),s.add(e)}onReleaseSession(e){let t=this.mlContextBySessionId.get(e);if(!t)return;this.tensorManager.releaseTensorsForSession(e),this.mlContextBySessionId.delete(e);let s=this.sessionIdsByMLContext.get(t);if(s.delete(e),s.size===0){this.sessionIdsByMLContext.delete(t);let n=this.mlContextCache.findIndex(i=>i.mlContext===t);n!==-1&&this.mlContextCache.splice(n,1)}}getMLContext(e){return this.mlContextBySessionId.get(e)}reserveTensorId(){return this.tensorManager.reserveTensorId()}releaseTensorId(e){as("verbose",()=>`[WebNN] releaseTensorId {tensorId: ${e}}`),this.tensorManager.releaseTensorId(e)}async ensureTensor(e,t,s,n){let i=Ti.get(t);if(!i)throw new Error(`Unsupported ONNX data type: ${t}`);return this.tensorManager.ensureTensor(e,i,s,n)}uploadTensor(e,t){if(!gs().shouldTransferToMLTensor)throw new Error("Trying to upload to a MLTensor while shouldTransferToMLTensor is false");as("verbose",()=>`[WebNN] uploadTensor {tensorId: ${e}, data: ${t.byteLength}}`),this.tensorManager.upload(e,t)}async downloadTensor(e,t){return this.tensorManager.download(e,t)}createMLTensorDownloader(e,t){return async()=>{let s=await this.tensorManager.download(e);return M(s,t)}}registerMLTensor(e,t,s){let n=Ti.get(t);if(!n)throw new Error(`Unsupported ONNX data type: ${t}`);let i=this.tensorManager.registerTensor(this.currentContext,e,n,s);return as("verbose",()=>`[WebNN] registerMLTensor {tensor: ${e}, dataType: ${n}, dimensions: ${s}} -> {tensorId: ${i}}`),i}registerMLConstant(e,t,s,n,i,o){if(!o)throw new Error("External mounted files are not available.");let a=e;e.startsWith("./")&&(a=e.substring(2));let c=o.get(a);if(!c)throw new Error(`File with name ${a} not found in preloaded files.`);if(t+s>c.byteLength)throw new Error("Out of bounds: data offset and length exceed the external file data size.");let p=c.slice(t,t+s).buffer,h;switch(i.dataType){case"float32":h=new Float32Array(p);break;case"float16":h=new Uint16Array(p);break;case"int32":h=new Int32Array(p);break;case"uint32":h=new Uint32Array(p);break;case"int64":h=new BigInt64Array(p);break;case"uint64":h=new BigUint64Array(p);break;case"int8":h=new Int8Array(p);break;case"int4":case"uint4":case"uint8":h=new Uint8Array(p);break;default:throw new Error(`Unsupported data type: ${i.dataType} in creating WebNN Constant from external data.`)}return as("verbose",()=>`[WebNN] registerMLConstant {dataType: ${i.dataType}, shape: ${i.shape}}}`),n.constant(i,h)}flush(){}}}),Ma={};T(Ma,{init:()=>Yd});var vn,ba,Yd,Jd=y(()=>{Ot(),Xd(),Te(),$t(),Vp(),vn=class mf{constructor(t,s,n,i){this.module=t,this.dataType=s,this.data=n,this.dims=i}getFloat32Array(){if(this.dataType!==1)throw new Error("Invalid data type");let t=De.size(this.dims);return t===0?new Float32Array:new Float32Array(this.module.HEAP8.buffer,this.data,t)}getBigInt64Array(){if(this.dataType!==7)throw new Error("Invalid data type");let t=De.size(this.dims);return t===0?new BigInt64Array:new BigInt64Array(this.module.HEAP8.buffer,this.data,t)}getInt32Array(){if(this.dataType!==6)throw new Error("Invalid data type");let t=De.size(this.dims);return t===0?new Int32Array:new Int32Array(this.module.HEAP8.buffer,this.data,t)}getUint16Array(){if(this.dataType!==10&&this.dataType!==4)throw new Error("Invalid data type");let t=De.size(this.dims);return t===0?new Uint16Array:new Uint16Array(this.module.HEAP8.buffer,this.data,t)}reshape(t){if(De.size(t)!==De.size(this.dims))throw new Error("Invalid new shape");return new mf(this.module,this.dataType,this.data,t)}},ba=class{constructor(e,t,s){this.module=e,this.backend=t,this.customDataOffset=0,this.customDataSize=0,this.adapterInfo=t.adapterInfo,this.deviceInfo=t.deviceInfo;let n=e.PTR_SIZE,i=s/e.PTR_SIZE,o=n===4?"i32":"i64";this.opKernelContext=Number(e.getValue(n*i++,o));let a=Number(e.getValue(n*i++,o));this.outputCount=Number(e.getValue(n*i++,o)),this.customDataOffset=Number(e.getValue(n*i++,"*")),this.customDataSize=Number(e.getValue(n*i++,o));let c=[];for(let p=0;ptypeof a=="number"?this.inputs[a]:a)??this.inputs,n=t?.outputs??[],i=(a,c,p)=>new vn(this.module,c,this.output(a,p),p),o=(a,c)=>{let p=ar(a,c);if(!p)throw new Error(`Unsupported data type: ${a}`);let h=p>0?this.backend.gpuDataManager.create(p).id:0;return new vn(this.module,a,h,c)};return this.backend.run(e,s,n,i,o,this.outputCount)}output(e,t){let s=this.module.stackSave();try{let n=this.module.PTR_SIZE,i=n===4?"i32":"i64",o=this.module.stackAlloc((1+t.length)*n);this.module.setValue(o,t.length,i);for(let a=0;a{let i=t.jsepInit;if(!i)throw new Error("Failed to initialize JSEP. The WebAssembly module is not built with JSEP support.");if(e==="webgpu"){let o=new Gn;await o.initialize(s,n),i("webgpu",[o,a=>o.alloc(Number(a)),a=>o.free(a),(a,c,p,h=!1)=>{if(h)as("verbose",()=>`[WebGPU] jsepCopyGpuToGpu: src=${Number(a)}, dst=${Number(c)}, size=${Number(p)}`),o.memcpy(Number(a),Number(c));else{as("verbose",()=>`[WebGPU] jsepCopyCpuToGpu: dataOffset=${Number(a)}, gpuDataId=${Number(c)}, size=${Number(p)}`);let C=t.HEAPU8.subarray(Number(a>>>0),Number(a>>>0)+Number(p));o.upload(Number(c),C)}},async(a,c,p)=>{as("verbose",()=>`[WebGPU] jsepCopyGpuToCpu: gpuDataId=${a}, dataOffset=${c}, size=${p}`),await o.download(Number(a),()=>t.HEAPU8.subarray(Number(c)>>>0,Number(c+p)>>>0))},(a,c,p)=>o.createKernel(a,Number(c),p,t.UTF8ToString(t._JsepGetNodeName(Number(c)))),a=>o.releaseKernel(a),(a,c,p,h)=>{as("verbose",()=>`[WebGPU] jsepRun: sessionHandle=${p}, kernel=${a}, contextDataOffset=${c}`);let C=new ba(t,o,Number(c));return o.computeKernel(Number(a),C,h)},()=>o.captureBegin(),()=>o.captureEnd(),()=>o.replay()])}else{let o=new ya(s);i("webnn",[o,()=>o.reserveTensorId(),a=>o.releaseTensorId(a),async(a,c,p,h)=>o.ensureTensor(a,c,p,h),(a,c)=>{o.uploadTensor(a,c)},async(a,c)=>o.downloadTensor(a,c)])}}}),Pi,Zd,ec,rn,nn,ur,Up,Wp,Gp,Kp,Hp,qp,Ch=y(()=>{Jn(),Zn(),Ot(),br(),cn(),In(),Pi=(e,t)=>{gs()._OrtInit(e,t)!==0&&ns("Can't initialize onnxruntime.")},Zd=async e=>{Pi(e.wasm.numThreads,Xr(e.logLevel))},ec=async(e,t)=>{{let s=(Jd(),x(Ma)).init;if(t==="webgpu"){if(typeof navigator>"u"||!navigator.gpu)throw new Error("WebGPU is not supported in current environment");let n=e.webgpu.adapter;if(n){if(typeof n.limits!="object"||typeof n.features!="object"||typeof n.requestDevice!="function")throw new Error("Invalid GPU adapter set in `env.webgpu.adapter`. It must be a GPUAdapter object.")}else{let i=e.webgpu.powerPreference;if(i!==void 0&&i!=="low-power"&&i!=="high-performance")throw new Error(`Invalid powerPreference setting: "${i}"`);let o=e.webgpu.forceFallbackAdapter;if(o!==void 0&&typeof o!="boolean")throw new Error(`Invalid forceFallbackAdapter setting: "${o}"`);if(n=await navigator.gpu.requestAdapter({powerPreference:i,forceFallbackAdapter:o}),!n)throw new Error('Failed to get GPU adapter. You may need to enable flag "--enable-unsafe-webgpu" if you are using Chrome.')}await s("webgpu",gs(),e,n)}if(t==="webnn"){if(typeof navigator>"u"||!navigator.ml)throw new Error("WebNN is not supported in current environment");await s("webnn",gs(),e)}}},rn=new Map,nn=e=>{let t=gs(),s=t.stackSave();try{let n=t.PTR_SIZE,i=t.stackAlloc(2*n);t._OrtGetInputOutputCount(e,i,i+n)!==0&&ns("Can't get session input/output count.");let o=n===4?"i32":"i64";return[Number(t.getValue(i,o)),Number(t.getValue(i+n,o))]}finally{t.stackRestore(s)}},ur=e=>{let t=gs(),s=t._malloc(e.byteLength);if(s===0)throw new Error(`Can't create a session. failed to allocate a buffer of size ${e.byteLength}.`);return t.HEAPU8.set(e,s),[s,e.byteLength]},Up=async(e,t)=>{let s,n,i=gs();Array.isArray(e)?[s,n]=e:e.buffer===i.HEAPU8.buffer?[s,n]=[e.byteOffset,e.byteLength]:[s,n]=ur(e);let o=0,a=0,c=0,p=[],h=[],C=[];try{if([a,p]=An(t),t?.externalData&&i.mountExternalData){let W=[];for(let ue of t.externalData){let he=typeof ue=="string"?ue:ue.path;W.push(_n(typeof ue=="string"?ue:ue.data).then(be=>{i.mountExternalData(he,be)}))}await Promise.all(W)}for(let W of t?.executionProviders??[])if((typeof W=="string"?W:W.name)==="webnn"){if(i.shouldTransferToMLTensor=!1,typeof W!="string"){let ue=W,he=ue?.context,be=ue?.gpuDevice,Be=ue?.deviceType,Ie=ue?.powerPreference;he?i.currentContext=he:be?i.currentContext=await i.jsepCreateMLContext(be):i.currentContext=await i.jsepCreateMLContext({deviceType:Be,powerPreference:Ie})}else i.currentContext=await i.jsepCreateMLContext();break}o=await i._OrtCreateSession(s,n,a),o===0&&ns("Can't create a session."),i.jsepOnCreateSession?.(),i.currentContext&&(i.jsepRegisterMLContext(o,i.currentContext),i.currentContext=void 0,i.shouldTransferToMLTensor=!0);let[u,k]=nn(o),B=!!t?.enableGraphCapture,R=[],z=[],ne=[];for(let W=0;WW==="gpu-buffer"||W==="ml-tensor")&&(c=i._OrtCreateBinding(o),c===0&&ns("Can't create IO binding."),J={handle:c,outputPreferredLocations:ne,outputPreferredLocationsEncoded:ne.map(W=>fn(W))}),rn.set(o,[o,h,C,J,B,!1]),[o,R,z]}catch(u){throw h.forEach(k=>i._OrtFree(k)),C.forEach(k=>i._OrtFree(k)),c!==0&&i._OrtReleaseBinding(c)!==0&&ns("Can't release IO binding."),o!==0&&i._OrtReleaseSession(o)!==0&&ns("Can't release session."),u}finally{i._free(s),a!==0&&i._OrtReleaseSessionOptions(a)!==0&&ns("Can't release session options."),p.forEach(u=>i._free(u)),i.unmountExternalData?.()}},Wp=e=>{let t=gs(),s=rn.get(e);if(!s)throw new Error(`cannot release session. invalid session id: ${e}`);let[n,i,o,a,c]=s;a&&(c&&t._OrtClearBoundOutputs(a.handle)!==0&&ns("Can't clear bound outputs."),t._OrtReleaseBinding(a.handle)!==0&&ns("Can't release IO binding.")),t.jsepOnReleaseSession?.(e),i.forEach(p=>t._OrtFree(p)),o.forEach(p=>t._OrtFree(p)),t._OrtReleaseSession(n)!==0&&ns("Can't release session."),rn.delete(e)},Gp=(e,t,s,n,i,o=!1)=>{if(!e){t.push(0);return}let a=gs(),c=a.PTR_SIZE,p=e[0],h=e[1],C=e[3],u,k;if(p==="string"&&(C==="gpu-buffer"||C==="ml-tensor"))throw new Error("String tensor is not supported on GPU.");if(o&&C!=="gpu-buffer")throw new Error(`External buffer must be provided for input/output index ${i} when enableGraphCapture is true.`);if(C==="gpu-buffer"){let z=e[2].gpuBuffer;k=ar(Rr(p),h);let ne=a.jsepRegisterBuffer;if(!ne)throw new Error('Tensor location "gpu-buffer" is not supported without using WebGPU.');u=ne(n,i,z,k)}else if(C==="ml-tensor"){let z=e[2].mlTensor;k=ar(Rr(p),h);let ne=a.jsepRegisterMLTensor;if(!ne)throw new Error('Tensor location "ml-tensor" is not supported without using WebNN.');u=ne(z,Rr(p),h)}else{let z=e[2];if(Array.isArray(z)){k=c*z.length,u=a._malloc(k),s.push(u);for(let ne=0;nea.setValue(R+J*c,ne,c===4?"i32":"i64"));let z=a._OrtCreateTensor(Rr(p),u,k,R,h.length,fn(C));z===0&&ns(`Can't create tensor for input/output. session=${n}, index=${i}.`),t.push(z)}finally{a.stackRestore(B)}},Kp=async(e,t,s,n,i,o)=>{let a=gs(),c=a.PTR_SIZE,p=rn.get(e);if(!p)throw new Error(`cannot run inference. invalid session id: ${e}`);let h=p[0],C=p[1],u=p[2],k=p[3],B=p[4],R=p[5],z=t.length,ne=n.length,J=0,W=[],ue=[],he=[],be=[],Be=a.stackSave(),Ie=a.stackAlloc(z*c),nt=a.stackAlloc(z*c),dt=a.stackAlloc(ne*c),Et=a.stackAlloc(ne*c);try{a.jsepOnRunStart?.(h),[J,W]=zr(o);for(let ht=0;hter*Ss,1);Xt=fr(ut);let xn=k?.outputPreferredLocations[n[ht]];if(Xt==="string"){if(xn==="gpu-buffer"||xn==="ml-tensor")throw new Error("String tensor is not supported on GPU.");let er=[];for(let Ss=0;Ss0){let er=a.jsepGetBuffer;if(!er)throw new Error('preferredLocation "gpu-buffer" is not supported without using WebGPU.');let Ss=er(Ut),ir=ar(ut,xs);if(ir===void 0||!hn(Xt))throw new Error(`Unsupported data type: ${Xt}`);ts=!0,It.push([Xt,vs,{gpuBuffer:Ss,download:a.jsepCreateDownloader(Ss,ir,Xt),dispose:()=>{a._OrtReleaseTensor(Jt)!==0&&ns("Can't release tensor.")}},"gpu-buffer"])}else if(xn==="ml-tensor"&&xs>0){let er=a.jsepEnsureTensor;if(!er)throw new Error('preferredLocation "ml-tensor" is not supported without using WebNN.');if(ar(ut,xs)===void 0||!mn(Xt))throw new Error(`Unsupported data type: ${Xt}`);let Ss=await er(Ut,ut,vs,!1);ts=!0,It.push([Xt,vs,{mlTensor:Ss,download:a.jsepCreateMLTensorDownloader(Ut,Xt),dispose:()=>{a.jsepReleaseTensorId(Ut),a._OrtReleaseTensor(Jt)}},"ml-tensor"])}else{let er=pn(Xt),Ss=new er(xs);new Uint8Array(Ss.buffer,Ss.byteOffset,Ss.byteLength).set(a.HEAPU8.subarray(Ut,Ut+Ss.byteLength)),It.push([Xt,vs,Ss,"cpu"])}}finally{a.stackRestore(Vt),Xt==="string"&&Ut&&a._free(Ut),ts||a._OrtReleaseTensor(Jt)}}return k&&!B&&(a._OrtClearBoundOutputs(k.handle)!==0&&ns("Can't clear bound outputs."),rn.set(e,[h,C,u,k,B,!1])),It}finally{a.stackRestore(Be),ue.forEach(zt=>a._OrtReleaseTensor(zt)),he.forEach(zt=>a._OrtReleaseTensor(zt)),be.forEach(zt=>a._free(zt)),J!==0&&a._OrtReleaseRunOptions(J),W.forEach(zt=>a._free(zt))}},Hp=e=>{let t=gs(),s=rn.get(e);if(!s)throw new Error("invalid session id");let n=s[0],i=t._OrtEndProfiling(n);i===0&&ns("Can't get an profile file name."),t._OrtFree(i)},qp=e=>{let t=[];for(let s of e){let n=s[2];!Array.isArray(n)&&"buffer"in n&&t.push(n.buffer)}return t}}),Kn,Fr,va,tc,sc,gp,Qp,wp,Ei,Ci,kh,Sh,$h,Ah,Ih,Fh,Oh,Dh,Lh=y(()=>{We(),Ch(),br(),Lr(),Kn=()=>!!F.wasm.proxy&&typeof document<"u",va=!1,tc=!1,sc=!1,wp=new Map,Ei=(e,t)=>{let s=wp.get(e);s?s.push(t):wp.set(e,[t])},Ci=()=>{if(va||!tc||sc||!Fr)throw new Error("worker not ready")},kh=e=>{switch(e.data.type){case"init-wasm":va=!1,e.data.err?(sc=!0,Qp[1](e.data.err)):(tc=!0,Qp[0]()),gp&&(URL.revokeObjectURL(gp),gp=void 0);break;case"init-ep":case"copy-from":case"create":case"release":case"run":case"end-profiling":{let t=wp.get(e.data.type);e.data.err?t.shift()[1](e.data.err):t.shift()[0](e.data.out);break}}},Sh=async()=>{if(!tc){if(va)throw new Error("multiple calls to 'initWasm()' detected.");if(sc)throw new Error("previous call to 'initWasm()' failed.");if(va=!0,Kn())return new Promise((e,t)=>{Fr?.terminate(),qr().then(([s,n])=>{try{Fr=n,Fr.onerror=o=>t(o),Fr.onmessage=kh,Qp=[e,t];let i={type:"init-wasm",in:F};!i.in.wasm.wasmPaths&&(s||import.meta.url?.startsWith("file:"))&&(i.in.wasm.wasmPaths={wasm:new URL(r("./node_modules/onnxruntime-web/dist/ort-wasm-simd-threaded.jsep.wasm"),r.b).href}),Fr.postMessage(i),gp=s}catch(i){t(i)}},t)});try{await dn(F.wasm),await Zd(F),tc=!0}catch(e){throw sc=!0,e}finally{va=!1}}},$h=async e=>{if(Kn())return Ci(),new Promise((t,s)=>{Ei("init-ep",[t,s]);let n={type:"init-ep",in:{epName:e,env:F}};Fr.postMessage(n)});await ec(F,e)},Ah=async e=>Kn()?(Ci(),new Promise((t,s)=>{Ei("copy-from",[t,s]);let n={type:"copy-from",in:{buffer:e}};Fr.postMessage(n,[e.buffer])})):ur(e),Ih=async(e,t)=>{if(Kn()){if(t?.preferredOutputLocation)throw new Error('session option "preferredOutputLocation" is not supported for proxy.');return Ci(),new Promise((s,n)=>{Ei("create",[s,n]);let i={type:"create",in:{model:e,options:{...t}}},o=[];e instanceof Uint8Array&&o.push(e.buffer),Fr.postMessage(i,o)})}else return Up(e,t)},Fh=async e=>{if(Kn())return Ci(),new Promise((t,s)=>{Ei("release",[t,s]);let n={type:"release",in:e};Fr.postMessage(n)});Wp(e)},Oh=async(e,t,s,n,i,o)=>{if(Kn()){if(s.some(a=>a[3]!=="cpu"))throw new Error("input tensor on GPU is not supported for proxy.");if(i.some(a=>a))throw new Error("pre-allocated output tensor is not supported for proxy.");return Ci(),new Promise((a,c)=>{Ei("run",[a,c]);let p=s,h={type:"run",in:{sessionId:e,inputIndices:t,inputs:p,outputIndices:n,options:o}};Fr.postMessage(h,qp(p))})}else return Kp(e,t,s,n,i,o)},Dh=async e=>{if(Kn())return Ci(),new Promise((t,s)=>{Ei("end-profiling",[t,s]);let n={type:"end-profiling",in:e};Fr.postMessage(n)});Hp(e)}}),Xp,zh,Bh,Mf=y(()=>{We(),Lh(),Ot(),qe(),In(),Xp=(e,t)=>{switch(e.location){case"cpu":return[e.type,e.dims,e.data,"cpu"];case"gpu-buffer":return[e.type,e.dims,{gpuBuffer:e.gpuBuffer},"gpu-buffer"];case"ml-tensor":return[e.type,e.dims,{mlTensor:e.mlTensor},"ml-tensor"];default:throw new Error(`invalid data location: ${e.location} for ${t()}`)}},zh=e=>{switch(e[3]){case"cpu":return new te(e[0],e[2],e[1]);case"gpu-buffer":{let t=e[0];if(!hn(t))throw new Error(`not supported data type: ${t} for deserializing GPU tensor`);let{gpuBuffer:s,download:n,dispose:i}=e[2];return te.fromGpuBuffer(s,{dataType:t,dims:e[1],download:n,dispose:i})}case"ml-tensor":{let t=e[0];if(!mn(t))throw new Error(`not supported data type: ${t} for deserializing MLTensor tensor`);let{mlTensor:s,download:n,dispose:i}=e[2];return te.fromMLTensor(s,{dataType:t,dims:e[1],download:n,dispose:i})}default:throw new Error(`invalid data location: ${e[3]}`)}},Bh=class{async fetchModelAndCopyToWasmMemory(e){return Ah(await _n(e))}async loadModel(e,t){Ue();let s;typeof e=="string"?s=await this.fetchModelAndCopyToWasmMemory(e):s=e,[this.sessionId,this.inputNames,this.outputNames]=await Ih(s,t),ze()}async dispose(){return Fh(this.sessionId)}async run(e,t,s){Ue();let n=[],i=[];Object.entries(e).forEach(u=>{let k=u[0],B=u[1],R=this.inputNames.indexOf(k);if(R===-1)throw new Error(`invalid input '${k}'`);n.push(B),i.push(R)});let o=[],a=[];Object.entries(t).forEach(u=>{let k=u[0],B=u[1],R=this.outputNames.indexOf(k);if(R===-1)throw new Error(`invalid output '${k}'`);o.push(B),a.push(R)});let c=n.map((u,k)=>Xp(u,()=>`input "${this.inputNames[i[k]]}"`)),p=o.map((u,k)=>u?Xp(u,()=>`output "${this.outputNames[a[k]]}"`):null),h=await Oh(this.sessionId,i,c,a,p,s),C={};for(let u=0;uJp,initializeFlags:()=>Yp,wasmBackend:()=>Nh});var Yp,Jp,Nh,bf=y(()=>{We(),Lh(),Mf(),Yp=()=>{if((typeof F.wasm.initTimeout!="number"||F.wasm.initTimeout<0)&&(F.wasm.initTimeout=0),F.wasm.simd===!1&&console.warn('Deprecated property "env.wasm.simd" is set to false. non-SIMD build is no longer provided, and this setting will be ignored.'),typeof F.wasm.proxy!="boolean"&&(F.wasm.proxy=!1),typeof F.wasm.trace!="boolean"&&(F.wasm.trace=!1),typeof F.wasm.numThreads!="number"||!Number.isInteger(F.wasm.numThreads)||F.wasm.numThreads<=0)if(typeof self<"u"&&!self.crossOriginIsolated)F.wasm.numThreads=1;else{let e=typeof navigator>"u"?j("node:os").cpus().length:navigator.hardwareConcurrency;F.wasm.numThreads=Math.min(4,Math.ceil((e||1)/2))}},Jp=class{async init(e){Yp(),await Sh(),await $h(e)}async createInferenceSessionHandler(e,t){let s=new Bh;return await s.loadModel(e,t),Promise.resolve(s)}},Nh=new Jp});We(),We(),We();var vf="1.21.0-dev.20250114-228dd16893",xf=Se;{let e=(bf(),x(Rh)).wasmBackend;K("webgpu",e,5),K("webnn",e,5),K("cpu",e,10),K("wasm",e,10)}Object.defineProperty(F.versions,"web",{value:vf,enumerable:!0});/** + * @license + * Copyright 2021 Google LLC. All Rights Reserved. + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + * ============================================================================= + *//** + * @license + * Copyright 2020 Google LLC. All Rights Reserved. + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + * ============================================================================= + *//** + * @license + * Copyright 2019 Google LLC. All Rights Reserved. + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + * ============================================================================= + */},"./src/backends/onnx.js":(ke,A,r)=>{var g;r.r(A),r.d(A,{Tensor:()=>j.Tensor,createInferenceSession:()=>oe,deviceToExecutionProviders:()=>K,isONNXProxy:()=>H,isONNXTensor:()=>V});var $=r("./src/env.js"),N=r("?2ce3"),Z=r("./node_modules/onnxruntime-web/dist/ort.bundle.min.mjs?3a96"),j=r("./node_modules/onnxruntime-common/dist/esm/index.js");const y=Object.freeze({auto:null,gpu:null,cpu:"cpu",wasm:"wasm",webgpu:"webgpu",cuda:"cuda",dml:"dml",webnn:{name:"webnn",deviceType:"cpu"},"webnn-npu":{name:"webnn",deviceType:"npu"},"webnn-gpu":{name:"webnn",deviceType:"gpu"},"webnn-cpu":{name:"webnn",deviceType:"cpu"}}),T=[];let b,x;const v=Symbol.for("onnxruntime");if(v in globalThis)x=globalThis[v];else if($.apis.IS_NODE_ENV){switch(x=N??(g||(g=r.t(N,2))),process.platform){case"win32":T.push("dml");break;case"linux":process.arch==="x64"&&T.push("cuda");break}T.push("cpu"),b=["cpu"]}else x=Z,$.apis.IS_WEBNN_AVAILABLE&&T.push("webnn-npu","webnn-gpu","webnn-cpu","webnn"),$.apis.IS_WEBGPU_AVAILABLE&&T.push("webgpu"),T.push("wasm"),b=["wasm"];const L=x.InferenceSession;function K(I=null){if(!I)return b;switch(I){case"auto":return T;case"gpu":return T.filter(S=>["webgpu","cuda","dml","webnn-gpu"].includes(S))}if(T.includes(I))return[y[I]??I];throw new Error(`Unsupported device: "${I}". Should be one of: ${T.join(", ")}.`)}let se=null;async function oe(I,S,w){se&&await se;const P=L.create(I,S);se??=P;const F=await P;return F.config=w,F}function V(I){return I instanceof x.Tensor}const U=x?.env;U?.wasm&&(U.wasm.wasmPaths=`https://cdn.jsdelivr.net/npm/@huggingface/transformers@${$.env.version}/dist/`,U.wasm.proxy=!1,(typeof crossOriginIsolated>"u"||!crossOriginIsolated)&&(U.wasm.numThreads=1)),U?.webgpu&&(U.webgpu.powerPreference="high-performance");function H(){return U?.wasm?.proxy}$.env.backends.onnx=U},"./src/base/feature_extraction_utils.js":(ke,A,r)=>{r.r(A),r.d(A,{FeatureExtractor:()=>Z,validate_audio_inputs:()=>j});var g=r("./src/utils/constants.js"),$=r("./src/utils/generic.js"),N=r("./src/utils/hub.js");class Z extends $.Callable{constructor(T){super(),this.config=T}static async from_pretrained(T,b){const x=await(0,N.getModelJSON)(T,g.FEATURE_EXTRACTOR_NAME,!0,b);return new this(x)}}function j(y,T){if(!(y instanceof Float32Array||y instanceof Float64Array))throw new Error(`${T} expects input to be a Float32Array or a Float64Array, but got ${y?.constructor?.name??typeof y} instead. If using the feature extractor directly, remember to use \`read_audio(url, sampling_rate)\` to obtain the raw audio data of the file/url.`)}},"./src/base/image_processors_utils.js":(ke,A,r)=>{r.r(A),r.d(A,{ImageProcessor:()=>I,center_to_corners_format:()=>x,post_process_instance_segmentation:()=>H,post_process_object_detection:()=>v,post_process_panoptic_segmentation:()=>U,post_process_semantic_segmentation:()=>L});var g=r("./src/utils/generic.js"),$=r("./src/utils/tensor.js"),N=r("./src/utils/maths.js");r("./src/utils/image.js");var Z=r("./src/utils/core.js"),j=r("./src/utils/hub.js"),y=r("./src/utils/constants.js");function T(S,w,P=0,F=null){const ae=S/w;let ie=(0,N.bankers_round)(ae)*w;return F!==null&&ie>F&&(ie=Math.floor(ae)*w),iew&&X.push(Ee)}else{let Ee=(0,N.max)(_e.data)[1];if(Ee===re-1||(de=(0,N.softmax)(_e.data),de[Ee]Xe*Ce[(ee+1)%2])),Ae.boxes.push(Oe),Ae.classes.push(Ee),Ae.scores.push(de[Ee])}}Me.push(Ae)}return Me}function L(S,w=null){const P=S.logits,F=P.dims[0];if(w!==null&&w.length!==F)throw Error("Make sure that you pass in as many target sizes as the batch dimension of the logits");const ae=[];for(let ie=0;ieCe[X]&&(Ce[X]=_e[X],Ae[X]=je)}const Pe=new Array(ge.dims[0]);for(let je=0;jeje!==void 0);ae.push({segmentation:pe,labels:Je})}return ae}function K(S,w,P,F){const ae=[],ie=[],ye=[];for(let ge=0;geP&&(ae.push(Me),ie.push(Ae),ye.push(pe))}return[ae,ie,ye]}function se(S,w,P,F=.5,ae=.8){const ie=[];let ye=0,ge=0;const re=w[P].data;for(let pe=0;pe=F&&++ge;let Me=ye>0&&ge>0;return Me&&(Me=ye/ge>ae),[Me,ie]}function oe(S,w,P,F,ae,ie=null,ye=null){const[ge,re]=ye??S[0].dims,Me=new $.Tensor("int32",new Int32Array(ge*re),[ge,re]),pe=[];if(ye!==null)for(let je=0;jeAe[de]&&(Ce[de]=je,Ae[de]=X[de])}let Pe=0;const Je=Me.data;for(let je=0;je200)throw new Error(`absolute aspect ratio must be smaller than 200, got ${Math.max(S,w)/Math.min(S,w)}`);let ie=Math.round(S/P)*P,ye=Math.round(w/P)*P;if(ie*ye>ae){const ge=Math.sqrt(S*w/ae);ie=Math.floor(S/ge/P)*P,ye=Math.floor(w/ge/P)*P}else if(ie*yeie?Me=Math.floor(ie*re/ae):ie>ae&&(re=Math.floor(ae*Me/ie)),await w.resize(Me,re,{resample:F}))}async crop_margin(w,P=200){const F=w.clone().grayscale(),ae=(0,N.min)(F.data)[0],ye=(0,N.max)(F.data)[0]-ae;if(ye===0)return w;const ge=P/255;let re=F.width,Me=F.height,pe=0,Ce=0;const Ae=F.data;for(let Pe=0;Pethis.preprocess(ie)));return{pixel_values:(0,$.stack)(F.map(ie=>ie.pixel_values),0),original_sizes:F.map(ie=>ie.original_size),reshaped_input_sizes:F.map(ie=>ie.reshaped_input_size)}}static async from_pretrained(w,P){const F=await(0,j.getModelJSON)(w,y.IMAGE_PROCESSOR_NAME,!0,P);return new this(F)}}},"./src/base/processing_utils.js":(ke,A,r)=>{r.r(A),r.d(A,{Processor:()=>Z});var g=r("./src/utils/constants.js"),$=r("./src/utils/generic.js"),N=r("./src/utils/hub.js");class Z extends $.Callable{static classes=["image_processor_class","tokenizer_class","feature_extractor_class"];static uses_processor_config=!1;constructor(y,T){super(),this.config=y,this.components=T}get image_processor(){return this.components.image_processor}get tokenizer(){return this.components.tokenizer}get feature_extractor(){return this.components.feature_extractor}apply_chat_template(y,T={}){if(!this.tokenizer)throw new Error("Unable to apply chat template without a tokenizer.");return this.tokenizer.apply_chat_template(y,{tokenize:!1,...T})}batch_decode(...y){if(!this.tokenizer)throw new Error("Unable to decode without a tokenizer.");return this.tokenizer.batch_decode(...y)}decode(...y){if(!this.tokenizer)throw new Error("Unable to decode without a tokenizer.");return this.tokenizer.decode(...y)}async _call(y,...T){for(const b of[this.image_processor,this.feature_extractor,this.tokenizer])if(b)return b(y,...T);throw new Error("No image processor, feature extractor, or tokenizer found.")}static async from_pretrained(y,T){const[b,x]=await Promise.all([this.uses_processor_config?(0,N.getModelJSON)(y,g.PROCESSOR_NAME,!0,T):{},Promise.all(this.classes.filter(v=>v in this).map(async v=>{const L=await this[v].from_pretrained(y,T);return[v.replace(/_class$/,""),L]})).then(Object.fromEntries)]);return new this(b,x)}}},"./src/configs.js":(ke,A,r)=>{r.r(A),r.d(A,{AutoConfig:()=>T,PretrainedConfig:()=>y,getKeyValueShapes:()=>j});var g=r("./src/utils/core.js"),$=r("./src/utils/hub.js");async function N(b,x){return await(0,$.getModelJSON)(b,"config.json",!0,x)}function Z(b){const x={};let v={};switch(b.model_type){case"llava":case"paligemma":case"florence2":case"llava_onevision":case"idefics3":v=Z(b.text_config);break;case"moondream1":v=Z(b.phi_config);break;case"musicgen":v=Z(b.decoder);break;case"multi_modality":v=Z(b.language_config);break;case"gpt2":case"gptj":case"jais":case"codegen":case"gpt_bigcode":x.num_heads="n_head",x.num_layers="n_layer",x.hidden_size="n_embd";break;case"gpt_neox":case"stablelm":case"opt":case"falcon":x.num_heads="num_attention_heads",x.num_layers="num_hidden_layers",x.hidden_size="hidden_size";break;case"llama":case"olmo":case"olmo2":case"mobilellm":case"granite":case"cohere":case"mistral":case"starcoder2":case"qwen2":case"qwen2_vl":case"phi":case"phi3":case"phi3_v":x.num_heads="num_key_value_heads",x.num_layers="num_hidden_layers",x.hidden_size="hidden_size",x.num_attention_heads="num_attention_heads";break;case"gemma":case"gemma2":x.num_heads="num_key_value_heads",x.num_layers="num_hidden_layers",x.dim_kv="head_dim";break;case"openelm":x.num_heads="num_kv_heads",x.num_layers="num_transformer_layers",x.dim_kv="head_dim";break;case"gpt_neo":case"donut-swin":x.num_heads="num_heads",x.num_layers="num_layers",x.hidden_size="hidden_size";break;case"bloom":x.num_heads="n_head",x.num_layers="n_layer",x.hidden_size="hidden_size";break;case"mpt":x.num_heads="n_heads",x.num_layers="n_layers",x.hidden_size="d_model";break;case"exaone":x.num_heads="num_key_value_heads",x.num_layers="num_layers",x.dim_kv="head_dim",x.num_attention_heads="num_attention_heads";break;case"t5":case"mt5":case"longt5":x.num_decoder_layers="num_decoder_layers",x.num_decoder_heads="num_heads",x.decoder_dim_kv="d_kv",x.num_encoder_layers="num_layers",x.num_encoder_heads="num_heads",x.encoder_dim_kv="d_kv";break;case"bart":case"mbart":case"marian":case"whisper":case"m2m_100":case"blenderbot":case"blenderbot-small":case"florence2_language":x.num_decoder_layers="decoder_layers",x.num_decoder_heads="decoder_attention_heads",x.decoder_hidden_size="d_model",x.num_encoder_layers="encoder_layers",x.num_encoder_heads="encoder_attention_heads",x.encoder_hidden_size="d_model";break;case"speecht5":x.num_decoder_layers="decoder_layers",x.num_decoder_heads="decoder_attention_heads",x.decoder_hidden_size="hidden_size",x.num_encoder_layers="encoder_layers",x.num_encoder_heads="encoder_attention_heads",x.encoder_hidden_size="hidden_size";break;case"trocr":x.num_encoder_layers=x.num_decoder_layers="decoder_layers",x.num_encoder_heads=x.num_decoder_heads="decoder_attention_heads",x.encoder_hidden_size=x.decoder_hidden_size="d_model";break;case"musicgen_decoder":case"moonshine":x.num_encoder_layers=x.num_decoder_layers="num_hidden_layers",x.num_encoder_heads=x.num_decoder_heads="num_attention_heads",x.encoder_hidden_size=x.decoder_hidden_size="hidden_size";break;case"vision-encoder-decoder":const K=Z(b.decoder),se="num_decoder_layers"in K,oe=(0,g.pick)(b,["model_type","is_encoder_decoder"]);return se?(oe.num_decoder_layers=K.num_decoder_layers,oe.num_decoder_heads=K.num_decoder_heads,oe.decoder_hidden_size=K.decoder_hidden_size,oe.num_encoder_layers=K.num_encoder_layers,oe.num_encoder_heads=K.num_encoder_heads,oe.encoder_hidden_size=K.encoder_hidden_size):(oe.num_layers=K.num_layers,oe.num_heads=K.num_heads,oe.hidden_size=K.hidden_size),oe}const L={...v,...(0,g.pick)(b,["model_type","multi_query","is_encoder_decoder"])};for(const K in x)L[K]=b[x[K]];return L}function j(b,{prefix:x="past_key_values",batch_size:v=1}={}){const L={},K=b.normalized_config;if(K.is_encoder_decoder&&"num_encoder_heads"in K&&"num_decoder_heads"in K){const se=K.encoder_dim_kv??K.encoder_hidden_size/K.num_encoder_heads,oe=K.decoder_dim_kv??K.decoder_hidden_size/K.num_decoder_heads,V=[v,K.num_encoder_heads,0,se],U=[v,K.num_decoder_heads,0,oe];for(let H=0;H{r.r(A),r.d(A,{apis:()=>oe,env:()=>w});var g=r("?569f"),$=r("?3f59"),N=r("?154a");const Z="3.3.1",j=typeof window<"u"&&typeof window.document<"u",y=typeof self<"u"&&self.constructor?.name==="DedicatedWorkerGlobalScope",T=typeof self<"u"&&"caches"in self,b=typeof navigator<"u"&&"gpu"in navigator,x=typeof navigator<"u"&&"ml"in navigator,v=typeof process<"u",L=v&&process?.release?.name==="node",K=!P(g),se=!P($),oe=Object.freeze({IS_BROWSER_ENV:j,IS_WEBWORKER_ENV:y,IS_WEB_CACHE_AVAILABLE:T,IS_WEBGPU_AVAILABLE:b,IS_WEBNN_AVAILABLE:x,IS_PROCESS_AVAILABLE:v,IS_NODE_ENV:L,IS_FS_AVAILABLE:K,IS_PATH_AVAILABLE:se}),V=K&&se;let U="./";if(V){const F=Object(import.meta).url;F?U=$.dirname($.dirname(N.fileURLToPath(F))):typeof __dirname<"u"&&(U=$.dirname(__dirname))}const H=V?$.join(U,"/.cache/"):null,I="/models/",S=V?$.join(U,I):I,w={version:Z,backends:{onnx:{}},allowRemoteModels:!0,remoteHost:"https://huggingface.co/",remotePathTemplate:"{model}/resolve/{revision}/",allowLocalModels:!(j||y),localModelPath:S,useFS:K,useBrowserCache:T,useFSCache:K,cacheDir:H,useCustomCache:!1,customCache:null};function P(F){return Object.keys(F).length===0}},"./src/generation/configuration_utils.js":(ke,A,r)=>{r.r(A),r.d(A,{GenerationConfig:()=>$});var g=r("./src/utils/core.js");class ${max_length=20;max_new_tokens=null;min_length=0;min_new_tokens=null;early_stopping=!1;max_time=null;do_sample=!1;num_beams=1;num_beam_groups=1;penalty_alpha=null;use_cache=!0;temperature=1;top_k=50;top_p=1;typical_p=1;epsilon_cutoff=0;eta_cutoff=0;diversity_penalty=0;repetition_penalty=1;encoder_repetition_penalty=1;length_penalty=1;no_repeat_ngram_size=0;bad_words_ids=null;force_words_ids=null;renormalize_logits=!1;constraints=null;forced_bos_token_id=null;forced_eos_token_id=null;remove_invalid_values=!1;exponential_decay_length_penalty=null;suppress_tokens=null;streamer=null;begin_suppress_tokens=null;forced_decoder_ids=null;guidance_scale=null;num_return_sequences=1;output_attentions=!1;output_hidden_states=!1;output_scores=!1;return_dict_in_generate=!1;pad_token_id=null;bos_token_id=null;eos_token_id=null;encoder_no_repeat_ngram_size=0;decoder_start_token_id=null;generation_kwargs={};constructor(Z){Object.assign(this,(0,g.pick)(Z,Object.getOwnPropertyNames(this)))}}},"./src/generation/logits_process.js":(ke,A,r)=>{r.r(A),r.d(A,{ClassifierFreeGuidanceLogitsProcessor:()=>V,ForcedBOSTokenLogitsProcessor:()=>y,ForcedEOSTokenLogitsProcessor:()=>T,LogitsProcessor:()=>N,LogitsProcessorList:()=>j,LogitsWarper:()=>Z,MinLengthLogitsProcessor:()=>K,MinNewTokensLengthLogitsProcessor:()=>se,NoBadWordsLogitsProcessor:()=>oe,NoRepeatNGramLogitsProcessor:()=>v,RepetitionPenaltyLogitsProcessor:()=>L,SuppressTokensAtBeginLogitsProcessor:()=>b,TemperatureLogitsWarper:()=>U,TopKLogitsWarper:()=>I,TopPLogitsWarper:()=>H,WhisperTimeStampLogitsProcessor:()=>x});var g=r("./src/utils/generic.js");r("./src/utils/tensor.js");var $=r("./src/utils/maths.js");class N extends g.Callable{_call(w,P){throw Error("`_call` should be implemented in a subclass")}}class Z extends g.Callable{_call(w,P){throw Error("`_call` should be implemented in a subclass")}}class j extends g.Callable{constructor(){super(),this.processors=[]}push(w){this.processors.push(w)}extend(w){this.processors.push(...w)}_call(w,P){let F=P;for(const ae of this.processors)F=ae(w,F);return F}[Symbol.iterator](){return this.processors.values()}}class y extends N{constructor(w){super(),this.bos_token_id=w}_call(w,P){for(let F=0;F=1&&ie[ie.length-1]>=this.timestamp_begin,ge=ie.length<2||ie[ie.length-2]>=this.timestamp_begin;if(ye&&(ge?ae.subarray(this.timestamp_begin).fill(-1/0):ae.subarray(0,this.eos_token_id).fill(-1/0)),w[F].length===this.begin_index&&this.max_initial_timestamp_index!==null){const Ce=this.timestamp_begin+this.max_initial_timestamp_index;ae.subarray(Ce+1).fill(-1/0)}const re=(0,$.log_softmax)(ae),Me=Math.log(re.subarray(this.timestamp_begin).map(Math.exp).reduce((Ce,Ae)=>Ce+Ae)),pe=(0,$.max)(re.subarray(0,this.timestamp_begin))[0];Me>pe&&ae.subarray(0,this.timestamp_begin).fill(-1/0)}return P}}class v extends N{constructor(w){super(),this.no_repeat_ngram_size=w}getNgrams(w){const P=w.length,F=[];for(let ie=0;ie1 to use the classifier free guidance processor, got guidance scale ${w}.`);this.guidance_scale=w}_call(w,P){if(P.dims[0]!==2*w.length)throw new Error(`Logits should have twice the batch size of the input ids, the first half of batches corresponding to the conditional inputs, and the second half of batches corresponding to the unconditional inputs. Got batch size ${P.dims[0]} for the logits and ${w.length} for the input ids.`);const F=w.length,ae=P.slice([0,F],null),ie=P.slice([F,P.dims[0]],null);for(let ye=0;ye1)throw new Error(`\`top_p\` must be a float > 0 and < 1, but is ${w}`);if(!Number.isInteger(F)||F<1)throw new Error(`\`min_tokens_to_keep\` must be a positive integer, but is ${F}`);this.top_p=w,this.filter_value=P,this.min_tokens_to_keep=F}}class I extends Z{constructor(w,{filter_value:P=-1/0,min_tokens_to_keep:F=1}={}){if(super(),!Number.isInteger(w)||w<0)throw new Error(`\`top_k\` must be a positive integer, but is ${w}`);this.top_k=Math.max(w,F),this.filter_value=P}}},"./src/generation/logits_sampler.js":(ke,A,r)=>{r.r(A),r.d(A,{LogitsSampler:()=>Z});var g=r("./src/utils/generic.js"),$=r("./src/utils/tensor.js"),N=r("./src/utils/maths.js");r("./src/generation/configuration_utils.js");class Z extends g.Callable{constructor(x){super(),this.generation_config=x}async _call(x){return this.sample(x)}async sample(x){throw Error("sample should be implemented in subclasses.")}getLogits(x,v){let L=x.dims.at(-1),K=x.data;if(v===-1)K=K.slice(-L);else{let se=v*L;K=K.slice(se,se+L)}return K}randomSelect(x){let v=0;for(let K=0;K1)return new T(x);if(x.num_return_sequences>1)throw Error(`num_return_sequences has to be 1 when doing greedy search, but is ${x.num_return_sequences}.`);return new j(x)}}class j extends Z{async sample(x){const v=(0,N.max)(x.data)[1];return[[BigInt(v),0]]}}class y extends Z{async sample(x){let v=x.dims.at(-1);this.generation_config.top_k>0&&(v=Math.min(this.generation_config.top_k,v));const[L,K]=await(0,$.topk)(x,v),se=(0,N.softmax)(L.data);return Array.from({length:this.generation_config.num_beams},()=>{const oe=this.randomSelect(se);return[K.data[oe],Math.log(se[oe])]})}}class T extends Z{async sample(x){let v=x.dims.at(-1);this.generation_config.top_k>0&&(v=Math.min(this.generation_config.top_k,v));const[L,K]=await(0,$.topk)(x,v),se=(0,N.softmax)(L.data);return Array.from({length:this.generation_config.num_beams},(oe,V)=>[K.data[V],Math.log(se[V])])}}},"./src/generation/stopping_criteria.js":(ke,A,r)=>{r.r(A),r.d(A,{EosTokenCriteria:()=>j,InterruptableStoppingCriteria:()=>y,MaxLengthCriteria:()=>Z,StoppingCriteria:()=>$,StoppingCriteriaList:()=>N});var g=r("./src/utils/generic.js");class $ extends g.Callable{_call(b,x){throw Error("StoppingCriteria needs to be subclassed")}}class N extends g.Callable{constructor(){super(),this.criteria=[]}push(b){this.criteria.push(b)}extend(b){b instanceof N?b=b.criteria:b instanceof $&&(b=[b]),this.criteria.push(...b)}_call(b,x){const v=new Array(b.length).fill(!1);for(const L of this.criteria){const K=L(b,x);for(let se=0;sex.length>=this.max_length)}}class j extends ${constructor(b){super(),Array.isArray(b)||(b=[b]),this.eos_token_id=b}_call(b,x){return b.map(v=>{const L=v.at(-1);return this.eos_token_id.some(K=>L==K)})}}class y extends ${constructor(){super(),this.interrupted=!1}interrupt(){this.interrupted=!0}reset(){this.interrupted=!1}_call(b,x){return new Array(b.length).fill(this.interrupted)}}},"./src/generation/streamers.js":(ke,A,r)=>{r.r(A),r.d(A,{BaseStreamer:()=>Z,TextStreamer:()=>y,WhisperTextStreamer:()=>T});var g=r("./src/utils/core.js"),$=r("./src/tokenizers.js"),N=r("./src/env.js");class Z{put(x){throw Error("Not implemented")}end(){throw Error("Not implemented")}}const j=N.apis.IS_PROCESS_AVAILABLE?b=>process.stdout.write(b):b=>console.log(b);class y extends Z{constructor(x,{skip_prompt:v=!1,callback_function:L=null,token_callback_function:K=null,skip_special_tokens:se=!0,decode_kwargs:oe={},...V}={}){super(),this.tokenizer=x,this.skip_prompt=v,this.callback_function=L??j,this.token_callback_function=K,this.decode_kwargs={skip_special_tokens:se,...oe,...V},this.token_cache=[],this.print_len=0,this.next_tokens_are_prompt=!0}put(x){if(x.length>1)throw Error("TextStreamer only supports batch size of 1");if(this.skip_prompt&&this.next_tokens_are_prompt){this.next_tokens_are_prompt=!1;return}const v=x[0];this.token_callback_function?.(v),this.token_cache=(0,g.mergeArrays)(this.token_cache,v);const L=this.tokenizer.decode(this.token_cache,this.decode_kwargs);let K;L.endsWith(` +`)?(K=L.slice(this.print_len),this.token_cache=[],this.print_len=0):L.length>0&&(0,$.is_chinese_char)(L.charCodeAt(L.length-1))?(K=L.slice(this.print_len),this.print_len+=K.length):(K=L.slice(this.print_len,L.lastIndexOf(" ")+1),this.print_len+=K.length),this.on_finalized_text(K,!1)}end(){let x;this.token_cache.length>0?(x=this.tokenizer.decode(this.token_cache,this.decode_kwargs).slice(this.print_len),this.token_cache=[],this.print_len=0):x="",this.next_tokens_are_prompt=!0,this.on_finalized_text(x,!0)}on_finalized_text(x,v){x.length>0&&this.callback_function?.(x),v&&this.callback_function===j&&N.apis.IS_PROCESS_AVAILABLE&&this.callback_function?.(` +`)}}class T extends y{constructor(x,{skip_prompt:v=!1,callback_function:L=null,token_callback_function:K=null,on_chunk_start:se=null,on_chunk_end:oe=null,on_finalize:V=null,time_precision:U=.02,skip_special_tokens:H=!0,decode_kwargs:I={}}={}){super(x,{skip_prompt:v,skip_special_tokens:H,callback_function:L,token_callback_function:K,decode_kwargs:I}),this.timestamp_begin=x.timestamp_begin,this.on_chunk_start=se,this.on_chunk_end=oe,this.on_finalize=V,this.time_precision=U,this.waiting_for_timestamp=!1}put(x){if(x.length>1)throw Error("WhisperTextStreamer only supports batch size of 1");const v=x[0];if(v.length===1){const L=Number(v[0])-this.timestamp_begin;if(L>=0){const K=L*this.time_precision;this.waiting_for_timestamp?this.on_chunk_end?.(K):this.on_chunk_start?.(K),this.waiting_for_timestamp=!this.waiting_for_timestamp,x=[[]]}}return super.put(x)}end(){super.end(),this.on_finalize?.()}}},"./src/models.js":(ke,A,r)=>{r.r(A),r.d(A,{ASTForAudioClassification:()=>Fi,ASTModel:()=>Sa,ASTPreTrainedModel:()=>qt,AlbertForMaskedLM:()=>as,AlbertForQuestionAnswering:()=>Ln,AlbertForSequenceClassification:()=>gn,AlbertModel:()=>Dn,AlbertPreTrainedModel:()=>Nr,AutoModel:()=>Vc,AutoModelForAudioClassification:()=>qd,AutoModelForAudioFrameClassification:()=>op,AutoModelForCTC:()=>np,AutoModelForCausalLM:()=>Np,AutoModelForDepthEstimation:()=>dp,AutoModelForDocumentQuestionAnswering:()=>ap,AutoModelForImageClassification:()=>Yc,AutoModelForImageFeatureExtraction:()=>pp,AutoModelForImageMatting:()=>lp,AutoModelForImageSegmentation:()=>Jc,AutoModelForImageToImage:()=>up,AutoModelForMaskGeneration:()=>rp,AutoModelForMaskedLM:()=>qc,AutoModelForNormalEstimation:()=>cp,AutoModelForObjectDetection:()=>tp,AutoModelForPoseEstimation:()=>jp,AutoModelForQuestionAnswering:()=>Qc,AutoModelForSemanticSegmentation:()=>Zc,AutoModelForSeq2SeqLM:()=>Wc,AutoModelForSequenceClassification:()=>Uc,AutoModelForSpeechSeq2Seq:()=>Gc,AutoModelForTextToSpectrogram:()=>Kc,AutoModelForTextToWaveform:()=>Hc,AutoModelForTokenClassification:()=>Rp,AutoModelForUniversalSegmentation:()=>ep,AutoModelForVision2Seq:()=>Xc,AutoModelForXVector:()=>ip,AutoModelForZeroShotObjectDetection:()=>sp,BartForConditionalGeneration:()=>rs,BartForSequenceClassification:()=>Yt,BartModel:()=>pt,BartPretrainedModel:()=>yt,BaseModelOutput:()=>Re,BeitForImageClassification:()=>Zl,BeitModel:()=>Jl,BeitPreTrainedModel:()=>xo,BertForMaskedLM:()=>Ke,BertForQuestionAnswering:()=>ze,BertForSequenceClassification:()=>Ne,BertForTokenClassification:()=>Ue,BertModel:()=>ve,BertPreTrainedModel:()=>te,BlenderbotForConditionalGeneration:()=>Xs,BlenderbotModel:()=>De,BlenderbotPreTrainedModel:()=>Js,BlenderbotSmallForConditionalGeneration:()=>Hs,BlenderbotSmallModel:()=>Es,BlenderbotSmallPreTrainedModel:()=>kr,BloomForCausalLM:()=>El,BloomModel:()=>Pl,BloomPreTrainedModel:()=>uo,CLIPModel:()=>ja,CLIPPreTrainedModel:()=>Jr,CLIPSegForImageSegmentation:()=>qa,CLIPSegModel:()=>Ha,CLIPSegPreTrainedModel:()=>Ni,CLIPTextModel:()=>uc,CLIPTextModelWithProjection:()=>Va,CLIPVisionModel:()=>dc,CLIPVisionModelWithProjection:()=>Ua,CamembertForMaskedLM:()=>Kr,CamembertForQuestionAnswering:()=>Hr,CamembertForSequenceClassification:()=>Pr,CamembertForTokenClassification:()=>Er,CamembertModel:()=>Lt,CamembertPreTrainedModel:()=>Mr,CausalLMOutput:()=>yn,CausalLMOutputWithPast:()=>fp,ChineseCLIPModel:()=>gr,ChineseCLIPPreTrainedModel:()=>cc,ClapAudioModelWithProjection:()=>ld,ClapModel:()=>od,ClapPreTrainedModel:()=>wi,ClapTextModelWithProjection:()=>ad,CodeGenForCausalLM:()=>ol,CodeGenModel:()=>Hi,CodeGenPreTrainedModel:()=>ri,CohereForCausalLM:()=>mc,CohereModel:()=>hl,CoherePreTrainedModel:()=>so,ConvBertForMaskedLM:()=>Nt,ConvBertForQuestionAnswering:()=>ms,ConvBertForSequenceClassification:()=>ss,ConvBertForTokenClassification:()=>Ts,ConvBertModel:()=>ft,ConvBertPreTrainedModel:()=>st,ConvNextForImageClassification:()=>Mc,ConvNextModel:()=>Vo,ConvNextPreTrainedModel:()=>jo,ConvNextV2ForImageClassification:()=>fu,ConvNextV2Model:()=>bc,ConvNextV2PreTrainedModel:()=>Uo,DPTForDepthEstimation:()=>Rn,DPTModel:()=>Lo,DPTPreTrainedModel:()=>Do,DebertaForMaskedLM:()=>Cr,DebertaForQuestionAnswering:()=>or,DebertaForSequenceClassification:()=>Dr,DebertaForTokenClassification:()=>Lr,DebertaModel:()=>qr,DebertaPreTrainedModel:()=>dr,DebertaV2ForMaskedLM:()=>Ft,DebertaV2ForQuestionAnswering:()=>dn,DebertaV2ForSequenceClassification:()=>Ys,DebertaV2ForTokenClassification:()=>Cn,DebertaV2Model:()=>vt,DebertaV2PreTrainedModel:()=>it,DecisionTransformerModel:()=>Md,DecisionTransformerPreTrainedModel:()=>Ic,DeiTForImageClassification:()=>ko,DeiTModel:()=>Co,DeiTPreTrainedModel:()=>wn,DepthAnythingForDepthEstimation:()=>zo,DepthAnythingPreTrainedModel:()=>au,DepthProForDepthEstimation:()=>cu,DepthProPreTrainedModel:()=>du,DetrForObjectDetection:()=>tu,DetrForSegmentation:()=>su,DetrModel:()=>eu,DetrObjectDetectionOutput:()=>Vr,DetrPreTrainedModel:()=>ai,DetrSegmentationOutput:()=>Zr,Dinov2ForImageClassification:()=>Go,Dinov2Model:()=>_u,Dinov2PreTrainedModel:()=>Wo,Dinov2WithRegistersForImageClassification:()=>Ho,Dinov2WithRegistersModel:()=>gu,Dinov2WithRegistersPreTrainedModel:()=>Ko,DistilBertForMaskedLM:()=>cn,DistilBertForQuestionAnswering:()=>ns,DistilBertForSequenceClassification:()=>Ls,DistilBertForTokenClassification:()=>Qr,DistilBertModel:()=>br,DistilBertPreTrainedModel:()=>gs,DonutSwinModel:()=>mu,DonutSwinPreTrainedModel:()=>No,EfficientNetForImageClassification:()=>md,EfficientNetModel:()=>hd,EfficientNetPreTrainedModel:()=>Zo,ElectraForMaskedLM:()=>tr,ElectraForQuestionAnswering:()=>Ns,ElectraForSequenceClassification:()=>Tr,ElectraForTokenClassification:()=>Gr,ElectraModel:()=>As,ElectraPreTrainedModel:()=>Ps,EsmForMaskedLM:()=>kn,EsmForSequenceClassification:()=>Sn,EsmForTokenClassification:()=>$n,EsmModel:()=>Jn,EsmPreTrainedModel:()=>zr,ExaoneForCausalLM:()=>al,ExaoneModel:()=>ni,ExaonePreTrainedModel:()=>Xi,FalconForCausalLM:()=>id,FalconModel:()=>nd,FalconPreTrainedModel:()=>Xo,FastViTForImageClassification:()=>fc,FastViTModel:()=>Vl,FastViTPreTrainedModel:()=>yo,Florence2ForConditionalGeneration:()=>La,Florence2PreTrainedModel:()=>Da,GLPNForDepthEstimation:()=>Ro,GLPNModel:()=>pi,GLPNPreTrainedModel:()=>Bo,GPT2LMHeadModel:()=>Xa,GPT2Model:()=>Qa,GPT2PreTrainedModel:()=>ji,GPTBigCodeForCausalLM:()=>il,GPTBigCodeModel:()=>nl,GPTBigCodePreTrainedModel:()=>Ki,GPTJForCausalLM:()=>rl,GPTJModel:()=>sl,GPTJPreTrainedModel:()=>Gi,GPTNeoForCausalLM:()=>Za,GPTNeoModel:()=>yr,GPTNeoPreTrainedModel:()=>Ui,GPTNeoXForCausalLM:()=>tl,GPTNeoXModel:()=>el,GPTNeoXPreTrainedModel:()=>Wi,Gemma2ForCausalLM:()=>_l,Gemma2Model:()=>fl,Gemma2PreTrainedModel:()=>no,GemmaForCausalLM:()=>ml,GemmaModel:()=>ls,GemmaPreTrainedModel:()=>ro,GraniteForCausalLM:()=>pl,GraniteModel:()=>hc,GranitePreTrainedModel:()=>to,GroundingDinoForObjectDetection:()=>yu,GroundingDinoPreTrainedModel:()=>wu,GroupViTModel:()=>jl,GroupViTPreTrainedModel:()=>wo,HieraForImageClassification:()=>$o,HieraModel:()=>nu,HieraPreTrainedModel:()=>So,HubertForCTC:()=>Wu,HubertForSequenceClassification:()=>Gu,HubertModel:()=>Uu,HubertPreTrainedModel:()=>Bp,IJepaForImageClassification:()=>Ol,IJepaModel:()=>Fl,IJepaPreTrainedModel:()=>mo,Idefics3ForConditionalGeneration:()=>zi,Idefics3PreTrainedModel:()=>Ra,ImageMattingOutput:()=>Wn,JAISLMHeadModel:()=>Ja,JAISModel:()=>Ya,JAISPreTrainedModel:()=>Vi,JinaCLIPModel:()=>si,JinaCLIPPreTrainedModel:()=>ti,JinaCLIPTextModel:()=>Ri,JinaCLIPVisionModel:()=>wr,LlamaForCausalLM:()=>pc,LlamaModel:()=>Qi,LlamaPreTrainedModel:()=>qi,LlavaForConditionalGeneration:()=>ei,LlavaOnevisionForConditionalGeneration:()=>Fa,LlavaPreTrainedModel:()=>jr,LongT5ForConditionalGeneration:()=>Fe,LongT5Model:()=>me,LongT5PreTrainedModel:()=>ce,M2M100ForConditionalGeneration:()=>Nn,M2M100Model:()=>hi,M2M100PreTrainedModel:()=>ku,MBartForCausalLM:()=>Ks,MBartForConditionalGeneration:()=>jt,MBartForSequenceClassification:()=>is,MBartModel:()=>Gs,MBartPreTrainedModel:()=>Ms,MPNetForMaskedLM:()=>Xr,MPNetForQuestionAnswering:()=>fn,MPNetForSequenceClassification:()=>hn,MPNetForTokenClassification:()=>mn,MPNetModel:()=>pn,MPNetPreTrainedModel:()=>ar,MT5ForConditionalGeneration:()=>wt,MT5Model:()=>gt,MT5PreTrainedModel:()=>Ye,MarianMTModel:()=>Cu,MarianModel:()=>Eu,MarianPreTrainedModel:()=>qo,MaskFormerForInstanceSegmentation:()=>ci,MaskFormerModel:()=>hu,MaskFormerPreTrainedModel:()=>pu,MaskedLMOutput:()=>Qs,MgpstrForSceneTextRecognition:()=>Td,MgpstrModelOutput:()=>Fc,MgpstrPreTrainedModel:()=>xd,MistralForCausalLM:()=>$r,MistralModel:()=>vr,MistralPreTrainedModel:()=>sd,MobileBertForMaskedLM:()=>Zn,MobileBertForQuestionAnswering:()=>fr,MobileBertForSequenceClassification:()=>Rr,MobileBertModel:()=>An,MobileBertPreTrainedModel:()=>Br,MobileLLMForCausalLM:()=>zn,MobileLLMModel:()=>ll,MobileLLMPreTrainedModel:()=>Yi,MobileNetV1ForImageClassification:()=>_d,MobileNetV1Model:()=>fd,MobileNetV1PreTrainedModel:()=>ta,MobileNetV2ForImageClassification:()=>ra,MobileNetV2Model:()=>gd,MobileNetV2PreTrainedModel:()=>sa,MobileNetV3ForImageClassification:()=>ia,MobileNetV3Model:()=>Ac,MobileNetV3PreTrainedModel:()=>na,MobileNetV4ForImageClassification:()=>yd,MobileNetV4Model:()=>wd,MobileNetV4PreTrainedModel:()=>oa,MobileViTForImageClassification:()=>Kl,MobileViTModel:()=>Gl,MobileViTPreTrainedModel:()=>hr,MobileViTV2ForImageClassification:()=>ql,MobileViTV2Model:()=>Hl,MobileViTV2PreTrainedModel:()=>Mo,ModelOutput:()=>Ve,ModernBertForMaskedLM:()=>mt,ModernBertForSequenceClassification:()=>lt,ModernBertForTokenClassification:()=>ct,ModernBertModel:()=>at,ModernBertPreTrainedModel:()=>Ze,Moondream1ForConditionalGeneration:()=>Oa,MoonshineForConditionalGeneration:()=>Ia,MoonshineModel:()=>cr,MoonshinePreTrainedModel:()=>Di,MptForCausalLM:()=>kl,MptModel:()=>Cl,MptPreTrainedModel:()=>co,MultiModalityCausalLM:()=>vd,MultiModalityPreTrainedModel:()=>bd,MusicgenForCausalLM:()=>$c,MusicgenForConditionalGeneration:()=>Mi,MusicgenModel:()=>Sc,MusicgenPreTrainedModel:()=>ea,NomicBertModel:()=>le,NomicBertPreTrainedModel:()=>O,OPTForCausalLM:()=>$l,OPTModel:()=>Sl,OPTPreTrainedModel:()=>po,Olmo2ForCausalLM:()=>cl,Olmo2Model:()=>dl,Olmo2PreTrainedModel:()=>eo,OlmoForCausalLM:()=>Zi,OlmoModel:()=>ul,OlmoPreTrainedModel:()=>Ji,OpenELMForCausalLM:()=>wl,OpenELMModel:()=>gl,OpenELMPreTrainedModel:()=>io,OwlViTForObjectDetection:()=>Xl,OwlViTModel:()=>Ql,OwlViTPreTrainedModel:()=>bo,Owlv2ForObjectDetection:()=>_c,Owlv2Model:()=>Yl,Owlv2PreTrainedModel:()=>vo,PaliGemmaForConditionalGeneration:()=>Ba,PaliGemmaPreTrainedModel:()=>za,PatchTSMixerForPrediction:()=>Sd,PatchTSMixerModel:()=>kd,PatchTSMixerPreTrainedModel:()=>aa,PatchTSTForPrediction:()=>Cd,PatchTSTModel:()=>Ed,PatchTSTPreTrainedModel:()=>Pd,Phi3ForCausalLM:()=>Tl,Phi3Model:()=>ii,Phi3PreTrainedModel:()=>lo,Phi3VForCausalLM:()=>pr,Phi3VPreTrainedModel:()=>Na,PhiForCausalLM:()=>Bn,PhiModel:()=>xl,PhiPreTrainedModel:()=>ao,PreTrainedModel:()=>ee,PretrainedMixin:()=>fs,PvtForImageClassification:()=>Ll,PvtModel:()=>_o,PvtPreTrainedModel:()=>oi,PyAnnoteForAudioFrameClassification:()=>Ou,PyAnnoteModel:()=>Fu,PyAnnotePreTrainedModel:()=>mi,QuestionAnsweringModelOutput:()=>Zs,Qwen2ForCausalLM:()=>Ml,Qwen2Model:()=>yl,Qwen2PreTrainedModel:()=>oo,Qwen2VLForConditionalGeneration:()=>vl,Qwen2VLPreTrainedModel:()=>bl,RTDetrForObjectDetection:()=>en,RTDetrModel:()=>To,RTDetrObjectDetectionOutput:()=>qs,RTDetrPreTrainedModel:()=>Ur,ResNetForImageClassification:()=>Ao,ResNetModel:()=>iu,ResNetPreTrainedModel:()=>li,RoFormerForMaskedLM:()=>Se,RoFormerForQuestionAnswering:()=>tt,RoFormerForSequenceClassification:()=>We,RoFormerForTokenClassification:()=>qe,RoFormerModel:()=>we,RoFormerPreTrainedModel:()=>Q,RobertaForMaskedLM:()=>_r,RobertaForQuestionAnswering:()=>Mt,RobertaForSequenceClassification:()=>ds,RobertaForTokenClassification:()=>Cs,RobertaModel:()=>sr,RobertaPreTrainedModel:()=>$t,SamImageSegmentationOutput:()=>Pu,SamModel:()=>Tu,SamPreTrainedModel:()=>vc,SapiensForDepthEstimation:()=>uu,SapiensForNormalEstimation:()=>yc,SapiensForSemanticSegmentation:()=>lu,SapiensPreTrainedModel:()=>di,SegformerForImageClassification:()=>dd,SegformerForSemanticSegmentation:()=>cd,SegformerModel:()=>rr,SegformerPreTrainedModel:()=>Jo,Seq2SeqLMOutput:()=>hp,SequenceClassifierOutput:()=>Kt,SiglipModel:()=>Wa,SiglipPreTrainedModel:()=>Bi,SiglipTextModel:()=>Ga,SiglipVisionModel:()=>Ka,SpeechT5ForSpeechToText:()=>kc,SpeechT5ForTextToSpeech:()=>Ju,SpeechT5HifiGan:()=>Zu,SpeechT5Model:()=>Cc,SpeechT5PreTrainedModel:()=>gi,SqueezeBertForMaskedLM:()=>In,SqueezeBertForQuestionAnswering:()=>On,SqueezeBertForSequenceClassification:()=>Fn,SqueezeBertModel:()=>_n,SqueezeBertPreTrainedModel:()=>Ot,StableLmForCausalLM:()=>Un,StableLmModel:()=>pd,StableLmPreTrainedModel:()=>yi,Starcoder2ForCausalLM:()=>rd,Starcoder2Model:()=>tn,Starcoder2PreTrainedModel:()=>Wr,StyleTextToSpeech2Model:()=>Yu,StyleTextToSpeech2PreTrainedModel:()=>Xu,Swin2SRForImageSuperResolution:()=>wc,Swin2SRModel:()=>ou,Swin2SRPreTrainedModel:()=>Oo,SwinForImageClassification:()=>Fo,SwinModel:()=>ui,SwinPreTrainedModel:()=>Io,T5ForConditionalGeneration:()=>Y,T5Model:()=>M,T5PreTrainedModel:()=>Te,TableTransformerForObjectDetection:()=>ru,TableTransformerModel:()=>Eo,TableTransformerObjectDetectionOutput:()=>gc,TableTransformerPreTrainedModel:()=>Po,TokenClassifierOutput:()=>Vs,TrOCRForCausalLM:()=>td,TrOCRPreTrainedModel:()=>ed,UniSpeechForCTC:()=>Lu,UniSpeechForSequenceClassification:()=>zu,UniSpeechModel:()=>Qo,UniSpeechPreTrainedModel:()=>fi,UniSpeechSatForAudioFrameClassification:()=>Pc,UniSpeechSatForCTC:()=>Bu,UniSpeechSatForSequenceClassification:()=>Ru,UniSpeechSatModel:()=>Tc,UniSpeechSatPreTrainedModel:()=>jn,ViTForImageClassification:()=>Il,ViTMAEModel:()=>Bl,ViTMAEPreTrainedModel:()=>zl,ViTMSNForImageClassification:()=>Nl,ViTMSNModel:()=>Rl,ViTMSNPreTrainedModel:()=>go,ViTModel:()=>Al,ViTPreTrainedModel:()=>ho,VisionEncoderDecoderModel:()=>Li,VitMatteForImageMatting:()=>Wl,VitMattePreTrainedModel:()=>Ul,VitPoseForPoseEstimation:()=>Dl,VitPosePreTrainedModel:()=>fo,VitsModel:()=>Yo,VitsModelOutput:()=>Qd,VitsPreTrainedModel:()=>ud,Wav2Vec2BertForCTC:()=>ju,Wav2Vec2BertForSequenceClassification:()=>Vu,Wav2Vec2BertModel:()=>Nu,Wav2Vec2BertPreTrainedModel:()=>_i,Wav2Vec2ForAudioFrameClassification:()=>Iu,Wav2Vec2ForCTC:()=>$u,Wav2Vec2ForSequenceClassification:()=>Au,Wav2Vec2Model:()=>Su,Wav2Vec2PreTrainedModel:()=>Sr,WavLMForAudioFrameClassification:()=>Ec,WavLMForCTC:()=>Hu,WavLMForSequenceClassification:()=>qu,WavLMForXVector:()=>Qu,WavLMModel:()=>Ku,WavLMPreTrainedModel:()=>Vn,WeSpeakerResNetModel:()=>xc,WeSpeakerResNetPreTrainedModel:()=>Du,WhisperForConditionalGeneration:()=>Aa,WhisperModel:()=>$a,WhisperPreTrainedModel:()=>Oi,XLMForQuestionAnswering:()=>Yr,XLMForSequenceClassification:()=>js,XLMForTokenClassification:()=>Tt,XLMModel:()=>Is,XLMPreTrainedModel:()=>Gt,XLMRobertaForMaskedLM:()=>Ea,XLMRobertaForQuestionAnswering:()=>ka,XLMRobertaForSequenceClassification:()=>Ii,XLMRobertaForTokenClassification:()=>Ca,XLMRobertaModel:()=>Ct,XLMRobertaPreTrainedModel:()=>He,XLMWithLMHeadModel:()=>ks,XVectorOutput:()=>mp,YolosForObjectDetection:()=>vu,YolosModel:()=>bu,YolosObjectDetectionOutput:()=>xu,YolosPreTrainedModel:()=>Mu});var g=r("./src/configs.js"),$=r("./src/backends/onnx.js"),N=r("./src/utils/dtypes.js"),Z=r("./src/utils/generic.js"),j=r("./src/utils/core.js"),y=r("./src/utils/hub.js"),T=r("./src/utils/constants.js"),b=r("./src/generation/logits_process.js"),x=r("./src/generation/configuration_utils.js"),v=r("./src/utils/tensor.js"),L=r("./src/utils/image.js"),K=r("./src/utils/maths.js"),se=r("./src/generation/stopping_criteria.js"),oe=r("./src/generation/logits_sampler.js"),V=r("./src/env.js"),U=r("./src/models/whisper/generation_whisper.js"),H=r("./src/models/whisper/common_whisper.js");const I={EncoderOnly:0,EncoderDecoder:1,Seq2Seq:2,Vision2Seq:3,DecoderOnly:4,MaskGeneration:5,ImageTextToText:6,Musicgen:7,MultiModality:8,Phi3V:9},S=new Map,w=new Map,P=new Map;async function F(_,f,q){const xe=q.config?.["transformers.js_config"]??{};let $e=q.device??xe.device;$e&&typeof $e!="string"&&($e.hasOwnProperty(f)?$e=$e[f]:(console.warn(`device not specified for "${f}". Using the default device.`),$e=null));const Le=$e??(V.apis.IS_NODE_ENV?"cpu":"wasm"),rt=(0,$.deviceToExecutionProviders)(Le);let ot=q.dtype??xe.dtype;if(typeof ot!="string"&&(ot&&ot.hasOwnProperty(f)?ot=ot[f]:(ot=N.DEFAULT_DEVICE_DTYPE_MAPPING[Le]??N.DATA_TYPES.fp32,console.warn(`dtype not specified for "${f}". Using the default dtype (${ot}) for this device (${Le}).`))),ot===N.DATA_TYPES.auto){let es=xe.dtype;typeof es!="string"&&(es=es[f]),es&&es!==N.DATA_TYPES.auto&&N.DATA_TYPES.hasOwnProperty(es)?ot=es:ot=N.DEFAULT_DEVICE_DTYPE_MAPPING[Le]??N.DATA_TYPES.fp32}const _t=ot;if(N.DEFAULT_DTYPE_SUFFIX_MAPPING.hasOwnProperty(_t)){if(_t===N.DATA_TYPES.fp16&&Le==="webgpu"&&!await(0,N.isWebGpuFp16Supported)())throw new Error(`The device (${Le}) does not support fp16.`)}else throw new Error(`Invalid dtype: ${_t}. Should be one of: ${Object.keys(N.DATA_TYPES).join(", ")}`);const kt=xe.kv_cache_dtype?typeof xe.kv_cache_dtype=="string"?xe.kv_cache_dtype:xe.kv_cache_dtype[_t]??"float32":void 0;if(kt&&!["float32","float16"].includes(kt))throw new Error(`Invalid kv_cache_dtype: ${kt}. Should be one of: float32, float16`);const Zt={dtype:_t,kv_cache_dtype:kt},Wt=N.DEFAULT_DTYPE_SUFFIX_MAPPING[_t],Dt=`${q.subfolder??""}/${f}${Wt}.onnx`,At={...q.session_options};At.executionProviders??=rt;const bs=xe.free_dimension_overrides;bs?At.freeDimensionOverrides??=bs:Le.startsWith("webnn")&&!At.freeDimensionOverrides&&console.warn('WebNN does not currently support dynamic shapes and requires `free_dimension_overrides` to be set in config.json as a field within "transformers.js_config". When `free_dimension_overrides` is not set, you may experience significant performance degradation.');const Ht=(0,y.getModelFile)(_,Dt,!0,q),Qt=q.use_external_data_format??xe.use_external_data_format;let ps=[];if(Qt&&(Qt===!0||typeof Qt=="object"&&Qt.hasOwnProperty(f)&&Qt[f]===!0)){if(V.apis.IS_NODE_ENV)throw new Error("External data format is not yet supported in Node.js");const es=`${f}${Wt}.onnx_data`,Us=`${q.subfolder??""}/${es}`;ps.push(new Promise(async(zs,Fs)=>{const Bs=await(0,y.getModelFile)(_,Us,!0,q);zs({path:es,data:Bs})}))}else At.externalData!==void 0&&(ps=At.externalData.map(async es=>{if(typeof es.data=="string"){const Us=await(0,y.getModelFile)(_,es.data,!0,q);return{...es,data:Us}}return es}));if(ps.length>0&&(At.externalData=await Promise.all(ps)),Le==="webgpu"){const es=(0,g.getKeyValueShapes)(q.config,{prefix:"present"});if(Object.keys(es).length>0&&!(0,$.isONNXProxy)()){const Us={};for(const zs in es)Us[zs]="gpu-buffer";At.preferredOutputLocation=Us}}return{buffer:await Ht,session_options:At,session_config:Zt}}async function ae(_,f,q){return Object.fromEntries(await Promise.all(Object.keys(f).map(async xe=>{const{buffer:$e,session_options:Le,session_config:rt}=await F(_,f[xe],q),ot=await(0,$.createInferenceSession)($e,Le,rt);return[xe,ot]})))}async function ie(_,f,q){return Object.fromEntries(await Promise.all(Object.keys(f).map(async xe=>{const $e=await(0,y.getModelJSON)(_,f[xe],!1,q);return[xe,$e]})))}function ye(_,f){const q=Object.create(null),xe=[];for(const rt of _.inputNames){const ot=f[rt];if(!(ot instanceof v.Tensor)){xe.push(rt);continue}q[rt]=(0,$.isONNXProxy)()?ot.clone():ot}if(xe.length>0)throw new Error(`An error occurred during model execution: "Missing the following inputs: ${xe.join(", ")}.`);const $e=Object.keys(f).length,Le=_.inputNames.length;if($e>Le){let rt=Object.keys(f).filter(ot=>!_.inputNames.includes(ot));console.warn(`WARNING: Too many inputs were provided (${$e} > ${Le}). The following inputs will be ignored: "${rt.join(", ")}".`)}return q}async function ge(_,f){const q=ye(_,f);try{const xe=Object.fromEntries(Object.entries(q).map(([Le,rt])=>[Le,rt.ort_tensor]));let $e=await _.run(xe);return $e=re($e),$e}catch(xe){const $e=Object.fromEntries(Object.entries(q).map(([Le,{type:rt,dims:ot,data:_t}])=>[Le,{type:rt,dims:ot,data:_t}]));throw console.error(`An error occurred during model execution: "${xe}".`),console.error("Inputs given to model:",$e),xe}}function re(_){for(let f in _)(0,$.isONNXTensor)(_[f])?_[f]=new v.Tensor(_[f]):typeof _[f]=="object"&&re(_[f]);return _}function Me(_){if(_ instanceof v.Tensor)return _;if(_.length===0)throw Error("items must be non-empty");if(Array.isArray(_[0])){if(_.some(f=>f.length!==_[0].length))throw Error("Unable to create tensor, you should probably activate truncation and/or padding with 'padding=True' and/or 'truncation=True' to have batched tensors with the same length.");return new v.Tensor("int64",BigInt64Array.from(_.flat().map(f=>BigInt(f))),[_.length,_[0].length])}else return new v.Tensor("int64",BigInt64Array.from(_.map(f=>BigInt(f))),[1,_.length])}function pe(_){return new v.Tensor("bool",[_],[1])}async function Ce(_,f){let{encoder_outputs:q,input_ids:xe,decoder_input_ids:$e,...Le}=f;if(!q){const ot=(0,j.pick)(f,_.sessions.model.inputNames);q=(await Ae(_,ot)).last_hidden_state}return Le.input_ids=$e,Le.encoder_hidden_states=q,_.sessions.decoder_model_merged.inputNames.includes("encoder_attention_mask")&&(Le.encoder_attention_mask=f.attention_mask),await Pe(_,Le,!0)}async function Ae(_,f){const q=_.sessions.model,xe=(0,j.pick)(f,q.inputNames);if(q.inputNames.includes("inputs_embeds")&&!xe.inputs_embeds){if(!f.input_ids)throw new Error("Both `input_ids` and `inputs_embeds` are missing in the model inputs.");xe.inputs_embeds=await _.encode_text({input_ids:f.input_ids})}if(q.inputNames.includes("token_type_ids")&&!xe.token_type_ids){if(!xe.input_ids)throw new Error("Both `input_ids` and `token_type_ids` are missing in the model inputs.");xe.token_type_ids=(0,v.zeros_like)(xe.input_ids)}if(q.inputNames.includes("pixel_mask")&&!xe.pixel_mask){if(!xe.pixel_values)throw new Error("Both `pixel_values` and `pixel_mask` are missing in the model inputs.");const $e=xe.pixel_values.dims;xe.pixel_mask=(0,v.ones)([$e[0],$e[2],$e[3]])}return await ge(q,xe)}async function Pe(_,f,q=!1){const xe=_.sessions[q?"decoder_model_merged":"model"],{past_key_values:$e,...Le}=f;if(xe.inputNames.includes("use_cache_branch")&&(Le.use_cache_branch=pe(!!$e)),xe.inputNames.includes("position_ids")&&Le.attention_mask&&!Le.position_ids){const ot=_.config.model_type==="paligemma"?1:0;Le.position_ids=X(Le,$e,ot)}_.addPastKeyValues(Le,$e);const rt=(0,j.pick)(Le,xe.inputNames);return await ge(xe,rt)}function Je({image_token_id:_,inputs_embeds:f,image_features:q,input_ids:xe,attention_mask:$e}){const Le=xe.tolist().map(kt=>kt.reduce((Zt,Wt,Dt)=>(Wt==_&&Zt.push(Dt),Zt),[])),rt=Le.reduce((kt,Zt)=>kt+Zt.length,0),ot=q.dims[0];if(rt!==ot)throw new Error(`Image features and image tokens do not match: tokens: ${rt}, features ${ot}`);let _t=0;for(let kt=0;ktLe.dims[1])){if($eot==_.config.image_token_index)){const ot=_.config.num_image_tokens;if(!ot)throw new Error("`num_image_tokens` is missing in the model configuration.");const _t=Le.dims[1]-($e-ot);q.input_ids=Le.slice(null,[-_t,null]),q.attention_mask=(0,v.ones)([1,$e+_t])}}}return q}function Ee(_,f,q,xe){return q.past_key_values&&(f=f.map($e=>[$e.at(-1)])),{...q,decoder_input_ids:Me(f)}}function Oe(_,...f){return _.config.is_encoder_decoder?Ee(_,...f):de(_,...f)}function Xe(_,f,q,xe){const $e=!!q.past_key_values;return xe.guidance_scale!==null&&xe.guidance_scale>1&&($e?q.input_ids=(0,v.cat)([q.input_ids,q.input_ids],0):(q.input_ids=(0,v.cat)([q.input_ids,(0,v.full_like)(q.input_ids,BigInt(xe.pad_token_id))],0),q.attention_mask=(0,v.cat)([q.attention_mask,(0,v.full_like)(q.attention_mask,0n)],0))),($e||!q.pixel_values)&&(q.pixel_values=(0,v.full)([0,0,3,384,384],1)),$e&&(q.images_seq_mask=new v.Tensor("bool",new Array(1).fill(!0).fill(!1,0,1),[1,1]),q.images_emb_mask=new v.Tensor("bool",new Array(0).fill(!1),[1,1,0])),q}class ee extends Z.Callable{main_input_name="input_ids";forward_params=["input_ids","attention_mask"];constructor(f,q,xe){super(),this.config=f,this.sessions=q,this.configs=xe;const $e=P.get(this.constructor),Le=S.get($e);switch(this.can_generate=!1,this._forward=null,this._prepare_inputs_for_generation=null,Le){case I.DecoderOnly:this.can_generate=!0,this._forward=Pe,this._prepare_inputs_for_generation=de;break;case I.Seq2Seq:case I.Vision2Seq:case I.Musicgen:this.can_generate=!0,this._forward=Ce,this._prepare_inputs_for_generation=Ee;break;case I.EncoderDecoder:this._forward=Ce;break;case I.ImageTextToText:this.can_generate=!0,this._forward=je,this._prepare_inputs_for_generation=Oe;break;case I.Phi3V:this.can_generate=!0,this._prepare_inputs_for_generation=Oe;break;case I.MultiModality:this.can_generate=!0,this._prepare_inputs_for_generation=Xe;break;default:this._forward=Ae;break}this.can_generate&&this.forward_params.push("past_key_values"),this.custom_config=this.config["transformers.js_config"]??{}}async dispose(){const f=[];for(const q of Object.values(this.sessions))q?.handler?.dispose&&f.push(q.handler.dispose());return await Promise.all(f)}static async from_pretrained(f,{progress_callback:q=null,config:xe=null,cache_dir:$e=null,local_files_only:Le=!1,revision:rt="main",model_file_name:ot=null,subfolder:_t="onnx",device:kt=null,dtype:Zt=null,use_external_data_format:Wt=null,session_options:Dt={}}={}){let At={progress_callback:q,config:xe,cache_dir:$e,local_files_only:Le,revision:rt,model_file_name:ot,subfolder:_t,device:kt,dtype:Zt,use_external_data_format:Wt,session_options:Dt};const bs=P.get(this),Ht=S.get(bs);xe=At.config=await g.AutoConfig.from_pretrained(f,At);let Qt;if(Ht===I.DecoderOnly)Qt=await Promise.all([ae(f,{model:At.model_file_name??"model"},At),ie(f,{generation_config:"generation_config.json"},At)]);else if(Ht===I.Seq2Seq||Ht===I.Vision2Seq)Qt=await Promise.all([ae(f,{model:"encoder_model",decoder_model_merged:"decoder_model_merged"},At),ie(f,{generation_config:"generation_config.json"},At)]);else if(Ht===I.MaskGeneration)Qt=await Promise.all([ae(f,{model:"vision_encoder",prompt_encoder_mask_decoder:"prompt_encoder_mask_decoder"},At)]);else if(Ht===I.EncoderDecoder)Qt=await Promise.all([ae(f,{model:"encoder_model",decoder_model_merged:"decoder_model_merged"},At)]);else if(Ht===I.ImageTextToText){const ps={embed_tokens:"embed_tokens",vision_encoder:"vision_encoder",decoder_model_merged:"decoder_model_merged"};xe.is_encoder_decoder&&(ps.model="encoder_model"),Qt=await Promise.all([ae(f,ps,At),ie(f,{generation_config:"generation_config.json"},At)])}else if(Ht===I.Musicgen)Qt=await Promise.all([ae(f,{model:"text_encoder",decoder_model_merged:"decoder_model_merged",encodec_decode:"encodec_decode"},At),ie(f,{generation_config:"generation_config.json"},At)]);else if(Ht===I.MultiModality)Qt=await Promise.all([ae(f,{prepare_inputs_embeds:"prepare_inputs_embeds",model:"language_model",lm_head:"lm_head",gen_head:"gen_head",gen_img_embeds:"gen_img_embeds",image_decode:"image_decode"},At),ie(f,{generation_config:"generation_config.json"},At)]);else if(Ht===I.Phi3V)Qt=await Promise.all([ae(f,{prepare_inputs_embeds:"prepare_inputs_embeds",model:"model",vision_encoder:"vision_encoder"},At),ie(f,{generation_config:"generation_config.json"},At)]);else{if(Ht!==I.EncoderOnly){const ps=bs??xe?.model_type;ps!=="custom"&&console.warn(`Model type for '${ps}' not found, assuming encoder-only architecture. Please report this at ${T.GITHUB_ISSUE_URL}.`)}Qt=await Promise.all([ae(f,{model:At.model_file_name??"model"},At)])}return new this(xe,...Qt)}async _call(f){return await this.forward(f)}async forward(f){return await this._forward(this,f)}get generation_config(){return this.configs?.generation_config??null}_get_logits_warper(f){const q=new b.LogitsProcessorList;return f.temperature!==null&&f.temperature!==1&&q.push(new b.TemperatureLogitsWarper(f.temperature)),f.top_k!==null&&f.top_k!==0&&q.push(new b.TopKLogitsWarper(f.top_k)),f.top_p!==null&&f.top_p<1&&q.push(new b.TopPLogitsWarper(f.top_p)),q}_get_logits_processor(f,q,xe=null){const $e=new b.LogitsProcessorList;if(f.repetition_penalty!==null&&f.repetition_penalty!==1&&$e.push(new b.RepetitionPenaltyLogitsProcessor(f.repetition_penalty)),f.no_repeat_ngram_size!==null&&f.no_repeat_ngram_size>0&&$e.push(new b.NoRepeatNGramLogitsProcessor(f.no_repeat_ngram_size)),f.bad_words_ids!==null&&$e.push(new b.NoBadWordsLogitsProcessor(f.bad_words_ids,f.eos_token_id)),f.min_length!==null&&f.eos_token_id!==null&&f.min_length>0&&$e.push(new b.MinLengthLogitsProcessor(f.min_length,f.eos_token_id)),f.min_new_tokens!==null&&f.eos_token_id!==null&&f.min_new_tokens>0&&$e.push(new b.MinNewTokensLengthLogitsProcessor(q,f.min_new_tokens,f.eos_token_id)),f.forced_bos_token_id!==null&&$e.push(new b.ForcedBOSTokenLogitsProcessor(f.forced_bos_token_id)),f.forced_eos_token_id!==null&&$e.push(new b.ForcedEOSTokenLogitsProcessor(f.max_length,f.forced_eos_token_id)),f.begin_suppress_tokens!==null){const Le=q>1||f.forced_bos_token_id===null?q:q+1;$e.push(new b.SuppressTokensAtBeginLogitsProcessor(f.begin_suppress_tokens,Le))}return f.guidance_scale!==null&&f.guidance_scale>1&&$e.push(new b.ClassifierFreeGuidanceLogitsProcessor(f.guidance_scale)),xe!==null&&$e.extend(xe),$e}_prepare_generation_config(f,q,xe=x.GenerationConfig){const $e={...this.config};for(const rt of["decoder","generator","text_config"])rt in $e&&Object.assign($e,$e[rt]);const Le=new xe($e);return Object.assign(Le,this.generation_config??{}),f&&Object.assign(Le,f),q&&Object.assign(Le,(0,j.pick)(q,Object.getOwnPropertyNames(Le))),Le}_get_stopping_criteria(f,q=null){const xe=new se.StoppingCriteriaList;return f.max_length!==null&&xe.push(new se.MaxLengthCriteria(f.max_length,this.config.max_position_embeddings??null)),f.eos_token_id!==null&&xe.push(new se.EosTokenCriteria(f.eos_token_id)),q&&xe.extend(q),xe}_validate_model_class(){if(!this.can_generate){const f=[Od,vi,ua,la],q=P.get(this.constructor),xe=new Set,$e=this.config.model_type;for(const rt of f){const ot=rt.get($e);ot&&xe.add(ot[0])}let Le=`The current model class (${q}) is not compatible with \`.generate()\`, as it doesn't have a language model head.`;throw xe.size>0&&(Le+=` Please use the following class instead: ${[...xe].join(", ")}`),Error(Le)}}prepare_inputs_for_generation(...f){return this._prepare_inputs_for_generation(this,...f)}_update_model_kwargs_for_generation({generated_input_ids:f,outputs:q,model_inputs:xe,is_encoder_decoder:$e}){return xe.past_key_values=this.getPastKeyValues(q,xe.past_key_values),xe.input_ids=new v.Tensor("int64",f.flat(),[f.length,1]),$e||(xe.attention_mask=(0,v.cat)([xe.attention_mask,(0,v.ones)([xe.attention_mask.dims[0],1])],1)),xe.position_ids=null,xe}_prepare_model_inputs({inputs:f,bos_token_id:q,model_kwargs:xe}){const $e=(0,j.pick)(xe,this.forward_params),Le=this.main_input_name;if(Le in $e){if(f)throw new Error("`inputs`: {inputs}` were passed alongside {input_name} which is not allowed. Make sure to either pass {inputs} or {input_name}=...")}else $e[Le]=f;return{inputs_tensor:$e[Le],model_inputs:$e,model_input_name:Le}}async _prepare_encoder_decoder_kwargs_for_generation({inputs_tensor:f,model_inputs:q,model_input_name:xe,generation_config:$e}){if(this.sessions.model.inputNames.includes("inputs_embeds")&&!q.inputs_embeds&&"_prepare_inputs_embeds"in this){const{input_ids:rt,pixel_values:ot,attention_mask:_t,...kt}=q,Zt=await this._prepare_inputs_embeds(q);q={...kt,...(0,j.pick)(Zt,["inputs_embeds","attention_mask"])}}let{last_hidden_state:Le}=await Ae(this,q);if($e.guidance_scale!==null&&$e.guidance_scale>1)Le=(0,v.cat)([Le,(0,v.full_like)(Le,0)],0),"attention_mask"in q&&(q.attention_mask=(0,v.cat)([q.attention_mask,(0,v.zeros_like)(q.attention_mask)],0));else if(q.decoder_input_ids){const rt=Me(q.decoder_input_ids).dims[0];if(rt!==Le.dims[0]){if(Le.dims[0]!==1)throw new Error(`The encoder outputs have a different batch size (${Le.dims[0]}) than the decoder inputs (${rt}).`);Le=(0,v.cat)(Array.from({length:rt},()=>Le),0)}}return q.encoder_outputs=Le,q}_prepare_decoder_input_ids_for_generation({batch_size:f,model_input_name:q,model_kwargs:xe,decoder_start_token_id:$e,bos_token_id:Le,generation_config:rt}){let{decoder_input_ids:ot,..._t}=xe;if(!(ot instanceof v.Tensor)){if(ot)Array.isArray(ot[0])||(ot=Array.from({length:f},()=>ot));else if($e??=Le,this.config.model_type==="musicgen")ot=Array.from({length:f*this.config.decoder.num_codebooks},()=>[$e]);else if(Array.isArray($e)){if($e.length!==f)throw new Error(`\`decoder_start_token_id\` expcted to have length ${f} but got ${$e.length}`);ot=$e}else ot=Array.from({length:f},()=>[$e]);ot=Me(ot)}return xe.decoder_attention_mask=(0,v.ones_like)(ot),{input_ids:ot,model_inputs:_t}}async generate({inputs:f=null,generation_config:q=null,logits_processor:xe=null,stopping_criteria:$e=null,streamer:Le=null,...rt}){this._validate_model_class(),q=this._prepare_generation_config(q,rt);let{inputs_tensor:ot,model_inputs:_t,model_input_name:kt}=this._prepare_model_inputs({inputs:f,model_kwargs:rt});const Zt=this.config.is_encoder_decoder;Zt&&("encoder_outputs"in _t||(_t=await this._prepare_encoder_decoder_kwargs_for_generation({inputs_tensor:ot,model_inputs:_t,model_input_name:kt,generation_config:q})));let Wt;Zt?{input_ids:Wt,model_inputs:_t}=this._prepare_decoder_input_ids_for_generation({batch_size:_t[kt].dims.at(0),model_input_name:kt,model_kwargs:_t,decoder_start_token_id:q.decoder_start_token_id,bos_token_id:q.bos_token_id,generation_config:q}):Wt=_t[kt];let Dt=Wt.dims.at(-1);q.max_new_tokens!==null&&(q.max_length=Dt+q.max_new_tokens);const At=this._get_logits_processor(q,Dt,xe),bs=this._get_stopping_criteria(q,$e),Ht=_t[kt].dims.at(0),Qt=oe.LogitsSampler.getSampler(q),ps=new Array(Ht).fill(0),ys=Wt.tolist();Le&&Le.put(ys);let es,Us={};for(;;){if(_t=this.prepare_inputs_for_generation(ys,_t,q),es=await this.forward(_t),q.output_attentions&&q.return_dict_in_generate){const lr=this.getAttentions(es);for(const Ar in lr)Ar in Us||(Us[Ar]=[]),Us[Ar].push(lr[Ar])}const Bs=es.logits.slice(null,-1,null),nr=At(ys,Bs),mr=[];for(let lr=0;lrlr))break;_t=this._update_model_kwargs_for_generation({generated_input_ids:mr,outputs:es,model_inputs:_t,is_encoder_decoder:Zt})}Le&&Le.end();const zs=this.getPastKeyValues(es,_t.past_key_values,!0),Fs=new v.Tensor("int64",ys.flat(),[ys.length,ys[0].length]);if(q.return_dict_in_generate)return{sequences:Fs,past_key_values:zs,...Us};for(const Bs of Object.values(es))Bs.location==="gpu-buffer"&&Bs.dispose();return Fs}getPastKeyValues(f,q,xe=!1){const $e=Object.create(null);for(const Le in f)if(Le.startsWith("present")){const rt=Le.replace("present","past_key_values"),ot=Le.includes("encoder");if(ot&&q?$e[rt]=q[rt]:$e[rt]=f[Le],q&&(!ot||xe)){const _t=q[rt];_t.location==="gpu-buffer"&&_t.dispose()}}return $e}getAttentions(f){const q={};for(const xe of["cross_attentions","encoder_attentions","decoder_attentions"])for(const $e in f)$e.startsWith(xe)&&(xe in q||(q[xe]=[]),q[xe].push(f[$e]));return q}addPastKeyValues(f,q){if(q)Object.assign(f,q);else{const $e=(this.sessions.decoder_model_merged??this.sessions.model)?.config?.kv_cache_dtype??"float32",Le=$e==="float16"?new Uint16Array:[],rt=(f[this.main_input_name]??f.attention_mask)?.dims?.[0]??1,ot=(0,g.getKeyValueShapes)(this.config,{batch_size:rt});for(const _t in ot)f[_t]=new v.Tensor($e,Le,ot[_t])}}async encode_image({pixel_values:f}){const q=(await ge(this.sessions.vision_encoder,{pixel_values:f})).image_features;return this.config.num_image_tokens||(console.warn(`The number of image tokens was not set in the model configuration. Setting it to the number of features detected by the vision encoder (${q.dims[1]}).`),this.config.num_image_tokens=q.dims[1]),q}async encode_text({input_ids:f}){return(await ge(this.sessions.embed_tokens,{input_ids:f})).inputs_embeds}}class Ve{}class Re extends Ve{constructor({last_hidden_state:f,hidden_states:q=null,attentions:xe=null}){super(),this.last_hidden_state=f,this.hidden_states=q,this.attentions=xe}}class te extends ee{}class ve extends te{}class Ke extends te{async _call(f){return new Qs(await super._call(f))}}class Ne extends te{async _call(f){return new Kt(await super._call(f))}}class Ue extends te{async _call(f){return new Vs(await super._call(f))}}class ze extends te{async _call(f){return new Zs(await super._call(f))}}class Ze extends ee{}class at extends Ze{}class mt extends Ze{async _call(f){return new Qs(await super._call(f))}}class lt extends Ze{async _call(f){return new Kt(await super._call(f))}}class ct extends Ze{async _call(f){return new Vs(await super._call(f))}}class O extends ee{}class le extends O{}class Q extends ee{}class we extends Q{}class Se extends Q{async _call(f){return new Qs(await super._call(f))}}class We extends Q{async _call(f){return new Kt(await super._call(f))}}class qe extends Q{async _call(f){return new Vs(await super._call(f))}}class tt extends Q{async _call(f){return new Zs(await super._call(f))}}class st extends ee{}class ft extends st{}class Nt extends st{async _call(f){return new Qs(await super._call(f))}}class ss extends st{async _call(f){return new Kt(await super._call(f))}}class Ts extends st{async _call(f){return new Vs(await super._call(f))}}class ms extends st{async _call(f){return new Zs(await super._call(f))}}class Ps extends ee{}class As extends Ps{}class tr extends Ps{async _call(f){return new Qs(await super._call(f))}}class Tr extends Ps{async _call(f){return new Kt(await super._call(f))}}class Gr extends Ps{async _call(f){return new Vs(await super._call(f))}}class Ns extends Ps{async _call(f){return new Zs(await super._call(f))}}class Mr extends ee{}class Lt extends Mr{}class Kr extends Mr{async _call(f){return new Qs(await super._call(f))}}class Pr extends Mr{async _call(f){return new Kt(await super._call(f))}}class Er extends Mr{async _call(f){return new Vs(await super._call(f))}}class Hr extends Mr{async _call(f){return new Zs(await super._call(f))}}class dr extends ee{}class qr extends dr{}class Cr extends dr{async _call(f){return new Qs(await super._call(f))}}class Dr extends dr{async _call(f){return new Kt(await super._call(f))}}class Lr extends dr{async _call(f){return new Vs(await super._call(f))}}class or extends dr{async _call(f){return new Zs(await super._call(f))}}class it extends ee{}class vt extends it{}class Ft extends it{async _call(f){return new Qs(await super._call(f))}}class Ys extends it{async _call(f){return new Kt(await super._call(f))}}class Cn extends it{async _call(f){return new Vs(await super._call(f))}}class dn extends it{async _call(f){return new Zs(await super._call(f))}}class gs extends ee{}class br extends gs{}class Ls extends gs{async _call(f){return new Kt(await super._call(f))}}class Qr extends gs{async _call(f){return new Vs(await super._call(f))}}class ns extends gs{async _call(f){return new Zs(await super._call(f))}}class cn extends gs{async _call(f){return new Qs(await super._call(f))}}class zr extends ee{}class Jn extends zr{}class kn extends zr{async _call(f){return new Qs(await super._call(f))}}class Sn extends zr{async _call(f){return new Kt(await super._call(f))}}class $n extends zr{async _call(f){return new Vs(await super._call(f))}}class Br extends ee{}class An extends Br{}class Zn extends Br{async _call(f){return new Qs(await super._call(f))}}class Rr extends Br{async _call(f){return new Kt(await super._call(f))}}class fr extends Br{async _call(f){return new Zs(await super._call(f))}}class ar extends ee{}class pn extends ar{}class Xr extends ar{async _call(f){return new Qs(await super._call(f))}}class hn extends ar{async _call(f){return new Kt(await super._call(f))}}class mn extends ar{async _call(f){return new Vs(await super._call(f))}}class fn extends ar{async _call(f){return new Zs(await super._call(f))}}class Ot extends ee{}class _n extends Ot{}class In extends Ot{async _call(f){return new Qs(await super._call(f))}}class Fn extends Ot{async _call(f){return new Kt(await super._call(f))}}class On extends Ot{async _call(f){return new Zs(await super._call(f))}}class Nr extends ee{}class Dn extends Nr{}class gn extends Nr{async _call(f){return new Kt(await super._call(f))}}class Ln extends Nr{async _call(f){return new Zs(await super._call(f))}}class as extends Nr{async _call(f){return new Qs(await super._call(f))}}class Te extends ee{forward_params=["input_ids","attention_mask","encoder_outputs","decoder_input_ids","decoder_attention_mask","past_key_values"]}class M extends Te{}class Y extends Te{}class ce extends ee{}class me extends ce{}class Fe extends ce{}class Ye extends ee{}class gt extends Ye{}class wt extends Ye{}class yt extends ee{}class pt extends yt{}class rs extends yt{}class Yt extends yt{async _call(f){return new Kt(await super._call(f))}}class Ms extends ee{}class Gs extends Ms{}class jt extends Ms{}class is extends Ms{async _call(f){return new Kt(await super._call(f))}}class Ks extends Ms{}class Js extends ee{}class De extends Js{}class Xs extends Js{}class kr extends ee{}class Es extends kr{}class Hs extends kr{}class $t extends ee{}class sr extends $t{}class _r extends $t{async _call(f){return new Qs(await super._call(f))}}class ds extends $t{async _call(f){return new Kt(await super._call(f))}}class Cs extends $t{async _call(f){return new Vs(await super._call(f))}}class Mt extends $t{async _call(f){return new Zs(await super._call(f))}}class Gt extends ee{}class Is extends Gt{}class ks extends Gt{async _call(f){return new Qs(await super._call(f))}}class js extends Gt{async _call(f){return new Kt(await super._call(f))}}class Tt extends Gt{async _call(f){return new Vs(await super._call(f))}}class Yr extends Gt{async _call(f){return new Zs(await super._call(f))}}class He extends ee{}class Ct extends He{}class Ea extends He{async _call(f){return new Qs(await super._call(f))}}class Ii extends He{async _call(f){return new Kt(await super._call(f))}}class Ca extends He{async _call(f){return new Vs(await super._call(f))}}class ka extends He{async _call(f){return new Zs(await super._call(f))}}class qt extends ee{}class Sa extends qt{}class Fi extends qt{}class Oi extends ee{requires_attention_mask=!1;main_input_name="input_features";forward_params=["input_features","attention_mask","decoder_input_ids","decoder_attention_mask","past_key_values"]}class $a extends Oi{}class Aa extends Oi{_prepare_generation_config(f,q){return super._prepare_generation_config(f,q,U.WhisperGenerationConfig)}_retrieve_init_tokens(f){const q=[f.decoder_start_token_id];let xe=f.language;const $e=f.task;if(f.is_multilingual){xe||(console.warn("No language specified - defaulting to English (en)."),xe="en");const rt=`<|${(0,H.whisper_language_to_code)(xe)}|>`;q.push(f.lang_to_id[rt]),q.push(f.task_to_id[$e??"transcribe"])}else if(xe||$e)throw new Error("Cannot specify `task` or `language` for an English-only model. If the model is intended to be multilingual, pass `is_multilingual=true` to generate, or update the generation config.");return!f.return_timestamps&&f.no_timestamps_token_id&&q.at(-1)!==f.no_timestamps_token_id?q.push(f.no_timestamps_token_id):f.return_timestamps&&q.at(-1)===f.no_timestamps_token_id&&(console.warn("<|notimestamps|> prompt token is removed from generation_config since `return_timestamps` is set to `true`."),q.pop()),q.filter(Le=>Le!=null)}async generate({inputs:f=null,generation_config:q=null,logits_processor:xe=null,stopping_criteria:$e=null,...Le}){q=this._prepare_generation_config(q,Le);const rt=Le.decoder_input_ids??this._retrieve_init_tokens(q);if(q.return_timestamps&&(xe??=new b.LogitsProcessorList,xe.push(new b.WhisperTimeStampLogitsProcessor(q,rt))),q.begin_suppress_tokens&&(xe??=new b.LogitsProcessorList,xe.push(new b.SuppressTokensAtBeginLogitsProcessor(q.begin_suppress_tokens,rt.length))),q.return_token_timestamps){if(!q.alignment_heads)throw new Error("Model generation config has no `alignment_heads`, token-level timestamps not available. See https://gist.github.com/hollance/42e32852f24243b748ae6bc1f985b13a on how to add this property to the generation config.");q.task==="translate"&&console.warn("Token-level timestamps may not be reliable for task 'translate'."),q.output_attentions=!0,q.return_dict_in_generate=!0}const ot=await super.generate({inputs:f,generation_config:q,logits_processor:xe,decoder_input_ids:rt,...Le});return q.return_token_timestamps&&(ot.token_timestamps=this._extract_token_timestamps(ot,q.alignment_heads,q.num_frames)),ot}_extract_token_timestamps(f,q,xe=null,$e=.02){if(!f.cross_attentions)throw new Error("Model outputs must contain cross attentions to extract timestamps. This is most likely because the model was not exported with `output_attentions=True`.");xe==null&&console.warn("`num_frames` has not been set, meaning the entire audio will be analyzed. This may lead to inaccurate token-level timestamps for short audios (< 30 seconds).");let Le=this.config.median_filter_width;Le===void 0&&(console.warn("Model config has no `median_filter_width`, using default value of 7."),Le=7);const rt=f.cross_attentions,ot=Array.from({length:this.config.decoder_layers},(Ht,Qt)=>(0,v.cat)(rt.map(ps=>ps[Qt]),2)),_t=(0,v.stack)(q.map(([Ht,Qt])=>{if(Ht>=ot.length)throw new Error(`Layer index ${Ht} is out of bounds for cross attentions (length ${ot.length}).`);return xe?ot[Ht].slice(null,Qt,null,[0,xe]):ot[Ht].slice(null,Qt)})).transpose(1,0,2,3),[kt,Zt]=(0,v.std_mean)(_t,-2,0,!0),Wt=_t.clone();for(let Ht=0;Htps[Bs+1]-ps[Bs]),Us=(0,j.mergeArrays)([1],es).map(Fs=>!!Fs),zs=[];for(let Fs=0;FsDt.findIndex(At=>At==Le)),_t=ot.every(Dt=>Dt===-1),kt=ot.every(Dt=>Dt!==-1);if(!_t&&!kt)throw new Error("Every input should contain either 0 or 1 image token.");if(_t)return{inputs_embeds:f,attention_mask:$e};const Zt=[],Wt=[];for(let Dt=0;DtArray.from({length:f.dims[0]},es=>Array.from({length:f.dims[1]},Us=>1))),bs=q?q.tolist():[],Ht=xe?xe.tolist():[];let Qt=0,ps=0;for(let ys=0;ysDt[ys][Os]==1),zs=es.reduce((ws,Os,Ir)=>(Os==_t&&ws.push(Ir),ws),[]).map(ws=>es[ws+1]),Fs=zs.filter(ws=>ws==rt).length,Bs=zs.filter(ws=>ws==ot).length;let nr=[],mr=0,_a=Fs,lr=Bs;for(let ws=0;wsur>mr&&nn==rt),Ir=es.findIndex((nn,ur)=>ur>mr&&nn==ot),sn=_a>0&&Os!==-1?Os:es.length+1,bn=lr>0&&Ir!==-1?Ir:es.length+1;let ga,Ti,wa,ya;sn0?(0,K.max)(nr.at(-1))[0]+1:0;nr.push(Array.from({length:3*ba},(nn,ur)=>Yd+ur%ba));const Jd=ba+Yd,Pi=Vp*Ma*vn,Zd=Array.from({length:Pi},(nn,ur)=>Jd+Math.floor(ur/(Ma*vn))),ec=Array.from({length:Pi},(nn,ur)=>Jd+Math.floor(ur/vn)%Ma),rn=Array.from({length:Pi},(nn,ur)=>Jd+ur%vn);nr.push([Zd,ec,rn].flat()),mr=ga+Pi}if(mr0?(0,K.max)(nr.at(-1))[0]+1:0,Os=es.length-mr;nr.push(Array.from({length:3*Os},(Ir,sn)=>ws+sn%Os))}const Ar=nr.reduce((ws,Os)=>ws+Os.length,0),Gn=new Array(Ar);let Xd=0;for(let ws=0;ws<3;++ws)for(let Os=0;OsWt[Qt%Wt.length]),bs=Array.from({length:Dt[0]},(Ht,Qt)=>(0,K.max)(Wt.subarray(Dt[1]*Qt,Dt[1]*(Qt+1)))[0]+1n+BigInt(Dt[1]));return[new v.Tensor("int64",At,[3,...Dt]),new v.Tensor("int64",bs,[bs.length,1])]}else{const[Wt,Dt]=f.dims,At=BigInt64Array.from({length:3*Wt*Dt},(bs,Ht)=>BigInt(Math.floor(Ht%Dt/Wt)));return[new v.Tensor("int64",At,[3,...f.dims]),(0,v.zeros)([Wt,1])]}}async encode_image({pixel_values:f,image_grid_thw:q}){return(await ge(this.sessions.vision_encoder,{pixel_values:f,grid_thw:q})).image_features}_merge_input_ids_with_image_features(f){return Je({image_token_id:this.config.image_token_id,...f})}prepare_inputs_for_generation(f,q,xe){if(q.attention_mask&&!q.position_ids)if(!q.past_key_values)[q.position_ids,q.rope_deltas]=this.get_rope_index(q.input_ids,q.image_grid_thw,q.video_grid_thw,q.attention_mask);else{q.pixel_values=null;const $e=BigInt(Object.values(q.past_key_values)[0].dims.at(-2)),Le=q.rope_deltas.map(rt=>$e+rt);q.position_ids=(0,v.stack)([Le,Le,Le],0)}return q}}class ao extends ee{}class xl extends ao{}class Bn extends ao{}class lo extends ee{}class ii extends lo{}class Tl extends lo{}class uo extends ee{}class Pl extends uo{}class El extends uo{}class co extends ee{}class Cl extends co{}class kl extends co{}class po extends ee{}class Sl extends po{}class $l extends po{}class ho extends ee{}class Al extends ho{}class Il extends ho{async _call(f){return new Kt(await super._call(f))}}class mo extends ee{}class Fl extends mo{}class Ol extends mo{async _call(f){return new Kt(await super._call(f))}}class fo extends ee{}class Dl extends fo{}class oi extends ee{}class _o extends oi{}class Ll extends oi{async _call(f){return new Kt(await super._call(f))}}class zl extends ee{}class Bl extends zl{}class go extends ee{}class Rl extends go{}class Nl extends go{async _call(f){return new Kt(await super._call(f))}}class wo extends ee{}class jl extends wo{}class yo extends ee{}class Vl extends yo{}class fc extends yo{async _call(f){return new Kt(await super._call(f))}}class Ul extends ee{}class Wl extends Ul{async _call(f){return new Wn(await super._call(f))}}class hr extends ee{}class Gl extends hr{}class Kl extends hr{async _call(f){return new Kt(await super._call(f))}}class Mo extends ee{}class Hl extends Mo{}class ql extends Mo{async _call(f){return new Kt(await super._call(f))}}class bo extends ee{}class Ql extends bo{}class Xl extends bo{}class vo extends ee{}class Yl extends vo{}class _c extends vo{}class xo extends ee{}class Jl extends xo{}class Zl extends xo{async _call(f){return new Kt(await super._call(f))}}class ai extends ee{}class eu extends ai{}class tu extends ai{async _call(f){return new Vr(await super._call(f))}}class su extends ai{async _call(f){return new Zr(await super._call(f))}}class Vr extends Ve{constructor({logits:f,pred_boxes:q}){super(),this.logits=f,this.pred_boxes=q}}class Zr extends Ve{constructor({logits:f,pred_boxes:q,pred_masks:xe}){super(),this.logits=f,this.pred_boxes=q,this.pred_masks=xe}}class Ur extends ee{}class To extends Ur{}class en extends Ur{async _call(f){return new qs(await super._call(f))}}class qs extends Ve{constructor({logits:f,pred_boxes:q}){super(),this.logits=f,this.pred_boxes=q}}class Po extends ee{}class Eo extends Po{}class ru extends Po{async _call(f){return new gc(await super._call(f))}}class gc extends Vr{}class wn extends ee{}class Co extends wn{}class ko extends wn{async _call(f){return new Kt(await super._call(f))}}class So extends ee{}class nu extends So{}class $o extends So{async _call(f){return new Kt(await super._call(f))}}class li extends ee{}class iu extends li{}class Ao extends li{async _call(f){return new Kt(await super._call(f))}}class Io extends ee{}class ui extends Io{}class Fo extends Io{async _call(f){return new Kt(await super._call(f))}}class Oo extends ee{}class ou extends Oo{}class wc extends Oo{}class Do extends ee{}class Lo extends Do{}class Rn extends Do{}class au extends ee{}class zo extends au{}class di extends ee{}class lu extends di{}class uu extends di{}class yc extends di{}class du extends ee{}class cu extends du{}class pu extends ee{}class hu extends pu{}class ci extends pu{}class Bo extends ee{}class pi extends Bo{}class Ro extends Bo{}class No extends ee{}class mu extends No{}class jo extends ee{}class Vo extends jo{}class Mc extends jo{async _call(f){return new Kt(await super._call(f))}}class Uo extends ee{}class bc extends Uo{}class fu extends Uo{async _call(f){return new Kt(await super._call(f))}}class Wo extends ee{}class _u extends Wo{}class Go extends Wo{async _call(f){return new Kt(await super._call(f))}}class Ko extends ee{}class gu extends Ko{}class Ho extends Ko{async _call(f){return new Kt(await super._call(f))}}class wu extends ee{}class yu extends wu{}class Mu extends ee{}class bu extends Mu{}class vu extends Mu{async _call(f){return new xu(await super._call(f))}}class xu extends Ve{constructor({logits:f,pred_boxes:q}){super(),this.logits=f,this.pred_boxes=q}}class vc extends ee{}class Tu extends vc{async get_image_embeddings({pixel_values:f}){return await Ae(this,{pixel_values:f})}async forward(f){if((!f.image_embeddings||!f.image_positional_embeddings)&&(f={...f,...await this.get_image_embeddings(f)}),!f.input_labels&&f.input_points){const xe=f.input_points.dims.slice(0,-1),$e=xe.reduce((Le,rt)=>Le*rt,1);f.input_labels=new v.Tensor("int64",new BigInt64Array($e).fill(1n),xe)}const q={image_embeddings:f.image_embeddings,image_positional_embeddings:f.image_positional_embeddings};return f.input_points&&(q.input_points=f.input_points),f.input_labels&&(q.input_labels=f.input_labels),f.input_boxes&&(q.input_boxes=f.input_boxes),await ge(this.sessions.prompt_encoder_mask_decoder,q)}async _call(f){return new Pu(await super._call(f))}}class Pu extends Ve{constructor({iou_scores:f,pred_masks:q}){super(),this.iou_scores=f,this.pred_masks=q}}class qo extends ee{}class Eu extends qo{}class Cu extends qo{}class ku extends ee{}class hi extends ku{}class Nn extends ku{}class Sr extends ee{}class Su extends Sr{}class $u extends Sr{async _call(f){return new yn(await super._call(f))}}class Au extends Sr{async _call(f){return new Kt(await super._call(f))}}class Iu extends Sr{async _call(f){return new Vs(await super._call(f))}}class mi extends ee{}class Fu extends mi{}class Ou extends mi{async _call(f){return new Vs(await super._call(f))}}class Du extends ee{}class xc extends Du{}class fi extends ee{}class Qo extends fi{}class Lu extends fi{async _call(f){return new yn(await super._call(f))}}class zu extends fi{async _call(f){return new Kt(await super._call(f))}}class jn extends ee{}class Tc extends jn{}class Bu extends jn{async _call(f){return new yn(await super._call(f))}}class Ru extends jn{async _call(f){return new Kt(await super._call(f))}}class Pc extends jn{async _call(f){return new Vs(await super._call(f))}}class _i extends ee{}class Nu extends _i{}class ju extends _i{async _call(f){return new yn(await super._call(f))}}class Vu extends _i{async _call(f){return new Kt(await super._call(f))}}class Bp extends ee{}class Uu extends Sr{}class Wu extends Sr{async _call(f){return new yn(await super._call(f))}}class Gu extends Sr{async _call(f){return new Kt(await super._call(f))}}class Vn extends ee{}class Ku extends Vn{}class Hu extends Vn{async _call(f){return new yn(await super._call(f))}}class qu extends Vn{async _call(f){return new Kt(await super._call(f))}}class Qu extends Vn{async _call(f){return new mp(await super._call(f))}}class Ec extends Vn{async _call(f){return new Vs(await super._call(f))}}class Xu extends ee{}class Yu extends Xu{}class gi extends ee{}class Cc extends gi{}class kc extends gi{}class Ju extends gi{async generate_speech(f,q,{threshold:xe=.5,minlenratio:$e=0,maxlenratio:Le=20,vocoder:rt=null}={}){const ot={input_ids:f},{encoder_outputs:_t,encoder_attention_mask:kt}=await Ae(this,ot),Zt=_t.dims[1]/this.config.reduction_factor,Wt=Math.floor(Zt*Le),Dt=Math.floor(Zt*$e),At=this.config.num_mel_bins;let bs=[],Ht=null,Qt=null,ps=0;for(;;){++ps;const Us=pe(!!Qt);let zs;Qt?zs=Qt.output_sequence_out:zs=new v.Tensor("float32",new Float32Array(At),[1,1,At]);let Fs={use_cache_branch:Us,output_sequence:zs,encoder_attention_mask:kt,speaker_embeddings:q,encoder_hidden_states:_t};this.addPastKeyValues(Fs,Ht),Qt=await ge(this.sessions.decoder_model_merged,Fs),Ht=this.getPastKeyValues(Qt,Ht);const{prob:Bs,spectrum:nr}=Qt;if(bs.push(nr),ps>=Dt&&(Array.from(Bs.data).filter(mr=>mr>=xe).length>0||ps>=Wt))break}const ys=(0,v.cat)(bs),{waveform:es}=await ge(rt.sessions.model,{spectrogram:ys});return{spectrogram:ys,waveform:es}}}class Zu extends ee{main_input_name="spectrogram"}class ed extends ee{}class td extends ed{}class sd extends ee{}class vr extends sd{}class $r extends sd{}class Wr extends ee{}class tn extends Wr{}class rd extends Wr{}class Xo extends ee{}class nd extends Xo{}class id extends Xo{}class wi extends ee{}class od extends wi{}class ad extends wi{static async from_pretrained(f,q={}){return super.from_pretrained(f,{...q,model_file_name:q.model_file_name??"text_model"})}}class ld extends wi{static async from_pretrained(f,q={}){return super.from_pretrained(f,{...q,model_file_name:q.model_file_name??"audio_model"})}}class ud extends ee{}class Yo extends ud{async _call(f){return new Qd(await super._call(f))}}class Jo extends ee{}class rr extends Jo{}class dd extends Jo{}class cd extends Jo{}class yi extends ee{}class pd extends yi{}class Un extends yi{}class Zo extends ee{}class hd extends Zo{}class md extends Zo{async _call(f){return new Kt(await super._call(f))}}class ea extends ee{}class Sc extends ea{}class $c extends ea{}class Mi extends ee{forward_params=["input_ids","attention_mask","encoder_outputs","decoder_input_ids","decoder_attention_mask","past_key_values"];_apply_and_filter_by_delay_pattern_mask(f){const[q,xe]=f.dims,$e=this.config.decoder.num_codebooks,Le=xe-$e;let rt=0;for(let kt=0;kt0&&Dt<=Le&&(f.data[rt++]=f.data[kt])}const ot=Math.floor(q/$e),_t=rt/(ot*$e);return new v.Tensor(f.type,f.data.slice(0,rt),[ot,$e,_t])}prepare_inputs_for_generation(f,q,xe){let $e=structuredClone(f);for(let rt=0;rt<$e.length;++rt)for(let ot=0;ot<$e[rt].length;++ot)rt%this.config.decoder.num_codebooks>=ot&&($e[rt][ot]=BigInt(this.config.decoder.pad_token_id));return xe.guidance_scale!==null&&xe.guidance_scale>1&&($e=$e.concat($e)),super.prepare_inputs_for_generation($e,q,xe)}async generate(f){const q=await super.generate(f),xe=this._apply_and_filter_by_delay_pattern_mask(q).unsqueeze_(0),{audio_values:$e}=await ge(this.sessions.encodec_decode,{audio_codes:xe});return $e}}class ta extends ee{}class fd extends ta{}class _d extends ta{async _call(f){return new Kt(await super._call(f))}}class sa extends ee{}class gd extends sa{}class ra extends sa{async _call(f){return new Kt(await super._call(f))}}class na extends ee{}class Ac extends na{}class ia extends na{async _call(f){return new Kt(await super._call(f))}}class oa extends ee{}class wd extends oa{}class yd extends oa{async _call(f){return new Kt(await super._call(f))}}class Ic extends ee{}class Md extends Ic{}class bd extends ee{}class vd extends bd{forward_params=["input_ids","pixel_values","images_seq_mask","images_emb_mask","attention_mask","position_ids","past_key_values"];constructor(...f){super(...f),this._generation_mode="text"}async forward(f){const q=this._generation_mode??"text";let xe;if(q==="text"||!f.past_key_values){const _t=this.sessions.prepare_inputs_embeds,kt=(0,j.pick)(f,_t.inputNames);xe=await ge(_t,kt)}else{const _t=this.sessions.gen_img_embeds,kt=(0,j.pick)({image_ids:f.input_ids},_t.inputNames);xe=await ge(_t,kt)}const $e={...f,...xe},Le=await Pe(this,$e),rt=this.sessions[q==="text"?"lm_head":"gen_head"];if(!rt)throw new Error(`Unable to find "${rt}" generation head`);const ot=await ge(rt,(0,j.pick)(Le,rt.inputNames));return{...xe,...Le,...ot}}async generate(f){return this._generation_mode="text",super.generate(f)}async generate_images(f){this._generation_mode="image";const q=(f.inputs??f[this.main_input_name]).dims[1],$e=(await super.generate(f)).slice(null,[q,null]),Le=this.sessions.image_decode,{decoded_image:rt}=await ge(Le,{generated_tokens:$e}),ot=rt.add_(1).mul_(255/2).clamp_(0,255).to("uint8"),_t=[];for(const kt of ot){const Zt=L.RawImage.fromTensor(kt);_t.push(Zt)}return _t}}class Fc extends Ve{constructor({char_logits:f,bpe_logits:q,wp_logits:xe}){super(),this.char_logits=f,this.bpe_logits=q,this.wp_logits=xe}get logits(){return[this.char_logits,this.bpe_logits,this.wp_logits]}}class xd extends ee{}class Td extends xd{async _call(f){return new Fc(await super._call(f))}}class Pd extends ee{}class Ed extends Pd{}class Cd extends Pd{}class aa extends ee{}class kd extends aa{}class Sd extends aa{}class fs{static MODEL_CLASS_MAPPINGS=null;static BASE_IF_FAIL=!1;static async from_pretrained(f,{progress_callback:q=null,config:xe=null,cache_dir:$e=null,local_files_only:Le=!1,revision:rt="main",model_file_name:ot=null,subfolder:_t="onnx",device:kt=null,dtype:Zt=null,use_external_data_format:Wt=null,session_options:Dt={}}={}){const At={progress_callback:q,config:xe,cache_dir:$e,local_files_only:Le,revision:rt,model_file_name:ot,subfolder:_t,device:kt,dtype:Zt,use_external_data_format:Wt,session_options:Dt};if(At.config=await g.AutoConfig.from_pretrained(f,At),!this.MODEL_CLASS_MAPPINGS)throw new Error("`MODEL_CLASS_MAPPINGS` not implemented for this type of `AutoClass`: "+this.name);for(const bs of this.MODEL_CLASS_MAPPINGS){const Ht=bs.get(At.config.model_type);if(Ht)return await Ht[1].from_pretrained(f,At)}if(this.BASE_IF_FAIL)return console.warn(`Unknown model class "${At.config.model_type}", attempting to construct from base class.`),await ee.from_pretrained(f,At);throw Error(`Unsupported model type: ${At.config.model_type}`)}}const Oc=new Map([["bert",["BertModel",ve]],["modernbert",["ModernBertModel",at]],["nomic_bert",["NomicBertModel",le]],["roformer",["RoFormerModel",we]],["electra",["ElectraModel",As]],["esm",["EsmModel",Jn]],["convbert",["ConvBertModel",ft]],["camembert",["CamembertModel",Lt]],["deberta",["DebertaModel",qr]],["deberta-v2",["DebertaV2Model",vt]],["mpnet",["MPNetModel",pn]],["albert",["AlbertModel",Dn]],["distilbert",["DistilBertModel",br]],["roberta",["RobertaModel",sr]],["xlm",["XLMModel",Is]],["xlm-roberta",["XLMRobertaModel",Ct]],["clap",["ClapModel",od]],["clip",["CLIPModel",ja]],["clipseg",["CLIPSegModel",Ha]],["chinese_clip",["ChineseCLIPModel",gr]],["siglip",["SiglipModel",Wa]],["jina_clip",["JinaCLIPModel",si]],["mobilebert",["MobileBertModel",An]],["squeezebert",["SqueezeBertModel",_n]],["wav2vec2",["Wav2Vec2Model",Su]],["wav2vec2-bert",["Wav2Vec2BertModel",Nu]],["unispeech",["UniSpeechModel",Qo]],["unispeech-sat",["UniSpeechSatModel",Tc]],["hubert",["HubertModel",Uu]],["wavlm",["WavLMModel",Ku]],["audio-spectrogram-transformer",["ASTModel",Sa]],["vits",["VitsModel",Yo]],["pyannote",["PyAnnoteModel",Fu]],["wespeaker-resnet",["WeSpeakerResNetModel",xc]],["detr",["DetrModel",eu]],["rt_detr",["RTDetrModel",To]],["table-transformer",["TableTransformerModel",Eo]],["vit",["ViTModel",Al]],["ijepa",["IJepaModel",Fl]],["pvt",["PvtModel",_o]],["vit_msn",["ViTMSNModel",Rl]],["vit_mae",["ViTMAEModel",Bl]],["groupvit",["GroupViTModel",jl]],["fastvit",["FastViTModel",Vl]],["mobilevit",["MobileViTModel",Gl]],["mobilevitv2",["MobileViTV2Model",Hl]],["owlvit",["OwlViTModel",Ql]],["owlv2",["Owlv2Model",Yl]],["beit",["BeitModel",Jl]],["deit",["DeiTModel",Co]],["hiera",["HieraModel",nu]],["convnext",["ConvNextModel",Vo]],["convnextv2",["ConvNextV2Model",bc]],["dinov2",["Dinov2Model",_u]],["dinov2_with_registers",["Dinov2WithRegistersModel",gu]],["resnet",["ResNetModel",iu]],["swin",["SwinModel",ui]],["swin2sr",["Swin2SRModel",ou]],["donut-swin",["DonutSwinModel",mu]],["yolos",["YolosModel",bu]],["dpt",["DPTModel",Lo]],["glpn",["GLPNModel",pi]],["hifigan",["SpeechT5HifiGan",Zu]],["efficientnet",["EfficientNetModel",hd]],["decision_transformer",["DecisionTransformerModel",Md]],["patchtst",["PatchTSTForPrediction",Ed]],["patchtsmixer",["PatchTSMixerForPrediction",kd]],["mobilenet_v1",["MobileNetV1Model",fd]],["mobilenet_v2",["MobileNetV2Model",gd]],["mobilenet_v3",["MobileNetV3Model",Ac]],["mobilenet_v4",["MobileNetV4Model",wd]],["maskformer",["MaskFormerModel",hu]],["mgp-str",["MgpstrForSceneTextRecognition",Td]],["style_text_to_speech_2",["StyleTextToSpeech2Model",Yu]]]),Dc=new Map([["t5",["T5Model",M]],["longt5",["LongT5Model",me]],["mt5",["MT5Model",gt]],["bart",["BartModel",pt]],["mbart",["MBartModel",Gs]],["marian",["MarianModel",Eu]],["whisper",["WhisperModel",$a]],["m2m_100",["M2M100Model",hi]],["blenderbot",["BlenderbotModel",De]],["blenderbot-small",["BlenderbotSmallModel",Es]]]),Lc=new Map([["bloom",["BloomModel",Pl]],["jais",["JAISModel",Ya]],["gpt2",["GPT2Model",Qa]],["gptj",["GPTJModel",sl]],["gpt_bigcode",["GPTBigCodeModel",nl]],["gpt_neo",["GPTNeoModel",yr]],["gpt_neox",["GPTNeoXModel",el]],["codegen",["CodeGenModel",Hi]],["llama",["LlamaModel",Qi]],["exaone",["ExaoneModel",ni]],["olmo",["OlmoModel",ul]],["olmo2",["Olmo2Model",dl]],["mobilellm",["MobileLLMModel",ll]],["granite",["GraniteModel",hc]],["cohere",["CohereModel",hl]],["gemma",["GemmaModel",ls]],["gemma2",["Gemma2Model",fl]],["openelm",["OpenELMModel",gl]],["qwen2",["Qwen2Model",yl]],["phi",["PhiModel",xl]],["phi3",["Phi3Model",ii]],["mpt",["MptModel",Cl]],["opt",["OPTModel",Sl]],["mistral",["MistralModel",vr]],["starcoder2",["Starcoder2Model",tn]],["falcon",["FalconModel",nd]],["stablelm",["StableLmModel",pd]]]),la=new Map([["speecht5",["SpeechT5ForSpeechToText",kc]],["whisper",["WhisperForConditionalGeneration",Aa]],["moonshine",["MoonshineForConditionalGeneration",Ia]]]),$d=new Map([["speecht5",["SpeechT5ForTextToSpeech",Ju]]]),Ad=new Map([["vits",["VitsModel",Yo]],["musicgen",["MusicgenForConditionalGeneration",Mi]]]),Id=new Map([["bert",["BertForSequenceClassification",Ne]],["modernbert",["ModernBertForSequenceClassification",lt]],["roformer",["RoFormerForSequenceClassification",We]],["electra",["ElectraForSequenceClassification",Tr]],["esm",["EsmForSequenceClassification",Sn]],["convbert",["ConvBertForSequenceClassification",ss]],["camembert",["CamembertForSequenceClassification",Pr]],["deberta",["DebertaForSequenceClassification",Dr]],["deberta-v2",["DebertaV2ForSequenceClassification",Ys]],["mpnet",["MPNetForSequenceClassification",hn]],["albert",["AlbertForSequenceClassification",gn]],["distilbert",["DistilBertForSequenceClassification",Ls]],["roberta",["RobertaForSequenceClassification",ds]],["xlm",["XLMForSequenceClassification",js]],["xlm-roberta",["XLMRobertaForSequenceClassification",Ii]],["bart",["BartForSequenceClassification",Yt]],["mbart",["MBartForSequenceClassification",is]],["mobilebert",["MobileBertForSequenceClassification",Rr]],["squeezebert",["SqueezeBertForSequenceClassification",Fn]]]),Fd=new Map([["bert",["BertForTokenClassification",Ue]],["modernbert",["ModernBertForTokenClassification",ct]],["roformer",["RoFormerForTokenClassification",qe]],["electra",["ElectraForTokenClassification",Gr]],["esm",["EsmForTokenClassification",$n]],["convbert",["ConvBertForTokenClassification",Ts]],["camembert",["CamembertForTokenClassification",Er]],["deberta",["DebertaForTokenClassification",Lr]],["deberta-v2",["DebertaV2ForTokenClassification",Cn]],["mpnet",["MPNetForTokenClassification",mn]],["distilbert",["DistilBertForTokenClassification",Qr]],["roberta",["RobertaForTokenClassification",Cs]],["xlm",["XLMForTokenClassification",Tt]],["xlm-roberta",["XLMRobertaForTokenClassification",Ca]]]),ua=new Map([["t5",["T5ForConditionalGeneration",Y]],["longt5",["LongT5ForConditionalGeneration",Fe]],["mt5",["MT5ForConditionalGeneration",wt]],["bart",["BartForConditionalGeneration",rs]],["mbart",["MBartForConditionalGeneration",jt]],["marian",["MarianMTModel",Cu]],["m2m_100",["M2M100ForConditionalGeneration",Nn]],["blenderbot",["BlenderbotForConditionalGeneration",Xs]],["blenderbot-small",["BlenderbotSmallForConditionalGeneration",Hs]]]),Od=new Map([["bloom",["BloomForCausalLM",El]],["gpt2",["GPT2LMHeadModel",Xa]],["jais",["JAISLMHeadModel",Ja]],["gptj",["GPTJForCausalLM",rl]],["gpt_bigcode",["GPTBigCodeForCausalLM",il]],["gpt_neo",["GPTNeoForCausalLM",Za]],["gpt_neox",["GPTNeoXForCausalLM",tl]],["codegen",["CodeGenForCausalLM",ol]],["llama",["LlamaForCausalLM",pc]],["exaone",["ExaoneForCausalLM",al]],["olmo",["OlmoForCausalLM",Zi]],["olmo2",["Olmo2ForCausalLM",cl]],["mobilellm",["MobileLLMForCausalLM",zn]],["granite",["GraniteForCausalLM",pl]],["cohere",["CohereForCausalLM",mc]],["gemma",["GemmaForCausalLM",ml]],["gemma2",["Gemma2ForCausalLM",_l]],["openelm",["OpenELMForCausalLM",wl]],["qwen2",["Qwen2ForCausalLM",Ml]],["phi",["PhiForCausalLM",Bn]],["phi3",["Phi3ForCausalLM",Tl]],["mpt",["MptForCausalLM",kl]],["opt",["OPTForCausalLM",$l]],["mbart",["MBartForCausalLM",Ks]],["mistral",["MistralForCausalLM",$r]],["starcoder2",["Starcoder2ForCausalLM",rd]],["falcon",["FalconForCausalLM",id]],["trocr",["TrOCRForCausalLM",td]],["stablelm",["StableLmForCausalLM",Un]],["phi3_v",["Phi3VForCausalLM",pr]]]),bi=new Map([["multi_modality",["MultiModalityCausalLM",vd]]]),da=new Map([["bert",["BertForMaskedLM",Ke]],["modernbert",["ModernBertForMaskedLM",mt]],["roformer",["RoFormerForMaskedLM",Se]],["electra",["ElectraForMaskedLM",tr]],["esm",["EsmForMaskedLM",kn]],["convbert",["ConvBertForMaskedLM",Nt]],["camembert",["CamembertForMaskedLM",Kr]],["deberta",["DebertaForMaskedLM",Cr]],["deberta-v2",["DebertaV2ForMaskedLM",Ft]],["mpnet",["MPNetForMaskedLM",Xr]],["albert",["AlbertForMaskedLM",as]],["distilbert",["DistilBertForMaskedLM",cn]],["roberta",["RobertaForMaskedLM",_r]],["xlm",["XLMWithLMHeadModel",ks]],["xlm-roberta",["XLMRobertaForMaskedLM",Ea]],["mobilebert",["MobileBertForMaskedLM",Zn]],["squeezebert",["SqueezeBertForMaskedLM",In]]]),ca=new Map([["bert",["BertForQuestionAnswering",ze]],["roformer",["RoFormerForQuestionAnswering",tt]],["electra",["ElectraForQuestionAnswering",Ns]],["convbert",["ConvBertForQuestionAnswering",ms]],["camembert",["CamembertForQuestionAnswering",Hr]],["deberta",["DebertaForQuestionAnswering",or]],["deberta-v2",["DebertaV2ForQuestionAnswering",dn]],["mpnet",["MPNetForQuestionAnswering",fn]],["albert",["AlbertForQuestionAnswering",Ln]],["distilbert",["DistilBertForQuestionAnswering",ns]],["roberta",["RobertaForQuestionAnswering",Mt]],["xlm",["XLMForQuestionAnswering",Yr]],["xlm-roberta",["XLMRobertaForQuestionAnswering",ka]],["mobilebert",["MobileBertForQuestionAnswering",fr]],["squeezebert",["SqueezeBertForQuestionAnswering",On]]]),vi=new Map([["vision-encoder-decoder",["VisionEncoderDecoderModel",Li]],["idefics3",["Idefics3ForConditionalGeneration",zi]]]),Dd=new Map([["llava",["LlavaForConditionalGeneration",ei]],["llava_onevision",["LlavaOnevisionForConditionalGeneration",Fa]],["moondream1",["Moondream1ForConditionalGeneration",Oa]],["florence2",["Florence2ForConditionalGeneration",La]],["qwen2-vl",["Qwen2VLForConditionalGeneration",vl]],["idefics3",["Idefics3ForConditionalGeneration",zi]],["paligemma",["PaliGemmaForConditionalGeneration",Ba]]]),zc=new Map([["vision-encoder-decoder",["VisionEncoderDecoderModel",Li]]]),Ld=new Map([["vit",["ViTForImageClassification",Il]],["ijepa",["IJepaForImageClassification",Ol]],["pvt",["PvtForImageClassification",Ll]],["vit_msn",["ViTMSNForImageClassification",Nl]],["fastvit",["FastViTForImageClassification",fc]],["mobilevit",["MobileViTForImageClassification",Kl]],["mobilevitv2",["MobileViTV2ForImageClassification",ql]],["beit",["BeitForImageClassification",Zl]],["deit",["DeiTForImageClassification",ko]],["hiera",["HieraForImageClassification",$o]],["convnext",["ConvNextForImageClassification",Mc]],["convnextv2",["ConvNextV2ForImageClassification",fu]],["dinov2",["Dinov2ForImageClassification",Go]],["dinov2_with_registers",["Dinov2WithRegistersForImageClassification",Ho]],["resnet",["ResNetForImageClassification",Ao]],["swin",["SwinForImageClassification",Fo]],["segformer",["SegformerForImageClassification",dd]],["efficientnet",["EfficientNetForImageClassification",md]],["mobilenet_v1",["MobileNetV1ForImageClassification",_d]],["mobilenet_v2",["MobileNetV2ForImageClassification",ra]],["mobilenet_v3",["MobileNetV3ForImageClassification",ia]],["mobilenet_v4",["MobileNetV4ForImageClassification",yd]]]),pa=new Map([["detr",["DetrForObjectDetection",tu]],["rt_detr",["RTDetrForObjectDetection",en]],["table-transformer",["TableTransformerForObjectDetection",ru]],["yolos",["YolosForObjectDetection",vu]]]),ha=new Map([["owlvit",["OwlViTForObjectDetection",Xl]],["owlv2",["Owlv2ForObjectDetection",_c]],["grounding-dino",["GroundingDinoForObjectDetection",yu]]]),zd=new Map([["detr",["DetrForSegmentation",su]],["clipseg",["CLIPSegForImageSegmentation",qa]]]),Bd=new Map([["segformer",["SegformerForSemanticSegmentation",cd]],["sapiens",["SapiensForSemanticSegmentation",lu]]]),ma=new Map([["detr",["DetrForSegmentation",su]],["maskformer",["MaskFormerForInstanceSegmentation",ci]]]),Rd=new Map([["sam",["SamModel",Tu]]]),Nd=new Map([["wav2vec2",["Wav2Vec2ForCTC",$u]],["wav2vec2-bert",["Wav2Vec2BertForCTC",ju]],["unispeech",["UniSpeechForCTC",Lu]],["unispeech-sat",["UniSpeechSatForCTC",Bu]],["wavlm",["WavLMForCTC",Hu]],["hubert",["HubertForCTC",Wu]]]),fa=new Map([["wav2vec2",["Wav2Vec2ForSequenceClassification",Au]],["wav2vec2-bert",["Wav2Vec2BertForSequenceClassification",Vu]],["unispeech",["UniSpeechForSequenceClassification",zu]],["unispeech-sat",["UniSpeechSatForSequenceClassification",Ru]],["wavlm",["WavLMForSequenceClassification",qu]],["hubert",["HubertForSequenceClassification",Gu]],["audio-spectrogram-transformer",["ASTForAudioClassification",Fi]]]),jd=new Map([["wavlm",["WavLMForXVector",Qu]]]),Vd=new Map([["unispeech-sat",["UniSpeechSatForAudioFrameClassification",Pc]],["wavlm",["WavLMForAudioFrameClassification",Ec]],["wav2vec2",["Wav2Vec2ForAudioFrameClassification",Iu]],["pyannote",["PyAnnoteForAudioFrameClassification",Ou]]]),Ud=new Map([["vitmatte",["VitMatteForImageMatting",Wl]]]),Bc=new Map([["patchtst",["PatchTSTForPrediction",Cd]],["patchtsmixer",["PatchTSMixerForPrediction",Sd]]]),Rc=new Map([["swin2sr",["Swin2SRForImageSuperResolution",wc]]]),Wd=new Map([["dpt",["DPTForDepthEstimation",Rn]],["depth_anything",["DepthAnythingForDepthEstimation",zo]],["glpn",["GLPNForDepthEstimation",Ro]],["sapiens",["SapiensForDepthEstimation",uu]],["depth_pro",["DepthProForDepthEstimation",cu]]]),Gd=new Map([["sapiens",["SapiensForNormalEstimation",yc]]]),Kd=new Map([["vitpose",["VitPoseForPoseEstimation",Dl]]]),Hd=new Map([["clip",["CLIPVisionModelWithProjection",Ua]],["siglip",["SiglipVisionModel",Ka]],["jina_clip",["JinaCLIPVisionModel",wr]]]),Nc=[[Oc,I.EncoderOnly],[Dc,I.EncoderDecoder],[Lc,I.DecoderOnly],[Id,I.EncoderOnly],[Fd,I.EncoderOnly],[ua,I.Seq2Seq],[la,I.Seq2Seq],[Od,I.DecoderOnly],[bi,I.MultiModality],[da,I.EncoderOnly],[ca,I.EncoderOnly],[vi,I.Vision2Seq],[Dd,I.ImageTextToText],[Ld,I.EncoderOnly],[zd,I.EncoderOnly],[ma,I.EncoderOnly],[Bd,I.EncoderOnly],[Ud,I.EncoderOnly],[Bc,I.EncoderOnly],[Rc,I.EncoderOnly],[Wd,I.EncoderOnly],[Gd,I.EncoderOnly],[Kd,I.EncoderOnly],[pa,I.EncoderOnly],[ha,I.EncoderOnly],[Rd,I.MaskGeneration],[Nd,I.EncoderOnly],[fa,I.EncoderOnly],[$d,I.Seq2Seq],[Ad,I.EncoderOnly],[jd,I.EncoderOnly],[Vd,I.EncoderOnly],[Hd,I.EncoderOnly]];for(const[_,f]of Nc)for(const[q,xe]of _.values())S.set(q,f),P.set(xe,q),w.set(q,xe);const jc=[["MusicgenForConditionalGeneration",Mi,I.Musicgen],["Phi3VForCausalLM",pr,I.Phi3V],["CLIPTextModelWithProjection",Va,I.EncoderOnly],["SiglipTextModel",Ga,I.EncoderOnly],["JinaCLIPTextModel",Ri,I.EncoderOnly],["ClapTextModelWithProjection",ad,I.EncoderOnly],["ClapAudioModelWithProjection",ld,I.EncoderOnly]];for(const[_,f,q]of jc)S.set(_,q),P.set(f,_),w.set(_,f);class Vc extends fs{static MODEL_CLASS_MAPPINGS=Nc.map(f=>f[0]);static BASE_IF_FAIL=!0}class Uc extends fs{static MODEL_CLASS_MAPPINGS=[Id]}class Rp extends fs{static MODEL_CLASS_MAPPINGS=[Fd]}class Wc extends fs{static MODEL_CLASS_MAPPINGS=[ua]}class Gc extends fs{static MODEL_CLASS_MAPPINGS=[la]}class Kc extends fs{static MODEL_CLASS_MAPPINGS=[$d]}class Hc extends fs{static MODEL_CLASS_MAPPINGS=[Ad]}class Np extends fs{static MODEL_CLASS_MAPPINGS=[Od]}class qc extends fs{static MODEL_CLASS_MAPPINGS=[da]}class Qc extends fs{static MODEL_CLASS_MAPPINGS=[ca]}class Xc extends fs{static MODEL_CLASS_MAPPINGS=[vi]}class Yc extends fs{static MODEL_CLASS_MAPPINGS=[Ld]}class Jc extends fs{static MODEL_CLASS_MAPPINGS=[zd]}class Zc extends fs{static MODEL_CLASS_MAPPINGS=[Bd]}class ep extends fs{static MODEL_CLASS_MAPPINGS=[ma]}class tp extends fs{static MODEL_CLASS_MAPPINGS=[pa]}class sp extends fs{static MODEL_CLASS_MAPPINGS=[ha]}class rp extends fs{static MODEL_CLASS_MAPPINGS=[Rd]}class np extends fs{static MODEL_CLASS_MAPPINGS=[Nd]}class qd extends fs{static MODEL_CLASS_MAPPINGS=[fa]}class ip extends fs{static MODEL_CLASS_MAPPINGS=[jd]}class op extends fs{static MODEL_CLASS_MAPPINGS=[Vd]}class ap extends fs{static MODEL_CLASS_MAPPINGS=[zc]}class lp extends fs{static MODEL_CLASS_MAPPINGS=[Ud]}class up extends fs{static MODEL_CLASS_MAPPINGS=[Rc]}class dp extends fs{static MODEL_CLASS_MAPPINGS=[Wd]}class cp extends fs{static MODEL_CLASS_MAPPINGS=[Gd]}class jp extends fs{static MODEL_CLASS_MAPPINGS=[Kd]}class pp extends fs{static MODEL_CLASS_MAPPINGS=[Hd]}class hp extends Ve{constructor({logits:f,past_key_values:q,encoder_outputs:xe,decoder_attentions:$e=null,cross_attentions:Le=null}){super(),this.logits=f,this.past_key_values=q,this.encoder_outputs=xe,this.decoder_attentions=$e,this.cross_attentions=Le}}class Kt extends Ve{constructor({logits:f,...q}){super(),this.logits=f;const xe=Object.values(q);xe.length>0&&(this.attentions=xe)}}class mp extends Ve{constructor({logits:f,embeddings:q}){super(),this.logits=f,this.embeddings=q}}class Vs extends Ve{constructor({logits:f}){super(),this.logits=f}}class Qs extends Ve{constructor({logits:f}){super(),this.logits=f}}class Zs extends Ve{constructor({start_logits:f,end_logits:q}){super(),this.start_logits=f,this.end_logits=q}}class yn extends Ve{constructor({logits:f}){super(),this.logits=f}}class fp extends Ve{constructor({logits:f,past_key_values:q}){super(),this.logits=f,this.past_key_values=q}}class Wn extends Ve{constructor({alphas:f}){super(),this.alphas=f}}class Qd extends Ve{constructor({waveform:f,spectrogram:q}){super(),this.waveform=f,this.spectrogram=q}}},"./src/models/audio_spectrogram_transformer/feature_extraction_audio_spectrogram_transformer.js":(ke,A,r)=>{r.r(A),r.d(A,{ASTFeatureExtractor:()=>N});var g=r("./src/base/feature_extraction_utils.js");r("./src/utils/tensor.js");var $=r("./src/utils/audio.js");class N extends g.FeatureExtractor{constructor(j){super(j);const y=this.config.sampling_rate,T=(0,$.mel_filter_bank)(256,this.config.num_mel_bins,20,Math.floor(y/2),y,null,"kaldi",!0);for(let b=0;b{r.r(A),r.d(A,{AutoFeatureExtractor:()=>Z});var g=r("./src/utils/constants.js"),$=r("./src/utils/hub.js");r("./src/base/feature_extraction_utils.js");var N=r("./src/models/feature_extractors.js");class Z{static async from_pretrained(y,T={}){const b=await(0,$.getModelJSON)(y,g.FEATURE_EXTRACTOR_NAME,!0,T),x=b.feature_extractor_type,v=N[x];if(!v)throw new Error(`Unknown feature_extractor_type: '${x}'. Please report this at ${g.GITHUB_ISSUE_URL}.`);return new v(b)}}},"./src/models/auto/image_processing_auto.js":(ke,A,r)=>{r.r(A),r.d(A,{AutoImageProcessor:()=>j});var g=r("./src/utils/constants.js"),$=r("./src/utils/hub.js"),N=r("./src/base/image_processors_utils.js"),Z=r("./src/models/image_processors.js");class j{static async from_pretrained(T,b={}){const x=await(0,$.getModelJSON)(T,g.IMAGE_PROCESSOR_NAME,!0,b),v=x.image_processor_type??x.feature_extractor_type;let L=Z[v];return L||(v!==void 0&&console.warn(`Image processor type '${v}' not found, assuming base ImageProcessor. Please report this at ${g.GITHUB_ISSUE_URL}.`),L=N.ImageProcessor),new L(x)}}},"./src/models/auto/processing_auto.js":(ke,A,r)=>{r.r(A),r.d(A,{AutoProcessor:()=>T});var g=r("./src/utils/constants.js"),$=r("./src/utils/hub.js"),N=r("./src/base/processing_utils.js"),Z=r("./src/models/processors.js"),j=r("./src/models/image_processors.js"),y=r("./src/models/feature_extractors.js");class T{static async from_pretrained(x,v={}){const L=await(0,$.getModelJSON)(x,g.IMAGE_PROCESSOR_NAME,!0,v),{image_processor_type:K,feature_extractor_type:se,processor_class:oe}=L;if(oe&&Z[oe])return Z[oe].from_pretrained(x,v);if(!K&&!se)throw new Error("No `image_processor_type` or `feature_extractor_type` found in the config.");const V={};if(K){const H=j[K];if(!H)throw new Error(`Unknown image_processor_type: '${K}'.`);V.image_processor=new H(L)}if(se){const H=j[se];if(H)V.image_processor=new H(L);else{const I=y[se];if(!I)throw new Error(`Unknown feature_extractor_type: '${se}'.`);V.feature_extractor=new I(L)}}const U={};return new N.Processor(U,V)}}},"./src/models/beit/image_processing_beit.js":(ke,A,r)=>{r.r(A),r.d(A,{BeitFeatureExtractor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}},"./src/models/bit/image_processing_bit.js":(ke,A,r)=>{r.r(A),r.d(A,{BitImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}},"./src/models/chinese_clip/image_processing_chinese_clip.js":(ke,A,r)=>{r.r(A),r.d(A,{ChineseCLIPFeatureExtractor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}},"./src/models/clap/feature_extraction_clap.js":(ke,A,r)=>{r.r(A),r.d(A,{ClapFeatureExtractor:()=>N});var g=r("./src/base/feature_extraction_utils.js");r("./src/utils/tensor.js");var $=r("./src/utils/audio.js");class N extends g.FeatureExtractor{constructor(j){super(j),this.mel_filters=(0,$.mel_filter_bank)(this.config.nb_frequency_bins,this.config.feature_size,this.config.frequency_min,this.config.frequency_max,this.config.sampling_rate,null,"htk"),this.mel_filters_slaney=(0,$.mel_filter_bank)(this.config.nb_frequency_bins,this.config.feature_size,this.config.frequency_min,this.config.frequency_max,this.config.sampling_rate,"slaney","slaney"),this.window=(0,$.window_function)(this.config.fft_window_size,"hann")}async _get_input_mel(j,y,T,b){let x;const v=j.length-y;if(v>0)if(T==="rand_trunc"){const L=Math.floor(Math.random()*(v+1));j=j.subarray(L,L+y),x=await this._extract_fbank_features(j,this.mel_filters_slaney,this.config.nb_max_samples)}else throw new Error(`Truncation strategy "${T}" not implemented`);else{if(v<0){let L=new Float64Array(y);if(L.set(j),b==="repeat")for(let K=j.length;K{r.r(A),r.d(A,{CLIPFeatureExtractor:()=>N,CLIPImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}class N extends ${}},"./src/models/convnext/image_processing_convnext.js":(ke,A,r)=>{r.r(A),r.d(A,{ConvNextFeatureExtractor:()=>N,ConvNextImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{constructor(j){super(j),this.crop_pct=this.config.crop_pct??224/256}async resize(j){const y=this.size?.shortest_edge;if(y===void 0)throw new Error("Size dictionary must contain 'shortest_edge' key.");if(y<384){const T=Math.floor(y/this.crop_pct),[b,x]=this.get_resize_output_image_size(j,{shortest_edge:T});j=await j.resize(b,x,{resample:this.resample}),j=await j.center_crop(y,y)}else j=await j.resize(y,y,{resample:this.resample});return j}}class N extends ${}},"./src/models/deit/image_processing_deit.js":(ke,A,r)=>{r.r(A),r.d(A,{DeiTFeatureExtractor:()=>N,DeiTImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}class N extends ${}},"./src/models/detr/image_processing_detr.js":(ke,A,r)=>{r.r(A),r.d(A,{DetrFeatureExtractor:()=>Z,DetrImageProcessor:()=>N});var g=r("./src/base/image_processors_utils.js"),$=r("./src/utils/tensor.js");class N extends g.ImageProcessor{async _call(y){const T=await super._call(y),b=[T.pixel_values.dims[0],64,64],x=(0,$.full)(b,1n);return{...T,pixel_mask:x}}post_process_object_detection(...y){return(0,g.post_process_object_detection)(...y)}post_process_panoptic_segmentation(...y){return(0,g.post_process_panoptic_segmentation)(...y)}post_process_instance_segmentation(...y){return(0,g.post_process_instance_segmentation)(...y)}}class Z extends N{}},"./src/models/donut/image_processing_donut.js":(ke,A,r)=>{r.r(A),r.d(A,{DonutFeatureExtractor:()=>N,DonutImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{pad_image(j,y,T,b={}){const[x,v,L]=y;let K=this.image_mean;Array.isArray(this.image_mean)||(K=new Array(L).fill(K));let se=this.image_std;Array.isArray(se)||(se=new Array(L).fill(K));const oe=K.map((V,U)=>-V/se[U]);return super.pad_image(j,y,T,{center:!0,constant_values:oe,...b})}}class N extends ${}},"./src/models/dpt/image_processing_dpt.js":(ke,A,r)=>{r.r(A),r.d(A,{DPTFeatureExtractor:()=>N,DPTImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}class N extends ${}},"./src/models/efficientnet/image_processing_efficientnet.js":(ke,A,r)=>{r.r(A),r.d(A,{EfficientNetImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{constructor(Z){super(Z),this.include_top=this.config.include_top??!0,this.include_top&&(this.image_std=this.image_std.map(j=>j*j))}}},"./src/models/feature_extractors.js":(ke,A,r)=>{r.r(A),r.d(A,{ASTFeatureExtractor:()=>g.ASTFeatureExtractor,ClapFeatureExtractor:()=>$.ClapFeatureExtractor,ImageFeatureExtractor:()=>v.ImageProcessor,MoonshineFeatureExtractor:()=>N.MoonshineFeatureExtractor,PyAnnoteFeatureExtractor:()=>Z.PyAnnoteFeatureExtractor,SeamlessM4TFeatureExtractor:()=>j.SeamlessM4TFeatureExtractor,SpeechT5FeatureExtractor:()=>y.SpeechT5FeatureExtractor,Wav2Vec2FeatureExtractor:()=>T.Wav2Vec2FeatureExtractor,WeSpeakerFeatureExtractor:()=>b.WeSpeakerFeatureExtractor,WhisperFeatureExtractor:()=>x.WhisperFeatureExtractor});var g=r("./src/models/audio_spectrogram_transformer/feature_extraction_audio_spectrogram_transformer.js"),$=r("./src/models/clap/feature_extraction_clap.js"),N=r("./src/models/moonshine/feature_extraction_moonshine.js"),Z=r("./src/models/pyannote/feature_extraction_pyannote.js"),j=r("./src/models/seamless_m4t/feature_extraction_seamless_m4t.js"),y=r("./src/models/speecht5/feature_extraction_speecht5.js"),T=r("./src/models/wav2vec2/feature_extraction_wav2vec2.js"),b=r("./src/models/wespeaker/feature_extraction_wespeaker.js"),x=r("./src/models/whisper/feature_extraction_whisper.js"),v=r("./src/base/image_processors_utils.js")},"./src/models/florence2/processing_florence2.js":(ke,A,r)=>{r.r(A),r.d(A,{Florence2Processor:()=>Z});var g=r("./src/base/processing_utils.js"),$=r("./src/models/auto/image_processing_auto.js"),N=r("./src/tokenizers.js");class Z extends g.Processor{static tokenizer_class=N.AutoTokenizer;static image_processor_class=$.AutoImageProcessor;constructor(y,T){super(y,T);const{tasks_answer_post_processing_type:b,task_prompts_without_inputs:x,task_prompts_with_input:v}=this.image_processor.config;this.tasks_answer_post_processing_type=new Map(Object.entries(b??{})),this.task_prompts_without_inputs=new Map(Object.entries(x??{})),this.task_prompts_with_input=new Map(Object.entries(v??{})),this.regexes={quad_boxes:/(.+?)/gm,bboxes:/([^<]+)?/gm},this.size_per_bin=1e3}construct_prompts(y){typeof y=="string"&&(y=[y]);const T=[];for(const b of y)if(this.task_prompts_without_inputs.has(b))T.push(this.task_prompts_without_inputs.get(b));else{for(const[x,v]of this.task_prompts_with_input)if(b.includes(x)){T.push(v.replaceAll("{input}",b).replaceAll(x,""));break}T.length!==y.length&&T.push(b)}return T}post_process_generation(y,T,b){const x=this.tasks_answer_post_processing_type.get(T)??"pure_text";y=y.replaceAll("","").replaceAll("","");let v;switch(x){case"pure_text":v=y;break;case"description_with_bboxes":case"bboxes":case"phrase_grounding":case"ocr":const L=x==="ocr"?"quad_boxes":"bboxes",K=y.matchAll(this.regexes[L]),se=[],oe=[];for(const[V,U,...H]of K)se.push(U?U.trim():se.at(-1)??""),oe.push(H.map((I,S)=>(Number(I)+.5)/this.size_per_bin*b[S%2]));v={labels:se,[L]:oe};break;default:throw new Error(`Task "${T}" (of type "${x}") not yet implemented.`)}return{[T]:v}}async _call(y,T=null,b={}){if(!y&&!T)throw new Error("Either text or images must be provided");const x=await this.image_processor(y,b),v=T?this.tokenizer(T,b):{};return{...x,...v}}}},"./src/models/glpn/image_processing_glpn.js":(ke,A,r)=>{r.r(A),r.d(A,{GLPNFeatureExtractor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}},"./src/models/grounding_dino/image_processing_grounding_dino.js":(ke,A,r)=>{r.r(A),r.d(A,{GroundingDinoImageProcessor:()=>N});var g=r("./src/base/image_processors_utils.js"),$=r("./src/utils/tensor.js");class N extends g.ImageProcessor{async _call(j){const y=await super._call(j),T=y.pixel_values.dims,b=(0,$.ones)([T[0],T[2],T[3]]);return{...y,pixel_mask:b}}}},"./src/models/grounding_dino/processing_grounding_dino.js":(ke,A,r)=>{r.r(A),r.d(A,{GroundingDinoProcessor:()=>y});var g=r("./src/base/processing_utils.js"),$=r("./src/models/auto/image_processing_auto.js"),N=r("./src/tokenizers.js"),Z=r("./src/base/image_processors_utils.js");function j(T,b){const v=T.dims.at(-1)-1,L=T.tolist();L.fill(!1,0,1),L.fill(!1,v);const K=b.tolist();return L.map((se,oe)=>se?oe:null).filter(se=>se!==null).map(se=>K[se])}class y extends g.Processor{static tokenizer_class=N.AutoTokenizer;static image_processor_class=$.AutoImageProcessor;async _call(b,x,v={}){const L=b?await this.image_processor(b,v):{};return{...x?this.tokenizer(x,v):{},...L}}post_process_grounded_object_detection(b,x,{box_threshold:v=.25,text_threshold:L=.25,target_sizes:K=null}={}){const{logits:se,pred_boxes:oe}=b,V=se.dims[0];if(K!==null&&K.length!==V)throw Error("Make sure that you pass in as many target sizes as the batch dimension of the logits");const U=se.dims.at(1),H=se.sigmoid(),I=H.max(-1).tolist(),S=oe.tolist().map(P=>P.map(F=>(0,Z.center_to_corners_format)(F))),w=[];for(let P=0;Pre.map((Me,pe)=>Me*F[(pe+1)%2])));const ae=I[P],ie=[],ye=[],ge=[];for(let re=0;re{r.r(A),r.d(A,{Idefics3ImageProcessor:()=>N});var g=r("./src/base/image_processors_utils.js"),$=r("./src/utils/tensor.js");class N extends g.ImageProcessor{constructor(j){super(j),this.do_image_splitting=j.do_image_splitting??!0,this.max_image_size=j.max_image_size}get_resize_for_vision_encoder(j,y){let[T,b]=j.dims.slice(-2);const x=b/T;return b>=T?(b=Math.ceil(b/y)*y,T=Math.floor(b/x),T=Math.ceil(T/y)*y):(T=Math.ceil(T/y)*y,b=Math.floor(T*x),b=Math.ceil(b/y)*y),{height:T,width:b}}async _call(j,{do_image_splitting:y=null,return_row_col_info:T=!1}={}){let b;if(!Array.isArray(j))b=[[j]];else{if(j.length===0||!j[0])throw new Error("No images provided.");Array.isArray(j[0])?b=j:b=[j]}let x=[],v=[],L=[];const K=[],se=[];for(const P of b){let F=await Promise.all(P.map(ye=>this.preprocess(ye)));K.push(...F.map(ye=>ye.original_size)),se.push(...F.map(ye=>ye.reshaped_input_size)),F.forEach(ye=>ye.pixel_values.unsqueeze_(0));const{longest_edge:ae}=this.max_image_size;let ie;if(y??this.do_image_splitting){let ye=new Array(F.length),ge=new Array(F.length);ie=await Promise.all(F.map(async(re,Me)=>{const pe=this.get_resize_for_vision_encoder(re.pixel_values,ae),Ce=await(0,$.interpolate_4d)(re.pixel_values,{size:[pe.height,pe.width]}),{frames:Ae,num_splits_h:Pe,num_splits_w:Je}=await this.split_image(Ce,this.max_image_size);return ye[Me]=Pe,ge[Me]=Je,(0,$.cat)(Ae,0)})),v.push(ye),L.push(ge)}else{const ye=[ae,ae];ie=await Promise.all(F.map(ge=>(0,$.interpolate_4d)(ge.pixel_values,{size:ye}))),v.push(new Array(F.length).fill(0)),L.push(new Array(F.length).fill(0))}x.push((0,$.cat)(ie,0))}const oe=x.length,[V,U,H,I]=x[0].dims;let S,w;if(oe===1)S=x[0].unsqueeze_(0),w=(0,$.full)([oe,V,H,I],!0);else{const P=Math.max(...x.map(ie=>ie.dims.at(0)));w=(0,$.full)([oe,P,H,I],!0);const F=w.data,ae=P*H*I;for(let ie=0;ieT||L>b){K=Math.ceil(v/T),se=Math.ceil(L/b);const oe=Math.ceil(v/K),V=Math.ceil(L/se);for(let I=0;I{r.r(A),r.d(A,{Idefics3Processor:()=>b});var g=r("./src/base/processing_utils.js"),$=r("./src/models/auto/image_processing_auto.js"),N=r("./src/tokenizers.js");r("./src/utils/image.js");var Z=r("./src/utils/core.js");function j(x,v,L,K,se,oe){let V="";for(let U=0;U`+se.repeat(x);V+=` +`}return V+=` +${K}${oe}`+se.repeat(x)+`${K}`,V}function y(x,v,L,K){return`${v}${K}`+L.repeat(x)+`${v}`}function T(x,v,L,K,se,oe){return x===0&&v===0?y(L,K,se,oe):j(L,x,v,K,se,oe)}class b extends g.Processor{static image_processor_class=$.AutoImageProcessor;static tokenizer_class=N.AutoTokenizer;static uses_processor_config=!0;fake_image_token="";image_token="";global_img_token="";async _call(v,L=null,K={}){K.return_row_col_info??=!0;let se;L&&(se=await this.image_processor(L,K)),Array.isArray(v)||(v=[v]);const oe=se.rows??[new Array(v.length).fill(0)],V=se.cols??[new Array(v.length).fill(0)],U=this.config.image_seq_len,H=[],I=[];for(let w=0;wT(re,ae[Me],U,this.fake_image_token,this.image_token,this.global_img_token)),ye=P.split(this.image_token);if(ye.length===0)throw new Error("The image token should be present in the text.");let ge=ye[0];for(let re=0;re{r.r(A),r.d(A,{BeitFeatureExtractor:()=>g.BeitFeatureExtractor,BitImageProcessor:()=>$.BitImageProcessor,CLIPFeatureExtractor:()=>Z.CLIPFeatureExtractor,CLIPImageProcessor:()=>Z.CLIPImageProcessor,ChineseCLIPFeatureExtractor:()=>N.ChineseCLIPFeatureExtractor,ConvNextFeatureExtractor:()=>j.ConvNextFeatureExtractor,ConvNextImageProcessor:()=>j.ConvNextImageProcessor,DPTFeatureExtractor:()=>x.DPTFeatureExtractor,DPTImageProcessor:()=>x.DPTImageProcessor,DeiTFeatureExtractor:()=>y.DeiTFeatureExtractor,DeiTImageProcessor:()=>y.DeiTImageProcessor,DetrFeatureExtractor:()=>T.DetrFeatureExtractor,DetrImageProcessor:()=>T.DetrImageProcessor,DonutFeatureExtractor:()=>b.DonutFeatureExtractor,DonutImageProcessor:()=>b.DonutImageProcessor,EfficientNetImageProcessor:()=>v.EfficientNetImageProcessor,GLPNFeatureExtractor:()=>L.GLPNFeatureExtractor,GroundingDinoImageProcessor:()=>K.GroundingDinoImageProcessor,Idefics3ImageProcessor:()=>se.Idefics3ImageProcessor,JinaCLIPImageProcessor:()=>V.JinaCLIPImageProcessor,LlavaOnevisionImageProcessor:()=>U.LlavaOnevisionImageProcessor,Mask2FormerImageProcessor:()=>H.Mask2FormerImageProcessor,MaskFormerFeatureExtractor:()=>I.MaskFormerFeatureExtractor,MaskFormerImageProcessor:()=>I.MaskFormerImageProcessor,MobileNetV1FeatureExtractor:()=>S.MobileNetV1FeatureExtractor,MobileNetV1ImageProcessor:()=>S.MobileNetV1ImageProcessor,MobileNetV2FeatureExtractor:()=>w.MobileNetV2FeatureExtractor,MobileNetV2ImageProcessor:()=>w.MobileNetV2ImageProcessor,MobileNetV3FeatureExtractor:()=>P.MobileNetV3FeatureExtractor,MobileNetV3ImageProcessor:()=>P.MobileNetV3ImageProcessor,MobileNetV4FeatureExtractor:()=>F.MobileNetV4FeatureExtractor,MobileNetV4ImageProcessor:()=>F.MobileNetV4ImageProcessor,MobileViTFeatureExtractor:()=>ae.MobileViTFeatureExtractor,MobileViTImageProcessor:()=>ae.MobileViTImageProcessor,NougatImageProcessor:()=>ie.NougatImageProcessor,OwlViTFeatureExtractor:()=>ge.OwlViTFeatureExtractor,OwlViTImageProcessor:()=>ge.OwlViTImageProcessor,Owlv2ImageProcessor:()=>ye.Owlv2ImageProcessor,Phi3VImageProcessor:()=>re.Phi3VImageProcessor,PvtImageProcessor:()=>Me.PvtImageProcessor,Qwen2VLImageProcessor:()=>pe.Qwen2VLImageProcessor,RTDetrImageProcessor:()=>Ce.RTDetrImageProcessor,SamImageProcessor:()=>Ae.SamImageProcessor,SegformerFeatureExtractor:()=>Pe.SegformerFeatureExtractor,SegformerImageProcessor:()=>Pe.SegformerImageProcessor,SiglipImageProcessor:()=>Je.SiglipImageProcessor,Swin2SRImageProcessor:()=>je.Swin2SRImageProcessor,VLMImageProcessor:()=>oe.VLMImageProcessor,ViTFeatureExtractor:()=>_e.ViTFeatureExtractor,ViTImageProcessor:()=>_e.ViTImageProcessor,VitMatteImageProcessor:()=>X.VitMatteImageProcessor,VitPoseImageProcessor:()=>de.VitPoseImageProcessor,YolosFeatureExtractor:()=>Ee.YolosFeatureExtractor,YolosImageProcessor:()=>Ee.YolosImageProcessor});var g=r("./src/models/beit/image_processing_beit.js"),$=r("./src/models/bit/image_processing_bit.js"),N=r("./src/models/chinese_clip/image_processing_chinese_clip.js"),Z=r("./src/models/clip/image_processing_clip.js"),j=r("./src/models/convnext/image_processing_convnext.js"),y=r("./src/models/deit/image_processing_deit.js"),T=r("./src/models/detr/image_processing_detr.js"),b=r("./src/models/donut/image_processing_donut.js"),x=r("./src/models/dpt/image_processing_dpt.js"),v=r("./src/models/efficientnet/image_processing_efficientnet.js"),L=r("./src/models/glpn/image_processing_glpn.js"),K=r("./src/models/grounding_dino/image_processing_grounding_dino.js"),se=r("./src/models/idefics3/image_processing_idefics3.js"),oe=r("./src/models/janus/image_processing_janus.js"),V=r("./src/models/jina_clip/image_processing_jina_clip.js"),U=r("./src/models/llava_onevision/image_processing_llava_onevision.js"),H=r("./src/models/mask2former/image_processing_mask2former.js"),I=r("./src/models/maskformer/image_processing_maskformer.js"),S=r("./src/models/mobilenet_v1/image_processing_mobilenet_v1.js"),w=r("./src/models/mobilenet_v2/image_processing_mobilenet_v2.js"),P=r("./src/models/mobilenet_v3/image_processing_mobilenet_v3.js"),F=r("./src/models/mobilenet_v4/image_processing_mobilenet_v4.js"),ae=r("./src/models/mobilevit/image_processing_mobilevit.js"),ie=r("./src/models/nougat/image_processing_nougat.js"),ye=r("./src/models/owlv2/image_processing_owlv2.js"),ge=r("./src/models/owlvit/image_processing_owlvit.js"),re=r("./src/models/phi3_v/image_processing_phi3_v.js"),Me=r("./src/models/pvt/image_processing_pvt.js"),pe=r("./src/models/qwen2_vl/image_processing_qwen2_vl.js"),Ce=r("./src/models/rt_detr/image_processing_rt_detr.js"),Ae=r("./src/models/sam/image_processing_sam.js"),Pe=r("./src/models/segformer/image_processing_segformer.js"),Je=r("./src/models/siglip/image_processing_siglip.js"),je=r("./src/models/swin2sr/image_processing_swin2sr.js"),_e=r("./src/models/vit/image_processing_vit.js"),X=r("./src/models/vitmatte/image_processing_vitmatte.js"),de=r("./src/models/vitpose/image_processing_vitpose.js"),Ee=r("./src/models/yolos/image_processing_yolos.js")},"./src/models/janus/image_processing_janus.js":(ke,A,r)=>{r.r(A),r.d(A,{VLMImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{constructor(Z){super({do_pad:!0,pad_size:{width:Z.image_size,height:Z.image_size},...Z}),this.constant_values=this.config.background_color.map(j=>j*this.rescale_factor)}pad_image(Z,j,y,T){return super.pad_image(Z,j,y,{constant_values:this.constant_values,center:!0,...T})}}},"./src/models/janus/processing_janus.js":(ke,A,r)=>{r.r(A),r.d(A,{VLChatProcessor:()=>T});var g=r("./src/base/processing_utils.js"),$=r("./src/models/auto/image_processing_auto.js"),N=r("./src/tokenizers.js"),Z=r("./src/utils/core.js"),j=r("./src/utils/tensor.js"),y=r("./src/utils/image.js");class T extends g.Processor{static image_processor_class=$.AutoImageProcessor;static tokenizer_class=N.AutoTokenizer;static uses_processor_config=!0;constructor(x,v){super(x,v),this.image_tag=this.config.image_tag,this.image_start_tag=this.config.image_start_tag,this.image_end_tag=this.config.image_end_tag,this.num_image_tokens=this.config.num_image_tokens}async _call(x,{images:v=null,chat_template:L="default"}={}){v?Array.isArray(v)||(v=[v]):v=await Promise.all(x.filter(ie=>ie.images).flatMap(ie=>ie.images).map(ie=>y.RawImage.read(ie)));const K=this.tokenizer,se=K.apply_chat_template(x,{tokenize:!1,add_generation_prompt:!0,chat_template:L}),oe=ie=>K.encode(ie,{add_special_tokens:!1}),V=se.split(this.image_tag),U=V.length-1;if(v.length!==U)throw new Error(`Number of images provided (${v.length}) does not match number of "${this.image_tag}" image tags (${U})`);const[H,I,S]=K.model.convert_tokens_to_ids([this.image_tag,this.image_start_tag,this.image_end_tag]);let w=oe(V[0]),P=new Array(w.length).fill(!1);for(let ie=1;ie0){const ie=await this.image_processor(v);return ie.pixel_values.unsqueeze_(0),{...ae,...ie}}return ae}}},"./src/models/jina_clip/image_processing_jina_clip.js":(ke,A,r)=>{r.r(A),r.d(A,{JinaCLIPImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{constructor(Z){const{resize_mode:j,fill_color:y,interpolation:T,size:b,...x}=Z,v=j==="squash"?{width:b,height:b}:j==="shortest"?{shortest_edge:b}:{longest_edge:b},L=T==="bicubic"?3:2;super({...x,size:v,resample:L,do_center_crop:!0,crop_size:b,do_normalize:!0})}}},"./src/models/jina_clip/processing_jina_clip.js":(ke,A,r)=>{r.r(A),r.d(A,{JinaCLIPProcessor:()=>Z});var g=r("./src/base/processing_utils.js"),$=r("./src/models/auto/image_processing_auto.js"),N=r("./src/tokenizers.js");class Z extends g.Processor{static tokenizer_class=N.AutoTokenizer;static image_processor_class=$.AutoImageProcessor;async _call(y=null,T=null,b={}){if(!y&&!T)throw new Error("Either text or images must be provided");const x=y?this.tokenizer(y,b):{},v=T?await this.image_processor(T,b):{};return{...x,...v}}}},"./src/models/llava_onevision/image_processing_llava_onevision.js":(ke,A,r)=>{r.r(A),r.d(A,{LlavaOnevisionImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}},"./src/models/mask2former/image_processing_mask2former.js":(ke,A,r)=>{r.r(A),r.d(A,{Mask2FormerImageProcessor:()=>$});var g=r("./src/models/maskformer/image_processing_maskformer.js");class $ extends g.MaskFormerImageProcessor{}},"./src/models/maskformer/image_processing_maskformer.js":(ke,A,r)=>{r.r(A),r.d(A,{MaskFormerFeatureExtractor:()=>N,MaskFormerImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{post_process_panoptic_segmentation(...j){return(0,g.post_process_panoptic_segmentation)(...j)}post_process_instance_segmentation(...j){return(0,g.post_process_instance_segmentation)(...j)}}class N extends ${}},"./src/models/mgp_str/processing_mgp_str.js":(ke,A,r)=>{r.r(A),r.d(A,{MgpstrProcessor:()=>y});var g=r("./src/base/processing_utils.js"),$=r("./src/models/auto/image_processing_auto.js"),N=r("./src/tokenizers.js"),Z=r("./src/utils/maths.js");const j={char:["char_decode",1],bpe:["bpe_decode",2],wp:["wp_decode",102]};class y extends g.Processor{static tokenizer_class=N.AutoTokenizer;static image_processor_class=$.AutoImageProcessor;get char_tokenizer(){return this.components.char_tokenizer}get bpe_tokenizer(){return this.components.bpe_tokenizer}get wp_tokenizer(){return this.components.wp_tokenizer}_decode_helper(b,x){if(!j.hasOwnProperty(x))throw new Error(`Format ${x} is not supported.`);const[v,L]=j[x],K=this[v].bind(this),[se,oe]=b.dims,V=[],U=[],H=b.tolist();for(let S=0;S0?F.reduce((ie,ye)=>ie*ye,1):0;U.push(P),V.push(ae)}return[K(U),V]}char_decode(b){return this.char_tokenizer.batch_decode(b).map(x=>x.replaceAll(" ",""))}bpe_decode(b){return this.bpe_tokenizer.batch_decode(b)}wp_decode(b){return this.wp_tokenizer.batch_decode(b).map(x=>x.replaceAll(" ",""))}batch_decode([b,x,v]){const[L,K]=this._decode_helper(b,"char"),[se,oe]=this._decode_helper(x,"bpe"),[V,U]=this._decode_helper(v,"wp"),H=[],I=[];for(let S=0;S{r.r(A),r.d(A,{MobileNetV1FeatureExtractor:()=>N,MobileNetV1ImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}class N extends ${}},"./src/models/mobilenet_v2/image_processing_mobilenet_v2.js":(ke,A,r)=>{r.r(A),r.d(A,{MobileNetV2FeatureExtractor:()=>N,MobileNetV2ImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}class N extends ${}},"./src/models/mobilenet_v3/image_processing_mobilenet_v3.js":(ke,A,r)=>{r.r(A),r.d(A,{MobileNetV3FeatureExtractor:()=>N,MobileNetV3ImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}class N extends ${}},"./src/models/mobilenet_v4/image_processing_mobilenet_v4.js":(ke,A,r)=>{r.r(A),r.d(A,{MobileNetV4FeatureExtractor:()=>N,MobileNetV4ImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}class N extends ${}},"./src/models/mobilevit/image_processing_mobilevit.js":(ke,A,r)=>{r.r(A),r.d(A,{MobileViTFeatureExtractor:()=>N,MobileViTImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}class N extends ${}},"./src/models/moonshine/feature_extraction_moonshine.js":(ke,A,r)=>{r.r(A),r.d(A,{MoonshineFeatureExtractor:()=>N});var g=r("./src/base/feature_extraction_utils.js"),$=r("./src/utils/tensor.js");class N extends g.FeatureExtractor{async _call(j){(0,g.validate_audio_inputs)(j,"MoonshineFeatureExtractor"),j instanceof Float64Array&&(j=new Float32Array(j));const y=[1,j.length];return{input_values:new $.Tensor("float32",j,y)}}}},"./src/models/moonshine/processing_moonshine.js":(ke,A,r)=>{r.r(A),r.d(A,{MoonshineProcessor:()=>Z});var g=r("./src/models/auto/feature_extraction_auto.js"),$=r("./src/tokenizers.js"),N=r("./src/base/processing_utils.js");class Z extends N.Processor{static tokenizer_class=$.AutoTokenizer;static feature_extractor_class=g.AutoFeatureExtractor;async _call(y){return await this.feature_extractor(y)}}},"./src/models/nougat/image_processing_nougat.js":(ke,A,r)=>{r.r(A),r.d(A,{NougatImageProcessor:()=>$});var g=r("./src/models/donut/image_processing_donut.js");class $ extends g.DonutImageProcessor{}},"./src/models/owlv2/image_processing_owlv2.js":(ke,A,r)=>{r.r(A),r.d(A,{Owlv2ImageProcessor:()=>$});var g=r("./src/models/owlvit/image_processing_owlvit.js");class $ extends g.OwlViTImageProcessor{}},"./src/models/owlvit/image_processing_owlvit.js":(ke,A,r)=>{r.r(A),r.d(A,{OwlViTFeatureExtractor:()=>N,OwlViTImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{post_process_object_detection(...j){return(0,g.post_process_object_detection)(...j)}}class N extends ${}},"./src/models/owlvit/processing_owlvit.js":(ke,A,r)=>{r.r(A),r.d(A,{OwlViTProcessor:()=>Z});var g=r("./src/base/processing_utils.js"),$=r("./src/models/auto/image_processing_auto.js"),N=r("./src/tokenizers.js");class Z extends g.Processor{static tokenizer_class=N.AutoTokenizer;static image_processor_class=$.AutoImageProcessor}},"./src/models/paligemma/processing_paligemma.js":(ke,A,r)=>{r.r(A),r.d(A,{PaliGemmaProcessor:()=>y});var g=r("./src/base/processing_utils.js"),$=r("./src/models/auto/image_processing_auto.js"),N=r("./src/tokenizers.js");const Z="";function j(T,b,x,v,L){return`${v.repeat(x*L)}${b}${T} +`}class y extends g.Processor{static tokenizer_class=N.AutoTokenizer;static image_processor_class=$.AutoImageProcessor;static uses_processor_config=!1;async _call(b,x=null,v={}){x||(console.warn("You are using PaliGemma without a text prefix. It will perform as a picture-captioning model."),x=""),Array.isArray(b)||(b=[b]),Array.isArray(x)||(x=[x]);const L=this.tokenizer.bos_token,K=this.image_processor.config.image_seq_length;let se;x.some(U=>U.includes(Z))?se=x.map(U=>{const H=U.replaceAll(Z,Z.repeat(K)),I=H.lastIndexOf(Z),S=I===-1?0:I+Z.length;return H.slice(0,S)+L+H.slice(S)+` +`}):(console.warn("You are passing both `text` and `images` to `PaliGemmaProcessor`. The processor expects special image tokens in the text, as many tokens as there are images per each text. It is recommended to add `` tokens in the very beginning of your text. For this call, we will infer how many images each text has and add special tokens."),se=x.map(U=>j(U,L,K,Z,b.length)));const oe=this.tokenizer(se,v);return{...await this.image_processor(b,v),...oe}}}},"./src/models/phi3_v/image_processing_phi3_v.js":(ke,A,r)=>{r.r(A),r.d(A,{Phi3VImageProcessor:()=>b});var g=r("./src/base/image_processors_utils.js"),$=r("./src/utils/tensor.js");const N=336,Z=[2,3],{ceil:j,floor:y,sqrt:T}=Math;class b extends g.ImageProcessor{constructor(v){super({...v,do_normalize:!0,do_pad:!0,pad_size:"custom",do_convert_rgb:!0,do_resize:!0}),this._num_crops=v.num_crops}calc_num_image_tokens_from_image_size(v,L){const{num_img_tokens:K}=this.config;return y((y(L/N)*y(v/N)+1)*K+1+(y(L/N)+1)*T(K))}get_resize_output_image_size(v,L){const K=this._num_crops,[se,oe]=v.size;let V=se/oe,U=1;for(;U*Math.ceil(U/V)<=K;)U+=1;U-=1;const H=Math.floor(U*336),I=Math.floor(H/V);return[H,I]}pad_image(v,L,K,se={}){const[oe,V]=L,U=N*j(oe/N),H=N*j(V/N),I=[1,1,1].map((S,w)=>(S-this.image_mean[w])/this.image_std[w]);return super.pad_image(v,L,{width:H,height:U},{center:!0,constant_values:I,...se})}async _call(v,{num_crops:L=null}={}){if(this._num_crops=L??=this.config.num_crops,L<4||T(L)%1!==0)throw new Error("num_crops must be a square number >= 4");Array.isArray(v)||(v=[v]);const K=v.length,se=await Promise.all(v.map(P=>this.preprocess(P))),oe=se.map(P=>P.original_size),V=se.map(P=>P.reshaped_input_size),U=[];for(const{pixel_values:P}of se){P.unsqueeze_(0);const[F,ae]=P.dims.slice(-2),ie=await(0,$.interpolate_4d)(P,{size:[N,N],mode:"bicubic"});if(L>0){const ye=[],ge=T(L),re=y(ae/ge),Me=y(F/ge);for(let Ce=0;CeP.map(F=>N*j(F/N))),S=new $.Tensor("int64",I.flat(),[K,2]),w=I.map(([P,F])=>this.calc_num_image_tokens_from_image_size(F,P));return{pixel_values:H,original_sizes:oe,reshaped_input_sizes:V,image_sizes:S,num_img_tokens:w}}}},"./src/models/phi3_v/processing_phi3_v.js":(ke,A,r)=>{r.r(A),r.d(A,{Phi3VProcessor:()=>y});var g=r("./src/base/processing_utils.js"),$=r("./src/models/auto/image_processing_auto.js"),N=r("./src/tokenizers.js");r("./src/utils/image.js");const Z="<|image|>",j=/<\|image_\d+\|>/g;class y extends g.Processor{static image_processor_class=$.AutoImageProcessor;static tokenizer_class=N.AutoTokenizer;async _call(b,x=null,{padding:v=!0,truncation:L=!0,num_crops:K=null}={}){Array.isArray(b)||(b=[b]);let se,oe;if(x){oe=await this.image_processor(x,{num_crops:K});const{num_img_tokens:V}=oe,U=b.map((I,S)=>I.split(j).join(Z.repeat(V[S])));se=this.tokenizer(U,{padding:v,truncation:L});const H=this.tokenizer.model.convert_tokens_to_ids([Z])[0];se.input_ids.map_(I=>I==H?-I:I)}else se=this.tokenizer(b);return{...se,...oe}}}},"./src/models/processors.js":(ke,A,r)=>{r.r(A),r.d(A,{Florence2Processor:()=>g.Florence2Processor,GroundingDinoProcessor:()=>$.GroundingDinoProcessor,Idefics3Processor:()=>N.Idefics3Processor,JinaCLIPProcessor:()=>j.JinaCLIPProcessor,MgpstrProcessor:()=>y.MgpstrProcessor,MoonshineProcessor:()=>T.MoonshineProcessor,OwlViTProcessor:()=>b.OwlViTProcessor,PaliGemmaProcessor:()=>v.PaliGemmaProcessor,Phi3VProcessor:()=>x.Phi3VProcessor,PyAnnoteProcessor:()=>L.PyAnnoteProcessor,Qwen2VLProcessor:()=>K.Qwen2VLProcessor,SamProcessor:()=>se.SamProcessor,SpeechT5Processor:()=>oe.SpeechT5Processor,VLChatProcessor:()=>Z.VLChatProcessor,Wav2Vec2ProcessorWithLM:()=>V.Wav2Vec2ProcessorWithLM,WhisperProcessor:()=>U.WhisperProcessor});var g=r("./src/models/florence2/processing_florence2.js"),$=r("./src/models/grounding_dino/processing_grounding_dino.js"),N=r("./src/models/idefics3/processing_idefics3.js"),Z=r("./src/models/janus/processing_janus.js"),j=r("./src/models/jina_clip/processing_jina_clip.js"),y=r("./src/models/mgp_str/processing_mgp_str.js"),T=r("./src/models/moonshine/processing_moonshine.js"),b=r("./src/models/owlvit/processing_owlvit.js"),x=r("./src/models/phi3_v/processing_phi3_v.js"),v=r("./src/models/paligemma/processing_paligemma.js"),L=r("./src/models/pyannote/processing_pyannote.js"),K=r("./src/models/qwen2_vl/processing_qwen2_vl.js"),se=r("./src/models/sam/processing_sam.js"),oe=r("./src/models/speecht5/processing_speecht5.js"),V=r("./src/models/wav2vec2/processing_wav2vec2.js"),U=r("./src/models/whisper/processing_whisper.js")},"./src/models/pvt/image_processing_pvt.js":(ke,A,r)=>{r.r(A),r.d(A,{PvtImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}},"./src/models/pyannote/feature_extraction_pyannote.js":(ke,A,r)=>{r.r(A),r.d(A,{PyAnnoteFeatureExtractor:()=>Z});var g=r("./src/base/feature_extraction_utils.js"),$=r("./src/utils/tensor.js"),N=r("./src/utils/maths.js");class Z extends g.FeatureExtractor{async _call(y){(0,g.validate_audio_inputs)(y,"PyAnnoteFeatureExtractor"),y instanceof Float64Array&&(y=new Float32Array(y));const T=[1,1,y.length];return{input_values:new $.Tensor("float32",y,T)}}samples_to_frames(y){return(y-this.config.offset)/this.config.step}post_process_speaker_diarization(y,T){const b=T/this.samples_to_frames(T)/this.config.sampling_rate,x=[];for(const v of y.tolist()){const L=[];let K=-1;for(let se=0;se({id:se,start:oe*b,end:V*b,confidence:U/(V-oe)})))}return x}}},"./src/models/pyannote/processing_pyannote.js":(ke,A,r)=>{r.r(A),r.d(A,{PyAnnoteProcessor:()=>N});var g=r("./src/base/processing_utils.js"),$=r("./src/models/pyannote/feature_extraction_pyannote.js");class N extends g.Processor{static feature_extractor_class=$.PyAnnoteFeatureExtractor;async _call(j){return await this.feature_extractor(j)}post_process_speaker_diarization(...j){return this.feature_extractor.post_process_speaker_diarization(...j)}get sampling_rate(){return this.feature_extractor.config.sampling_rate}}},"./src/models/qwen2_vl/image_processing_qwen2_vl.js":(ke,A,r)=>{r.r(A),r.d(A,{Qwen2VLImageProcessor:()=>N});var g=r("./src/base/image_processors_utils.js"),$=r("./src/utils/tensor.js");class N extends g.ImageProcessor{async _call(j,...y){const{pixel_values:T,original_sizes:b,reshaped_input_sizes:x}=await super._call(j,...y);let v=T;const{temporal_patch_size:L,merge_size:K,patch_size:se}=this.config;v.dims[0]===1&&(v=(0,$.cat)(Array.from({length:L},()=>v),0));const oe=v.dims[0]/L,V=v.dims[1],U=Math.floor(v.dims[2]/se),H=Math.floor(v.dims[3]/se),I=v.view(oe,L,V,Math.floor(U/K),K,se,Math.floor(H/K),K,se).permute(0,3,6,4,7,2,1,5,8).view(oe*U*H,V*L*se*se),S=new $.Tensor("int64",[oe,U,H],[1,3]);return{pixel_values:I,image_grid_thw:S,original_sizes:b,reshaped_input_sizes:x}}}},"./src/models/qwen2_vl/processing_qwen2_vl.js":(ke,A,r)=>{r.r(A),r.d(A,{Qwen2VLProcessor:()=>Z});var g=r("./src/base/processing_utils.js"),$=r("./src/models/auto/image_processing_auto.js"),N=r("./src/tokenizers.js");r("./src/utils/image.js");class Z extends g.Processor{static image_processor_class=$.AutoImageProcessor;static tokenizer_class=N.AutoTokenizer;async _call(y,T=null,...b){Array.isArray(y)||(y=[y]);let x,v;if(T&&(x=await this.image_processor(T),v=x.image_grid_thw),v){let K=this.image_processor.config.merge_size**2,se=0;const oe=v.tolist();y=y.map(V=>{for(;V.includes("<|image_pad|>");){const U=Number(oe[se++].reduce((H,I)=>H*I,1n));V=V.replace("<|image_pad|>","<|placeholder|>".repeat(Math.floor(U/K)))}return V.replaceAll("<|placeholder|>","<|image_pad|>")})}return{...this.tokenizer(y),...x}}}},"./src/models/rt_detr/image_processing_rt_detr.js":(ke,A,r)=>{r.r(A),r.d(A,{RTDetrImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{post_process_object_detection(...Z){return(0,g.post_process_object_detection)(...Z)}}},"./src/models/sam/image_processing_sam.js":(ke,A,r)=>{r.r(A),r.d(A,{SamImageProcessor:()=>Z});var g=r("./src/base/image_processors_utils.js"),$=r("./src/utils/core.js"),N=r("./src/utils/tensor.js");class Z extends g.ImageProcessor{reshape_input_points(y,T,b,x=!1){y=structuredClone(y);let v=(0,$.calculateDimensions)(y);if(v.length===3)x||(v=[1,...v]),y=[y];else if(v.length!==4)throw Error("The input_points must be a 4D tensor of shape `batch_size`, `point_batch_size`, `nb_points_per_image`, `2`.");for(let L=0;Lx!==T.dims[v]))throw Error(`The first ${b.length} dimensions of 'input_points' and 'input_labels' must be the same.`);return new N.Tensor("int64",y.flat(1/0).map(BigInt),b)}async _call(y,{input_points:T=null,input_labels:b=null,input_boxes:x=null}={}){const v=await super._call(y);if(T&&(v.input_points=this.reshape_input_points(T,v.original_sizes,v.reshaped_input_sizes)),b){if(!v.input_points)throw Error("`input_points` must be provided if `input_labels` are provided.");v.input_labels=this.add_input_labels(b,v.input_points)}return x&&(v.input_boxes=this.reshape_input_points(x,v.original_sizes,v.reshaped_input_sizes,!0)),v}async post_process_masks(y,T,b,{mask_threshold:x=0,binarize:v=!0,pad_size:L=null}={}){const K=[];L=L??this.pad_size;const se=[L.height,L.width];for(let oe=0;oex&&(S[w]=1);H=new N.Tensor("bool",S,H.dims)}K.push(H)}return K}generate_crop_boxes(y,T,{crop_n_layers:b=0,overlap_ratio:x=512/1500,points_per_crop:v=32,crop_n_points_downscale_factor:L=1}={}){}}},"./src/models/sam/processing_sam.js":(ke,A,r)=>{r.r(A),r.d(A,{SamProcessor:()=>N});var g=r("./src/base/processing_utils.js"),$=r("./src/models/auto/image_processing_auto.js");class N extends g.Processor{static image_processor_class=$.AutoImageProcessor;async _call(...j){return await this.image_processor(...j)}post_process_masks(...j){return this.image_processor.post_process_masks(...j)}reshape_input_points(...j){return this.image_processor.reshape_input_points(...j)}}},"./src/models/seamless_m4t/feature_extraction_seamless_m4t.js":(ke,A,r)=>{r.r(A),r.d(A,{SeamlessM4TFeatureExtractor:()=>Z});var g=r("./src/base/feature_extraction_utils.js"),$=r("./src/utils/tensor.js"),N=r("./src/utils/audio.js");class Z extends g.FeatureExtractor{constructor(y){super(y);const T=this.config.sampling_rate,b=(0,N.mel_filter_bank)(256,this.config.num_mel_bins,20,Math.floor(T/2),T,null,"kaldi",!0);for(let x=0;xb*32768),(0,N.spectrogram)(y,this.window,400,160,{fft_length:512,power:2,center:!1,preemphasis:.97,mel_filters:this.mel_filters,log_mel:"log",mel_floor:1192092955078125e-22,remove_dc_offset:!0,max_num_frames:T,transpose:!0})}async _call(y,{padding:T=!0,pad_to_multiple_of:b=2,do_normalize_per_mel_bins:x=!0,return_attention_mask:v=!0}={}){(0,g.validate_audio_inputs)(y,"SeamlessM4TFeatureExtractor");let L=await this._extract_fbank_features(y,this.config.max_length);if(x){const[S,w]=L.dims,P=L.data;for(let F=0;F0){const ae=new Float32Array(w*(S+F));ae.set(P),ae.fill(this.config.padding_value,P.length);const ie=S+F;L=new $.Tensor(L.type,ae,[ie,w]),v&&(K=new $.Tensor("int64",new BigInt64Array(ie),[1,ie]),K.data.fill(1n,0,S))}}const[se,oe]=L.dims,V=this.config.stride;if(se%V!==0)throw new Error(`The number of frames (${se}) must be a multiple of the stride (${V}).`);const H=L.view(1,Math.floor(se/V),oe*V),I={input_features:H};if(v){const S=H.dims[1],w=new BigInt64Array(S);if(K){const P=K.data;for(let F=1,ae=0;F{r.r(A),r.d(A,{SegformerFeatureExtractor:()=>N,SegformerImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{post_process_semantic_segmentation(...j){return(0,g.post_process_semantic_segmentation)(...j)}}class N extends ${}},"./src/models/siglip/image_processing_siglip.js":(ke,A,r)=>{r.r(A),r.d(A,{SiglipImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}},"./src/models/speecht5/feature_extraction_speecht5.js":(ke,A,r)=>{r.r(A),r.d(A,{SpeechT5FeatureExtractor:()=>$});var g=r("./src/base/feature_extraction_utils.js");class $ extends g.FeatureExtractor{}},"./src/models/speecht5/processing_speecht5.js":(ke,A,r)=>{r.r(A),r.d(A,{SpeechT5Processor:()=>Z});var g=r("./src/base/processing_utils.js"),$=r("./src/tokenizers.js"),N=r("./src/models/auto/feature_extraction_auto.js");class Z extends g.Processor{static tokenizer_class=$.AutoTokenizer;static feature_extractor_class=N.AutoFeatureExtractor;async _call(y){return await this.feature_extractor(y)}}},"./src/models/swin2sr/image_processing_swin2sr.js":(ke,A,r)=>{r.r(A),r.d(A,{Swin2SRImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{pad_image(Z,j,y,T={}){const[b,x,v]=j;return super.pad_image(Z,j,{width:x+(y-x%y)%y,height:b+(y-b%y)%y},{mode:"symmetric",center:!1,constant_values:-1,...T})}}},"./src/models/vit/image_processing_vit.js":(ke,A,r)=>{r.r(A),r.d(A,{ViTFeatureExtractor:()=>N,ViTImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{}class N extends ${}},"./src/models/vitmatte/image_processing_vitmatte.js":(ke,A,r)=>{r.r(A),r.d(A,{VitMatteImageProcessor:()=>N});var g=r("./src/base/image_processors_utils.js"),$=r("./src/utils/tensor.js");class N extends g.ImageProcessor{async _call(j,y){Array.isArray(j)||(j=[j]),Array.isArray(y)||(y=[y]);const T=await Promise.all(j.map(v=>this.preprocess(v))),b=await Promise.all(y.map(v=>this.preprocess(v,{do_normalize:!1,do_convert_rgb:!1,do_convert_grayscale:!0})));return{pixel_values:(0,$.stack)(T.map((v,L)=>(0,$.cat)([v.pixel_values,b[L].pixel_values],0)),0),original_sizes:T.map(v=>v.original_size),reshaped_input_sizes:T.map(v=>v.reshaped_input_size)}}}},"./src/models/vitpose/image_processing_vitpose.js":(ke,A,r)=>{r.r(A),r.d(A,{VitPoseImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{post_process_pose_estimation(Z,j,{threshold:y=null}={}){const T=Z.tolist(),[b,x,v,L]=Z.dims,K=[];for(let se=0;se{r.r(A),r.d(A,{Wav2Vec2FeatureExtractor:()=>N});var g=r("./src/base/feature_extraction_utils.js"),$=r("./src/utils/tensor.js");class N extends g.FeatureExtractor{_zero_mean_unit_var_norm(j){const T=j.reduce((x,v)=>x+v,0)/j.length,b=j.reduce((x,v)=>x+(v-T)**2,0)/j.length;return j.map(x=>(x-T)/Math.sqrt(b+1e-7))}async _call(j){(0,g.validate_audio_inputs)(j,"Wav2Vec2FeatureExtractor"),j instanceof Float64Array&&(j=new Float32Array(j));let y=j;this.config.do_normalize&&(y=this._zero_mean_unit_var_norm(y));const T=[1,y.length];return{input_values:new $.Tensor("float32",y,T),attention_mask:new $.Tensor("int64",new BigInt64Array(y.length).fill(1n),T)}}}},"./src/models/wav2vec2/processing_wav2vec2.js":(ke,A,r)=>{r.r(A),r.d(A,{Wav2Vec2ProcessorWithLM:()=>N});var g=r("./src/base/processing_utils.js"),$=r("./src/models/auto/feature_extraction_auto.js");class N extends g.Processor{static feature_extractor_class=$.AutoFeatureExtractor;async _call(j){return await this.feature_extractor(j)}}},"./src/models/wespeaker/feature_extraction_wespeaker.js":(ke,A,r)=>{r.r(A),r.d(A,{WeSpeakerFeatureExtractor:()=>N});var g=r("./src/base/feature_extraction_utils.js");r("./src/utils/tensor.js");var $=r("./src/utils/audio.js");class N extends g.FeatureExtractor{constructor(j){super(j);const y=this.config.sampling_rate,T=(0,$.mel_filter_bank)(256,this.config.num_mel_bins,20,Math.floor(y/2),y,null,"kaldi",!0);for(let b=0;by*32768),(0,$.spectrogram)(j,this.window,400,160,{fft_length:512,power:2,center:!1,preemphasis:.97,mel_filters:this.mel_filters,log_mel:"log",mel_floor:1192092955078125e-22,remove_dc_offset:!0,transpose:!0,min_num_frames:this.min_num_frames})}async _call(j){(0,g.validate_audio_inputs)(j,"WeSpeakerFeatureExtractor");const y=(await this._extract_fbank_features(j)).unsqueeze_(0);if(this.config.fbank_centering_span===null){const T=y.mean(1).data,b=y.data,[x,v,L]=y.dims;for(let K=0;K{r.r(A),r.d(A,{WHISPER_LANGUAGE_MAPPING:()=>$,WHISPER_TO_LANGUAGE_CODE_MAPPING:()=>N,whisper_language_to_code:()=>Z});const g=[["en","english"],["zh","chinese"],["de","german"],["es","spanish"],["ru","russian"],["ko","korean"],["fr","french"],["ja","japanese"],["pt","portuguese"],["tr","turkish"],["pl","polish"],["ca","catalan"],["nl","dutch"],["ar","arabic"],["sv","swedish"],["it","italian"],["id","indonesian"],["hi","hindi"],["fi","finnish"],["vi","vietnamese"],["he","hebrew"],["uk","ukrainian"],["el","greek"],["ms","malay"],["cs","czech"],["ro","romanian"],["da","danish"],["hu","hungarian"],["ta","tamil"],["no","norwegian"],["th","thai"],["ur","urdu"],["hr","croatian"],["bg","bulgarian"],["lt","lithuanian"],["la","latin"],["mi","maori"],["ml","malayalam"],["cy","welsh"],["sk","slovak"],["te","telugu"],["fa","persian"],["lv","latvian"],["bn","bengali"],["sr","serbian"],["az","azerbaijani"],["sl","slovenian"],["kn","kannada"],["et","estonian"],["mk","macedonian"],["br","breton"],["eu","basque"],["is","icelandic"],["hy","armenian"],["ne","nepali"],["mn","mongolian"],["bs","bosnian"],["kk","kazakh"],["sq","albanian"],["sw","swahili"],["gl","galician"],["mr","marathi"],["pa","punjabi"],["si","sinhala"],["km","khmer"],["sn","shona"],["yo","yoruba"],["so","somali"],["af","afrikaans"],["oc","occitan"],["ka","georgian"],["be","belarusian"],["tg","tajik"],["sd","sindhi"],["gu","gujarati"],["am","amharic"],["yi","yiddish"],["lo","lao"],["uz","uzbek"],["fo","faroese"],["ht","haitian creole"],["ps","pashto"],["tk","turkmen"],["nn","nynorsk"],["mt","maltese"],["sa","sanskrit"],["lb","luxembourgish"],["my","myanmar"],["bo","tibetan"],["tl","tagalog"],["mg","malagasy"],["as","assamese"],["tt","tatar"],["haw","hawaiian"],["ln","lingala"],["ha","hausa"],["ba","bashkir"],["jw","javanese"],["su","sundanese"]],$=new Map(g),N=new Map([...g.map(([j,y])=>[y,j]),["burmese","my"],["valencian","ca"],["flemish","nl"],["haitian","ht"],["letzeburgesch","lb"],["pushto","ps"],["panjabi","pa"],["moldavian","ro"],["moldovan","ro"],["sinhalese","si"],["castilian","es"]]);function Z(j){j=j.toLowerCase();let y=N.get(j);if(y===void 0)if($.has(j))y=j;else{const b=j.length===2?$.keys():$.values();throw new Error(`Language "${j}" is not supported. Must be one of: ${JSON.stringify(b)}`)}return y}},"./src/models/whisper/feature_extraction_whisper.js":(ke,A,r)=>{r.r(A),r.d(A,{WhisperFeatureExtractor:()=>Z});var g=r("./src/base/feature_extraction_utils.js");r("./src/utils/tensor.js");var $=r("./src/utils/audio.js"),N=r("./src/utils/maths.js");class Z extends g.FeatureExtractor{constructor(y){super(y),this.config.mel_filters??=(0,$.mel_filter_bank)(Math.floor(1+this.config.n_fft/2),this.config.feature_size,0,8e3,this.config.sampling_rate,"slaney","slaney"),this.window=(0,$.window_function)(this.config.n_fft,"hann")}async _extract_fbank_features(y){const T=await(0,$.spectrogram)(y,this.window,this.config.n_fft,this.config.hop_length,{power:2,mel_filters:this.config.mel_filters,log_mel:"log10",max_num_frames:this.config.nb_max_frames}),b=T.data,x=(0,N.max)(b)[0];for(let v=0;vthis.config.n_samples?(console.warn("Attempting to extract features for audio longer than 30 seconds. If using a pipeline to extract transcript from a long audio clip, remember to specify `chunk_length_s` and/or `stride_length_s`."),T=y.slice(0,this.config.n_samples)):(T=new Float32Array(this.config.n_samples),T.set(y)),{input_features:(await this._extract_fbank_features(T)).unsqueeze_(0)}}}},"./src/models/whisper/generation_whisper.js":(ke,A,r)=>{r.r(A),r.d(A,{WhisperGenerationConfig:()=>$});var g=r("./src/generation/configuration_utils.js");class $ extends g.GenerationConfig{return_timestamps=null;return_token_timestamps=null;num_frames=null;alignment_heads=null;task=null;language=null;no_timestamps_token_id=null;prompt_ids=null;is_multilingual=null;lang_to_id=null;task_to_id=null;max_initial_timestamp_index=1}},"./src/models/whisper/processing_whisper.js":(ke,A,r)=>{r.r(A),r.d(A,{WhisperProcessor:()=>Z});var g=r("./src/models/auto/feature_extraction_auto.js"),$=r("./src/tokenizers.js"),N=r("./src/base/processing_utils.js");class Z extends N.Processor{static tokenizer_class=$.AutoTokenizer;static feature_extractor_class=g.AutoFeatureExtractor;async _call(y){return await this.feature_extractor(y)}}},"./src/models/yolos/image_processing_yolos.js":(ke,A,r)=>{r.r(A),r.d(A,{YolosFeatureExtractor:()=>N,YolosImageProcessor:()=>$});var g=r("./src/base/image_processors_utils.js");class $ extends g.ImageProcessor{post_process_object_detection(...j){return(0,g.post_process_object_detection)(...j)}}class N extends ${}},"./src/ops/registry.js":(ke,A,r)=>{r.r(A),r.d(A,{TensorOpRegistry:()=>Z});var g=r("./src/backends/onnx.js"),$=r("./src/utils/tensor.js");const N=async(j,y,T)=>{const b=await(0,g.createInferenceSession)(new Uint8Array(j),y);return async x=>{const v=(0,g.isONNXProxy)(),L=Object.fromEntries(Object.entries(x).map(([se,oe])=>[se,(v?oe.clone():oe).ort_tensor])),K=await b.run(L);return Array.isArray(T)?T.map(se=>new $.Tensor(K[se])):new $.Tensor(K[T])}};class Z{static session_options={};static get nearest_interpolate_4d(){return this._nearest_interpolate_4d||(this._nearest_interpolate_4d=N([8,10,18,0,58,129,1,10,41,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,18,10,4,109,111,100,101,34,7,110,101,97,114,101,115,116,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,21],this.session_options,"y")),this._nearest_interpolate_4d}static get bilinear_interpolate_4d(){return this._bilinear_interpolate_4d||(this._bilinear_interpolate_4d=N([8,9,18,0,58,128,1,10,40,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,17,10,4,109,111,100,101,34,6,108,105,110,101,97,114,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,20],this.session_options,"y")),this._bilinear_interpolate_4d}static get bicubic_interpolate_4d(){return this._bicubic_interpolate_4d||(this._bicubic_interpolate_4d=N([8,9,18,0,58,127,10,39,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,16,10,4,109,111,100,101,34,5,99,117,98,105,99,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,20],this.session_options,"y")),this._bicubic_interpolate_4d}static get matmul(){return this._matmul||(this._matmul=N([8,9,18,0,58,55,10,17,10,1,97,10,1,98,18,1,99,34,6,77,97,116,77,117,108,18,1,114,90,9,10,1,97,18,4,10,2,8,1,90,9,10,1,98,18,4,10,2,8,1,98,9,10,1,99,18,4,10,2,8,1,66,2,16,20],this.session_options,"c")),this._matmul}static get stft(){return this._stft||(this._stft=N([8,7,18,0,58,148,1,10,38,10,1,115,10,1,106,10,1,119,10,1,108,18,1,111,34,4,83,84,70,84,42,15,10,8,111,110,101,115,105,100,101,100,24,1,160,1,2,18,1,115,90,26,10,1,115,18,21,10,19,8,1,18,15,10,3,18,1,98,10,3,18,1,115,10,3,18,1,99,90,11,10,1,106,18,6,10,4,8,7,18,0,90,16,10,1,119,18,11,10,9,8,1,18,5,10,3,18,1,119,90,11,10,1,108,18,6,10,4,8,7,18,0,98,31,10,1,111,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,102,10,3,18,1,100,10,3,18,1,99,66,2,16,17],this.session_options,"o")),this._stft}static get rfft(){return this._rfft||(this._rfft=N([8,9,18,0,58,97,10,33,10,1,120,10,0,10,1,97,18,1,121,34,3,68,70,84,42,15,10,8,111,110,101,115,105,100,101,100,24,1,160,1,2,18,1,100,90,21,10,1,120,18,16,10,14,8,1,18,10,10,3,18,1,115,10,3,18,1,99,90,11,10,1,97,18,6,10,4,8,7,18,0,98,21,10,1,121,18,16,10,14,8,1,18,10,10,3,18,1,115,10,3,18,1,99,66,2,16,20],this.session_options,"y")),this._rfft}static get top_k(){return this._top_k||(this._top_k=N([8,10,18,0,58,73,10,18,10,1,120,10,1,107,18,1,118,18,1,105,34,4,84,111,112,75,18,1,116,90,9,10,1,120,18,4,10,2,8,1,90,15,10,1,107,18,10,10,8,8,7,18,4,10,2,8,1,98,9,10,1,118,18,4,10,2,8,1,98,9,10,1,105,18,4,10,2,8,7,66,2,16,21],this.session_options,["v","i"])),this._top_k}static get slice(){return this._slice||(this._slice=N([8,7,18,0,58,96,10,25,10,1,120,10,1,115,10,1,101,10,1,97,10,1,116,18,1,121,34,5,83,108,105,99,101,18,1,114,90,9,10,1,120,18,4,10,2,8,1,90,9,10,1,115,18,4,10,2,8,7,90,9,10,1,101,18,4,10,2,8,7,90,9,10,1,97,18,4,10,2,8,7,90,9,10,1,116,18,4,10,2,8,7,98,9,10,1,121,18,4,10,2,8,1,66,2,16,13],this.session_options,"y")),this._slice}}},"./src/pipelines.js":(ke,A,r)=>{r.r(A),r.d(A,{AudioClassificationPipeline:()=>ge,AutomaticSpeechRecognitionPipeline:()=>Me,DepthEstimationPipeline:()=>Ee,DocumentQuestionAnsweringPipeline:()=>_e,FeatureExtractionPipeline:()=>ie,FillMaskPipeline:()=>H,ImageClassificationPipeline:()=>Ce,ImageFeatureExtractionPipeline:()=>ye,ImageSegmentationPipeline:()=>Ae,ImageToImagePipeline:()=>de,ImageToTextPipeline:()=>pe,ObjectDetectionPipeline:()=>Je,Pipeline:()=>se,QuestionAnsweringPipeline:()=>U,SummarizationPipeline:()=>S,Text2TextGenerationPipeline:()=>I,TextClassificationPipeline:()=>oe,TextGenerationPipeline:()=>F,TextToAudioPipeline:()=>X,TokenClassificationPipeline:()=>V,TranslationPipeline:()=>w,ZeroShotAudioClassificationPipeline:()=>re,ZeroShotClassificationPipeline:()=>ae,ZeroShotImageClassificationPipeline:()=>Pe,ZeroShotObjectDetectionPipeline:()=>je,pipeline:()=>ee});var g=r("./src/tokenizers.js"),$=r("./src/models.js"),N=r("./src/models/auto/processing_auto.js");r("./src/base/processing_utils.js");var Z=r("./src/utils/generic.js"),j=r("./src/utils/core.js"),y=r("./src/utils/maths.js"),T=r("./src/utils/audio.js"),b=r("./src/utils/tensor.js"),x=r("./src/utils/image.js");async function v(Re){return Array.isArray(Re)||(Re=[Re]),await Promise.all(Re.map(te=>x.RawImage.read(te)))}async function L(Re,te){return Array.isArray(Re)||(Re=[Re]),await Promise.all(Re.map(ve=>typeof ve=="string"||ve instanceof URL?(0,T.read_audio)(ve,te):ve instanceof Float64Array?new Float32Array(ve):ve))}function K(Re,te){te&&(Re=Re.map(ze=>ze|0));const[ve,Ke,Ne,Ue]=Re;return{xmin:ve,ymin:Ke,xmax:Ne,ymax:Ue}}class se extends Z.Callable{constructor({task:te,model:ve,tokenizer:Ke=null,processor:Ne=null}){super(),this.task=te,this.model=ve,this.tokenizer=Ke,this.processor=Ne}async dispose(){await this.model.dispose()}}class oe extends se{constructor(te){super(te)}async _call(te,{top_k:ve=1}={}){const Ke=this.tokenizer(te,{padding:!0,truncation:!0}),Ne=await this.model(Ke),Ue=this.model.config.problem_type==="multi_label_classification"?at=>at.sigmoid():at=>new b.Tensor("float32",(0,y.softmax)(at.data),at.dims),ze=this.model.config.id2label,Ze=[];for(const at of Ne.logits){const mt=Ue(at),lt=await(0,b.topk)(mt,ve),ct=lt[0].tolist(),le=lt[1].tolist().map((Q,we)=>({label:ze?ze[Q]:`LABEL_${Q}`,score:ct[we]}));ve===1?Ze.push(...le):Ze.push(le)}return Array.isArray(te)||ve===1?Ze:Ze[0]}}class V extends se{constructor(te){super(te)}async _call(te,{ignore_labels:ve=["O"]}={}){const Ke=Array.isArray(te),Ne=this.tokenizer(Ke?te:[te],{padding:!0,truncation:!0}),ze=(await this.model(Ne)).logits,Ze=this.model.config.id2label,at=[];for(let mt=0;mttt==this.tokenizer.sep_token_id);at[ct].map((tt,st)=>tt==1&&(st===0||st>le&&mt.findIndex(ft=>ft==O[st])===-1));const Q=Ue[ct].tolist(),we=ze[ct].tolist();for(let tt=1;ttst==O[tt])!==-1)&&(Q[tt]=-1/0,we[tt]=-1/0);const Se=(0,y.softmax)(Q).map((tt,st)=>[tt,st]),We=(0,y.softmax)(we).map((tt,st)=>[tt,st]);Se[0][0]=0,We[0][0]=0;const qe=(0,j.product)(Se,We).filter(tt=>tt[0][1]<=tt[1][1]).map(tt=>[tt[0][1],tt[1][1],tt[0][0]*tt[1][0]]).sort((tt,st)=>st[2]-tt[2]);for(let tt=0;ttQ==this.tokenizer.mask_token_id);if(mt===-1)throw Error(`Mask token (${this.tokenizer.mask_token}) not found in text.`);const lt=Ne[Ze][mt],ct=await(0,b.topk)(new b.Tensor("float32",(0,y.softmax)(lt.data),lt.dims),ve),O=ct[0].tolist(),le=ct[1].tolist();Ue.push(le.map((Q,we)=>{const Se=at.slice();return Se[mt]=Q,{score:O[we],token:Number(Q),token_str:this.tokenizer.decode([Q]),sequence:this.tokenizer.decode(Se,{skip_special_tokens:!0})}}))}return Array.isArray(te)?Ue:Ue[0]}}class I extends se{_key="generated_text";constructor(te){super(te)}async _call(te,ve={}){Array.isArray(te)||(te=[te]),this.model.config.prefix&&(te=te.map(at=>this.model.config.prefix+at));const Ke=this.model.config.task_specific_params;Ke&&Ke[this.task]&&Ke[this.task].prefix&&(te=te.map(at=>Ke[this.task].prefix+at));const Ne=this.tokenizer,Ue={padding:!0,truncation:!0};let ze;this instanceof w&&"_build_translation_inputs"in Ne?ze=Ne._build_translation_inputs(te,Ue,ve):ze=Ne(te,Ue);const Ze=await this.model.generate({...ze,...ve});return Ne.batch_decode(Ze,{skip_special_tokens:!0}).map(at=>({[this._key]:at}))}}class S extends I{_key="summary_text";constructor(te){super(te)}}class w extends I{_key="translation_text";constructor(te){super(te)}}function P(Re){return Array.isArray(Re)&&Re.every(te=>"role"in te&&"content"in te)}class F extends se{constructor(te){super(te)}async _call(te,ve={}){let Ke=!1,Ne=!1,Ue;if(typeof te=="string")Ue=te=[te];else if(Array.isArray(te)&&te.every(le=>typeof le=="string"))Ke=!0,Ue=te;else{if(P(te))te=[te];else if(Array.isArray(te)&&te.every(P))Ke=!0;else throw new Error("Input must be a string, an array of strings, a Chat, or an array of Chats");Ne=!0,Ue=te.map(le=>this.tokenizer.apply_chat_template(le,{tokenize:!1,add_generation_prompt:!0}))}const ze=ve.add_special_tokens??!1,Ze=Ne?!1:ve.return_full_text??!0;this.tokenizer.padding_side="left";const at=this.tokenizer(Ue,{add_special_tokens:ze,padding:!0,truncation:!0}),mt=await this.model.generate({...at,...ve}),lt=this.tokenizer.batch_decode(mt,{skip_special_tokens:!0});let ct;!Ze&&at.input_ids.dims.at(-1)>0&&(ct=this.tokenizer.batch_decode(at.input_ids,{skip_special_tokens:!0}).map(le=>le.length));const O=Array.from({length:te.length},le=>[]);for(let le=0;le[ve.toLowerCase(),Ke])),this.entailment_id=this.label2id.entailment,this.entailment_id===void 0&&(console.warn("Could not find 'entailment' in label2id mapping. Using 2 as entailment_id."),this.entailment_id=2),this.contradiction_id=this.label2id.contradiction??this.label2id.not_entailment,this.contradiction_id===void 0&&(console.warn("Could not find 'contradiction' in label2id mapping. Using 0 as contradiction_id."),this.contradiction_id=0)}async _call(te,ve,{hypothesis_template:Ke="This example is {}.",multi_label:Ne=!1}={}){const Ue=Array.isArray(te);Ue||(te=[te]),Array.isArray(ve)||(ve=[ve]);const ze=ve.map(mt=>Ke.replace("{}",mt)),Ze=Ne||ve.length===1,at=[];for(const mt of te){const lt=[];for(const le of ze){const Q=this.tokenizer(mt,{text_pair:le,padding:!0,truncation:!0}),we=await this.model(Q);Ze?lt.push([we.logits.data[this.contradiction_id],we.logits.data[this.entailment_id]]):lt.push(we.logits.data[this.entailment_id])}const O=(Ze?lt.map(le=>(0,y.softmax)(le)[1]):(0,y.softmax)(lt)).map((le,Q)=>[le,Q]).sort((le,Q)=>Q[0]-le[0]);at.push({sequence:mt,labels:O.map(le=>ve[le[1]]),scores:O.map(le=>le[0])})}return Ue?at:at[0]}}class ie extends se{constructor(te){super(te)}async _call(te,{pooling:ve="none",normalize:Ke=!1,quantize:Ne=!1,precision:Ue="binary"}={}){const ze=this.tokenizer(te,{padding:!0,truncation:!0}),Ze=await this.model(ze);let at=Ze.last_hidden_state??Ze.logits??Ze.token_embeddings;if(ve!=="none")if(ve==="mean")at=(0,b.mean_pooling)(at,ze.attention_mask);else if(ve==="cls")at=at.slice(null,0);else throw Error(`Pooling method '${ve}' not supported.`);return Ke&&(at=at.normalize(2,-1)),Ne&&(at=(0,b.quantize_embeddings)(at,Ue)),at}}class ye extends se{constructor(te){super(te)}async _call(te,{pool:ve=null}={}){const Ke=await v(te),{pixel_values:Ne}=await this.processor(Ke),Ue=await this.model({pixel_values:Ne});let ze;if(ve){if(!("pooler_output"in Ue))throw Error("No pooled output was returned. Make sure the model has a 'pooler' layer when using the 'pool' option.");ze=Ue.pooler_output}else ze=Ue.last_hidden_state??Ue.logits??Ue.image_embeds;return ze}}class ge extends se{constructor(te){super(te)}async _call(te,{top_k:ve=5}={}){const Ke=this.processor.feature_extractor.config.sampling_rate,Ne=await L(te,Ke),Ue=this.model.config.id2label,ze=[];for(const Ze of Ne){const at=await this.processor(Ze),lt=(await this.model(at)).logits[0],ct=await(0,b.topk)(new b.Tensor("float32",(0,y.softmax)(lt.data),lt.dims),ve),O=ct[0].tolist(),Q=ct[1].tolist().map((we,Se)=>({label:Ue?Ue[we]:`LABEL_${we}`,score:O[Se]}));ze.push(Q)}return Array.isArray(te)?ze:ze[0]}}class re extends se{constructor(te){super(te)}async _call(te,ve,{hypothesis_template:Ke="This is a sound of {}."}={}){const Ne=!Array.isArray(te);Ne&&(te=[te]);const Ue=ve.map(lt=>Ke.replace("{}",lt)),ze=this.tokenizer(Ue,{padding:!0,truncation:!0}),Ze=this.processor.feature_extractor.config.sampling_rate,at=await L(te,Ze),mt=[];for(const lt of at){const ct=await this.processor(lt),O=await this.model({...ze,...ct}),le=(0,y.softmax)(O.logits_per_audio.data);mt.push([...le].map((Q,we)=>({score:Q,label:ve[we]})))}return Ne?mt[0]:mt}}class Me extends se{constructor(te){super(te)}async _call(te,ve={}){switch(this.model.config.model_type){case"whisper":return this._call_whisper(te,ve);case"wav2vec2":case"wav2vec2-bert":case"unispeech":case"unispeech-sat":case"hubert":return this._call_wav2vec2(te,ve);case"moonshine":return this._call_moonshine(te,ve);default:throw new Error(`AutomaticSpeechRecognitionPipeline does not support model type '${this.model.config.model_type}'.`)}}async _call_wav2vec2(te,ve){ve.language&&console.warn('`language` parameter is not yet supported for `wav2vec2` models, defaulting to "English".'),ve.task&&console.warn('`task` parameter is not yet supported for `wav2vec2` models, defaulting to "transcribe".');const Ke=!Array.isArray(te);Ke&&(te=[te]);const Ne=this.processor.feature_extractor.config.sampling_rate,Ue=await L(te,Ne),ze=[];for(const Ze of Ue){const at=await this.processor(Ze),lt=(await this.model(at)).logits[0],ct=[];for(const le of lt)ct.push((0,y.max)(le.data)[1]);const O=this.tokenizer.decode(ct);ze.push({text:O})}return Ke?ze[0]:ze}async _call_whisper(te,ve){const Ke=ve.return_timestamps??!1,Ne=ve.chunk_length_s??0,Ue=ve.force_full_sequences??!1;let ze=ve.stride_length_s??null;const Ze={...ve};Ke==="word"&&(Ze.return_token_timestamps=!0,Ze.return_timestamps=!1);const at=!Array.isArray(te);at&&(te=[te]);const mt=this.processor.feature_extractor.config.chunk_length/this.model.config.max_source_positions,lt=this.processor.feature_extractor.config.hop_length,ct=this.processor.feature_extractor.config.sampling_rate,O=await L(te,ct),le=[];for(const Q of O){let we=[];if(Ne>0){if(ze===null)ze=Ne/6;else if(Ne<=ze)throw Error("`chunk_length_s` must be larger than `stride_length_s`.");const qe=ct*Ne,tt=ct*ze,st=qe-2*tt;let ft=0;for(;;){const Nt=ft+qe,ss=Q.subarray(ft,Nt),Ts=await this.processor(ss),ms=ft===0,Ps=Nt>=Q.length;if(we.push({stride:[ss.length,ms?0:tt,Ps?0:tt],input_features:Ts.input_features,is_last:Ps}),Ps)break;ft+=st}}else we=[{stride:[Q.length,0,0],input_features:(await this.processor(Q)).input_features,is_last:!0}];for(const qe of we){Ze.num_frames=Math.floor(qe.stride[0]/lt);const tt=await this.model.generate({inputs:qe.input_features,...Ze});Ke==="word"?(qe.tokens=tt.sequences.tolist()[0],qe.token_timestamps=tt.token_timestamps.tolist()[0].map(st=>(0,y.round)(st,2))):qe.tokens=tt[0].tolist(),qe.stride=qe.stride.map(st=>st/ct)}const[Se,We]=this.tokenizer._decode_asr(we,{time_precision:mt,return_timestamps:Ke,force_full_sequences:Ue});le.push({text:Se,...We})}return at?le[0]:le}async _call_moonshine(te,ve){const Ke=!Array.isArray(te);Ke&&(te=[te]);const Ne=this.processor.feature_extractor.config.sampling_rate,Ue=await L(te,Ne),ze=[];for(const Ze of Ue){const at=await this.processor(Ze),mt=Math.floor(Ze.length/Ne)*6,lt=await this.model.generate({max_new_tokens:mt,...ve,...at}),ct=this.processor.batch_decode(lt,{skip_special_tokens:!0})[0];ze.push({text:ct})}return Ke?ze[0]:ze}}class pe extends se{constructor(te){super(te)}async _call(te,ve={}){const Ke=Array.isArray(te),Ne=await v(te),{pixel_values:Ue}=await this.processor(Ne),ze=[];for(const Ze of Ue){Ze.dims=[1,...Ze.dims];const at=await this.model.generate({inputs:Ze,...ve}),mt=this.tokenizer.batch_decode(at,{skip_special_tokens:!0}).map(lt=>({generated_text:lt.trim()}));ze.push(mt)}return Ke?ze:ze[0]}}class Ce extends se{constructor(te){super(te)}async _call(te,{top_k:ve=5}={}){const Ke=await v(te),{pixel_values:Ne}=await this.processor(Ke),Ue=await this.model({pixel_values:Ne}),ze=this.model.config.id2label,Ze=[];for(const at of Ue.logits){const mt=await(0,b.topk)(new b.Tensor("float32",(0,y.softmax)(at.data),at.dims),ve),lt=mt[0].tolist(),O=mt[1].tolist().map((le,Q)=>({label:ze?ze[le]:`LABEL_${le}`,score:lt[Q]}));Ze.push(O)}return Array.isArray(te)?Ze:Ze[0]}}class Ae extends se{constructor(te){super(te),this.subtasks_mapping={panoptic:"post_process_panoptic_segmentation",instance:"post_process_instance_segmentation",semantic:"post_process_semantic_segmentation"}}async _call(te,{threshold:ve=.5,mask_threshold:Ke=.5,overlap_mask_area_threshold:Ne=.8,label_ids_to_fuse:Ue=null,target_sizes:ze=null,subtask:Ze=null}={}){if(Array.isArray(te)&&te.length!==1)throw Error("Image segmentation pipeline currently only supports a batch size of 1.");const mt=await v(te),lt=mt.map(We=>[We.height,We.width]),{pixel_values:ct,pixel_mask:O}=await this.processor(mt),le=await this.model({pixel_values:ct,pixel_mask:O});let Q=null;if(Ze!==null)Q=this.subtasks_mapping[Ze];else for(let[We,qe]of Object.entries(this.subtasks_mapping))if(qe in this.processor.image_processor){Q=this.processor.image_processor[qe].bind(this.processor.image_processor),Ze=We;break}const we=this.model.config.id2label,Se=[];if(Ze==="panoptic"||Ze==="instance"){const We=Q(le,ve,Ke,Ne,Ue,ze??lt)[0],qe=We.segmentation;for(const tt of We.segments_info){const st=new Uint8ClampedArray(qe.data.length);for(let Nt=0;NtKe.replace("{}",O)),Ze=this.tokenizer(ze,{padding:this.model.config.model_type==="siglip"?"max_length":!0,truncation:!0}),{pixel_values:at}=await this.processor(Ue),mt=await this.model({...Ze,pixel_values:at}),lt=this.model.config.model_type==="siglip"?O=>O.sigmoid().data:O=>(0,y.softmax)(O.data),ct=[];for(const O of mt.logits_per_image){const Q=[...lt(O)].map((we,Se)=>({score:we,label:ve[Se]}));Q.sort((we,Se)=>Se.score-we.score),ct.push(Q)}return Ne?ct:ct[0]}}class Je extends se{constructor(te){super(te)}async _call(te,{threshold:ve=.9,percentage:Ke=!1}={}){const Ne=Array.isArray(te);if(Ne&&te.length!==1)throw Error("Object detection pipeline currently only supports a batch size of 1.");const Ue=await v(te),ze=Ke?null:Ue.map(le=>[le.height,le.width]),{pixel_values:Ze,pixel_mask:at}=await this.processor(Ue),mt=await this.model({pixel_values:Ze,pixel_mask:at}),lt=this.processor.image_processor.post_process_object_detection(mt,ve,ze),ct=this.model.config.id2label,O=lt.map(le=>le.boxes.map((Q,we)=>({score:le.scores[we],label:ct[le.classes[we]],box:K(Q,!Ke)})));return Ne?O:O[0]}}class je extends se{constructor(te){super(te)}async _call(te,ve,{threshold:Ke=.1,top_k:Ne=null,percentage:Ue=!1}={}){const ze=Array.isArray(te),Ze=await v(te),at=this.tokenizer(ve,{padding:!0,truncation:!0}),mt=await this.processor(Ze),lt=[];for(let ct=0;ct({score:We.scores[tt],label:We.labels[tt],box:K(qe,!Ue)}))}else{const We=this.processor.image_processor.post_process_object_detection(we,Ke,le,!0)[0];Se=We.boxes.map((qe,tt)=>({score:We.scores[tt],label:ve[We.classes[tt]],box:K(qe,!Ue)}))}Se.sort((We,qe)=>qe.score-We.score),Ne!==null&&(Se=Se.slice(0,Ne)),lt.push(Se)}return ze?lt:lt[0]}}class _e extends se{constructor(te){super(te)}async _call(te,ve,Ke={}){const Ne=(await v(te))[0],{pixel_values:Ue}=await this.processor(Ne),ze=`${ve}`,Ze=this.tokenizer(ze,{add_special_tokens:!1,padding:!0,truncation:!0}).input_ids,at=await this.model.generate({inputs:Ue,max_length:this.model.config.decoder.max_position_embeddings,decoder_input_ids:Ze,...Ke}),lt=this.tokenizer.batch_decode(at)[0].match(/(.*?)<\/s_answer>/);let ct=null;return lt&<.length>=2&&(ct=lt[1].trim()),[{answer:ct}]}}class X extends se{DEFAULT_VOCODER_ID="Xenova/speecht5_hifigan";constructor(te){super(te),this.vocoder=te.vocoder??null}async _call(te,{speaker_embeddings:ve=null}={}){return this.processor?this._call_text_to_spectrogram(te,{speaker_embeddings:ve}):this._call_text_to_waveform(te)}async _call_text_to_waveform(te){const ve=this.tokenizer(te,{padding:!0,truncation:!0}),{waveform:Ke}=await this.model(ve),Ne=this.model.config.sampling_rate;return new T.RawAudio(Ke.data,Ne)}async _call_text_to_spectrogram(te,{speaker_embeddings:ve}){if(this.vocoder||(console.log("No vocoder specified, using default HifiGan vocoder."),this.vocoder=await $.AutoModel.from_pretrained(this.DEFAULT_VOCODER_ID,{dtype:"fp32"})),(typeof ve=="string"||ve instanceof URL)&&(ve=new Float32Array(await(await fetch(ve)).arrayBuffer())),ve instanceof Float32Array)ve=new b.Tensor("float32",ve,[1,ve.length]);else if(!(ve instanceof b.Tensor))throw new Error("Speaker embeddings must be a `Tensor`, `Float32Array`, `string`, or `URL`.");const{input_ids:Ke}=this.tokenizer(te,{padding:!0,truncation:!0}),{waveform:Ne}=await this.model.generate_speech(Ke,ve,{vocoder:this.vocoder}),Ue=this.processor.feature_extractor.config.sampling_rate;return new T.RawAudio(Ne.data,Ue)}}class de extends se{constructor(te){super(te)}async _call(te){const ve=await v(te),Ke=await this.processor(ve),Ne=await this.model(Ke),Ue=[];for(const ze of Ne.reconstruction){const Ze=ze.squeeze().clamp_(0,1).mul_(255).round_().to("uint8");Ue.push(x.RawImage.fromTensor(Ze))}return Ue.length>1?Ue:Ue[0]}}class Ee extends se{constructor(te){super(te)}async _call(te){const ve=await v(te),Ke=await this.processor(ve),{predicted_depth:Ne}=await this.model(Ke),Ue=[];for(let ze=0;ze1?Ue:Ue[0]}}const Oe=Object.freeze({"text-classification":{tokenizer:g.AutoTokenizer,pipeline:oe,model:$.AutoModelForSequenceClassification,default:{model:"Xenova/distilbert-base-uncased-finetuned-sst-2-english"},type:"text"},"token-classification":{tokenizer:g.AutoTokenizer,pipeline:V,model:$.AutoModelForTokenClassification,default:{model:"Xenova/bert-base-multilingual-cased-ner-hrl"},type:"text"},"question-answering":{tokenizer:g.AutoTokenizer,pipeline:U,model:$.AutoModelForQuestionAnswering,default:{model:"Xenova/distilbert-base-cased-distilled-squad"},type:"text"},"fill-mask":{tokenizer:g.AutoTokenizer,pipeline:H,model:$.AutoModelForMaskedLM,default:{model:"Xenova/bert-base-uncased"},type:"text"},summarization:{tokenizer:g.AutoTokenizer,pipeline:S,model:$.AutoModelForSeq2SeqLM,default:{model:"Xenova/distilbart-cnn-6-6"},type:"text"},translation:{tokenizer:g.AutoTokenizer,pipeline:w,model:$.AutoModelForSeq2SeqLM,default:{model:"Xenova/t5-small"},type:"text"},"text2text-generation":{tokenizer:g.AutoTokenizer,pipeline:I,model:$.AutoModelForSeq2SeqLM,default:{model:"Xenova/flan-t5-small"},type:"text"},"text-generation":{tokenizer:g.AutoTokenizer,pipeline:F,model:$.AutoModelForCausalLM,default:{model:"Xenova/gpt2"},type:"text"},"zero-shot-classification":{tokenizer:g.AutoTokenizer,pipeline:ae,model:$.AutoModelForSequenceClassification,default:{model:"Xenova/distilbert-base-uncased-mnli"},type:"text"},"audio-classification":{pipeline:ge,model:$.AutoModelForAudioClassification,processor:N.AutoProcessor,default:{model:"Xenova/wav2vec2-base-superb-ks"},type:"audio"},"zero-shot-audio-classification":{tokenizer:g.AutoTokenizer,pipeline:re,model:$.AutoModel,processor:N.AutoProcessor,default:{model:"Xenova/clap-htsat-unfused"},type:"multimodal"},"automatic-speech-recognition":{tokenizer:g.AutoTokenizer,pipeline:Me,model:[$.AutoModelForSpeechSeq2Seq,$.AutoModelForCTC],processor:N.AutoProcessor,default:{model:"Xenova/whisper-tiny.en"},type:"multimodal"},"text-to-audio":{tokenizer:g.AutoTokenizer,pipeline:X,model:[$.AutoModelForTextToWaveform,$.AutoModelForTextToSpectrogram],processor:[N.AutoProcessor,null],default:{model:"Xenova/speecht5_tts"},type:"text"},"image-to-text":{tokenizer:g.AutoTokenizer,pipeline:pe,model:$.AutoModelForVision2Seq,processor:N.AutoProcessor,default:{model:"Xenova/vit-gpt2-image-captioning"},type:"multimodal"},"image-classification":{pipeline:Ce,model:$.AutoModelForImageClassification,processor:N.AutoProcessor,default:{model:"Xenova/vit-base-patch16-224"},type:"multimodal"},"image-segmentation":{pipeline:Ae,model:[$.AutoModelForImageSegmentation,$.AutoModelForSemanticSegmentation,$.AutoModelForUniversalSegmentation],processor:N.AutoProcessor,default:{model:"Xenova/detr-resnet-50-panoptic"},type:"multimodal"},"zero-shot-image-classification":{tokenizer:g.AutoTokenizer,pipeline:Pe,model:$.AutoModel,processor:N.AutoProcessor,default:{model:"Xenova/clip-vit-base-patch32"},type:"multimodal"},"object-detection":{pipeline:Je,model:$.AutoModelForObjectDetection,processor:N.AutoProcessor,default:{model:"Xenova/detr-resnet-50"},type:"multimodal"},"zero-shot-object-detection":{tokenizer:g.AutoTokenizer,pipeline:je,model:$.AutoModelForZeroShotObjectDetection,processor:N.AutoProcessor,default:{model:"Xenova/owlvit-base-patch32"},type:"multimodal"},"document-question-answering":{tokenizer:g.AutoTokenizer,pipeline:_e,model:$.AutoModelForDocumentQuestionAnswering,processor:N.AutoProcessor,default:{model:"Xenova/donut-base-finetuned-docvqa"},type:"multimodal"},"image-to-image":{pipeline:de,model:$.AutoModelForImageToImage,processor:N.AutoProcessor,default:{model:"Xenova/swin2SR-classical-sr-x2-64"},type:"image"},"depth-estimation":{pipeline:Ee,model:$.AutoModelForDepthEstimation,processor:N.AutoProcessor,default:{model:"Xenova/dpt-large"},type:"image"},"feature-extraction":{tokenizer:g.AutoTokenizer,pipeline:ie,model:$.AutoModel,default:{model:"Xenova/all-MiniLM-L6-v2"},type:"text"},"image-feature-extraction":{processor:N.AutoProcessor,pipeline:ye,model:[$.AutoModelForImageFeatureExtraction,$.AutoModel],default:{model:"Xenova/vit-base-patch16-224-in21k"},type:"image"}}),Xe=Object.freeze({"sentiment-analysis":"text-classification",ner:"token-classification",asr:"automatic-speech-recognition","text-to-speech":"text-to-audio",embeddings:"feature-extraction"});async function ee(Re,te=null,{progress_callback:ve=null,config:Ke=null,cache_dir:Ne=null,local_files_only:Ue=!1,revision:ze="main",device:Ze=null,dtype:at=null,model_file_name:mt=null,session_options:lt={}}={}){Re=Xe[Re]??Re;const ct=Oe[Re.split("_",1)[0]];if(!ct)throw Error(`Unsupported pipeline: ${Re}. Must be one of [${Object.keys(Oe)}]`);te||(te=ct.default.model,console.log(`No model specified. Using default model: "${te}".`));const O={progress_callback:ve,config:Ke,cache_dir:Ne,local_files_only:Ue,revision:ze,device:Ze,dtype:at,model_file_name:mt,session_options:lt},le=new Map([["tokenizer",ct.tokenizer],["model",ct.model],["processor",ct.processor]]),Q=await Ve(le,te,O);Q.task=Re,(0,j.dispatchCallback)(ve,{status:"ready",task:Re,model:te});const we=ct.pipeline;return new we(Q)}async function Ve(Re,te,ve){const Ke=Object.create(null),Ne=[];for(const[Ue,ze]of Re.entries()){if(!ze)continue;let Ze;Array.isArray(ze)?Ze=new Promise(async(at,mt)=>{let lt;for(const ct of ze){if(ct===null){at(null);return}try{at(await ct.from_pretrained(te,ve));return}catch(O){if(O.message?.includes("Unsupported model type"))lt=O;else if(O.message?.includes("Could not locate file"))lt=O;else{mt(O);return}}}mt(lt)}):Ze=ze.from_pretrained(te,ve),Ke[Ue]=Ze,Ne.push(Ze)}await Promise.all(Ne);for(const[Ue,ze]of Object.entries(Ke))Ke[Ue]=await ze;return Ke}},"./src/tokenizers.js":(ke,A,r)=>{r.r(A),r.d(A,{AlbertTokenizer:()=>Pr,AutoTokenizer:()=>as,BartTokenizer:()=>dn,BertTokenizer:()=>Kr,BlenderbotSmallTokenizer:()=>Fn,BlenderbotTokenizer:()=>In,BloomTokenizer:()=>Qr,CLIPTokenizer:()=>mn,CamembertTokenizer:()=>it,CodeGenTokenizer:()=>hn,CodeLlamaTokenizer:()=>zr,CohereTokenizer:()=>gn,ConvBertTokenizer:()=>Dr,DebertaTokenizer:()=>dr,DebertaV2Tokenizer:()=>qr,DistilBertTokenizer:()=>or,ElectraTokenizer:()=>Ft,EsmTokenizer:()=>Br,FalconTokenizer:()=>Sn,GPT2Tokenizer:()=>Cn,GPTNeoXTokenizer:()=>$n,GemmaTokenizer:()=>Zn,Grok1Tokenizer:()=>Rr,HerbertTokenizer:()=>Cr,LlamaTokenizer:()=>cn,M2M100Tokenizer:()=>pn,MBart50Tokenizer:()=>br,MBartTokenizer:()=>gs,MPNetTokenizer:()=>kn,MarianTokenizer:()=>Ot,MgpstrTokenizer:()=>Ln,MobileBertTokenizer:()=>Er,NllbTokenizer:()=>ar,NougatTokenizer:()=>Nr,PreTrainedTokenizer:()=>Lt,Qwen2Tokenizer:()=>An,RoFormerTokenizer:()=>Lr,RobertaTokenizer:()=>Ls,SiglipTokenizer:()=>fn,SpeechT5Tokenizer:()=>On,SqueezeBertTokenizer:()=>Hr,T5Tokenizer:()=>Ys,TokenizerModel:()=>ye,VitsTokenizer:()=>Dn,Wav2Vec2CTCTokenizer:()=>_n,WhisperTokenizer:()=>Xr,XLMRobertaTokenizer:()=>Jn,XLMTokenizer:()=>vt,is_chinese_char:()=>H});var g=r("./src/utils/generic.js"),$=r("./src/utils/core.js"),N=r("./src/utils/hub.js"),Z=r("./src/utils/maths.js"),j=r("./src/utils/tensor.js"),y=r("./src/utils/data-structures.js"),T=r("./node_modules/@huggingface/jinja/dist/index.js"),b=r("./src/models/whisper/common_whisper.js");async function x(Te,M){const Y=await Promise.all([(0,N.getModelJSON)(Te,"tokenizer.json",!0,M),(0,N.getModelJSON)(Te,"tokenizer_config.json",!0,M)]);return M.legacy!==null&&(Y[1].legacy=M.legacy),Y}function v(Te,M){const Y=[];let ce=0;for(const me of Te.matchAll(M)){const Fe=me[0];ce0&&Y.push(Fe),ce=me.index+Fe.length}return ce=19968&&Te<=40959||Te>=13312&&Te<=19903||Te>=131072&&Te<=173791||Te>=173824&&Te<=177983||Te>=177984&&Te<=178207||Te>=178208&&Te<=183983||Te>=63744&&Te<=64255||Te>=194560&&Te<=195103}function I(Te,M,Y){const ce=[];let me=0;for(;methis.tokens_to_ids.get(Y)??this.unk_token_id)}convert_ids_to_tokens(M){return M.map(Y=>this.vocab[Y]??this.unk_token)}}class ge extends ye{constructor(M){super(M),this.tokens_to_ids=K(M.vocab),this.unk_token_id=this.tokens_to_ids.get(M.unk_token),this.unk_token=M.unk_token,this.max_input_chars_per_word=M.max_input_chars_per_word??100,this.vocab=new Array(this.tokens_to_ids.size);for(const[Y,ce]of this.tokens_to_ids)this.vocab[ce]=Y}encode(M){const Y=[];for(const ce of M){const me=[...ce];if(me.length>this.max_input_chars_per_word){Y.push(this.unk_token);continue}let Fe=!1,Ye=0;const gt=[];for(;Ye0&&(pt=this.config.continuing_subword_prefix+pt),this.tokens_to_ids.has(pt)){yt=pt;break}--wt}if(yt===null){Fe=!0;break}gt.push(yt),Ye=wt}Fe?Y.push(this.unk_token):Y.push(...gt)}return Y}}class re extends ye{constructor(M,Y){super(M);const ce=M.vocab.length;this.vocab=new Array(ce),this.scores=new Array(ce);for(let me=0;me[me,Fe])),this.bos_token=" ",this.bos_token_id=this.tokens_to_ids.get(this.bos_token),this.eos_token=Y.eos_token,this.eos_token_id=this.tokens_to_ids.get(this.eos_token),this.unk_token=this.vocab[this.unk_token_id],this.minScore=(0,Z.min)(this.scores)[0],this.unk_score=this.minScore-10,this.scores[this.unk_token_id]=this.unk_score,this.trie=new y.CharTrie,this.trie.extend(this.vocab),this.fuse_unk=!0}populateNodes(M){const Y=M.chars,ce=1;let me=0;for(;me{const Te=[...Array.from({length:94},(me,Fe)=>Fe+33),...Array.from({length:12},(me,Fe)=>Fe+161),...Array.from({length:82},(me,Fe)=>Fe+174)],M=Te.slice();let Y=0;for(let me=0;me<256;++me)Te.includes(me)||(Te.push(me),M.push(256+Y),Y+=1);const ce=M.map(me=>String.fromCharCode(me));return Object.fromEntries(Te.map((me,Fe)=>[me,ce[Fe]]))})(),pe=(0,$.reverseDictionary)(Me);class Ce extends ye{constructor(M){super(M),this.tokens_to_ids=K(M.vocab),this.unk_token_id=this.tokens_to_ids.get(M.unk_token),this.unk_token=M.unk_token,this.vocab=new Array(this.tokens_to_ids.size);for(const[ce,me]of this.tokens_to_ids)this.vocab[me]=ce;const Y=Array.isArray(M.merges[0]);this.merges=Y?M.merges:M.merges.map(ce=>ce.split(" ",2)),this.bpe_ranks=new Map(this.merges.map((ce,me)=>[JSON.stringify(ce),me])),this.end_of_word_suffix=M.end_of_word_suffix,this.continuing_subword_suffix=M.continuing_subword_suffix??null,this.byte_fallback=this.config.byte_fallback??!1,this.byte_fallback&&(this.text_encoder=new TextEncoder),this.ignore_merges=this.config.ignore_merges??!1,this.cache=new Map}bpe(M){if(M.length===0)return[];const Y=this.cache.get(M);if(Y!==void 0)return Y;const ce=Array.from(M);this.end_of_word_suffix&&(ce[ce.length-1]+=this.end_of_word_suffix);let me=[];if(ce.length>1){const Fe=new y.PriorityQueue((wt,yt)=>wt.score`<0x${gt.toString(16).toUpperCase().padStart(2,"0")}>`);Ye.every(gt=>this.tokens_to_ids.has(gt))?Y.push(...Ye):Y.push(this.unk_token)}else Y.push(this.unk_token)}return Y}}class Ae extends ye{constructor(M,Y){super(M),this.tokens_to_ids=K(Y.target_lang?M.vocab[Y.target_lang]:M.vocab),this.bos_token=Y.bos_token,this.bos_token_id=this.tokens_to_ids.get(this.bos_token),this.eos_token=Y.eos_token,this.eos_token_id=this.tokens_to_ids.get(this.eos_token),this.pad_token=Y.pad_token,this.pad_token_id=this.tokens_to_ids.get(this.pad_token),this.unk_token=Y.unk_token,this.unk_token_id=this.tokens_to_ids.get(this.unk_token),this.vocab=new Array(this.tokens_to_ids.size);for(const[ce,me]of this.tokens_to_ids)this.vocab[me]=ce}encode(M){return M}}class Pe extends g.Callable{constructor(M){super(),this.config=M}static fromConfig(M){if(M===null)return null;switch(M.type){case"BertNormalizer":return new Ve(M);case"Precompiled":return new ms(M);case"Sequence":return new ee(M);case"Replace":return new Je(M);case"NFC":return new je(M);case"NFKC":return new _e(M);case"NFKD":return new X(M);case"Strip":return new de(M);case"StripAccents":return new Ee(M);case"Lowercase":return new Oe(M);case"Prepend":return new Xe(M);default:throw new Error(`Unknown Normalizer type: ${M.type}`)}}normalize(M){throw Error("normalize should be implemented in subclass.")}_call(M){return this.normalize(M)}}class Je extends Pe{normalize(M){const Y=L(this.config.pattern);return Y===null?M:M.replaceAll(Y,this.config.content)}}class je extends Pe{normalize(M){return M=M.normalize("NFC"),M}}class _e extends Pe{normalize(M){return M=M.normalize("NFKC"),M}}class X extends Pe{normalize(M){return M=M.normalize("NFKD"),M}}class de extends Pe{normalize(M){return this.config.strip_left&&this.config.strip_right?M=M.trim():(this.config.strip_left&&(M=M.trimStart()),this.config.strip_right&&(M=M.trimEnd())),M}}class Ee extends Pe{normalize(M){return M=V(M),M}}class Oe extends Pe{normalize(M){return M=M.toLowerCase(),M}}class Xe extends Pe{normalize(M){return M=this.config.prepend+M,M}}class ee extends Pe{constructor(M){super(M),this.normalizers=M.normalizers.map(Y=>Pe.fromConfig(Y))}normalize(M){return this.normalizers.reduce((Y,ce)=>ce.normalize(Y),M)}}class Ve extends Pe{_tokenize_chinese_chars(M){const Y=[];for(let ce=0;cethis.pre_tokenize_text(ce,Y)):this.pre_tokenize_text(M,Y)).flat()}_call(M,Y){return this.pre_tokenize(M,Y)}}class te extends Re{constructor(M){super(),this.pattern=new RegExp(`[^\\s${w}]+|[${w}]`,"gu")}pre_tokenize_text(M,Y){return M.trim().match(this.pattern)||[]}}class ve extends Re{constructor(M){super(),this.config=M,this.add_prefix_space=this.config.add_prefix_space,this.trim_offsets=this.config.trim_offsets,this.use_regex=this.config.use_regex??!0,this.pattern=/'s|'t|'re|'ve|'m|'ll|'d| ?\p{L}+| ?\p{N}+| ?[^\s\p{L}\p{N}]+|\s+(?!\S)|\s+/gu,this.byte_encoder=Me,this.text_encoder=new TextEncoder}pre_tokenize_text(M,Y){return this.add_prefix_space&&!M.startsWith(" ")&&(M=" "+M),(this.use_regex?M.match(this.pattern)||[]:[M]).map(me=>Array.from(this.text_encoder.encode(me),Fe=>this.byte_encoder[Fe]).join(""))}}class Ke extends Re{constructor(M){super(),this.config=M,this.pattern=L(this.config.pattern,this.config.invert)}pre_tokenize_text(M,Y){return this.pattern===null?[]:this.config.invert?M.match(this.pattern)||[]:this.config.behavior?.toLowerCase()==="removed"?M.split(this.pattern).filter(ce=>ce):v(M,this.pattern)}}class Ne extends Re{constructor(M){super(),this.config=M,this.pattern=new RegExp(`[^${w}]+|[${w}]+`,"gu")}pre_tokenize_text(M,Y){return M.match(this.pattern)||[]}}class Ue extends Re{constructor(M){super(),this.config=M;const Y=`[^\\d]+|\\d${this.config.individual_digits?"":"+"}`;this.pattern=new RegExp(Y,"gu")}pre_tokenize_text(M,Y){return M.match(this.pattern)||[]}}class ze extends g.Callable{constructor(M){super(),this.config=M}static fromConfig(M){if(M===null)return null;switch(M.type){case"TemplateProcessing":return new mt(M);case"ByteLevel":return new lt(M);case"RobertaProcessing":return new at(M);case"BertProcessing":return new Ze(M);case"Sequence":return new ct(M);default:throw new Error(`Unknown PostProcessor type: ${M.type}`)}}post_process(M,...Y){throw Error("post_process should be implemented in subclass.")}_call(M,...Y){return this.post_process(M,...Y)}}class Ze extends ze{constructor(M){super(M),this.cls=M.cls[0],this.sep=M.sep[0]}post_process(M,Y=null,{add_special_tokens:ce=!0}={}){ce&&(M=(0,$.mergeArrays)([this.cls],M,[this.sep]));let me=new Array(M.length).fill(0);if(Y!==null){const Fe=ce&&this instanceof at?[this.sep]:[],Ye=ce?[this.sep]:[];M=(0,$.mergeArrays)(M,Fe,Y,Ye),me=(0,$.mergeArrays)(me,new Array(Y.length+Fe.length+Ye.length).fill(1))}return{tokens:M,token_type_ids:me}}}class at extends Ze{}class mt extends ze{constructor(M){super(M),this.single=M.single,this.pair=M.pair}post_process(M,Y=null,{add_special_tokens:ce=!0}={}){const me=Y===null?this.single:this.pair;let Fe=[],Ye=[];for(const gt of me)"SpecialToken"in gt?ce&&(Fe.push(gt.SpecialToken.id),Ye.push(gt.SpecialToken.type_id)):"Sequence"in gt&&(gt.Sequence.id==="A"?(Fe=(0,$.mergeArrays)(Fe,M),Ye=(0,$.mergeArrays)(Ye,new Array(M.length).fill(gt.Sequence.type_id))):gt.Sequence.id==="B"&&(Fe=(0,$.mergeArrays)(Fe,Y),Ye=(0,$.mergeArrays)(Ye,new Array(Y.length).fill(gt.Sequence.type_id))));return{tokens:Fe,token_type_ids:Ye}}}class lt extends ze{post_process(M,Y=null){return Y&&(M=(0,$.mergeArrays)(M,Y)),{tokens:M}}}class ct extends ze{constructor(M){super(M),this.processors=M.processors.map(Y=>ze.fromConfig(Y))}post_process(M,Y=null,ce={}){let me;for(const Fe of this.processors)if(Fe instanceof lt)M=Fe.post_process(M).tokens,Y&&(Y=Fe.post_process(Y).tokens);else{const Ye=Fe.post_process(M,Y,ce);M=Ye.tokens,me=Ye.token_type_ids}return{tokens:M,token_type_ids:me}}}class O extends g.Callable{constructor(M){super(),this.config=M,this.added_tokens=[],this.end_of_word_suffix=null,this.trim_offsets=M.trim_offsets}static fromConfig(M){if(M===null)return null;switch(M.type){case"WordPiece":return new We(M);case"Metaspace":return new Ts(M);case"ByteLevel":return new qe(M);case"Replace":return new le(M);case"ByteFallback":return new Q(M);case"Fuse":return new we(M);case"Strip":return new Se(M);case"Sequence":return new st(M);case"CTC":return new tt(M);case"BPEDecoder":return new ft(M);default:throw new Error(`Unknown Decoder type: ${M.type}`)}}_call(M){return this.decode(M)}decode(M){return this.decode_chain(M).join("")}decode_chain(M){throw Error("`decode_chain` should be implemented in subclass.")}}class le extends O{decode_chain(M){const Y=L(this.config.pattern);return Y===null?M:M.map(ce=>ce.replaceAll(Y,this.config.content))}}class Q extends O{constructor(M){super(M),this.text_decoder=new TextDecoder}decode_chain(M){const Y=[];let ce=[];for(const me of M){let Fe=null;if(me.length===6&&me.startsWith("<0x")&&me.endsWith(">")){const Ye=parseInt(me.slice(3,5),16);isNaN(Ye)||(Fe=Ye)}if(Fe!==null)ce.push(Fe);else{if(ce.length>0){const Ye=this.text_decoder.decode(Uint8Array.from(ce));Y.push(Ye),ce=[]}Y.push(me)}}if(ce.length>0){const me=this.text_decoder.decode(Uint8Array.from(ce));Y.push(me),ce=[]}return Y}}class we extends O{decode_chain(M){return[M.join("")]}}class Se extends O{constructor(M){super(M),this.content=this.config.content,this.start=this.config.start,this.stop=this.config.stop}decode_chain(M){return M.map(Y=>{let ce=0;for(let Fe=0;Fe(ce!==0&&(Y.startsWith(this.config.prefix)?Y=Y.replace(this.config.prefix,""):Y=" "+Y),this.cleanup&&(Y=oe(Y)),Y))}}class qe extends O{constructor(M){super(M),this.byte_decoder=pe,this.text_decoder=new TextDecoder("utf-8",{fatal:!1,ignoreBOM:!0}),this.end_of_word_suffix=null}convert_tokens_to_string(M){const Y=M.join(""),ce=new Uint8Array([...Y].map(Fe=>this.byte_decoder[Fe]));return this.text_decoder.decode(ce)}decode_chain(M){const Y=[];let ce=[];for(const me of M)this.added_tokens.find(Fe=>Fe.content===me)!==void 0?(ce.length>0&&(Y.push(this.convert_tokens_to_string(ce)),ce=[]),Y.push(me)):ce.push(me);return ce.length>0&&Y.push(this.convert_tokens_to_string(ce)),Y}}class tt extends O{constructor(M){super(M),this.pad_token=this.config.pad_token,this.word_delimiter_token=this.config.word_delimiter_token,this.cleanup=this.config.cleanup}convert_tokens_to_string(M){if(M.length===0)return"";const Y=[M[0]];for(let Fe=1;FeFe!==this.pad_token).join("");return this.cleanup&&(me=oe(me).replaceAll(this.word_delimiter_token," ").trim()),me}decode_chain(M){return[this.convert_tokens_to_string(M)]}}class st extends O{constructor(M){super(M),this.decoders=M.decoders.map(Y=>O.fromConfig(Y))}decode_chain(M){return this.decoders.reduce((Y,ce)=>ce.decode_chain(Y),M)}}class ft extends O{constructor(M){super(M),this.suffix=this.config.suffix}decode_chain(M){return M.map((Y,ce)=>Y.replaceAll(this.suffix,ce===M.length-1?"":" "))}}class Nt extends O{decode_chain(M){let Y="";for(let ce=1;cece.normalize("NFKC")).join("~"):M=M.normalize("NFKC"),M}}class Ps extends Re{constructor(M){super(),this.tokenizers=M.pretokenizers.map(Y=>Re.fromConfig(Y))}pre_tokenize_text(M,Y){return this.tokenizers.reduce((ce,me)=>me.pre_tokenize(ce,Y),[M])}}class As extends Re{constructor(M){super()}pre_tokenize_text(M,Y){return M.match(/\w+|[^\w\s]+/g)||[]}}class tr extends Re{constructor(M){super()}pre_tokenize_text(M,Y){return S(M)}}class Tr extends Re{constructor(M){super(),this.config=M,this.pattern=L(this.config.pattern),this.content=this.config.content}pre_tokenize_text(M,Y){return this.pattern===null?[M]:[M.replaceAll(this.pattern,this.config.content)]}}const Gr=["bos_token","eos_token","unk_token","sep_token","pad_token","cls_token","mask_token"];function Ns(Te,M,Y,ce){for(const me of Object.keys(Te)){const Fe=M-Te[me].length,Ye=Y(me),gt=new Array(Fe).fill(Ye);Te[me]=ce==="right"?(0,$.mergeArrays)(Te[me],gt):(0,$.mergeArrays)(gt,Te[me])}}function Mr(Te,M){for(const Y of Object.keys(Te))Te[Y].length=M}class Lt extends g.Callable{return_token_type_ids=!1;padding_side="right";constructor(M,Y){super(),this._tokenizer_config=Y,this.normalizer=Pe.fromConfig(M.normalizer),this.pre_tokenizer=Re.fromConfig(M.pre_tokenizer),this.model=ye.fromConfig(M.model,Y),this.post_processor=ze.fromConfig(M.post_processor),this.decoder=O.fromConfig(M.decoder),this.special_tokens=[],this.all_special_ids=[],this.added_tokens=[];for(const ce of M.added_tokens){const me=new ie(ce);this.added_tokens.push(me),this.model.tokens_to_ids.set(me.content,me.id),this.model.vocab[me.id]=me.content,me.special&&(this.special_tokens.push(me.content),this.all_special_ids.push(me.id))}if(this.additional_special_tokens=Y.additional_special_tokens??[],this.special_tokens.push(...this.additional_special_tokens),this.special_tokens=[...new Set(this.special_tokens)],this.decoder&&(this.decoder.added_tokens=this.added_tokens,this.decoder.end_of_word_suffix=this.model.end_of_word_suffix),this.added_tokens_regex=this.added_tokens.length>0?new RegExp(this.added_tokens.slice().sort((ce,me)=>me.content.length-ce.content.length).map(ce=>`${ce.lstrip?"\\s*":""}(${(0,$.escapeRegExp)(ce.content)})${ce.rstrip?"\\s*":""}`).join("|")):null,this.mask_token=this.getToken("mask_token"),this.mask_token_id=this.model.tokens_to_ids.get(this.mask_token),this.pad_token=this.getToken("pad_token","eos_token"),this.pad_token_id=this.model.tokens_to_ids.get(this.pad_token),this.sep_token=this.getToken("sep_token"),this.sep_token_id=this.model.tokens_to_ids.get(this.sep_token),this.unk_token=this.getToken("unk_token"),this.unk_token_id=this.model.tokens_to_ids.get(this.unk_token),this.bos_token=this.getToken("bos_token"),this.bos_token_id=this.model.tokens_to_ids.get(this.bos_token),this.eos_token=this.getToken("eos_token"),this.eos_token_id=this.model.tokens_to_ids.get(this.eos_token),this.model_max_length=Y.model_max_length,this.remove_space=Y.remove_space,this.clean_up_tokenization_spaces=Y.clean_up_tokenization_spaces??!0,this.do_lowercase_and_remove_accent=Y.do_lowercase_and_remove_accent??!1,Y.padding_side&&(this.padding_side=Y.padding_side),this.legacy=!1,this.chat_template=Y.chat_template??null,Array.isArray(this.chat_template)){const ce=Object.create(null);for(const{name:me,template:Fe}of this.chat_template){if(typeof me!="string"||typeof Fe!="string")throw new Error('Chat template must be a list of objects with "name" and "template" properties');ce[me]=Fe}this.chat_template=ce}this._compiled_template_cache=new Map}getToken(...M){for(const Y of M){const ce=this._tokenizer_config[Y];if(ce)if(typeof ce=="object"){if(ce.__type==="AddedToken")return ce.content;throw Error(`Unknown token: ${ce}`)}else return ce}return null}static async from_pretrained(M,{progress_callback:Y=null,config:ce=null,cache_dir:me=null,local_files_only:Fe=!1,revision:Ye="main",legacy:gt=null}={}){const wt=await x(M,{progress_callback:Y,config:ce,cache_dir:me,local_files_only:Fe,revision:Ye,legacy:gt});return new this(...wt)}_call(M,{text_pair:Y=null,add_special_tokens:ce=!0,padding:me=!1,truncation:Fe=null,max_length:Ye=null,return_tensor:gt=!0,return_token_type_ids:wt=null}={}){const yt=Array.isArray(M);let pt;if(yt){if(M.length===0)throw Error("text array must be non-empty");if(Y!==null){if(Array.isArray(Y)){if(M.length!==Y.length)throw Error("text and text_pair must have the same length")}else throw Error("text_pair must also be an array");pt=M.map((Yt,Ms)=>this._encode_plus(Yt,{text_pair:Y[Ms],add_special_tokens:ce,return_token_type_ids:wt}))}else pt=M.map(Yt=>this._encode_plus(Yt,{add_special_tokens:ce,return_token_type_ids:wt}))}else{if(M==null)throw Error("text may not be null or undefined");if(Array.isArray(Y))throw Error("When specifying `text_pair`, since `text` is a string, `text_pair` must also be a string (i.e., not an array).");pt=[this._encode_plus(M,{text_pair:Y,add_special_tokens:ce,return_token_type_ids:wt})]}if(Ye===null?me==="max_length"?Ye=this.model_max_length:Ye=(0,Z.max)(pt.map(Yt=>Yt.input_ids.length))[0]:Fe||console.warn("Truncation was not explicitly activated but `max_length` is provided a specific value, please use `truncation=true` to explicitly truncate examples to max length."),Ye=Math.min(Ye,this.model_max_length??1/0),me||Fe)for(let Yt=0;YtYe?Fe&&Mr(pt[Yt],Ye):me&&Ns(pt[Yt],Ye,Ms=>Ms==="input_ids"?this.pad_token_id:0,this.padding_side));const rs={};if(gt){if(!(me&&Fe)&&pt.some(Ms=>{for(const Gs of Object.keys(Ms))if(Ms[Gs].length!==pt[0][Gs]?.length)return!0;return!1}))throw Error("Unable to create tensor, you should probably activate truncation and/or padding with 'padding=true' and 'truncation=true' to have batched tensors with the same length.");const Yt=[pt.length,pt[0].input_ids.length];for(const Ms of Object.keys(pt[0]))rs[Ms]=new j.Tensor("int64",BigInt64Array.from(pt.flatMap(Gs=>Gs[Ms]).map(BigInt)),Yt)}else{for(const Yt of Object.keys(pt[0]))rs[Yt]=pt.map(Ms=>Ms[Yt]);if(!yt)for(const Yt of Object.keys(rs))rs[Yt]=rs[Yt][0]}return rs}_encode_text(M){return M===null?null:(this.added_tokens_regex?M.split(this.added_tokens_regex).filter(me=>me):[M]).map((me,Fe)=>{if(this.added_tokens.find(gt=>gt.content===me)!==void 0)return me;{if(this.remove_space===!0&&(me=me.trim().split(/\s+/).join(" ")),this.do_lowercase_and_remove_accent&&(me=U(me)),this.normalizer!==null&&(me=this.normalizer(me)),me.length===0)return[];const gt=this.pre_tokenizer!==null?this.pre_tokenizer(me,{section_index:Fe}):[me];return this.model(gt)}}).flat()}_encode_plus(M,{text_pair:Y=null,add_special_tokens:ce=!0,return_token_type_ids:me=null}={}){const{tokens:Fe,token_type_ids:Ye}=this._tokenize_helper(M,{pair:Y,add_special_tokens:ce}),gt=this.model.convert_tokens_to_ids(Fe),wt={input_ids:gt,attention_mask:new Array(gt.length).fill(1)};return(me??this.return_token_type_ids)&&Ye&&(wt.token_type_ids=Ye),wt}_tokenize_helper(M,{pair:Y=null,add_special_tokens:ce=!1}={}){const me=this._encode_text(M),Fe=this._encode_text(Y);return this.post_processor?this.post_processor(me,Fe,{add_special_tokens:ce}):{tokens:(0,$.mergeArrays)(me??[],Fe??[])}}tokenize(M,{pair:Y=null,add_special_tokens:ce=!1}={}){return this._tokenize_helper(M,{pair:Y,add_special_tokens:ce}).tokens}encode(M,{text_pair:Y=null,add_special_tokens:ce=!0,return_token_type_ids:me=null}={}){return this._encode_plus(M,{text_pair:Y,add_special_tokens:ce,return_token_type_ids:me}).input_ids}batch_decode(M,Y={}){return M instanceof j.Tensor&&(M=M.tolist()),M.map(ce=>this.decode(ce,Y))}decode(M,Y={}){if(M instanceof j.Tensor&&(M=se(M)),!Array.isArray(M)||M.length===0||!(0,$.isIntegralNumber)(M[0]))throw Error("token_ids must be a non-empty array of integers.");return this.decode_single(M,Y)}decode_single(M,{skip_special_tokens:Y=!1,clean_up_tokenization_spaces:ce=null}){let me=this.model.convert_ids_to_tokens(M);Y&&(me=me.filter(Ye=>!this.special_tokens.includes(Ye)));let Fe=this.decoder?this.decoder(me):me.join(" ");return this.decoder&&this.decoder.end_of_word_suffix&&(Fe=Fe.replaceAll(this.decoder.end_of_word_suffix," "),Y&&(Fe=Fe.trim())),(ce??this.clean_up_tokenization_spaces)&&(Fe=oe(Fe)),Fe}get_chat_template({chat_template:M=null,tools:Y=null}={}){if(this.chat_template&&typeof this.chat_template=="object"){const ce=this.chat_template;if(M!==null&&Object.hasOwn(ce,M))M=ce[M];else if(M===null)if(Y!==null&&"tool_use"in ce)M=ce.tool_use;else if("default"in ce)M=ce.default;else throw Error(`This model has multiple chat templates with no default specified! Please either pass a chat template or the name of the template you wish to use to the 'chat_template' argument. Available template names are ${Object.keys(ce).sort()}.`)}else if(M===null)if(this.chat_template)M=this.chat_template;else throw Error("Cannot use apply_chat_template() because tokenizer.chat_template is not set and no template argument was passed! For information about writing templates and setting the tokenizer.chat_template attribute, please see the documentation at https://huggingface.co/docs/transformers/main/en/chat_templating");return M}apply_chat_template(M,{tools:Y=null,documents:ce=null,chat_template:me=null,add_generation_prompt:Fe=!1,tokenize:Ye=!0,padding:gt=!1,truncation:wt=!1,max_length:yt=null,return_tensor:pt=!0,return_dict:rs=!1,tokenizer_kwargs:Yt={},...Ms}={}){if(me=this.get_chat_template({chat_template:me,tools:Y}),typeof me!="string")throw Error(`chat_template must be a string, but got ${typeof me}`);let Gs=this._compiled_template_cache.get(me);Gs===void 0&&(Gs=new T.Template(me),this._compiled_template_cache.set(me,Gs));const jt=Object.create(null);for(const Ks of Gr){const Js=this.getToken(Ks);Js&&(jt[Ks]=Js)}const is=Gs.render({messages:M,add_generation_prompt:Fe,tools:Y,documents:ce,...jt,...Ms});if(Ye){const Ks=this._call(is,{add_special_tokens:!1,padding:gt,truncation:wt,max_length:yt,return_tensor:pt,...Yt});return rs?Ks:Ks.input_ids}return is}}class Kr extends Lt{return_token_type_ids=!0}class Pr extends Lt{return_token_type_ids=!0}class Er extends Lt{return_token_type_ids=!0}class Hr extends Lt{return_token_type_ids=!0}class dr extends Lt{return_token_type_ids=!0}class qr extends Lt{return_token_type_ids=!0}class Cr extends Lt{return_token_type_ids=!0}class Dr extends Lt{return_token_type_ids=!0}class Lr extends Lt{return_token_type_ids=!0}class or extends Lt{}class it extends Lt{}class vt extends Lt{return_token_type_ids=!0;constructor(M,Y){super(M,Y),console.warn('WARNING: `XLMTokenizer` is not yet supported by Hugging Face\'s "fast" tokenizers library. Therefore, you may experience slightly inaccurate results.')}}class Ft extends Lt{return_token_type_ids=!0}class Ys extends Lt{}class Cn extends Lt{}class dn extends Lt{}class gs extends Lt{constructor(M,Y){super(M,Y),this.languageRegex=/^[a-z]{2}_[A-Z]{2}$/,this.language_codes=this.special_tokens.filter(ce=>this.languageRegex.test(ce)),this.lang_to_token=ce=>ce}_build_translation_inputs(M,Y,ce){return fr(this,M,Y,ce)}}class br extends gs{}class Ls extends Lt{}class Qr extends Lt{}const ns="▁";class cn extends Lt{padding_side="left";constructor(M,Y){super(M,Y),this.legacy=Y.legacy??!0,this.legacy||(this.normalizer=null,this.pre_tokenizer=new ss({replacement:ns,add_prefix_space:!0,prepend_scheme:"first"}))}_encode_text(M){if(M===null)return null;if(this.legacy||M.length===0)return super._encode_text(M);let Y=super._encode_text(ns+M.replaceAll(ns," "));return Y.length>1&&Y[0]===ns&&this.special_tokens.includes(Y[1])&&(Y=Y.slice(1)),Y}}class zr extends Lt{}class Jn extends Lt{}class kn extends Lt{}class Sn extends Lt{}class $n extends Lt{}class Br extends Lt{}class An extends Lt{}class Zn extends Lt{}class Rr extends Lt{}function fr(Te,M,Y,ce){if(!("language_codes"in Te)||!Array.isArray(Te.language_codes))throw new Error("Tokenizer must have `language_codes` attribute set and it should be an array of language ids.");if(!("languageRegex"in Te)||!(Te.languageRegex instanceof RegExp))throw new Error("Tokenizer must have `languageRegex` attribute set and it should be a regular expression.");if(!("lang_to_token"in Te)||typeof Te.lang_to_token!="function")throw new Error("Tokenizer must have `lang_to_token` attribute set and it should be a function.");const me=ce.src_lang,Fe=ce.tgt_lang;if(!Te.language_codes.includes(Fe))throw new Error(`Target language code "${Fe}" is not valid. Must be one of: {${Te.language_codes.join(", ")}}`);if(me!==void 0){if(!Te.language_codes.includes(me))throw new Error(`Source language code "${me}" is not valid. Must be one of: {${Te.language_codes.join(", ")}}`);for(const Ye of Te.post_processor.config.single)if("SpecialToken"in Ye&&Te.languageRegex.test(Ye.SpecialToken.id)){Ye.SpecialToken.id=Te.lang_to_token(me);break}}return ce.forced_bos_token_id=Te.model.convert_tokens_to_ids([Te.lang_to_token(Fe)])[0],Te._call(M,Y)}class ar extends Lt{constructor(M,Y){super(M,Y),this.languageRegex=/^[a-z]{3}_[A-Z][a-z]{3}$/,this.language_codes=this.special_tokens.filter(ce=>this.languageRegex.test(ce)),this.lang_to_token=ce=>ce}_build_translation_inputs(M,Y,ce){return fr(this,M,Y,ce)}}class pn extends Lt{constructor(M,Y){super(M,Y),this.languageRegex=/^__[a-z]{2,3}__$/,this.language_codes=this.special_tokens.filter(ce=>this.languageRegex.test(ce)).map(ce=>ce.slice(2,-2)),this.lang_to_token=ce=>`__${ce}__`}_build_translation_inputs(M,Y,ce){return fr(this,M,Y,ce)}}class Xr extends Lt{get timestamp_begin(){return this.model.convert_tokens_to_ids(["<|notimestamps|>"])[0]+1}_decode_asr(M,{return_timestamps:Y=!1,return_language:ce=!1,time_precision:me=null,force_full_sequences:Fe=!0}={}){if(me===null)throw Error("Must specify time_precision");let Ye=null;const gt=Y==="word";function wt(){return{language:Ye,timestamp:[null,null],text:""}}const yt=[];let pt=wt(),rs=0;const Yt=this.timestamp_begin,Gs=Yt+1500;let jt=[],is=[],Ks=!1,Js=null;const De=new Set(this.all_special_ids);for(const Es of M){const Hs=Es.tokens,$t=gt?Es.token_timestamps:null;let sr=null,_r=Yt;if("stride"in Es){const[Mt,Gt,Is]=Es.stride;if(rs-=Gt,Js=Mt-Is,Gt&&(_r=Gt/me+Yt),Is)for(let ks=Hs.length-1;ks>=0;--ks){const js=Number(Hs[ks]);if(js>=Yt){if(sr!==null&&(js-Yt)*me=Yt&&Gt<=Gs){const Is=(Gt-Yt)*me+rs,ks=(0,Z.round)(Is,2);if(sr!==null&&Gt>=sr)Ks=!0;else if(Ks||jt.length>0&&Gt<_r)Ks=!1;else if(pt.timestamp[0]===null)pt.timestamp[0]=ks;else if(ks!==pt.timestamp[0]){pt.timestamp[1]=ks,jt.push(ds),gt&&is.push(Cs);const[js,Tt]=this.findLongestCommonSequence(jt,is),Yr=this.decode(js);pt.text=Yr,gt&&(pt.words=this.collateWordTimestamps(js,Tt,Ye)),yt.push(pt),jt=[],ds=[],is=[],Cs=[],pt=wt()}}else if(ds.push(Gt),gt){let Is=(0,Z.round)($t[Mt]+rs,2),ks;if(Mt+1<$t.length){ks=(0,Z.round)($t[Mt+1]+rs,2);const js=this.decode([Gt]);P.test(js)&&(ks=(0,Z.round)(Math.min(Is+me,ks),2))}else ks=null;Cs.push([Is,ks])}}if("stride"in Es){const[Mt,Gt,Is]=Es.stride;rs+=Mt-Is}ds.length>0?(jt.push(ds),gt&&is.push(Cs)):jt.every(Mt=>Mt.length===0)&&(pt=wt(),jt=[],ds=[],is=[],Cs=[])}if(jt.length>0){if(Fe&&Y)throw new Error("Whisper did not predict an ending timestamp, which can happen if audio is cut off in the middle of a word. Also make sure WhisperTimeStampLogitsProcessor was used during generation.");const[Es,Hs]=this.findLongestCommonSequence(jt,is),$t=this.decode(Es);pt.text=$t,gt&&(pt.words=this.collateWordTimestamps(Es,Hs,Ye)),yt.push(pt)}let Xs=Object.create(null);const kr=yt.map(Es=>Es.text).join("");if(Y||ce){for(let Es=0;Es0;let gt=Ye?[]:null,wt=Ye?Y[0]:null;for(let yt=1;ytGt===_r[Is]&&wt[kr+Is]<=Y[yt][$t+Is]).length:ds=Hs.filter((Gt,Is)=>Gt===_r[Is]).length;const Cs=Xs/1e4,Mt=ds/Xs+Cs;ds>1&&Mt>rs&&(rs=Mt,Yt=[kr,Es,$t,sr])}const[Gs,jt,is,Ks]=Yt,Js=Math.floor((jt+Gs)/2),De=Math.floor((Ks+is)/2);Fe.push(...ce.slice(0,Js)),ce=pt.slice(De),me=ce.length,Ye&&(gt.push(...wt.slice(0,Js)),wt=Y[yt].slice(De))}return Fe.push(...ce),Ye?(gt.push(...wt),[Fe,gt]):[Fe,[]]}collateWordTimestamps(M,Y,ce){const[me,Fe,Ye]=this.combineTokensIntoWords(M,ce),gt=[];for(let wt=0;wt=me){const gt=((Ye-me)*ce).toFixed(2);Fe.push(`<|${gt}|>`),Fe.push([])}else Fe[Fe.length-1].push(Ye);return Fe=Fe.map(Ye=>typeof Ye=="string"?Ye:super.decode(Ye,Y)),Fe.join("")}splitTokensOnUnicode(M){const Y=this.decode(M,{decode_with_timestamps:!0}),ce="�",me=[],Fe=[],Ye=[];let gt=[],wt=[],yt=0;for(let pt=0;pt=this.model.tokens_to_ids.get("<|endoftext|>"),Gs=pt.startsWith(" "),jt=pt.trim(),is=wt.test(jt);if(Ms||Gs||is||Fe.length===0)Fe.push(pt),Ye.push(rs),gt.push(Yt);else{const Ks=Fe.length-1;Fe[Ks]+=pt,Ye[Ks].push(...rs),gt[Ks].push(...Yt)}}return[Fe,Ye,gt]}mergePunctuations(M,Y,ce,me,Fe){const Ye=structuredClone(M),gt=structuredClone(Y),wt=structuredClone(ce);let yt=Ye.length-2,pt=Ye.length-1;for(;yt>=0;)Ye[yt].startsWith(" ")&&me.includes(Ye[yt].trim())?(Ye[pt]=Ye[yt]+Ye[pt],gt[pt]=(0,$.mergeArrays)(gt[yt],gt[pt]),wt[pt]=(0,$.mergeArrays)(wt[yt],wt[pt]),Ye[yt]="",gt[yt]=[],wt[yt]=[]):pt=yt,--yt;for(yt=0,pt=1;ptrs),gt.filter(rs=>rs.length>0),wt.filter(rs=>rs.length>0)]}}class hn extends Lt{}class mn extends Lt{}class fn extends Lt{}class Ot extends Lt{constructor(M,Y){super(M,Y),this.languageRegex=/^(>>\w+<<)\s*/g,this.supported_language_codes=this.model.vocab.filter(ce=>this.languageRegex.test(ce)),console.warn('WARNING: `MarianTokenizer` is not yet supported by Hugging Face\'s "fast" tokenizers library. Therefore, you may experience slightly inaccurate results.')}_encode_text(M){if(M===null)return null;const[Y,...ce]=M.trim().split(this.languageRegex);if(ce.length===0)return super._encode_text(Y);if(ce.length===2){const[me,Fe]=ce;return this.supported_language_codes.includes(me)||console.warn(`Unsupported language code "${me}" detected, which may lead to unexpected behavior. Should be one of: ${JSON.stringify(this.supported_language_codes)}`),(0,$.mergeArrays)([me],super._encode_text(Fe))}}}class _n extends Lt{}class In extends Lt{}class Fn extends Lt{}class On extends Lt{}class Nr extends Lt{}class Dn extends Lt{constructor(M,Y){super(M,Y),this.decoder=new Nt({})}}class gn extends Lt{}class Ln extends Lt{}class as{static TOKENIZER_CLASS_MAPPING={T5Tokenizer:Ys,DistilBertTokenizer:or,CamembertTokenizer:it,DebertaTokenizer:dr,DebertaV2Tokenizer:qr,BertTokenizer:Kr,HerbertTokenizer:Cr,ConvBertTokenizer:Dr,RoFormerTokenizer:Lr,XLMTokenizer:vt,ElectraTokenizer:Ft,MobileBertTokenizer:Er,SqueezeBertTokenizer:Hr,AlbertTokenizer:Pr,GPT2Tokenizer:Cn,BartTokenizer:dn,MBartTokenizer:gs,MBart50Tokenizer:br,RobertaTokenizer:Ls,WhisperTokenizer:Xr,CodeGenTokenizer:hn,CLIPTokenizer:mn,SiglipTokenizer:fn,MarianTokenizer:Ot,BloomTokenizer:Qr,NllbTokenizer:ar,M2M100Tokenizer:pn,LlamaTokenizer:cn,CodeLlamaTokenizer:zr,XLMRobertaTokenizer:Jn,MPNetTokenizer:kn,FalconTokenizer:Sn,GPTNeoXTokenizer:$n,EsmTokenizer:Br,Wav2Vec2CTCTokenizer:_n,BlenderbotTokenizer:In,BlenderbotSmallTokenizer:Fn,SpeechT5Tokenizer:On,NougatTokenizer:Nr,VitsTokenizer:Dn,Qwen2Tokenizer:An,GemmaTokenizer:Zn,Grok1Tokenizer:Rr,CohereTokenizer:gn,MgpstrTokenizer:Ln,PreTrainedTokenizer:Lt};static async from_pretrained(M,{progress_callback:Y=null,config:ce=null,cache_dir:me=null,local_files_only:Fe=!1,revision:Ye="main",legacy:gt=null}={}){const[wt,yt]=await x(M,{progress_callback:Y,config:ce,cache_dir:me,local_files_only:Fe,revision:Ye,legacy:gt}),pt=yt.tokenizer_class?.replace(/Fast$/,"")??"PreTrainedTokenizer";let rs=this.TOKENIZER_CLASS_MAPPING[pt];return rs||(console.warn(`Unknown tokenizer class "${pt}", attempting to construct from base class.`),rs=Lt),new rs(wt,yt)}}},"./src/utils/audio.js":(ke,A,r)=>{r.r(A),r.d(A,{RawAudio:()=>ge,hamming:()=>v,hanning:()=>x,mel_filter_bank:()=>H,read_audio:()=>T,spectrogram:()=>F,window_function:()=>ae});var g=r("./src/utils/hub.js"),$=r("./src/utils/maths.js"),N=r("./src/utils/core.js"),Z=r("./src/env.js"),j=r("?7a2c"),y=r("./src/utils/tensor.js");async function T(re,Me){if(typeof AudioContext>"u")throw Error("Unable to load audio from path/URL since `AudioContext` is not available in your environment. Instead, audio data should be passed directly to the pipeline/processor. For more information and some example code, see https://huggingface.co/docs/transformers.js/guides/node-audio-processing.");const pe=await(await(0,g.getFile)(re)).arrayBuffer(),Ce=new AudioContext({sampleRate:Me});typeof Me>"u"&&console.warn(`No sampling rate provided, using default of ${Ce.sampleRate}Hz.`);const Ae=await Ce.decodeAudioData(pe);let Pe;if(Ae.numberOfChannels===2){const Je=Math.sqrt(2),je=Ae.getChannelData(0),_e=Ae.getChannelData(1);Pe=new Float32Array(je.length);for(let X=0;X2595*Math.log10(1+re/700),kaldi:re=>1127*Math.log(1+re/700),slaney:(re,Me=1e3,pe=15,Ce=27/Math.log(6.4))=>re>=Me?pe+Math.log(re/Me)*Ce:3*re/200};function K(re,Me="htk"){const pe=L[Me];if(!pe)throw new Error('mel_scale should be one of "htk", "slaney" or "kaldi".');return typeof re=="number"?pe(re):re.map(Ce=>pe(Ce))}const se={htk:re=>700*(10**(re/2595)-1),kaldi:re=>700*(Math.exp(re/1127)-1),slaney:(re,Me=1e3,pe=15,Ce=Math.log(6.4)/27)=>re>=pe?Me*Math.exp(Ce*(re-pe)):200*re/3};function oe(re,Me="htk"){const pe=se[Me];if(!pe)throw new Error('mel_scale should be one of "htk", "slaney" or "kaldi".');return typeof re=="number"?pe(re):re.map(Ce=>pe(Ce))}function V(re,Me){const pe=Float64Array.from({length:Me.length-1},(Je,je)=>Me[je+1]-Me[je]),Ce=Array.from({length:re.length},()=>new Array(Me.length));for(let Je=0;Jenew Array(re.length));for(let Je=0;Jere+Ce*Pe)}function H(re,Me,pe,Ce,Ae,Pe=null,Je="htk",je=!1){if(Pe!==null&&Pe!=="slaney")throw new Error('norm must be one of null or "slaney"');const _e=K(pe,Je),X=K(Ce,Je),de=U(_e,X,Me+2);let Ee=oe(de,Je),Oe;if(je){const ee=Ae/(re*2);Oe=K(Float64Array.from({length:re},(Ve,Re)=>Re*ee),Je),Ee=de}else Oe=U(0,Math.floor(Ae/2),re);const Xe=V(Oe,Ee);if(Pe!==null&&Pe==="slaney")for(let ee=0;eeAe)throw Error(`frame_length (${pe}) may not be larger than fft_length (${Ae})`);if(Ue!==pe)throw new Error(`Length of the window (${Ue}) must equal frame_length (${pe})`);if(Ce<=0)throw new Error("hop_length must be greater than zero");if(Pe===null&&de!==null)throw new Error("You have provided `mel_filters` but `power` is `None`. Mel spectrogram computation is not yet supported for complex-valued spectrogram. Specify `power` to fix this issue.");if(Je){if(je!=="reflect")throw new Error(`pad_mode="${je}" not implemented yet.`);const We=Math.floor((Ae-1)/2)+1;re=I(re,We,We)}let ze=Math.floor(1+Math.floor((re.length-pe)/Ce));te!==null&&zeze?Ke&&(mt=ve):mt=at=ve);const lt=new $.FFT(Ae),ct=new Float64Array(Ae),O=new Float64Array(lt.outputBufferSize),le=new Float32Array(Ze*mt);for(let We=0;We=1;--st)ct[st]-=X*ct[st-1];ct[0]*=1-X}for(let st=0;stMath.pow(je,.85));break;default:throw new Error(`Unknown window type ${Me}.`)}if(pe&&(Je=Je.subarray(0,re)),Ce===null)return Je;if(re>Ce)throw new Error(`Length of the window (${re}) may not be larger than frame_length (${Ce})`);return Je}function ie(re,Me){let pe=44;const Ce=new ArrayBuffer(pe+re.length*4),Ae=new DataView(Ce);ye(Ae,0,"RIFF"),Ae.setUint32(4,36+re.length*4,!0),ye(Ae,8,"WAVE"),ye(Ae,12,"fmt "),Ae.setUint32(16,16,!0),Ae.setUint16(20,3,!0),Ae.setUint16(22,1,!0),Ae.setUint32(24,Me,!0),Ae.setUint32(28,Me*4,!0),Ae.setUint16(32,4,!0),Ae.setUint16(34,32,!0),ye(Ae,36,"data"),Ae.setUint32(40,re.length*4,!0);for(let Pe=0;Pe{let Pe=await Ae.arrayBuffer();j.writeFileSync(Ce,Buffer.from(Pe))};else throw new Error("Unable to save because filesystem is disabled in this environment.");await pe(Me,this.toBlob())}}},"./src/utils/constants.js":(ke,A,r)=>{r.r(A),r.d(A,{CHAT_TEMPLATE_NAME:()=>y,CONFIG_NAME:()=>$,FEATURE_EXTRACTOR_NAME:()=>N,GENERATION_CONFIG_NAME:()=>T,GITHUB_ISSUE_URL:()=>g,IMAGE_PROCESSOR_NAME:()=>Z,PROCESSOR_NAME:()=>j});const g="https://github.com/huggingface/transformers.js/issues/new/choose",$="config.json",N="preprocessor_config.json",Z=N,j="processor_config.json",y="chat_template.json",T="generation_config.json"},"./src/utils/core.js":(ke,A,r)=>{r.r(A),r.d(A,{calculateDimensions:()=>T,calculateReflectOffset:()=>L,count:()=>V,dispatchCallback:()=>g,escapeRegExp:()=>N,isIntegralNumber:()=>j,isNullishDimension:()=>y,isTypedArray:()=>Z,len:()=>oe,mergeArrays:()=>x,pick:()=>se,pop:()=>b,product:()=>v,reverseDictionary:()=>$,saveBlob:()=>K});function g(U,H){U&&U(H)}function $(U){return Object.fromEntries(Object.entries(U).map(([H,I])=>[I,H]))}function N(U){return U.replace(/[.*+?^${}()|[\]\\]/g,"\\$&")}function Z(U){return U?.prototype?.__proto__?.constructor?.name==="TypedArray"}function j(U){return Number.isInteger(U)||typeof U=="bigint"}function y(U){return U==null||U===-1}function T(U){const H=[];let I=U;for(;Array.isArray(I);)H.push(I.length),I=I[0];return H}function b(U,H,I=void 0){const S=U[H];if(S!==void 0)return delete U[H],S;if(I===void 0)throw Error(`Key ${H} does not exist in object.`);return I}function x(...U){return Array.prototype.concat.apply([],U)}function v(...U){return U.reduce((H,I)=>H.flatMap(S=>I.map(w=>[S,w])))}function L(U,H){return Math.abs((U+H)%(2*H)-H)}function K(U,H){const I=URL.createObjectURL(H),S=document.createElement("a");S.href=I,S.download=U,S.click(),S.remove(),URL.revokeObjectURL(I)}function se(U,H){return Object.assign({},...H.map(I=>{if(U[I]!==void 0)return{[I]:U[I]}}))}function oe(U){let H=0;for(const I of U)++H;return H}function V(U,H){let I=0;for(const S of U)S===H&&++I;return I}},"./src/utils/data-structures.js":(ke,A,r)=>{r.r(A),r.d(A,{CharTrie:()=>$,PriorityQueue:()=>g,TokenLattice:()=>Z});class g{constructor(T=(x,v)=>x>v,b=1/0){this._heap=[],this._comparator=T,this._maxSize=b}get size(){return this._heap.length}isEmpty(){return this.size===0}peek(){return this._heap[0]}push(...T){return this.extend(T)}extend(T){for(const b of T)if(this.size0&&this._swap(0,b),this._heap.pop(),this._siftDown(),T}replace(T){const b=this.peek();return this._heap[0]=T,this._siftDown(),b}_parent(T){return(T+1>>>1)-1}_left(T){return(T<<1)+1}_right(T){return T+1<<1}_greater(T,b){return this._comparator(this._heap[T],this._heap[b])}_swap(T,b){const x=this._heap[T];this._heap[T]=this._heap[b],this._heap[b]=x}_siftUp(){this._siftUpFrom(this.size-1)}_siftUpFrom(T){for(;T>0&&this._greater(T,this._parent(T));)this._swap(T,this._parent(T)),T=this._parent(T)}_siftDown(){let T=0;for(;this._left(T)[]),this.endNodes=Array.from({length:this.len+1},()=>[]);const v=new j(this.bosTokenId,0,0,0,0),L=new j(this.eosTokenId,1,this.len,0,0);this.nodes.push(v.clone()),this.nodes.push(L.clone()),this.beginNodes[this.len].push(L),this.endNodes[0].push(v)}insert(T,b,x,v){const L=this.nodes.length,K=new j(v,L,T,b,x);this.beginNodes[T].push(K),this.endNodes[T+b].push(K),this.nodes.push(K)}viterbi(){const T=this.len;let b=0;for(;b<=T;){if(this.beginNodes[b].length==0)return[];for(let se of this.beginNodes[b]){se.prev=null;let oe=0,V=null;for(let U of this.endNodes[b]){const H=U.backtraceScore+se.score;(V===null||H>oe)&&(V=U.clone(),oe=H)}if(V!==null)se.prev=V,se.backtraceScore=oe;else return[]}++b}const x=[],L=this.beginNodes[T][0].prev;if(L===null)return[];let K=L.clone();for(;K.prev!==null;)x.push(K.clone()),K=K.clone().prev.clone();return x.reverse(),x}piece(T){return this.chars.slice(T.pos,T.pos+T.length).join("")}tokens(){return this.viterbi().map(b=>this.piece(b))}tokenIds(){return this.viterbi().map(b=>b.tokenId)}}class j{constructor(T,b,x,v,L){this.tokenId=T,this.nodeId=b,this.pos=x,this.length=v,this.score=L,this.prev=null,this.backtraceScore=0}clone(){const T=new j(this.tokenId,this.nodeId,this.pos,this.length,this.score);return T.prev=this.prev,T.backtraceScore=this.backtraceScore,T}}},"./src/utils/devices.js":(ke,A,r)=>{r.r(A),r.d(A,{DEVICE_TYPES:()=>g});const g=Object.freeze({auto:"auto",gpu:"gpu",cpu:"cpu",wasm:"wasm",webgpu:"webgpu",cuda:"cuda",dml:"dml",webnn:"webnn","webnn-npu":"webnn-npu","webnn-gpu":"webnn-gpu","webnn-cpu":"webnn-cpu"})},"./src/utils/dtypes.js":(ke,A,r)=>{r.r(A),r.d(A,{DATA_TYPES:()=>Z,DEFAULT_DEVICE_DTYPE_MAPPING:()=>j,DEFAULT_DTYPE_SUFFIX_MAPPING:()=>y,isWebGpuFp16Supported:()=>N});var g=r("./src/env.js"),$=r("./src/utils/devices.js");const N=function(){let T;return async function(){if(T===void 0)if(!g.apis.IS_WEBGPU_AVAILABLE)T=!1;else try{T=(await navigator.gpu.requestAdapter()).features.has("shader-f16")}catch{T=!1}return T}}(),Z=Object.freeze({auto:"auto",fp32:"fp32",fp16:"fp16",q8:"q8",int8:"int8",uint8:"uint8",q4:"q4",bnb4:"bnb4",q4f16:"q4f16"}),j=Object.freeze({[$.DEVICE_TYPES.wasm]:Z.q8}),y=Object.freeze({[Z.fp32]:"",[Z.fp16]:"_fp16",[Z.int8]:"_int8",[Z.uint8]:"_uint8",[Z.q8]:"_quantized",[Z.q4]:"_q4",[Z.q4f16]:"_q4f16",[Z.bnb4]:"_bnb4"})},"./src/utils/generic.js":(ke,A,r)=>{r.r(A),r.d(A,{Callable:()=>g});const g=class{constructor(){let $=function(...N){return $._call(...N)};return Object.setPrototypeOf($,new.target.prototype)}_call(...$){throw Error("Must implement _call method in subclass")}}},"./src/utils/hub.js":(ke,A,r)=>{r.r(A),r.d(A,{getFile:()=>b,getModelFile:()=>se,getModelJSON:()=>oe});var g=r("?7a2c"),$=r("?a42a"),N=r("./src/env.js"),Z=r("./src/utils/core.js");const j={txt:"text/plain",html:"text/html",css:"text/css",js:"text/javascript",json:"application/json",png:"image/png",jpg:"image/jpeg",jpeg:"image/jpeg",gif:"image/gif"};class y{constructor(I){if(this.filePath=I,this.headers=new Headers,this.exists=g.existsSync(I),this.exists){this.status=200,this.statusText="OK";let S=g.statSync(I);this.headers.set("content-length",S.size.toString()),this.updateContentType();let w=this;this.body=new ReadableStream({start(P){w.arrayBuffer().then(F=>{P.enqueue(new Uint8Array(F)),P.close()})}})}else this.status=404,this.statusText="Not Found",this.body=null}updateContentType(){const I=this.filePath.toString().split(".").pop().toLowerCase();this.headers.set("content-type",j[I]??"application/octet-stream")}clone(){let I=new y(this.filePath);return I.exists=this.exists,I.status=this.status,I.statusText=this.statusText,I.headers=new Headers(this.headers),I}async arrayBuffer(){return(await g.promises.readFile(this.filePath)).buffer}async blob(){const I=await g.promises.readFile(this.filePath);return new Blob([I],{type:this.headers.get("content-type")})}async text(){return await g.promises.readFile(this.filePath,"utf8")}async json(){return JSON.parse(await this.text())}}function T(H,I=null,S=null){let w;try{w=new URL(H)}catch{return!1}return!(I&&!I.includes(w.protocol)||S&&!S.includes(w.hostname))}async function b(H){if(N.env.useFS&&!T(H,["http:","https:","blob:"]))return new y(H);if(typeof process<"u"&&process?.release?.name==="node"){const I=!!bh?.TESTING_REMOTELY,S=N.env.version,w=new Headers;if(w.set("User-Agent",`transformers.js/${S}; is_ci/${I};`),T(H,["http:","https:"],["huggingface.co","hf.co"])){const F=bh?.HF_TOKEN??bh?.HF_ACCESS_TOKEN;F&&w.set("Authorization",`Bearer ${F}`)}return fetch(H,{headers:w})}else return fetch(H)}const x={400:"Bad request error occurred while trying to load file",401:"Unauthorized access to file",403:"Forbidden access to file",404:"Could not locate file",408:"Request timeout error occurred while trying to load file",500:"Internal server error error occurred while trying to load file",502:"Bad gateway error occurred while trying to load file",503:"Service unavailable error occurred while trying to load file",504:"Gateway timeout error occurred while trying to load file"};function v(H,I,S){if(!S)return null;const w=x[H]??`Error (${H}) occurred while trying to load file`;throw Error(`${w}: "${I}".`)}class L{constructor(I){this.path=I}async match(I){let S=$.join(this.path,I),w=new y(S);if(w.exists)return w}async put(I,S){const w=Buffer.from(await S.arrayBuffer());let P=$.join(this.path,I);try{await g.promises.mkdir($.dirname(P),{recursive:!0}),await g.promises.writeFile(P,w)}catch(F){console.warn("An error occurred while writing the file to cache:",F)}}}async function K(H,...I){for(let S of I)try{let w=await H.match(S);if(w)return w}catch{continue}}async function se(H,I,S=!0,w={}){if(!N.env.allowLocalModels){if(w.local_files_only)throw Error("Invalid configuration detected: local models are disabled (`env.allowLocalModels=false`) but you have requested to only use local models (`local_files_only=true`).");if(!N.env.allowRemoteModels)throw Error("Invalid configuration detected: both local and remote models are disabled. Fix by setting `env.allowLocalModels` or `env.allowRemoteModels` to `true`.")}(0,Z.dispatchCallback)(w.progress_callback,{status:"initiate",name:H,file:I});let P;if(!P&&N.env.useBrowserCache){if(typeof caches>"u")throw Error("Browser cache is not available in this environment.");try{P=await caches.open("transformers-cache")}catch(Je){console.warn("An error occurred while opening the browser cache:",Je)}}if(!P&&N.env.useFSCache&&(P=new L(w.cache_dir??N.env.cacheDir)),!P&&N.env.useCustomCache){if(!N.env.customCache)throw Error("`env.useCustomCache=true`, but `env.customCache` is not defined.");if(!N.env.customCache.match||!N.env.customCache.put)throw new Error("`env.customCache` must be an object which implements the `match` and `put` functions of the Web Cache API. For more information, see https://developer.mozilla.org/en-US/docs/Web/API/Cache");P=N.env.customCache}const F=w.revision??"main";let ae=U(H,I),ie=U(N.env.localModelPath,ae),ye=U(N.env.remoteHost,N.env.remotePathTemplate.replaceAll("{model}",H).replaceAll("{revision}",encodeURIComponent(F)),I),ge=F==="main"?ae:U(H,F,I),re,Me=P instanceof L?ge:ye,pe=!1,Ce;P&&(Ce=await K(P,ie,Me));const Ae=Ce!==void 0;if(Ce===void 0){if(N.env.allowLocalModels)if(T(ae,["http:","https:"])){if(w.local_files_only)throw new Error(`\`local_files_only=true\`, but attempted to load a remote file from: ${ae}.`);if(!N.env.allowRemoteModels)throw new Error(`\`env.allowRemoteModels=false\`, but attempted to load a remote file from: ${ae}.`)}else try{Ce=await b(ie),re=ie}catch(je){console.warn(`Unable to load from local path "${ie}": "${je}"`)}if(Ce===void 0||Ce.status===404){if(w.local_files_only||!N.env.allowRemoteModels){if(S)throw Error(`\`local_files_only=true\` or \`env.allowRemoteModels=false\` and file was not found locally at "${ie}".`);return null}if(Ce=await b(ye),Ce.status!==200)return v(Ce.status,ye,S);re=Me}pe=P&&typeof Response<"u"&&Ce instanceof Response&&Ce.status===200}(0,Z.dispatchCallback)(w.progress_callback,{status:"download",name:H,file:I});let Pe;return w.progress_callback?Ae&&typeof navigator<"u"&&/firefox/i.test(navigator.userAgent)?(Pe=new Uint8Array(await Ce.arrayBuffer()),(0,Z.dispatchCallback)(w.progress_callback,{status:"progress",name:H,file:I,progress:100,loaded:Pe.length,total:Pe.length})):Pe=await V(Ce,Je=>{(0,Z.dispatchCallback)(w.progress_callback,{status:"progress",name:H,file:I,...Je})}):Pe=new Uint8Array(await Ce.arrayBuffer()),pe&&re&&await P.match(re)===void 0&&await P.put(re,new Response(Pe,{headers:Ce.headers})).catch(Je=>{console.warn(`Unable to add response to browser cache: ${Je}.`)}),(0,Z.dispatchCallback)(w.progress_callback,{status:"done",name:H,file:I}),Pe}async function oe(H,I,S=!0,w={}){let P=await se(H,I,S,w);if(P===null)return{};let ae=new TextDecoder("utf-8").decode(P);return JSON.parse(ae)}async function V(H,I){const S=H.headers.get("Content-Length");S===null&&console.warn("Unable to determine content-length from response headers. Will expand buffer when needed.");let w=parseInt(S??"0"),P=new Uint8Array(w),F=0;const ae=H.body.getReader();async function ie(){const{done:ye,value:ge}=await ae.read();if(ye)return;let re=F+ge.length;if(re>w){w=re;let pe=new Uint8Array(w);pe.set(P),P=pe}P.set(ge,F),F=re;const Me=F/w*100;return I({progress:Me,loaded:F,total:w}),ie()}return await ie(),P}function U(...H){return H=H.map((I,S)=>(S&&(I=I.replace(new RegExp("^/"),"")),S!==H.length-1&&(I=I.replace(new RegExp("/$"),"")),I)),H.join("/")}},"./src/utils/image.js":(ke,A,r)=>{r.r(A),r.d(A,{RawImage:()=>K,load_image:()=>se});var g=r("./src/utils/core.js"),$=r("./src/utils/hub.js"),N=r("./src/env.js"),Z=r("./src/utils/tensor.js"),j=r("?2b25");let y,T,b;const x=N.apis.IS_BROWSER_ENV||N.apis.IS_WEBWORKER_ENV;if(x)y=(oe,V)=>{if(!self.OffscreenCanvas)throw new Error("OffscreenCanvas not supported by this browser.");return new self.OffscreenCanvas(oe,V)},b=self.createImageBitmap,T=self.ImageData;else if(j)b=async oe=>{const U=(await oe.metadata()).channels,{data:H,info:I}=await oe.rotate().raw().toBuffer({resolveWithObject:!0}),S=new K(new Uint8ClampedArray(H),I.width,I.height,I.channels);return U!==void 0&&U!==I.channels&&S.convert(U),S};else throw new Error("Unable to load image processing library.");const v={0:"nearest",1:"lanczos",2:"bilinear",3:"bicubic",4:"box",5:"hamming"},L=new Map([["png","image/png"],["jpg","image/jpeg"],["jpeg","image/jpeg"],["gif","image/gif"]]);class K{constructor(V,U,H,I){this.data=V,this.width=U,this.height=H,this.channels=I}get size(){return[this.width,this.height]}static async read(V){if(V instanceof K)return V;if(typeof V=="string"||V instanceof URL)return await this.fromURL(V);throw new Error(`Unsupported input type: ${typeof V}`)}static fromCanvas(V){if(!x)throw new Error("fromCanvas() is only supported in browser environments.");const H=V.getContext("2d").getImageData(0,0,V.width,V.height).data;return new K(H,V.width,V.height,4)}static async fromURL(V){const U=await(0,$.getFile)(V);if(U.status!==200)throw new Error(`Unable to read image from "${V}" (${U.status} ${U.statusText})`);const H=await U.blob();return this.fromBlob(H)}static async fromBlob(V){if(x){const U=await b(V),H=y(U.width,U.height).getContext("2d");return H.drawImage(U,0,0),new this(H.getImageData(0,0,U.width,U.height).data,U.width,U.height,4)}else{const U=j(await V.arrayBuffer());return await b(U)}}static fromTensor(V,U="CHW"){if(V.dims.length!==3)throw new Error(`Tensor should have 3 dimensions, but has ${V.dims.length} dimensions.`);if(U==="CHW")V=V.transpose(1,2,0);else if(U!=="HWC")throw new Error(`Unsupported channel format: ${U}`);if(!(V.data instanceof Uint8ClampedArray||V.data instanceof Uint8Array))throw new Error(`Unsupported tensor type: ${V.type}`);switch(V.dims[2]){case 1:case 2:case 3:case 4:return new K(V.data,V.dims[1],V.dims[0],V.dims[2]);default:throw new Error(`Unsupported number of channels: ${V.dims[2]}`)}}grayscale(){if(this.channels===1)return this;const V=new Uint8ClampedArray(this.width*this.height*1);switch(this.channels){case 3:case 4:for(let U=0,H=0;U=0?F=H:ie=-H,I>=0?ae=I:ye=-I,P.drawImage(w,F,ae,V,U,ie,ye,V,U),new K(P.getImageData(0,0,V,U).data,V,U,4).convert(S)}else{let S=this.toSharp();if(H>=0&&I>=0)S=S.extract({left:Math.floor(H),top:Math.floor(I),width:V,height:U});else if(H<=0&&I<=0){const w=Math.floor(-I),P=Math.floor(-H);S=S.extend({top:w,left:P,right:V-this.width-P,bottom:U-this.height-w})}else{let w=[0,0],P=0;I<0?(w[0]=Math.floor(-I),w[1]=U-this.height-w[0]):P=Math.floor(I);let F=[0,0],ae=0;H<0?(F[0]=Math.floor(-H),F[1]=V-this.width-F[0]):ae=Math.floor(H),S=S.extend({top:w[0],bottom:w[1],left:F[0],right:F[1]}).extract({left:ae,top:P,width:V,height:U})}return await b(S)}}async toBlob(V="image/png",U=1){if(!x)throw new Error("toBlob() is only supported in browser environments.");return await this.toCanvas().convertToBlob({type:V,quality:U})}toTensor(V="CHW"){let U=new Z.Tensor("uint8",new Uint8Array(this.data),[this.height,this.width,this.channels]);if(V!=="HWC")if(V==="CHW")U=U.permute(2,0,1);else throw new Error(`Unsupported channel format: ${V}`);return U}toCanvas(){if(!x)throw new Error("toCanvas() is only supported in browser environments.");const V=this.clone().rgba(),U=y(V.width,V.height),H=new T(V.data,V.width,V.height);return U.getContext("2d").putImageData(H,0,0),U}split(){const{data:V,width:U,height:H,channels:I}=this,S=V.constructor,w=V.length/I,P=Array.from({length:I},()=>new S(w));for(let F=0;Fnew K(F,U,H,1))}_update(V,U,H,I=null){return this.data=V,this.width=U,this.height=H,I!==null&&(this.channels=I),this}clone(){return new K(this.data.slice(),this.width,this.height,this.channels)}convert(V){if(this.channels===V)return this;switch(V){case 1:this.grayscale();break;case 3:this.rgb();break;case 4:this.rgba();break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this}async save(V){if(x){if(N.apis.IS_WEBWORKER_ENV)throw new Error("Unable to save an image from a Web Worker.");const U=V.split(".").pop().toLowerCase(),H=L.get(U)??"image/png",I=await this.toBlob(H);(0,g.saveBlob)(V,I)}else{if(N.apis.IS_FS_AVAILABLE)return await this.toSharp().toFile(V);throw new Error("Unable to save the image because filesystem is disabled in this environment.")}}toSharp(){if(x)throw new Error("toSharp() is only supported in server-side environments.");return j(this.data,{raw:{width:this.width,height:this.height,channels:this.channels}})}}const se=K.read.bind(K)},"./src/utils/maths.js":(ke,A,r)=>{r.r(A),r.d(A,{FFT:()=>se,bankers_round:()=>U,cos_sim:()=>y,dot:()=>j,dynamic_time_warping:()=>H,interpolate_data:()=>g,log_softmax:()=>Z,magnitude:()=>T,max:()=>x,medianFilter:()=>oe,min:()=>b,permute_data:()=>$,round:()=>V,softmax:()=>N});function g(I,[S,w,P],[F,ae],ie="bilinear",ye=!1){const ge=ae/P,re=F/w,Me=new I.constructor(F*ae*S),pe=w*P,Ce=F*ae;for(let Ae=0;Ae=0;--ye)F[ye]=ge,P[ye]=S[w[ye]],ge*=P[ye];const ae=w.map((ye,ge)=>F[w.indexOf(ge)]),ie=new I.constructor(I.length);for(let ye=0;ye=0;--re)ge+=Me%S[re]*ae[re],Me=Math.floor(Me/S[re]);ie[ge]=I[ye]}return[ie,P]}function N(I){const S=x(I)[0],w=I.map(ae=>Math.exp(ae-S)),P=w.reduce((ae,ie)=>ae+ie,0);return w.map(ae=>ae/P)}function Z(I){const S=x(I)[0];let w=0;for(let ae=0;aeae-S-P)}function j(I,S){let w=0;for(let P=0;PS+w*w,0))}function b(I){if(I.length===0)throw Error("Array must not be empty");let S=I[0],w=0;for(let P=1;PS&&(S=I[P],w=P);return[S,w]}function v(I){return I>0&&(I&I-1)===0}class L{constructor(S){if(this.size=S|0,this.size<=1||!v(this.size))throw new Error("FFT size must be a power of two larger than 1");this._csize=S<<1,this.table=new Float64Array(this.size*2);for(let P=0;PP;P<<=1)++w;this._width=w%2===0?w-1:w,this._bitrev=new Int32Array(1<>>F&3)<>>1);for(let F=0;F>>1]=S[F];return P}toComplexArray(S,w){const P=w||this.createComplexArray();for(let F=0;F>>1],P[F+1]=0;return P}transform(S,w){if(S===w)throw new Error("Input and output buffers must be different");this._transform4(S,w,1)}realTransform(S,w){if(S===w)throw new Error("Input and output buffers must be different");this._realTransform4(S,w,1)}inverseTransform(S,w){if(S===w)throw new Error("Input and output buffers must be different");this._transform4(S,w,-1);for(let P=0;P>=2;ie>=2;ie>>=2){ye=F/ie<<1;const Ce=ye>>>2;for(ge=0;ge>>1,ie>>>1)}else for(ge=0,re=0;ge>>1,ie>>>1,P)}const pe=this.table;for(ie>>=2;ie>=2;ie>>=2){ye=F/ie<<1;const Ae=ye>>>1,Pe=Ae>>>1,Je=Pe>>>1;for(ge=0;ge>>1;for(let Ae=2;Ae>1;++Me){const pe=(Me+1-S)**2/2,Ce=Math.sqrt(ge**2+re**2)**pe,Ae=pe*Math.atan2(re,ge),Pe=2*Me;ae[Pe]=Ce*Math.cos(Ae),ae[Pe+1]=Ce*Math.sin(Ae),ie[Pe]=ae[Pe],ie[Pe+1]=-ae[Pe+1]}this._slicedChirpBuffer=ae.subarray(w,P),this._f=new L(F>>1),this._f.transform(this._chirpBuffer,ie)}_transform(S,w,P){const F=this._buffer1,ae=this._buffer2,ie=this._outBuffer1,ye=this._outBuffer2,ge=this._chirpBuffer,re=this._slicedChirpBuffer,Me=this._a;if(P)for(let pe=0;pe>1,Pe=w[Ae];F[pe]=Pe*re[pe],F[Ce]=Pe*re[Ce]}else for(let pe=0;pe=I.length&&(ge=2*(I.length-1)-ge),P[ie++]=I[ge]}P.sort(),w[ae]=P[F]}return w}function V(I,S){const w=Math.pow(10,S);return Math.round(I*w)/w}function U(I){const S=Math.round(I);return Math.abs(I)%1===.5?S%2===0?S:S-1:S}function H(I){const S=I.length,w=I[0].length,P=[S+1,w+1],F=Array.from({length:P[0]},()=>Array(P[1]).fill(1/0));F[0][0]=0;const ae=Array.from({length:P[0]},()=>Array(P[1]).fill(-1));for(let Me=1;Me0||ye>0;)switch(ge.push(ie-1),re.push(ye-1),ae[ie][ye]){case 0:--ie,--ye;break;case 1:--ie;break;case 2:--ye;break;default:throw new Error(`Internal error in dynamic time warping. Unexpected trace[${ie}, ${ye}]. Please file a bug report.`)}return ge.reverse(),re.reverse(),[ge,re]}},"./src/utils/tensor.js":(ke,A,r)=>{r.r(A),r.d(A,{Tensor:()=>j,cat:()=>w,full:()=>re,full_like:()=>Me,interpolate:()=>b,interpolate_4d:()=>x,layer_norm:()=>U,matmul:()=>v,mean:()=>ie,mean_pooling:()=>V,ones:()=>pe,ones_like:()=>Ce,permute:()=>T,quantize_embeddings:()=>je,rand:()=>Je,rfft:()=>L,slice:()=>oe,stack:()=>P,std_mean:()=>ae,topk:()=>K,zeros:()=>Ae,zeros_like:()=>Pe});var g=r("./src/utils/maths.js"),$=r("./src/backends/onnx.js"),N=r("./src/ops/registry.js");const Z=Object.freeze({float32:Float32Array,float16:Uint16Array,float64:Float64Array,string:Array,int8:Int8Array,uint8:Uint8Array,int16:Int16Array,uint16:Uint16Array,int32:Int32Array,uint32:Uint32Array,int64:BigInt64Array,uint64:BigUint64Array,bool:Uint8Array,uint4:Uint8Array,int4:Int8Array});class j{get dims(){return this.ort_tensor.dims}set dims(X){this.ort_tensor.dims=X}get type(){return this.ort_tensor.type}get data(){return this.ort_tensor.data}get size(){return this.ort_tensor.size}get location(){return this.ort_tensor.location}ort_tensor;constructor(...X){return(0,$.isONNXTensor)(X[0])?this.ort_tensor=X[0]:this.ort_tensor=new $.Tensor(X[0],X[1],X[2]),new Proxy(this,{get:(de,Ee)=>{if(typeof Ee=="string"){let Oe=Number(Ee);if(Number.isInteger(Oe))return de._getitem(Oe)}return de[Ee]},set:(de,Ee,Oe)=>de[Ee]=Oe})}dispose(){this.ort_tensor.dispose()}*[Symbol.iterator](){const[X,...de]=this.dims;if(de.length>0){const Ee=de.reduce((Oe,Xe)=>Oe*Xe);for(let Oe=0;Oe0){const Oe=Ee.reduce((Xe,ee)=>Xe*ee);return this._subarray(X,Oe,Ee)}else return new j(this.type,[this.data[X]],Ee)}indexOf(X){const de=this.data;for(let Ee=0;EeNe)throw new Error(`Invalid slice: ${ve}`);const Ue=[Math.max(Ke,0),Math.min(Ne,this.dims[te])];Ee.push(Ue),de.push(Ue[1]-Ue[0])}else throw new Error(`Invalid slice: ${ve}`)}const Oe=Ee.map(([te,ve])=>ve-te),Xe=Oe.reduce((te,ve)=>te*ve),ee=this.data,Ve=new ee.constructor(Xe),Re=this.stride();for(let te=0;te=0;--Ke){const Ue=Oe[Ke];ve+=(Ne%Ue+Ee[Ke][0])*Re[Ke],Ne=Math.floor(Ne/Ue)}Ve[te]=ee[ve]}return new j(this.type,Ve,de)}permute(...X){return T(this,X)}transpose(...X){return this.permute(...X)}sum(X=null,de=!1){return this.norm(1,X,de)}norm(X="fro",de=null,Ee=!1){if(X==="fro")X=2;else if(typeof X=="string")throw Error(`Unsupported norm: ${X}`);const Oe=this.data,Xe=(te,ve)=>te+ve**X;if(de===null){const te=Oe.reduce(Xe,0)**(1/X);return new j(this.type,[te],[])}const[ee,Ve,Re]=F(Xe,this,de,Ee);if(X!==1)for(let te=0;te=0;--Re){const Ke=this.dims[Re];if(Re!==de){const Ne=te%Ke;Ve+=Ne*ve,ve*=this.dims[Re]}te=Math.floor(te/Ke)}Oe[ee]/=Xe[Ve]}return this}normalize(X=2,de=1){return this.clone().normalize_(X,de)}stride(){return ye(this.dims)}squeeze(X=null){return new j(this.type,this.data,H(this.dims,X))}squeeze_(X=null){return this.dims=H(this.dims,X),this}unsqueeze(X=null){return new j(this.type,this.data,I(this.dims,X))}unsqueeze_(X=null){return this.dims=I(this.dims,X),this}flatten_(X=0,de=-1){de=(de+this.dims.length)%this.dims.length;let Ee=this.dims.slice(0,X),Oe=this.dims.slice(X,de+1),Xe=this.dims.slice(de+1);return this.dims=[...Ee,Oe.reduce((ee,Ve)=>ee*Ve,1),...Xe],this}flatten(X=0,de=-1){return this.clone().flatten_(X,de)}view(...X){let de=-1;for(let Oe=0;OeVe!==de?Xe*ee:Xe,1);X[de]=Ee.length/Oe}return new j(this.type,Ee,X)}neg_(){const X=this.data;for(let de=0;deX?1:0;return new j("bool",de,this.dims)}lt(X){const de=new Uint8Array(this.data.length),Ee=this.data;for(let Oe=0;OeMath.min(ee,Ve),this,X,de,1/0);return new j(Ee,Oe,Xe)}max(X=null,de=!1){if(X===null){const ee=(0,g.max)(this.data)[0];return new j(this.type,[ee],[])}const[Ee,Oe,Xe]=F((ee,Ve)=>Math.max(ee,Ve),this,X,de,-1/0);return new j(Ee,Oe,Xe)}argmin(X=null,de=!1){if(X!==null)throw new Error("`dim !== null` not yet implemented.");const Ee=(0,g.min)(this.data)[1];return new j("int64",[BigInt(Ee)],[])}argmax(X=null,de=!1){if(X!==null)throw new Error("`dim !== null` not yet implemented.");const Ee=(0,g.max)(this.data)[1];return new j("int64",[BigInt(Ee)],[])}to(X){if(this.type===X)return this;if(!Z.hasOwnProperty(X))throw new Error(`Unsupported type: ${X}`);let de;const Ee=["int64","uint64"].includes(this.type),Oe=["int64","uint64"].includes(X);return Ee&&!Oe?de=Number:!Ee&&Oe&&(de=BigInt),new j(X,Z[X].from(this.data,de),this.dims)}}function y(_e,X){const de=_e.length,Ee=X.reduce((Xe,ee)=>Xe*ee);if(de!==Ee)throw Error(`cannot reshape array of size ${de} into shape (${X})`);let Oe=_e;for(let Xe=X.length-1;Xe>=0;Xe--)Oe=Oe.reduce((ee,Ve)=>{let Re=ee[ee.length-1];return Re.lengthnew j("int64",_e,[_e.length]);async function oe(_e,X,de,Ee,Oe){return await(await N.TensorOpRegistry.slice)({x:_e,s:se(X),e:se(de),a:se(Ee),t:se(Oe??new Array(Ee.length).fill(1))})}function V(_e,X){const de=_e.data,Ee=X.data,Oe=[_e.dims[0],_e.dims[2]],Xe=new de.constructor(Oe[0]*Oe[1]),[ee,Ve,Re]=_e.dims;let te=0;for(let ve=0;vede!==1):typeof X=="number"?_e[X]===1&&_e.splice(X,1):Array.isArray(X)&&(_e=_e.filter((de,Ee)=>de!==1||!X.includes(Ee))),_e}function I(_e,X){return X=S(X,_e.length+1),_e=_e.slice(),_e.splice(X,0,1),_e}function S(_e,X,de=null,Ee=!0){if(Ee&&(_e<-X||_e>=X))throw new Error(`IndexError: index ${_e} is out of bounds for dimension${de===null?"":" "+de} with size ${X}`);return _e<0&&(_e=(_e%X+X)%X),_e}function w(_e,X=0){X=S(X,_e[0].dims.length);const de=_e[0].dims.slice();de[X]=_e.reduce((ee,Ve)=>ee+Ve.dims[X],0);const Ee=de.reduce((ee,Ve)=>ee*Ve,1),Oe=new _e[0].data.constructor(Ee),Xe=_e[0].type;if(X===0){let ee=0;for(const Ve of _e){const Re=Ve.data;Oe.set(Re,ee),ee+=Re.length}}else{let ee=0;for(let Ve=0;Ve<_e.length;++Ve){const{data:Re,dims:te}=_e[Ve];for(let ve=0;ve=0;--Ne){const Ze=te[Ne];let at=Ue%Ze;Ne===X&&(at+=ee),Ke+=at*ze,ze*=de[Ne],Ue=Math.floor(Ue/Ze)}Oe[Ke]=Re[ve]}ee+=te[X]}}return new j(Xe,Oe,de)}function P(_e,X=0){return w(_e.map(de=>de.unsqueeze(X)),X)}function F(_e,X,de=null,Ee=!1,Oe=null){const Xe=X.data,ee=X.dims;de=S(de,ee.length);const Ve=ee.slice();Ve[de]=1;const Re=new Xe.constructor(Xe.length/ee[de]);Oe!==null&&Re.fill(Oe);for(let te=0;te=0;--Ke){const ze=ee[Ke];if(Ke!==de){const Ze=Ne%ze;ve+=Ze*Ue,Ue*=Ve[Ke]}Ne=Math.floor(Ne/ze)}Re[ve]=_e(Re[ve],Xe[te],te,ve)}return Ee||Ve.splice(de,1),[X.type,Re,Ve]}function ae(_e,X=null,de=1,Ee=!1){const Oe=_e.data,Xe=_e.dims;if(X===null){const Ue=Oe.reduce((mt,lt)=>mt+lt,0)/Oe.length,ze=Math.sqrt(Oe.reduce((mt,lt)=>mt+(lt-Ue)**2,0)/(Oe.length-de)),Ze=new j(_e.type,[Ue],[]);return[new j(_e.type,[ze],[]),Ze]}X=S(X,Xe.length);const ee=ie(_e,X,Ee),Ve=ee.data,[Re,te,ve]=F((Ne,Ue,ze,Ze)=>Ne+(Ue-Ve[Ze])**2,_e,X,Ee);for(let Ne=0;Nete+ve,0);return new j(_e.type,[Re/Oe.length],[])}X=S(X,Ee.length);const[Xe,ee,Ve]=F((Re,te)=>Re+te,_e,X,de);if(Ee[X]!==1)for(let Re=0;Re=0;--de)X[de]=Ee,Ee*=_e[de];return X}function ge(_e,X,de,Ee){const Oe=_e.reduce((Xe,ee)=>Xe*ee,1);return new j(de,new Ee(Oe).fill(X),_e)}function re(_e,X){let de,Ee;if(typeof X=="number")de="float32",Ee=Float32Array;else if(typeof X=="bigint")de="int64",Ee=BigInt64Array;else if(typeof X=="boolean")de="bool",Ee=Uint8Array;else throw new Error(`Unsupported data type: ${typeof X}`);return ge(_e,X,de,Ee)}function Me(_e,X){return re(_e.dims,X)}function pe(_e){return ge(_e,1n,"int64",BigInt64Array)}function Ce(_e){return pe(_e.dims)}function Ae(_e){return ge(_e,0n,"int64",BigInt64Array)}function Pe(_e){return Ae(_e.dims)}function Je(_e){const X=_e.reduce((de,Ee)=>de*Ee,1);return new j("float32",Float32Array.from({length:X},()=>Math.random()),_e)}function je(_e,X){if(_e.dims.length!==2)throw new Error("The tensor must have 2 dimensions");if(_e.dims.at(-1)%8!==0)throw new Error("The last dimension of the tensor must be a multiple of 8");if(!["binary","ubinary"].includes(X))throw new Error("The precision must be either 'binary' or 'ubinary'");const de=X==="binary",Ee=de?"int8":"uint8",Oe=de?Int8Array:Uint8Array,Xe=_e.data,ee=new Oe(Xe.length/8);for(let Ve=0;Ve0?1:0,te=Math.floor(Ve/8),ve=Ve%8;ee[te]|=Re<<7-ve,de&&ve===0&&(ee[te]-=128)}return new j(Ee,ee,[_e.dims[0],_e.dims[1]/8])}}},af={};function cs(ke){var A=af[ke];if(A!==void 0)return A.exports;var r=af[ke]={exports:{}};return pf[ke](r,r.exports,cs),r.exports}cs.m=pf;(()=>{var ke=Object.getPrototypeOf?r=>Object.getPrototypeOf(r):r=>r.__proto__,A;cs.t=function(r,g){if(g&1&&(r=this(r)),g&8||typeof r=="object"&&r&&(g&4&&r.__esModule||g&16&&typeof r.then=="function"))return r;var $=Object.create(null);cs.r($);var N={};A=A||[null,ke({}),ke([]),ke(ke)];for(var Z=g&2&&r;typeof Z=="object"&&!~A.indexOf(Z);Z=ke(Z))Object.getOwnPropertyNames(Z).forEach(j=>N[j]=()=>r[j]);return N.default=()=>r,cs.d($,N),$}})();cs.d=(ke,A)=>{for(var r in A)cs.o(A,r)&&!cs.o(ke,r)&&Object.defineProperty(ke,r,{enumerable:!0,get:A[r]})};cs.o=(ke,A)=>Object.prototype.hasOwnProperty.call(ke,A);cs.r=ke=>{typeof Symbol<"u"&&Symbol.toStringTag&&Object.defineProperty(ke,Symbol.toStringTag,{value:"Module"}),Object.defineProperty(ke,"__esModule",{value:!0})};(()=>{var ke;if(typeof import.meta.url=="string"&&(ke=import.meta.url),!ke)throw new Error("Automatic publicPath is not supported in this browser");ke=ke.replace(/#.*$/,"").replace(/\?.*$/,"").replace(/\/[^\/]+$/,"/"),cs.p=ke})();cs.b=new URL("./",import.meta.url);var d={};(()=>{/*!*****************************!*\ + !*** ./src/transformers.js ***! + \*****************************/cs.r(d),cs.d(d,{ASTFeatureExtractor:()=>b.ASTFeatureExtractor,ASTForAudioClassification:()=>r.ASTForAudioClassification,ASTModel:()=>r.ASTModel,ASTPreTrainedModel:()=>r.ASTPreTrainedModel,AlbertForMaskedLM:()=>r.AlbertForMaskedLM,AlbertForQuestionAnswering:()=>r.AlbertForQuestionAnswering,AlbertForSequenceClassification:()=>r.AlbertForSequenceClassification,AlbertModel:()=>r.AlbertModel,AlbertPreTrainedModel:()=>r.AlbertPreTrainedModel,AlbertTokenizer:()=>g.AlbertTokenizer,AudioClassificationPipeline:()=>A.AudioClassificationPipeline,AutoConfig:()=>$.AutoConfig,AutoFeatureExtractor:()=>x.AutoFeatureExtractor,AutoImageProcessor:()=>K.AutoImageProcessor,AutoModel:()=>r.AutoModel,AutoModelForAudioClassification:()=>r.AutoModelForAudioClassification,AutoModelForAudioFrameClassification:()=>r.AutoModelForAudioFrameClassification,AutoModelForCTC:()=>r.AutoModelForCTC,AutoModelForCausalLM:()=>r.AutoModelForCausalLM,AutoModelForDepthEstimation:()=>r.AutoModelForDepthEstimation,AutoModelForDocumentQuestionAnswering:()=>r.AutoModelForDocumentQuestionAnswering,AutoModelForImageClassification:()=>r.AutoModelForImageClassification,AutoModelForImageFeatureExtraction:()=>r.AutoModelForImageFeatureExtraction,AutoModelForImageMatting:()=>r.AutoModelForImageMatting,AutoModelForImageSegmentation:()=>r.AutoModelForImageSegmentation,AutoModelForImageToImage:()=>r.AutoModelForImageToImage,AutoModelForMaskGeneration:()=>r.AutoModelForMaskGeneration,AutoModelForMaskedLM:()=>r.AutoModelForMaskedLM,AutoModelForNormalEstimation:()=>r.AutoModelForNormalEstimation,AutoModelForObjectDetection:()=>r.AutoModelForObjectDetection,AutoModelForPoseEstimation:()=>r.AutoModelForPoseEstimation,AutoModelForQuestionAnswering:()=>r.AutoModelForQuestionAnswering,AutoModelForSemanticSegmentation:()=>r.AutoModelForSemanticSegmentation,AutoModelForSeq2SeqLM:()=>r.AutoModelForSeq2SeqLM,AutoModelForSequenceClassification:()=>r.AutoModelForSequenceClassification,AutoModelForSpeechSeq2Seq:()=>r.AutoModelForSpeechSeq2Seq,AutoModelForTextToSpectrogram:()=>r.AutoModelForTextToSpectrogram,AutoModelForTextToWaveform:()=>r.AutoModelForTextToWaveform,AutoModelForTokenClassification:()=>r.AutoModelForTokenClassification,AutoModelForUniversalSegmentation:()=>r.AutoModelForUniversalSegmentation,AutoModelForVision2Seq:()=>r.AutoModelForVision2Seq,AutoModelForXVector:()=>r.AutoModelForXVector,AutoModelForZeroShotObjectDetection:()=>r.AutoModelForZeroShotObjectDetection,AutoProcessor:()=>V.AutoProcessor,AutoTokenizer:()=>g.AutoTokenizer,AutomaticSpeechRecognitionPipeline:()=>A.AutomaticSpeechRecognitionPipeline,BartForConditionalGeneration:()=>r.BartForConditionalGeneration,BartForSequenceClassification:()=>r.BartForSequenceClassification,BartModel:()=>r.BartModel,BartPretrainedModel:()=>r.BartPretrainedModel,BartTokenizer:()=>g.BartTokenizer,BaseModelOutput:()=>r.BaseModelOutput,BaseStreamer:()=>U.BaseStreamer,BeitFeatureExtractor:()=>L.BeitFeatureExtractor,BeitForImageClassification:()=>r.BeitForImageClassification,BeitModel:()=>r.BeitModel,BeitPreTrainedModel:()=>r.BeitPreTrainedModel,BertForMaskedLM:()=>r.BertForMaskedLM,BertForQuestionAnswering:()=>r.BertForQuestionAnswering,BertForSequenceClassification:()=>r.BertForSequenceClassification,BertForTokenClassification:()=>r.BertForTokenClassification,BertModel:()=>r.BertModel,BertPreTrainedModel:()=>r.BertPreTrainedModel,BertTokenizer:()=>g.BertTokenizer,BitImageProcessor:()=>L.BitImageProcessor,BlenderbotForConditionalGeneration:()=>r.BlenderbotForConditionalGeneration,BlenderbotModel:()=>r.BlenderbotModel,BlenderbotPreTrainedModel:()=>r.BlenderbotPreTrainedModel,BlenderbotSmallForConditionalGeneration:()=>r.BlenderbotSmallForConditionalGeneration,BlenderbotSmallModel:()=>r.BlenderbotSmallModel,BlenderbotSmallPreTrainedModel:()=>r.BlenderbotSmallPreTrainedModel,BlenderbotSmallTokenizer:()=>g.BlenderbotSmallTokenizer,BlenderbotTokenizer:()=>g.BlenderbotTokenizer,BloomForCausalLM:()=>r.BloomForCausalLM,BloomModel:()=>r.BloomModel,BloomPreTrainedModel:()=>r.BloomPreTrainedModel,BloomTokenizer:()=>g.BloomTokenizer,CLIPFeatureExtractor:()=>L.CLIPFeatureExtractor,CLIPImageProcessor:()=>L.CLIPImageProcessor,CLIPModel:()=>r.CLIPModel,CLIPPreTrainedModel:()=>r.CLIPPreTrainedModel,CLIPSegForImageSegmentation:()=>r.CLIPSegForImageSegmentation,CLIPSegModel:()=>r.CLIPSegModel,CLIPSegPreTrainedModel:()=>r.CLIPSegPreTrainedModel,CLIPTextModel:()=>r.CLIPTextModel,CLIPTextModelWithProjection:()=>r.CLIPTextModelWithProjection,CLIPTokenizer:()=>g.CLIPTokenizer,CLIPVisionModel:()=>r.CLIPVisionModel,CLIPVisionModelWithProjection:()=>r.CLIPVisionModelWithProjection,CamembertForMaskedLM:()=>r.CamembertForMaskedLM,CamembertForQuestionAnswering:()=>r.CamembertForQuestionAnswering,CamembertForSequenceClassification:()=>r.CamembertForSequenceClassification,CamembertForTokenClassification:()=>r.CamembertForTokenClassification,CamembertModel:()=>r.CamembertModel,CamembertPreTrainedModel:()=>r.CamembertPreTrainedModel,CamembertTokenizer:()=>g.CamembertTokenizer,CausalLMOutput:()=>r.CausalLMOutput,CausalLMOutputWithPast:()=>r.CausalLMOutputWithPast,ChineseCLIPFeatureExtractor:()=>L.ChineseCLIPFeatureExtractor,ChineseCLIPModel:()=>r.ChineseCLIPModel,ChineseCLIPPreTrainedModel:()=>r.ChineseCLIPPreTrainedModel,ClapAudioModelWithProjection:()=>r.ClapAudioModelWithProjection,ClapFeatureExtractor:()=>b.ClapFeatureExtractor,ClapModel:()=>r.ClapModel,ClapPreTrainedModel:()=>r.ClapPreTrainedModel,ClapTextModelWithProjection:()=>r.ClapTextModelWithProjection,ClassifierFreeGuidanceLogitsProcessor:()=>I.ClassifierFreeGuidanceLogitsProcessor,CodeGenForCausalLM:()=>r.CodeGenForCausalLM,CodeGenModel:()=>r.CodeGenModel,CodeGenPreTrainedModel:()=>r.CodeGenPreTrainedModel,CodeGenTokenizer:()=>g.CodeGenTokenizer,CodeLlamaTokenizer:()=>g.CodeLlamaTokenizer,CohereForCausalLM:()=>r.CohereForCausalLM,CohereModel:()=>r.CohereModel,CoherePreTrainedModel:()=>r.CoherePreTrainedModel,CohereTokenizer:()=>g.CohereTokenizer,ConvBertForMaskedLM:()=>r.ConvBertForMaskedLM,ConvBertForQuestionAnswering:()=>r.ConvBertForQuestionAnswering,ConvBertForSequenceClassification:()=>r.ConvBertForSequenceClassification,ConvBertForTokenClassification:()=>r.ConvBertForTokenClassification,ConvBertModel:()=>r.ConvBertModel,ConvBertPreTrainedModel:()=>r.ConvBertPreTrainedModel,ConvBertTokenizer:()=>g.ConvBertTokenizer,ConvNextFeatureExtractor:()=>L.ConvNextFeatureExtractor,ConvNextForImageClassification:()=>r.ConvNextForImageClassification,ConvNextImageProcessor:()=>L.ConvNextImageProcessor,ConvNextModel:()=>r.ConvNextModel,ConvNextPreTrainedModel:()=>r.ConvNextPreTrainedModel,ConvNextV2ForImageClassification:()=>r.ConvNextV2ForImageClassification,ConvNextV2Model:()=>r.ConvNextV2Model,ConvNextV2PreTrainedModel:()=>r.ConvNextV2PreTrainedModel,DPTFeatureExtractor:()=>L.DPTFeatureExtractor,DPTForDepthEstimation:()=>r.DPTForDepthEstimation,DPTImageProcessor:()=>L.DPTImageProcessor,DPTModel:()=>r.DPTModel,DPTPreTrainedModel:()=>r.DPTPreTrainedModel,DebertaForMaskedLM:()=>r.DebertaForMaskedLM,DebertaForQuestionAnswering:()=>r.DebertaForQuestionAnswering,DebertaForSequenceClassification:()=>r.DebertaForSequenceClassification,DebertaForTokenClassification:()=>r.DebertaForTokenClassification,DebertaModel:()=>r.DebertaModel,DebertaPreTrainedModel:()=>r.DebertaPreTrainedModel,DebertaTokenizer:()=>g.DebertaTokenizer,DebertaV2ForMaskedLM:()=>r.DebertaV2ForMaskedLM,DebertaV2ForQuestionAnswering:()=>r.DebertaV2ForQuestionAnswering,DebertaV2ForSequenceClassification:()=>r.DebertaV2ForSequenceClassification,DebertaV2ForTokenClassification:()=>r.DebertaV2ForTokenClassification,DebertaV2Model:()=>r.DebertaV2Model,DebertaV2PreTrainedModel:()=>r.DebertaV2PreTrainedModel,DebertaV2Tokenizer:()=>g.DebertaV2Tokenizer,DecisionTransformerModel:()=>r.DecisionTransformerModel,DecisionTransformerPreTrainedModel:()=>r.DecisionTransformerPreTrainedModel,DeiTFeatureExtractor:()=>L.DeiTFeatureExtractor,DeiTForImageClassification:()=>r.DeiTForImageClassification,DeiTImageProcessor:()=>L.DeiTImageProcessor,DeiTModel:()=>r.DeiTModel,DeiTPreTrainedModel:()=>r.DeiTPreTrainedModel,DepthAnythingForDepthEstimation:()=>r.DepthAnythingForDepthEstimation,DepthAnythingPreTrainedModel:()=>r.DepthAnythingPreTrainedModel,DepthEstimationPipeline:()=>A.DepthEstimationPipeline,DepthProForDepthEstimation:()=>r.DepthProForDepthEstimation,DepthProPreTrainedModel:()=>r.DepthProPreTrainedModel,DetrFeatureExtractor:()=>L.DetrFeatureExtractor,DetrForObjectDetection:()=>r.DetrForObjectDetection,DetrForSegmentation:()=>r.DetrForSegmentation,DetrImageProcessor:()=>L.DetrImageProcessor,DetrModel:()=>r.DetrModel,DetrObjectDetectionOutput:()=>r.DetrObjectDetectionOutput,DetrPreTrainedModel:()=>r.DetrPreTrainedModel,DetrSegmentationOutput:()=>r.DetrSegmentationOutput,Dinov2ForImageClassification:()=>r.Dinov2ForImageClassification,Dinov2Model:()=>r.Dinov2Model,Dinov2PreTrainedModel:()=>r.Dinov2PreTrainedModel,Dinov2WithRegistersForImageClassification:()=>r.Dinov2WithRegistersForImageClassification,Dinov2WithRegistersModel:()=>r.Dinov2WithRegistersModel,Dinov2WithRegistersPreTrainedModel:()=>r.Dinov2WithRegistersPreTrainedModel,DistilBertForMaskedLM:()=>r.DistilBertForMaskedLM,DistilBertForQuestionAnswering:()=>r.DistilBertForQuestionAnswering,DistilBertForSequenceClassification:()=>r.DistilBertForSequenceClassification,DistilBertForTokenClassification:()=>r.DistilBertForTokenClassification,DistilBertModel:()=>r.DistilBertModel,DistilBertPreTrainedModel:()=>r.DistilBertPreTrainedModel,DistilBertTokenizer:()=>g.DistilBertTokenizer,DocumentQuestionAnsweringPipeline:()=>A.DocumentQuestionAnsweringPipeline,DonutFeatureExtractor:()=>L.DonutFeatureExtractor,DonutImageProcessor:()=>L.DonutImageProcessor,DonutSwinModel:()=>r.DonutSwinModel,DonutSwinPreTrainedModel:()=>r.DonutSwinPreTrainedModel,EfficientNetForImageClassification:()=>r.EfficientNetForImageClassification,EfficientNetImageProcessor:()=>L.EfficientNetImageProcessor,EfficientNetModel:()=>r.EfficientNetModel,EfficientNetPreTrainedModel:()=>r.EfficientNetPreTrainedModel,ElectraForMaskedLM:()=>r.ElectraForMaskedLM,ElectraForQuestionAnswering:()=>r.ElectraForQuestionAnswering,ElectraForSequenceClassification:()=>r.ElectraForSequenceClassification,ElectraForTokenClassification:()=>r.ElectraForTokenClassification,ElectraModel:()=>r.ElectraModel,ElectraPreTrainedModel:()=>r.ElectraPreTrainedModel,ElectraTokenizer:()=>g.ElectraTokenizer,EosTokenCriteria:()=>H.EosTokenCriteria,EsmForMaskedLM:()=>r.EsmForMaskedLM,EsmForSequenceClassification:()=>r.EsmForSequenceClassification,EsmForTokenClassification:()=>r.EsmForTokenClassification,EsmModel:()=>r.EsmModel,EsmPreTrainedModel:()=>r.EsmPreTrainedModel,EsmTokenizer:()=>g.EsmTokenizer,ExaoneForCausalLM:()=>r.ExaoneForCausalLM,ExaoneModel:()=>r.ExaoneModel,ExaonePreTrainedModel:()=>r.ExaonePreTrainedModel,FFT:()=>y.FFT,FalconForCausalLM:()=>r.FalconForCausalLM,FalconModel:()=>r.FalconModel,FalconPreTrainedModel:()=>r.FalconPreTrainedModel,FalconTokenizer:()=>g.FalconTokenizer,FastViTForImageClassification:()=>r.FastViTForImageClassification,FastViTModel:()=>r.FastViTModel,FastViTPreTrainedModel:()=>r.FastViTPreTrainedModel,FeatureExtractionPipeline:()=>A.FeatureExtractionPipeline,FeatureExtractor:()=>T.FeatureExtractor,FillMaskPipeline:()=>A.FillMaskPipeline,Florence2ForConditionalGeneration:()=>r.Florence2ForConditionalGeneration,Florence2PreTrainedModel:()=>r.Florence2PreTrainedModel,Florence2Processor:()=>oe.Florence2Processor,ForcedBOSTokenLogitsProcessor:()=>I.ForcedBOSTokenLogitsProcessor,ForcedEOSTokenLogitsProcessor:()=>I.ForcedEOSTokenLogitsProcessor,GLPNFeatureExtractor:()=>L.GLPNFeatureExtractor,GLPNForDepthEstimation:()=>r.GLPNForDepthEstimation,GLPNModel:()=>r.GLPNModel,GLPNPreTrainedModel:()=>r.GLPNPreTrainedModel,GPT2LMHeadModel:()=>r.GPT2LMHeadModel,GPT2Model:()=>r.GPT2Model,GPT2PreTrainedModel:()=>r.GPT2PreTrainedModel,GPT2Tokenizer:()=>g.GPT2Tokenizer,GPTBigCodeForCausalLM:()=>r.GPTBigCodeForCausalLM,GPTBigCodeModel:()=>r.GPTBigCodeModel,GPTBigCodePreTrainedModel:()=>r.GPTBigCodePreTrainedModel,GPTJForCausalLM:()=>r.GPTJForCausalLM,GPTJModel:()=>r.GPTJModel,GPTJPreTrainedModel:()=>r.GPTJPreTrainedModel,GPTNeoForCausalLM:()=>r.GPTNeoForCausalLM,GPTNeoModel:()=>r.GPTNeoModel,GPTNeoPreTrainedModel:()=>r.GPTNeoPreTrainedModel,GPTNeoXForCausalLM:()=>r.GPTNeoXForCausalLM,GPTNeoXModel:()=>r.GPTNeoXModel,GPTNeoXPreTrainedModel:()=>r.GPTNeoXPreTrainedModel,GPTNeoXTokenizer:()=>g.GPTNeoXTokenizer,Gemma2ForCausalLM:()=>r.Gemma2ForCausalLM,Gemma2Model:()=>r.Gemma2Model,Gemma2PreTrainedModel:()=>r.Gemma2PreTrainedModel,GemmaForCausalLM:()=>r.GemmaForCausalLM,GemmaModel:()=>r.GemmaModel,GemmaPreTrainedModel:()=>r.GemmaPreTrainedModel,GemmaTokenizer:()=>g.GemmaTokenizer,GraniteForCausalLM:()=>r.GraniteForCausalLM,GraniteModel:()=>r.GraniteModel,GranitePreTrainedModel:()=>r.GranitePreTrainedModel,Grok1Tokenizer:()=>g.Grok1Tokenizer,GroundingDinoForObjectDetection:()=>r.GroundingDinoForObjectDetection,GroundingDinoImageProcessor:()=>L.GroundingDinoImageProcessor,GroundingDinoPreTrainedModel:()=>r.GroundingDinoPreTrainedModel,GroundingDinoProcessor:()=>oe.GroundingDinoProcessor,GroupViTModel:()=>r.GroupViTModel,GroupViTPreTrainedModel:()=>r.GroupViTPreTrainedModel,HerbertTokenizer:()=>g.HerbertTokenizer,HieraForImageClassification:()=>r.HieraForImageClassification,HieraModel:()=>r.HieraModel,HieraPreTrainedModel:()=>r.HieraPreTrainedModel,HubertForCTC:()=>r.HubertForCTC,HubertForSequenceClassification:()=>r.HubertForSequenceClassification,HubertModel:()=>r.HubertModel,HubertPreTrainedModel:()=>r.HubertPreTrainedModel,IJepaForImageClassification:()=>r.IJepaForImageClassification,IJepaModel:()=>r.IJepaModel,IJepaPreTrainedModel:()=>r.IJepaPreTrainedModel,Idefics3ForConditionalGeneration:()=>r.Idefics3ForConditionalGeneration,Idefics3ImageProcessor:()=>L.Idefics3ImageProcessor,Idefics3PreTrainedModel:()=>r.Idefics3PreTrainedModel,Idefics3Processor:()=>oe.Idefics3Processor,ImageClassificationPipeline:()=>A.ImageClassificationPipeline,ImageFeatureExtractionPipeline:()=>A.ImageFeatureExtractionPipeline,ImageFeatureExtractor:()=>b.ImageFeatureExtractor,ImageMattingOutput:()=>r.ImageMattingOutput,ImageProcessor:()=>v.ImageProcessor,ImageSegmentationPipeline:()=>A.ImageSegmentationPipeline,ImageToImagePipeline:()=>A.ImageToImagePipeline,ImageToTextPipeline:()=>A.ImageToTextPipeline,InterruptableStoppingCriteria:()=>H.InterruptableStoppingCriteria,JAISLMHeadModel:()=>r.JAISLMHeadModel,JAISModel:()=>r.JAISModel,JAISPreTrainedModel:()=>r.JAISPreTrainedModel,JinaCLIPImageProcessor:()=>L.JinaCLIPImageProcessor,JinaCLIPModel:()=>r.JinaCLIPModel,JinaCLIPPreTrainedModel:()=>r.JinaCLIPPreTrainedModel,JinaCLIPProcessor:()=>oe.JinaCLIPProcessor,JinaCLIPTextModel:()=>r.JinaCLIPTextModel,JinaCLIPVisionModel:()=>r.JinaCLIPVisionModel,LlamaForCausalLM:()=>r.LlamaForCausalLM,LlamaModel:()=>r.LlamaModel,LlamaPreTrainedModel:()=>r.LlamaPreTrainedModel,LlamaTokenizer:()=>g.LlamaTokenizer,LlavaForConditionalGeneration:()=>r.LlavaForConditionalGeneration,LlavaOnevisionForConditionalGeneration:()=>r.LlavaOnevisionForConditionalGeneration,LlavaOnevisionImageProcessor:()=>L.LlavaOnevisionImageProcessor,LlavaPreTrainedModel:()=>r.LlavaPreTrainedModel,LogitsProcessor:()=>I.LogitsProcessor,LogitsProcessorList:()=>I.LogitsProcessorList,LogitsWarper:()=>I.LogitsWarper,LongT5ForConditionalGeneration:()=>r.LongT5ForConditionalGeneration,LongT5Model:()=>r.LongT5Model,LongT5PreTrainedModel:()=>r.LongT5PreTrainedModel,M2M100ForConditionalGeneration:()=>r.M2M100ForConditionalGeneration,M2M100Model:()=>r.M2M100Model,M2M100PreTrainedModel:()=>r.M2M100PreTrainedModel,M2M100Tokenizer:()=>g.M2M100Tokenizer,MBart50Tokenizer:()=>g.MBart50Tokenizer,MBartForCausalLM:()=>r.MBartForCausalLM,MBartForConditionalGeneration:()=>r.MBartForConditionalGeneration,MBartForSequenceClassification:()=>r.MBartForSequenceClassification,MBartModel:()=>r.MBartModel,MBartPreTrainedModel:()=>r.MBartPreTrainedModel,MBartTokenizer:()=>g.MBartTokenizer,MPNetForMaskedLM:()=>r.MPNetForMaskedLM,MPNetForQuestionAnswering:()=>r.MPNetForQuestionAnswering,MPNetForSequenceClassification:()=>r.MPNetForSequenceClassification,MPNetForTokenClassification:()=>r.MPNetForTokenClassification,MPNetModel:()=>r.MPNetModel,MPNetPreTrainedModel:()=>r.MPNetPreTrainedModel,MPNetTokenizer:()=>g.MPNetTokenizer,MT5ForConditionalGeneration:()=>r.MT5ForConditionalGeneration,MT5Model:()=>r.MT5Model,MT5PreTrainedModel:()=>r.MT5PreTrainedModel,MarianMTModel:()=>r.MarianMTModel,MarianModel:()=>r.MarianModel,MarianPreTrainedModel:()=>r.MarianPreTrainedModel,MarianTokenizer:()=>g.MarianTokenizer,Mask2FormerImageProcessor:()=>L.Mask2FormerImageProcessor,MaskFormerFeatureExtractor:()=>L.MaskFormerFeatureExtractor,MaskFormerForInstanceSegmentation:()=>r.MaskFormerForInstanceSegmentation,MaskFormerImageProcessor:()=>L.MaskFormerImageProcessor,MaskFormerModel:()=>r.MaskFormerModel,MaskFormerPreTrainedModel:()=>r.MaskFormerPreTrainedModel,MaskedLMOutput:()=>r.MaskedLMOutput,MaxLengthCriteria:()=>H.MaxLengthCriteria,MgpstrForSceneTextRecognition:()=>r.MgpstrForSceneTextRecognition,MgpstrModelOutput:()=>r.MgpstrModelOutput,MgpstrPreTrainedModel:()=>r.MgpstrPreTrainedModel,MgpstrProcessor:()=>oe.MgpstrProcessor,MgpstrTokenizer:()=>g.MgpstrTokenizer,MinLengthLogitsProcessor:()=>I.MinLengthLogitsProcessor,MinNewTokensLengthLogitsProcessor:()=>I.MinNewTokensLengthLogitsProcessor,MistralForCausalLM:()=>r.MistralForCausalLM,MistralModel:()=>r.MistralModel,MistralPreTrainedModel:()=>r.MistralPreTrainedModel,MobileBertForMaskedLM:()=>r.MobileBertForMaskedLM,MobileBertForQuestionAnswering:()=>r.MobileBertForQuestionAnswering,MobileBertForSequenceClassification:()=>r.MobileBertForSequenceClassification,MobileBertModel:()=>r.MobileBertModel,MobileBertPreTrainedModel:()=>r.MobileBertPreTrainedModel,MobileBertTokenizer:()=>g.MobileBertTokenizer,MobileLLMForCausalLM:()=>r.MobileLLMForCausalLM,MobileLLMModel:()=>r.MobileLLMModel,MobileLLMPreTrainedModel:()=>r.MobileLLMPreTrainedModel,MobileNetV1FeatureExtractor:()=>L.MobileNetV1FeatureExtractor,MobileNetV1ForImageClassification:()=>r.MobileNetV1ForImageClassification,MobileNetV1ImageProcessor:()=>L.MobileNetV1ImageProcessor,MobileNetV1Model:()=>r.MobileNetV1Model,MobileNetV1PreTrainedModel:()=>r.MobileNetV1PreTrainedModel,MobileNetV2FeatureExtractor:()=>L.MobileNetV2FeatureExtractor,MobileNetV2ForImageClassification:()=>r.MobileNetV2ForImageClassification,MobileNetV2ImageProcessor:()=>L.MobileNetV2ImageProcessor,MobileNetV2Model:()=>r.MobileNetV2Model,MobileNetV2PreTrainedModel:()=>r.MobileNetV2PreTrainedModel,MobileNetV3FeatureExtractor:()=>L.MobileNetV3FeatureExtractor,MobileNetV3ForImageClassification:()=>r.MobileNetV3ForImageClassification,MobileNetV3ImageProcessor:()=>L.MobileNetV3ImageProcessor,MobileNetV3Model:()=>r.MobileNetV3Model,MobileNetV3PreTrainedModel:()=>r.MobileNetV3PreTrainedModel,MobileNetV4FeatureExtractor:()=>L.MobileNetV4FeatureExtractor,MobileNetV4ForImageClassification:()=>r.MobileNetV4ForImageClassification,MobileNetV4ImageProcessor:()=>L.MobileNetV4ImageProcessor,MobileNetV4Model:()=>r.MobileNetV4Model,MobileNetV4PreTrainedModel:()=>r.MobileNetV4PreTrainedModel,MobileViTFeatureExtractor:()=>L.MobileViTFeatureExtractor,MobileViTForImageClassification:()=>r.MobileViTForImageClassification,MobileViTImageProcessor:()=>L.MobileViTImageProcessor,MobileViTModel:()=>r.MobileViTModel,MobileViTPreTrainedModel:()=>r.MobileViTPreTrainedModel,MobileViTV2ForImageClassification:()=>r.MobileViTV2ForImageClassification,MobileViTV2Model:()=>r.MobileViTV2Model,MobileViTV2PreTrainedModel:()=>r.MobileViTV2PreTrainedModel,ModelOutput:()=>r.ModelOutput,ModernBertForMaskedLM:()=>r.ModernBertForMaskedLM,ModernBertForSequenceClassification:()=>r.ModernBertForSequenceClassification,ModernBertForTokenClassification:()=>r.ModernBertForTokenClassification,ModernBertModel:()=>r.ModernBertModel,ModernBertPreTrainedModel:()=>r.ModernBertPreTrainedModel,Moondream1ForConditionalGeneration:()=>r.Moondream1ForConditionalGeneration,MoonshineFeatureExtractor:()=>b.MoonshineFeatureExtractor,MoonshineForConditionalGeneration:()=>r.MoonshineForConditionalGeneration,MoonshineModel:()=>r.MoonshineModel,MoonshinePreTrainedModel:()=>r.MoonshinePreTrainedModel,MoonshineProcessor:()=>oe.MoonshineProcessor,MptForCausalLM:()=>r.MptForCausalLM,MptModel:()=>r.MptModel,MptPreTrainedModel:()=>r.MptPreTrainedModel,MultiModalityCausalLM:()=>r.MultiModalityCausalLM,MultiModalityPreTrainedModel:()=>r.MultiModalityPreTrainedModel,MusicgenForCausalLM:()=>r.MusicgenForCausalLM,MusicgenForConditionalGeneration:()=>r.MusicgenForConditionalGeneration,MusicgenModel:()=>r.MusicgenModel,MusicgenPreTrainedModel:()=>r.MusicgenPreTrainedModel,NllbTokenizer:()=>g.NllbTokenizer,NoBadWordsLogitsProcessor:()=>I.NoBadWordsLogitsProcessor,NoRepeatNGramLogitsProcessor:()=>I.NoRepeatNGramLogitsProcessor,NomicBertModel:()=>r.NomicBertModel,NomicBertPreTrainedModel:()=>r.NomicBertPreTrainedModel,NougatImageProcessor:()=>L.NougatImageProcessor,NougatTokenizer:()=>g.NougatTokenizer,OPTForCausalLM:()=>r.OPTForCausalLM,OPTModel:()=>r.OPTModel,OPTPreTrainedModel:()=>r.OPTPreTrainedModel,ObjectDetectionPipeline:()=>A.ObjectDetectionPipeline,Olmo2ForCausalLM:()=>r.Olmo2ForCausalLM,Olmo2Model:()=>r.Olmo2Model,Olmo2PreTrainedModel:()=>r.Olmo2PreTrainedModel,OlmoForCausalLM:()=>r.OlmoForCausalLM,OlmoModel:()=>r.OlmoModel,OlmoPreTrainedModel:()=>r.OlmoPreTrainedModel,OpenELMForCausalLM:()=>r.OpenELMForCausalLM,OpenELMModel:()=>r.OpenELMModel,OpenELMPreTrainedModel:()=>r.OpenELMPreTrainedModel,OwlViTFeatureExtractor:()=>L.OwlViTFeatureExtractor,OwlViTForObjectDetection:()=>r.OwlViTForObjectDetection,OwlViTImageProcessor:()=>L.OwlViTImageProcessor,OwlViTModel:()=>r.OwlViTModel,OwlViTPreTrainedModel:()=>r.OwlViTPreTrainedModel,OwlViTProcessor:()=>oe.OwlViTProcessor,Owlv2ForObjectDetection:()=>r.Owlv2ForObjectDetection,Owlv2ImageProcessor:()=>L.Owlv2ImageProcessor,Owlv2Model:()=>r.Owlv2Model,Owlv2PreTrainedModel:()=>r.Owlv2PreTrainedModel,PaliGemmaForConditionalGeneration:()=>r.PaliGemmaForConditionalGeneration,PaliGemmaPreTrainedModel:()=>r.PaliGemmaPreTrainedModel,PaliGemmaProcessor:()=>oe.PaliGemmaProcessor,PatchTSMixerForPrediction:()=>r.PatchTSMixerForPrediction,PatchTSMixerModel:()=>r.PatchTSMixerModel,PatchTSMixerPreTrainedModel:()=>r.PatchTSMixerPreTrainedModel,PatchTSTForPrediction:()=>r.PatchTSTForPrediction,PatchTSTModel:()=>r.PatchTSTModel,PatchTSTPreTrainedModel:()=>r.PatchTSTPreTrainedModel,Phi3ForCausalLM:()=>r.Phi3ForCausalLM,Phi3Model:()=>r.Phi3Model,Phi3PreTrainedModel:()=>r.Phi3PreTrainedModel,Phi3VForCausalLM:()=>r.Phi3VForCausalLM,Phi3VImageProcessor:()=>L.Phi3VImageProcessor,Phi3VPreTrainedModel:()=>r.Phi3VPreTrainedModel,Phi3VProcessor:()=>oe.Phi3VProcessor,PhiForCausalLM:()=>r.PhiForCausalLM,PhiModel:()=>r.PhiModel,PhiPreTrainedModel:()=>r.PhiPreTrainedModel,Pipeline:()=>A.Pipeline,PreTrainedModel:()=>r.PreTrainedModel,PreTrainedTokenizer:()=>g.PreTrainedTokenizer,PretrainedConfig:()=>$.PretrainedConfig,PretrainedMixin:()=>r.PretrainedMixin,Processor:()=>se.Processor,PvtForImageClassification:()=>r.PvtForImageClassification,PvtImageProcessor:()=>L.PvtImageProcessor,PvtModel:()=>r.PvtModel,PvtPreTrainedModel:()=>r.PvtPreTrainedModel,PyAnnoteFeatureExtractor:()=>b.PyAnnoteFeatureExtractor,PyAnnoteForAudioFrameClassification:()=>r.PyAnnoteForAudioFrameClassification,PyAnnoteModel:()=>r.PyAnnoteModel,PyAnnotePreTrainedModel:()=>r.PyAnnotePreTrainedModel,PyAnnoteProcessor:()=>oe.PyAnnoteProcessor,QuestionAnsweringModelOutput:()=>r.QuestionAnsweringModelOutput,QuestionAnsweringPipeline:()=>A.QuestionAnsweringPipeline,Qwen2ForCausalLM:()=>r.Qwen2ForCausalLM,Qwen2Model:()=>r.Qwen2Model,Qwen2PreTrainedModel:()=>r.Qwen2PreTrainedModel,Qwen2Tokenizer:()=>g.Qwen2Tokenizer,Qwen2VLForConditionalGeneration:()=>r.Qwen2VLForConditionalGeneration,Qwen2VLImageProcessor:()=>L.Qwen2VLImageProcessor,Qwen2VLPreTrainedModel:()=>r.Qwen2VLPreTrainedModel,Qwen2VLProcessor:()=>oe.Qwen2VLProcessor,RTDetrForObjectDetection:()=>r.RTDetrForObjectDetection,RTDetrImageProcessor:()=>L.RTDetrImageProcessor,RTDetrModel:()=>r.RTDetrModel,RTDetrObjectDetectionOutput:()=>r.RTDetrObjectDetectionOutput,RTDetrPreTrainedModel:()=>r.RTDetrPreTrainedModel,RawAudio:()=>N.RawAudio,RawImage:()=>Z.RawImage,RepetitionPenaltyLogitsProcessor:()=>I.RepetitionPenaltyLogitsProcessor,ResNetForImageClassification:()=>r.ResNetForImageClassification,ResNetModel:()=>r.ResNetModel,ResNetPreTrainedModel:()=>r.ResNetPreTrainedModel,RoFormerForMaskedLM:()=>r.RoFormerForMaskedLM,RoFormerForQuestionAnswering:()=>r.RoFormerForQuestionAnswering,RoFormerForSequenceClassification:()=>r.RoFormerForSequenceClassification,RoFormerForTokenClassification:()=>r.RoFormerForTokenClassification,RoFormerModel:()=>r.RoFormerModel,RoFormerPreTrainedModel:()=>r.RoFormerPreTrainedModel,RoFormerTokenizer:()=>g.RoFormerTokenizer,RobertaForMaskedLM:()=>r.RobertaForMaskedLM,RobertaForQuestionAnswering:()=>r.RobertaForQuestionAnswering,RobertaForSequenceClassification:()=>r.RobertaForSequenceClassification,RobertaForTokenClassification:()=>r.RobertaForTokenClassification,RobertaModel:()=>r.RobertaModel,RobertaPreTrainedModel:()=>r.RobertaPreTrainedModel,RobertaTokenizer:()=>g.RobertaTokenizer,SamImageProcessor:()=>L.SamImageProcessor,SamImageSegmentationOutput:()=>r.SamImageSegmentationOutput,SamModel:()=>r.SamModel,SamPreTrainedModel:()=>r.SamPreTrainedModel,SamProcessor:()=>oe.SamProcessor,SapiensForDepthEstimation:()=>r.SapiensForDepthEstimation,SapiensForNormalEstimation:()=>r.SapiensForNormalEstimation,SapiensForSemanticSegmentation:()=>r.SapiensForSemanticSegmentation,SapiensPreTrainedModel:()=>r.SapiensPreTrainedModel,SeamlessM4TFeatureExtractor:()=>b.SeamlessM4TFeatureExtractor,SegformerFeatureExtractor:()=>L.SegformerFeatureExtractor,SegformerForImageClassification:()=>r.SegformerForImageClassification,SegformerForSemanticSegmentation:()=>r.SegformerForSemanticSegmentation,SegformerImageProcessor:()=>L.SegformerImageProcessor,SegformerModel:()=>r.SegformerModel,SegformerPreTrainedModel:()=>r.SegformerPreTrainedModel,Seq2SeqLMOutput:()=>r.Seq2SeqLMOutput,SequenceClassifierOutput:()=>r.SequenceClassifierOutput,SiglipImageProcessor:()=>L.SiglipImageProcessor,SiglipModel:()=>r.SiglipModel,SiglipPreTrainedModel:()=>r.SiglipPreTrainedModel,SiglipTextModel:()=>r.SiglipTextModel,SiglipTokenizer:()=>g.SiglipTokenizer,SiglipVisionModel:()=>r.SiglipVisionModel,SpeechT5FeatureExtractor:()=>b.SpeechT5FeatureExtractor,SpeechT5ForSpeechToText:()=>r.SpeechT5ForSpeechToText,SpeechT5ForTextToSpeech:()=>r.SpeechT5ForTextToSpeech,SpeechT5HifiGan:()=>r.SpeechT5HifiGan,SpeechT5Model:()=>r.SpeechT5Model,SpeechT5PreTrainedModel:()=>r.SpeechT5PreTrainedModel,SpeechT5Processor:()=>oe.SpeechT5Processor,SpeechT5Tokenizer:()=>g.SpeechT5Tokenizer,SqueezeBertForMaskedLM:()=>r.SqueezeBertForMaskedLM,SqueezeBertForQuestionAnswering:()=>r.SqueezeBertForQuestionAnswering,SqueezeBertForSequenceClassification:()=>r.SqueezeBertForSequenceClassification,SqueezeBertModel:()=>r.SqueezeBertModel,SqueezeBertPreTrainedModel:()=>r.SqueezeBertPreTrainedModel,SqueezeBertTokenizer:()=>g.SqueezeBertTokenizer,StableLmForCausalLM:()=>r.StableLmForCausalLM,StableLmModel:()=>r.StableLmModel,StableLmPreTrainedModel:()=>r.StableLmPreTrainedModel,Starcoder2ForCausalLM:()=>r.Starcoder2ForCausalLM,Starcoder2Model:()=>r.Starcoder2Model,Starcoder2PreTrainedModel:()=>r.Starcoder2PreTrainedModel,StoppingCriteria:()=>H.StoppingCriteria,StoppingCriteriaList:()=>H.StoppingCriteriaList,StyleTextToSpeech2Model:()=>r.StyleTextToSpeech2Model,StyleTextToSpeech2PreTrainedModel:()=>r.StyleTextToSpeech2PreTrainedModel,SummarizationPipeline:()=>A.SummarizationPipeline,SuppressTokensAtBeginLogitsProcessor:()=>I.SuppressTokensAtBeginLogitsProcessor,Swin2SRForImageSuperResolution:()=>r.Swin2SRForImageSuperResolution,Swin2SRImageProcessor:()=>L.Swin2SRImageProcessor,Swin2SRModel:()=>r.Swin2SRModel,Swin2SRPreTrainedModel:()=>r.Swin2SRPreTrainedModel,SwinForImageClassification:()=>r.SwinForImageClassification,SwinModel:()=>r.SwinModel,SwinPreTrainedModel:()=>r.SwinPreTrainedModel,T5ForConditionalGeneration:()=>r.T5ForConditionalGeneration,T5Model:()=>r.T5Model,T5PreTrainedModel:()=>r.T5PreTrainedModel,T5Tokenizer:()=>g.T5Tokenizer,TableTransformerForObjectDetection:()=>r.TableTransformerForObjectDetection,TableTransformerModel:()=>r.TableTransformerModel,TableTransformerObjectDetectionOutput:()=>r.TableTransformerObjectDetectionOutput,TableTransformerPreTrainedModel:()=>r.TableTransformerPreTrainedModel,TemperatureLogitsWarper:()=>I.TemperatureLogitsWarper,Tensor:()=>j.Tensor,Text2TextGenerationPipeline:()=>A.Text2TextGenerationPipeline,TextClassificationPipeline:()=>A.TextClassificationPipeline,TextGenerationPipeline:()=>A.TextGenerationPipeline,TextStreamer:()=>U.TextStreamer,TextToAudioPipeline:()=>A.TextToAudioPipeline,TokenClassificationPipeline:()=>A.TokenClassificationPipeline,TokenClassifierOutput:()=>r.TokenClassifierOutput,TokenizerModel:()=>g.TokenizerModel,TopKLogitsWarper:()=>I.TopKLogitsWarper,TopPLogitsWarper:()=>I.TopPLogitsWarper,TrOCRForCausalLM:()=>r.TrOCRForCausalLM,TrOCRPreTrainedModel:()=>r.TrOCRPreTrainedModel,TranslationPipeline:()=>A.TranslationPipeline,UniSpeechForCTC:()=>r.UniSpeechForCTC,UniSpeechForSequenceClassification:()=>r.UniSpeechForSequenceClassification,UniSpeechModel:()=>r.UniSpeechModel,UniSpeechPreTrainedModel:()=>r.UniSpeechPreTrainedModel,UniSpeechSatForAudioFrameClassification:()=>r.UniSpeechSatForAudioFrameClassification,UniSpeechSatForCTC:()=>r.UniSpeechSatForCTC,UniSpeechSatForSequenceClassification:()=>r.UniSpeechSatForSequenceClassification,UniSpeechSatModel:()=>r.UniSpeechSatModel,UniSpeechSatPreTrainedModel:()=>r.UniSpeechSatPreTrainedModel,VLChatProcessor:()=>oe.VLChatProcessor,VLMImageProcessor:()=>L.VLMImageProcessor,ViTFeatureExtractor:()=>L.ViTFeatureExtractor,ViTForImageClassification:()=>r.ViTForImageClassification,ViTImageProcessor:()=>L.ViTImageProcessor,ViTMAEModel:()=>r.ViTMAEModel,ViTMAEPreTrainedModel:()=>r.ViTMAEPreTrainedModel,ViTMSNForImageClassification:()=>r.ViTMSNForImageClassification,ViTMSNModel:()=>r.ViTMSNModel,ViTMSNPreTrainedModel:()=>r.ViTMSNPreTrainedModel,ViTModel:()=>r.ViTModel,ViTPreTrainedModel:()=>r.ViTPreTrainedModel,VisionEncoderDecoderModel:()=>r.VisionEncoderDecoderModel,VitMatteForImageMatting:()=>r.VitMatteForImageMatting,VitMatteImageProcessor:()=>L.VitMatteImageProcessor,VitMattePreTrainedModel:()=>r.VitMattePreTrainedModel,VitPoseForPoseEstimation:()=>r.VitPoseForPoseEstimation,VitPoseImageProcessor:()=>L.VitPoseImageProcessor,VitPosePreTrainedModel:()=>r.VitPosePreTrainedModel,VitsModel:()=>r.VitsModel,VitsModelOutput:()=>r.VitsModelOutput,VitsPreTrainedModel:()=>r.VitsPreTrainedModel,VitsTokenizer:()=>g.VitsTokenizer,Wav2Vec2BertForCTC:()=>r.Wav2Vec2BertForCTC,Wav2Vec2BertForSequenceClassification:()=>r.Wav2Vec2BertForSequenceClassification,Wav2Vec2BertModel:()=>r.Wav2Vec2BertModel,Wav2Vec2BertPreTrainedModel:()=>r.Wav2Vec2BertPreTrainedModel,Wav2Vec2CTCTokenizer:()=>g.Wav2Vec2CTCTokenizer,Wav2Vec2FeatureExtractor:()=>b.Wav2Vec2FeatureExtractor,Wav2Vec2ForAudioFrameClassification:()=>r.Wav2Vec2ForAudioFrameClassification,Wav2Vec2ForCTC:()=>r.Wav2Vec2ForCTC,Wav2Vec2ForSequenceClassification:()=>r.Wav2Vec2ForSequenceClassification,Wav2Vec2Model:()=>r.Wav2Vec2Model,Wav2Vec2PreTrainedModel:()=>r.Wav2Vec2PreTrainedModel,Wav2Vec2ProcessorWithLM:()=>oe.Wav2Vec2ProcessorWithLM,WavLMForAudioFrameClassification:()=>r.WavLMForAudioFrameClassification,WavLMForCTC:()=>r.WavLMForCTC,WavLMForSequenceClassification:()=>r.WavLMForSequenceClassification,WavLMForXVector:()=>r.WavLMForXVector,WavLMModel:()=>r.WavLMModel,WavLMPreTrainedModel:()=>r.WavLMPreTrainedModel,WeSpeakerFeatureExtractor:()=>b.WeSpeakerFeatureExtractor,WeSpeakerResNetModel:()=>r.WeSpeakerResNetModel,WeSpeakerResNetPreTrainedModel:()=>r.WeSpeakerResNetPreTrainedModel,WhisperFeatureExtractor:()=>b.WhisperFeatureExtractor,WhisperForConditionalGeneration:()=>r.WhisperForConditionalGeneration,WhisperModel:()=>r.WhisperModel,WhisperPreTrainedModel:()=>r.WhisperPreTrainedModel,WhisperProcessor:()=>oe.WhisperProcessor,WhisperTextStreamer:()=>U.WhisperTextStreamer,WhisperTimeStampLogitsProcessor:()=>I.WhisperTimeStampLogitsProcessor,WhisperTokenizer:()=>g.WhisperTokenizer,XLMForQuestionAnswering:()=>r.XLMForQuestionAnswering,XLMForSequenceClassification:()=>r.XLMForSequenceClassification,XLMForTokenClassification:()=>r.XLMForTokenClassification,XLMModel:()=>r.XLMModel,XLMPreTrainedModel:()=>r.XLMPreTrainedModel,XLMRobertaForMaskedLM:()=>r.XLMRobertaForMaskedLM,XLMRobertaForQuestionAnswering:()=>r.XLMRobertaForQuestionAnswering,XLMRobertaForSequenceClassification:()=>r.XLMRobertaForSequenceClassification,XLMRobertaForTokenClassification:()=>r.XLMRobertaForTokenClassification,XLMRobertaModel:()=>r.XLMRobertaModel,XLMRobertaPreTrainedModel:()=>r.XLMRobertaPreTrainedModel,XLMRobertaTokenizer:()=>g.XLMRobertaTokenizer,XLMTokenizer:()=>g.XLMTokenizer,XLMWithLMHeadModel:()=>r.XLMWithLMHeadModel,XVectorOutput:()=>r.XVectorOutput,YolosFeatureExtractor:()=>L.YolosFeatureExtractor,YolosForObjectDetection:()=>r.YolosForObjectDetection,YolosImageProcessor:()=>L.YolosImageProcessor,YolosModel:()=>r.YolosModel,YolosObjectDetectionOutput:()=>r.YolosObjectDetectionOutput,YolosPreTrainedModel:()=>r.YolosPreTrainedModel,ZeroShotAudioClassificationPipeline:()=>A.ZeroShotAudioClassificationPipeline,ZeroShotClassificationPipeline:()=>A.ZeroShotClassificationPipeline,ZeroShotImageClassificationPipeline:()=>A.ZeroShotImageClassificationPipeline,ZeroShotObjectDetectionPipeline:()=>A.ZeroShotObjectDetectionPipeline,bankers_round:()=>y.bankers_round,cat:()=>j.cat,cos_sim:()=>y.cos_sim,dot:()=>y.dot,dynamic_time_warping:()=>y.dynamic_time_warping,env:()=>ke.env,full:()=>j.full,full_like:()=>j.full_like,getKeyValueShapes:()=>$.getKeyValueShapes,hamming:()=>N.hamming,hanning:()=>N.hanning,interpolate:()=>j.interpolate,interpolate_4d:()=>j.interpolate_4d,interpolate_data:()=>y.interpolate_data,is_chinese_char:()=>g.is_chinese_char,layer_norm:()=>j.layer_norm,load_image:()=>Z.load_image,log_softmax:()=>y.log_softmax,magnitude:()=>y.magnitude,matmul:()=>j.matmul,max:()=>y.max,mean:()=>j.mean,mean_pooling:()=>j.mean_pooling,medianFilter:()=>y.medianFilter,mel_filter_bank:()=>N.mel_filter_bank,min:()=>y.min,ones:()=>j.ones,ones_like:()=>j.ones_like,permute:()=>j.permute,permute_data:()=>y.permute_data,pipeline:()=>A.pipeline,quantize_embeddings:()=>j.quantize_embeddings,rand:()=>j.rand,read_audio:()=>N.read_audio,rfft:()=>j.rfft,round:()=>y.round,slice:()=>j.slice,softmax:()=>y.softmax,spectrogram:()=>N.spectrogram,stack:()=>j.stack,std_mean:()=>j.std_mean,topk:()=>j.topk,window_function:()=>N.window_function,zeros:()=>j.zeros,zeros_like:()=>j.zeros_like});var ke=cs("./src/env.js"),A=cs("./src/pipelines.js"),r=cs("./src/models.js"),g=cs("./src/tokenizers.js"),$=cs("./src/configs.js"),N=cs("./src/utils/audio.js"),Z=cs("./src/utils/image.js"),j=cs("./src/utils/tensor.js"),y=cs("./src/utils/maths.js"),T=cs("./src/base/feature_extraction_utils.js"),b=cs("./src/models/feature_extractors.js"),x=cs("./src/models/auto/feature_extraction_auto.js"),v=cs("./src/base/image_processors_utils.js"),L=cs("./src/models/image_processors.js"),K=cs("./src/models/auto/image_processing_auto.js"),se=cs("./src/base/processing_utils.js"),oe=cs("./src/models/processors.js"),V=cs("./src/models/auto/processing_auto.js"),U=cs("./src/generation/streamers.js"),H=cs("./src/generation/stopping_criteria.js"),I=cs("./src/generation/logits_process.js")})();d.ASTFeatureExtractor;d.ASTForAudioClassification;d.ASTModel;d.ASTPreTrainedModel;d.AlbertForMaskedLM;d.AlbertForQuestionAnswering;d.AlbertForSequenceClassification;d.AlbertModel;d.AlbertPreTrainedModel;d.AlbertTokenizer;d.AudioClassificationPipeline;d.AutoConfig;d.AutoFeatureExtractor;d.AutoImageProcessor;var lf=d.AutoModel;d.AutoModelForAudioClassification;d.AutoModelForAudioFrameClassification;d.AutoModelForCTC;d.AutoModelForCausalLM;d.AutoModelForDepthEstimation;d.AutoModelForDocumentQuestionAnswering;d.AutoModelForImageClassification;d.AutoModelForImageFeatureExtraction;d.AutoModelForImageMatting;d.AutoModelForImageSegmentation;d.AutoModelForImageToImage;d.AutoModelForMaskGeneration;d.AutoModelForMaskedLM;d.AutoModelForNormalEstimation;d.AutoModelForObjectDetection;d.AutoModelForPoseEstimation;d.AutoModelForQuestionAnswering;d.AutoModelForSemanticSegmentation;d.AutoModelForSeq2SeqLM;d.AutoModelForSequenceClassification;d.AutoModelForSpeechSeq2Seq;d.AutoModelForTextToSpectrogram;d.AutoModelForTextToWaveform;d.AutoModelForTokenClassification;d.AutoModelForUniversalSegmentation;d.AutoModelForVision2Seq;d.AutoModelForXVector;d.AutoModelForZeroShotObjectDetection;var U_=d.AutoProcessor,W_=d.AutoTokenizer;d.AutomaticSpeechRecognitionPipeline;d.BartForConditionalGeneration;d.BartForSequenceClassification;d.BartModel;d.BartPretrainedModel;d.BartTokenizer;d.BaseModelOutput;d.BaseStreamer;d.BeitFeatureExtractor;d.BeitForImageClassification;d.BeitModel;d.BeitPreTrainedModel;d.BertForMaskedLM;d.BertForQuestionAnswering;d.BertForSequenceClassification;d.BertForTokenClassification;d.BertModel;d.BertPreTrainedModel;d.BertTokenizer;d.BitImageProcessor;d.BlenderbotForConditionalGeneration;d.BlenderbotModel;d.BlenderbotPreTrainedModel;d.BlenderbotSmallForConditionalGeneration;d.BlenderbotSmallModel;d.BlenderbotSmallPreTrainedModel;d.BlenderbotSmallTokenizer;d.BlenderbotTokenizer;d.BloomForCausalLM;d.BloomModel;d.BloomPreTrainedModel;d.BloomTokenizer;d.CLIPFeatureExtractor;d.CLIPImageProcessor;d.CLIPModel;d.CLIPPreTrainedModel;d.CLIPSegForImageSegmentation;d.CLIPSegModel;d.CLIPSegPreTrainedModel;d.CLIPTextModel;d.CLIPTextModelWithProjection;d.CLIPTokenizer;d.CLIPVisionModel;d.CLIPVisionModelWithProjection;d.CamembertForMaskedLM;d.CamembertForQuestionAnswering;d.CamembertForSequenceClassification;d.CamembertForTokenClassification;d.CamembertModel;d.CamembertPreTrainedModel;d.CamembertTokenizer;d.CausalLMOutput;d.CausalLMOutputWithPast;d.ChineseCLIPFeatureExtractor;d.ChineseCLIPModel;d.ChineseCLIPPreTrainedModel;d.ClapAudioModelWithProjection;d.ClapFeatureExtractor;d.ClapModel;d.ClapPreTrainedModel;d.ClapTextModelWithProjection;d.ClassifierFreeGuidanceLogitsProcessor;d.CodeGenForCausalLM;d.CodeGenModel;d.CodeGenPreTrainedModel;d.CodeGenTokenizer;d.CodeLlamaTokenizer;d.CohereForCausalLM;d.CohereModel;d.CoherePreTrainedModel;d.CohereTokenizer;d.ConvBertForMaskedLM;d.ConvBertForQuestionAnswering;d.ConvBertForSequenceClassification;d.ConvBertForTokenClassification;d.ConvBertModel;d.ConvBertPreTrainedModel;d.ConvBertTokenizer;d.ConvNextFeatureExtractor;d.ConvNextForImageClassification;d.ConvNextImageProcessor;d.ConvNextModel;d.ConvNextPreTrainedModel;d.ConvNextV2ForImageClassification;d.ConvNextV2Model;d.ConvNextV2PreTrainedModel;d.DPTFeatureExtractor;d.DPTForDepthEstimation;d.DPTImageProcessor;d.DPTModel;d.DPTPreTrainedModel;d.DebertaForMaskedLM;d.DebertaForQuestionAnswering;d.DebertaForSequenceClassification;d.DebertaForTokenClassification;d.DebertaModel;d.DebertaPreTrainedModel;d.DebertaTokenizer;d.DebertaV2ForMaskedLM;d.DebertaV2ForQuestionAnswering;d.DebertaV2ForSequenceClassification;d.DebertaV2ForTokenClassification;d.DebertaV2Model;d.DebertaV2PreTrainedModel;d.DebertaV2Tokenizer;d.DecisionTransformerModel;d.DecisionTransformerPreTrainedModel;d.DeiTFeatureExtractor;d.DeiTForImageClassification;d.DeiTImageProcessor;d.DeiTModel;d.DeiTPreTrainedModel;d.DepthAnythingForDepthEstimation;d.DepthAnythingPreTrainedModel;d.DepthEstimationPipeline;d.DepthProForDepthEstimation;d.DepthProPreTrainedModel;d.DetrFeatureExtractor;d.DetrForObjectDetection;d.DetrForSegmentation;d.DetrImageProcessor;d.DetrModel;d.DetrObjectDetectionOutput;d.DetrPreTrainedModel;d.DetrSegmentationOutput;d.Dinov2ForImageClassification;d.Dinov2Model;d.Dinov2PreTrainedModel;d.Dinov2WithRegistersForImageClassification;d.Dinov2WithRegistersModel;d.Dinov2WithRegistersPreTrainedModel;d.DistilBertForMaskedLM;d.DistilBertForQuestionAnswering;d.DistilBertForSequenceClassification;d.DistilBertForTokenClassification;d.DistilBertModel;d.DistilBertPreTrainedModel;d.DistilBertTokenizer;d.DocumentQuestionAnsweringPipeline;d.DonutFeatureExtractor;d.DonutImageProcessor;d.DonutSwinModel;d.DonutSwinPreTrainedModel;d.EfficientNetForImageClassification;d.EfficientNetImageProcessor;d.EfficientNetModel;d.EfficientNetPreTrainedModel;d.ElectraForMaskedLM;d.ElectraForQuestionAnswering;d.ElectraForSequenceClassification;d.ElectraForTokenClassification;d.ElectraModel;d.ElectraPreTrainedModel;d.ElectraTokenizer;d.EosTokenCriteria;d.EsmForMaskedLM;d.EsmForSequenceClassification;d.EsmForTokenClassification;d.EsmModel;d.EsmPreTrainedModel;d.EsmTokenizer;d.ExaoneForCausalLM;d.ExaoneModel;d.ExaonePreTrainedModel;d.FFT;d.FalconForCausalLM;d.FalconModel;d.FalconPreTrainedModel;d.FalconTokenizer;d.FastViTForImageClassification;d.FastViTModel;d.FastViTPreTrainedModel;d.FeatureExtractionPipeline;d.FeatureExtractor;d.FillMaskPipeline;d.Florence2ForConditionalGeneration;d.Florence2PreTrainedModel;d.Florence2Processor;d.ForcedBOSTokenLogitsProcessor;d.ForcedEOSTokenLogitsProcessor;d.GLPNFeatureExtractor;d.GLPNForDepthEstimation;d.GLPNModel;d.GLPNPreTrainedModel;d.GPT2LMHeadModel;d.GPT2Model;d.GPT2PreTrainedModel;d.GPT2Tokenizer;d.GPTBigCodeForCausalLM;d.GPTBigCodeModel;d.GPTBigCodePreTrainedModel;d.GPTJForCausalLM;d.GPTJModel;d.GPTJPreTrainedModel;d.GPTNeoForCausalLM;d.GPTNeoModel;d.GPTNeoPreTrainedModel;d.GPTNeoXForCausalLM;d.GPTNeoXModel;d.GPTNeoXPreTrainedModel;d.GPTNeoXTokenizer;d.Gemma2ForCausalLM;d.Gemma2Model;d.Gemma2PreTrainedModel;d.GemmaForCausalLM;d.GemmaModel;d.GemmaPreTrainedModel;d.GemmaTokenizer;d.GraniteForCausalLM;d.GraniteModel;d.GranitePreTrainedModel;d.Grok1Tokenizer;d.GroundingDinoForObjectDetection;d.GroundingDinoImageProcessor;d.GroundingDinoPreTrainedModel;d.GroundingDinoProcessor;d.GroupViTModel;d.GroupViTPreTrainedModel;d.HerbertTokenizer;d.HieraForImageClassification;d.HieraModel;d.HieraPreTrainedModel;d.HubertForCTC;d.HubertForSequenceClassification;d.HubertModel;d.HubertPreTrainedModel;d.IJepaForImageClassification;d.IJepaModel;d.IJepaPreTrainedModel;d.Idefics3ForConditionalGeneration;d.Idefics3ImageProcessor;d.Idefics3PreTrainedModel;d.Idefics3Processor;d.ImageClassificationPipeline;d.ImageFeatureExtractionPipeline;d.ImageFeatureExtractor;d.ImageMattingOutput;d.ImageProcessor;d.ImageSegmentationPipeline;d.ImageToImagePipeline;d.ImageToTextPipeline;d.InterruptableStoppingCriteria;d.JAISLMHeadModel;d.JAISModel;d.JAISPreTrainedModel;d.JinaCLIPImageProcessor;d.JinaCLIPModel;d.JinaCLIPPreTrainedModel;d.JinaCLIPProcessor;d.JinaCLIPTextModel;d.JinaCLIPVisionModel;d.LlamaForCausalLM;d.LlamaModel;d.LlamaPreTrainedModel;d.LlamaTokenizer;d.LlavaForConditionalGeneration;d.LlavaOnevisionForConditionalGeneration;d.LlavaOnevisionImageProcessor;d.LlavaPreTrainedModel;d.LogitsProcessor;d.LogitsProcessorList;d.LogitsWarper;d.LongT5ForConditionalGeneration;d.LongT5Model;d.LongT5PreTrainedModel;d.M2M100ForConditionalGeneration;d.M2M100Model;d.M2M100PreTrainedModel;d.M2M100Tokenizer;d.MBart50Tokenizer;d.MBartForCausalLM;d.MBartForConditionalGeneration;d.MBartForSequenceClassification;d.MBartModel;d.MBartPreTrainedModel;d.MBartTokenizer;d.MPNetForMaskedLM;d.MPNetForQuestionAnswering;d.MPNetForSequenceClassification;d.MPNetForTokenClassification;d.MPNetModel;d.MPNetPreTrainedModel;d.MPNetTokenizer;d.MT5ForConditionalGeneration;d.MT5Model;d.MT5PreTrainedModel;d.MarianMTModel;d.MarianModel;d.MarianPreTrainedModel;d.MarianTokenizer;d.Mask2FormerImageProcessor;d.MaskFormerFeatureExtractor;d.MaskFormerForInstanceSegmentation;d.MaskFormerImageProcessor;d.MaskFormerModel;d.MaskFormerPreTrainedModel;d.MaskedLMOutput;d.MaxLengthCriteria;d.MgpstrForSceneTextRecognition;d.MgpstrModelOutput;d.MgpstrPreTrainedModel;d.MgpstrProcessor;d.MgpstrTokenizer;d.MinLengthLogitsProcessor;d.MinNewTokensLengthLogitsProcessor;d.MistralForCausalLM;d.MistralModel;d.MistralPreTrainedModel;d.MobileBertForMaskedLM;d.MobileBertForQuestionAnswering;d.MobileBertForSequenceClassification;d.MobileBertModel;d.MobileBertPreTrainedModel;d.MobileBertTokenizer;d.MobileLLMForCausalLM;d.MobileLLMModel;d.MobileLLMPreTrainedModel;d.MobileNetV1FeatureExtractor;d.MobileNetV1ForImageClassification;d.MobileNetV1ImageProcessor;d.MobileNetV1Model;d.MobileNetV1PreTrainedModel;d.MobileNetV2FeatureExtractor;d.MobileNetV2ForImageClassification;d.MobileNetV2ImageProcessor;d.MobileNetV2Model;d.MobileNetV2PreTrainedModel;d.MobileNetV3FeatureExtractor;d.MobileNetV3ForImageClassification;d.MobileNetV3ImageProcessor;d.MobileNetV3Model;d.MobileNetV3PreTrainedModel;d.MobileNetV4FeatureExtractor;d.MobileNetV4ForImageClassification;d.MobileNetV4ImageProcessor;d.MobileNetV4Model;d.MobileNetV4PreTrainedModel;d.MobileViTFeatureExtractor;d.MobileViTForImageClassification;d.MobileViTImageProcessor;d.MobileViTModel;d.MobileViTPreTrainedModel;d.MobileViTV2ForImageClassification;d.MobileViTV2Model;d.MobileViTV2PreTrainedModel;d.ModelOutput;d.ModernBertForMaskedLM;d.ModernBertForSequenceClassification;d.ModernBertForTokenClassification;d.ModernBertModel;d.ModernBertPreTrainedModel;d.Moondream1ForConditionalGeneration;d.MoonshineFeatureExtractor;d.MoonshineForConditionalGeneration;d.MoonshineModel;d.MoonshinePreTrainedModel;d.MoonshineProcessor;d.MptForCausalLM;d.MptModel;d.MptPreTrainedModel;d.MultiModalityCausalLM;d.MultiModalityPreTrainedModel;d.MusicgenForCausalLM;d.MusicgenForConditionalGeneration;d.MusicgenModel;d.MusicgenPreTrainedModel;d.NllbTokenizer;d.NoBadWordsLogitsProcessor;d.NoRepeatNGramLogitsProcessor;d.NomicBertModel;d.NomicBertPreTrainedModel;d.NougatImageProcessor;d.NougatTokenizer;d.OPTForCausalLM;d.OPTModel;d.OPTPreTrainedModel;d.ObjectDetectionPipeline;d.Olmo2ForCausalLM;d.Olmo2Model;d.Olmo2PreTrainedModel;d.OlmoForCausalLM;d.OlmoModel;d.OlmoPreTrainedModel;d.OpenELMForCausalLM;d.OpenELMModel;d.OpenELMPreTrainedModel;d.OwlViTFeatureExtractor;d.OwlViTForObjectDetection;d.OwlViTImageProcessor;d.OwlViTModel;d.OwlViTPreTrainedModel;d.OwlViTProcessor;d.Owlv2ForObjectDetection;d.Owlv2ImageProcessor;d.Owlv2Model;d.Owlv2PreTrainedModel;d.PaliGemmaForConditionalGeneration;d.PaliGemmaPreTrainedModel;d.PaliGemmaProcessor;d.PatchTSMixerForPrediction;d.PatchTSMixerModel;d.PatchTSMixerPreTrainedModel;d.PatchTSTForPrediction;d.PatchTSTModel;d.PatchTSTPreTrainedModel;d.Phi3ForCausalLM;d.Phi3Model;d.Phi3PreTrainedModel;d.Phi3VForCausalLM;d.Phi3VImageProcessor;d.Phi3VPreTrainedModel;d.Phi3VProcessor;d.PhiForCausalLM;d.PhiModel;d.PhiPreTrainedModel;d.Pipeline;d.PreTrainedModel;d.PreTrainedTokenizer;d.PretrainedConfig;d.PretrainedMixin;d.Processor;d.PvtForImageClassification;d.PvtImageProcessor;d.PvtModel;d.PvtPreTrainedModel;d.PyAnnoteFeatureExtractor;d.PyAnnoteForAudioFrameClassification;d.PyAnnoteModel;d.PyAnnotePreTrainedModel;d.PyAnnoteProcessor;d.QuestionAnsweringModelOutput;d.QuestionAnsweringPipeline;d.Qwen2ForCausalLM;d.Qwen2Model;d.Qwen2PreTrainedModel;d.Qwen2Tokenizer;d.Qwen2VLForConditionalGeneration;d.Qwen2VLImageProcessor;d.Qwen2VLPreTrainedModel;d.Qwen2VLProcessor;d.RTDetrForObjectDetection;d.RTDetrImageProcessor;d.RTDetrModel;d.RTDetrObjectDetectionOutput;d.RTDetrPreTrainedModel;d.RawAudio;var G_=d.RawImage;d.RepetitionPenaltyLogitsProcessor;d.ResNetForImageClassification;d.ResNetModel;d.ResNetPreTrainedModel;d.RoFormerForMaskedLM;d.RoFormerForQuestionAnswering;d.RoFormerForSequenceClassification;d.RoFormerForTokenClassification;d.RoFormerModel;d.RoFormerPreTrainedModel;d.RoFormerTokenizer;d.RobertaForMaskedLM;d.RobertaForQuestionAnswering;d.RobertaForSequenceClassification;d.RobertaForTokenClassification;d.RobertaModel;d.RobertaPreTrainedModel;d.RobertaTokenizer;d.SamImageProcessor;d.SamImageSegmentationOutput;d.SamModel;d.SamPreTrainedModel;d.SamProcessor;d.SapiensForDepthEstimation;d.SapiensForNormalEstimation;d.SapiensForSemanticSegmentation;d.SapiensPreTrainedModel;d.SeamlessM4TFeatureExtractor;d.SegformerFeatureExtractor;d.SegformerForImageClassification;d.SegformerForSemanticSegmentation;d.SegformerImageProcessor;d.SegformerModel;d.SegformerPreTrainedModel;d.Seq2SeqLMOutput;d.SequenceClassifierOutput;d.SiglipImageProcessor;d.SiglipModel;d.SiglipPreTrainedModel;d.SiglipTextModel;d.SiglipTokenizer;d.SiglipVisionModel;d.SpeechT5FeatureExtractor;d.SpeechT5ForSpeechToText;d.SpeechT5ForTextToSpeech;d.SpeechT5HifiGan;d.SpeechT5Model;d.SpeechT5PreTrainedModel;d.SpeechT5Processor;d.SpeechT5Tokenizer;d.SqueezeBertForMaskedLM;d.SqueezeBertForQuestionAnswering;d.SqueezeBertForSequenceClassification;d.SqueezeBertModel;d.SqueezeBertPreTrainedModel;d.SqueezeBertTokenizer;d.StableLmForCausalLM;d.StableLmModel;d.StableLmPreTrainedModel;d.Starcoder2ForCausalLM;d.Starcoder2Model;d.Starcoder2PreTrainedModel;d.StoppingCriteria;d.StoppingCriteriaList;d.StyleTextToSpeech2Model;d.StyleTextToSpeech2PreTrainedModel;d.SummarizationPipeline;d.SuppressTokensAtBeginLogitsProcessor;d.Swin2SRForImageSuperResolution;d.Swin2SRImageProcessor;d.Swin2SRModel;d.Swin2SRPreTrainedModel;d.SwinForImageClassification;d.SwinModel;d.SwinPreTrainedModel;d.T5ForConditionalGeneration;d.T5Model;d.T5PreTrainedModel;d.T5Tokenizer;d.TableTransformerForObjectDetection;d.TableTransformerModel;d.TableTransformerObjectDetectionOutput;d.TableTransformerPreTrainedModel;d.TemperatureLogitsWarper;d.Tensor;d.Text2TextGenerationPipeline;d.TextClassificationPipeline;d.TextGenerationPipeline;d.TextStreamer;d.TextToAudioPipeline;d.TokenClassificationPipeline;d.TokenClassifierOutput;d.TokenizerModel;d.TopKLogitsWarper;d.TopPLogitsWarper;d.TrOCRForCausalLM;d.TrOCRPreTrainedModel;d.TranslationPipeline;d.UniSpeechForCTC;d.UniSpeechForSequenceClassification;d.UniSpeechModel;d.UniSpeechPreTrainedModel;d.UniSpeechSatForAudioFrameClassification;d.UniSpeechSatForCTC;d.UniSpeechSatForSequenceClassification;d.UniSpeechSatModel;d.UniSpeechSatPreTrainedModel;d.VLChatProcessor;d.VLMImageProcessor;d.ViTFeatureExtractor;d.ViTForImageClassification;d.ViTImageProcessor;d.ViTMAEModel;d.ViTMAEPreTrainedModel;d.ViTMSNForImageClassification;d.ViTMSNModel;d.ViTMSNPreTrainedModel;d.ViTModel;d.ViTPreTrainedModel;d.VisionEncoderDecoderModel;d.VitMatteForImageMatting;d.VitMatteImageProcessor;d.VitMattePreTrainedModel;d.VitPoseForPoseEstimation;d.VitPoseImageProcessor;d.VitPosePreTrainedModel;d.VitsModel;d.VitsModelOutput;d.VitsPreTrainedModel;d.VitsTokenizer;d.Wav2Vec2BertForCTC;d.Wav2Vec2BertForSequenceClassification;d.Wav2Vec2BertModel;d.Wav2Vec2BertPreTrainedModel;d.Wav2Vec2CTCTokenizer;d.Wav2Vec2FeatureExtractor;d.Wav2Vec2ForAudioFrameClassification;d.Wav2Vec2ForCTC;d.Wav2Vec2ForSequenceClassification;d.Wav2Vec2Model;d.Wav2Vec2PreTrainedModel;d.Wav2Vec2ProcessorWithLM;d.WavLMForAudioFrameClassification;d.WavLMForCTC;d.WavLMForSequenceClassification;d.WavLMForXVector;d.WavLMModel;d.WavLMPreTrainedModel;d.WeSpeakerFeatureExtractor;d.WeSpeakerResNetModel;d.WeSpeakerResNetPreTrainedModel;d.WhisperFeatureExtractor;d.WhisperForConditionalGeneration;d.WhisperModel;d.WhisperPreTrainedModel;d.WhisperProcessor;d.WhisperTextStreamer;d.WhisperTimeStampLogitsProcessor;d.WhisperTokenizer;d.XLMForQuestionAnswering;d.XLMForSequenceClassification;d.XLMForTokenClassification;d.XLMModel;d.XLMPreTrainedModel;d.XLMRobertaForMaskedLM;d.XLMRobertaForQuestionAnswering;d.XLMRobertaForSequenceClassification;d.XLMRobertaForTokenClassification;d.XLMRobertaModel;d.XLMRobertaPreTrainedModel;d.XLMRobertaTokenizer;d.XLMTokenizer;d.XLMWithLMHeadModel;d.XVectorOutput;d.YolosFeatureExtractor;d.YolosForObjectDetection;d.YolosImageProcessor;d.YolosModel;d.YolosObjectDetectionOutput;d.YolosPreTrainedModel;d.ZeroShotAudioClassificationPipeline;d.ZeroShotClassificationPipeline;d.ZeroShotImageClassificationPipeline;d.ZeroShotObjectDetectionPipeline;d.bankers_round;d.cat;d.cos_sim;var K_=d.dot;d.dynamic_time_warping;d.env;d.full;d.full_like;d.getKeyValueShapes;d.hamming;d.hanning;d.interpolate;d.interpolate_4d;d.interpolate_data;d.is_chinese_char;var H_=d.layer_norm;d.load_image;d.log_softmax;d.magnitude;d.matmul;d.max;d.mean;var q_=d.mean_pooling;d.medianFilter;d.mel_filter_bank;d.min;d.ones;d.ones_like;d.permute;d.permute_data;d.pipeline;d.quantize_embeddings;d.rand;d.read_audio;d.rfft;d.round;d.slice;var Q_=d.softmax;d.spectrogram;d.stack;d.std_mean;d.topk;d.window_function;d.zeros;d.zeros_like;const zp=document.getElementById("status"),uf=document.getElementById("container"),lc=document.getElementById("video"),Ph=document.getElementById("labels"),Lp=document.getElementById("template"),Fp=document.getElementById("overlay");zp.textContent="Loading model (300MB)...";async function X_(){try{return(await navigator.gpu.requestAdapter()).features.has("shader-f16")}catch{return!1}}await X_();let ff,_f,gf,wf;try{const ke="nomic-ai/nomic-embed-text-v1.5";ff=await W_.from_pretrained(ke),_f=await lf.from_pretrained(ke,{device:"webgpu",dtype:"q4"});const A="nomic-ai/nomic-embed-vision-v1.5";gf=await U_.from_pretrained(A),wf=await lf.from_pretrained(A,{device:"webgpu",dtype:"fp32"})}catch(ke){throw zp.textContent=ke.message,alert(ke.message),ke}Ph.disabled=!1;Lp.disabled=!1;zp.textContent="Ready";const Y_=Math.exp(4.6052),Ai=224,Eh=document.createElement("canvas");Eh.width=Eh.height=Ai;const df=Eh.getContext("2d",{willReadFrequently:!0});let vh=!1,xh,En,Th,cf,Op;function yf(){vh||(vh=!0,async function(){if(Th!==Ph.value||cf!==Lp.value)if(En=null,Th=Ph.value,cf=Lp.value,Op=Th.split(/\s*,\s*/).filter(ke=>ke),Op.length>0){const ke=Op.map(g=>Lp.value.replaceAll("{}",g)),A=ff(ke,{padding:!0,truncation:!0}),{last_hidden_state:r}=await _f(A);En=q_(r,A.attention_mask),En=H_(En,[En.dims[1]]),En=En.normalize(2,-1).tolist()}else Fp.innerHTML="";if(En){df.drawImage(lc,0,0,Ai,Ai);const ke=df.getImageData(0,0,Ai,Ai).data,A=new G_(ke,Ai,Ai,4),r=await gf(A),{last_hidden_state:g}=await wf(r),$=g.mean(1).normalize(2,-1).tolist()[0],N=En.map(j=>K_(j,$)*Y_),Z=Q_(N).map((j,y)=>[j,y]).sort((j,y)=>y[0]-j[0]);Fp.innerHTML="";for(const[j,y]of Z)Fp.appendChild(document.createTextNode(`${Op[y]}: ${j.toFixed(2)}`)),Fp.appendChild(document.createElement("br"))}if(xh!==void 0){const ke=1e3/(performance.now()-xh);zp.textContent=`FPS: ${ke.toFixed(2)}`}xh=performance.now(),vh=!1}()),window.requestAnimationFrame(yf)}navigator.mediaDevices.getUserMedia({video:!0}).then(ke=>{lc.srcObject=ke,lc.play();const A=ke.getVideoTracks()[0],{width:r,height:g}=A.getSettings();lc.width=r,lc.height=g;const $=r/g,[N,Z]=$>720/405?[720,720/$]:[405*$,405];uf.style.width=`${N}px`,uf.style.height=`${Z}px`,window.requestAnimationFrame(yf)}).catch(ke=>{alert(ke)}); diff --git a/assets/index-DrEDm3et.js b/assets/index-DrEDm3et.js deleted file mode 100644 index 1a8e4bb04cf40807f51debf86a63ea39a26ea53d..0000000000000000000000000000000000000000 --- a/assets/index-DrEDm3et.js +++ /dev/null @@ -1,2373 +0,0 @@ -(function(){const e=document.createElement("link").relList;if(e&&e.supports&&e.supports("modulepreload"))return;for(const a of document.querySelectorAll('link[rel="modulepreload"]'))n(a);new MutationObserver(a=>{for(const i of a)if(i.type==="childList")for(const s of i.addedNodes)s.tagName==="LINK"&&s.rel==="modulepreload"&&n(s)}).observe(document,{childList:!0,subtree:!0});function r(a){const i={};return a.integrity&&(i.integrity=a.integrity),a.referrerPolicy&&(i.referrerPolicy=a.referrerPolicy),a.crossOrigin==="use-credentials"?i.credentials="include":a.crossOrigin==="anonymous"?i.credentials="omit":i.credentials="same-origin",i}function n(a){if(a.ep)return;a.ep=!0;const i=r(a);fetch(a.href,i)}})();const Ze={},n_=Object.freeze(Object.defineProperty({__proto__:null,default:Ze},Symbol.toStringTag,{value:"Module"})),a_="3.0.0-alpha.0",Ki=typeof self<"u",i_=Ki&&self.constructor.name==="DedicatedWorkerGlobalScope",kp=Ki&&"caches"in self,s_=typeof navigator<"u"&&"gpu"in navigator,Ep=typeof process<"u",o_=Ep&&process?.release?.name==="node",Pi=!Ip(Ze),Cp=!Ip(Ze),Zr=Object.freeze({IS_BROWSER_ENV:Ki,IS_WEBWORKER_ENV:i_,IS_WEB_CACHE_AVAILABLE:kp,IS_WEBGPU_AVAILABLE:s_,IS_PROCESS_AVAILABLE:Ep,IS_NODE_ENV:o_,IS_FS_AVAILABLE:Pi,IS_PATH_AVAILABLE:Cp}),Oo=Pi&&Cp,Tp=Oo?Ze.dirname(Ze.dirname(Ze.fileURLToPath(import.meta.url))):"./",u_=Oo?Ze.join(Tp,"/.cache/"):null,Hu="/models/",l_=Oo?Ze.join(Tp,Hu):Hu,Ct={version:a_,backends:{onnx:{},tfjs:{}},allowRemoteModels:!0,remoteHost:"https://huggingface.co/",remotePathTemplate:"{model}/resolve/{revision}/",allowLocalModels:!Ki,localModelPath:l_,useFS:Pi,useBrowserCache:kp,useFSCache:Pi,cacheDir:u_,useCustomCache:!1,customCache:null};function Ip(t){return Object.keys(t).length===0}const vt=class{constructor(){let t=function(...e){return t._call(...e)};return Object.setPrototypeOf(t,new.target.prototype)}_call(...t){throw Error("Must implement _call method in subclass")}};function Jn(t,e){t&&t(e)}function d_(t){return Object.fromEntries(Object.entries(t).map(([e,r])=>[r,e]))}function Ap(t){return t.replace(/[.*+?^${}()|[\]\\]/g,"\\$&")}function c_(t){return Number.isInteger(t)||typeof t=="bigint"}function ju(t){const e=[];let r=t;for(;Array.isArray(r);)e.push(r.length),r=r[0];return e}function ct(...t){return Array.prototype.concat.apply([],t)}function Ri(t,e){return Math.abs((t+e)%(2*e)-e)}function Qr(t,e){return Object.assign({},...e.map(r=>{if(t[r]!==void 0)return{[r]:t[r]}}))}var xs={};class Yi{_CONTENT_TYPE_MAP={txt:"text/plain",html:"text/html",css:"text/css",js:"text/javascript",json:"application/json",png:"image/png",jpg:"image/jpeg",jpeg:"image/jpeg",gif:"image/gif"};constructor(e){if(this.filePath=e,this.headers=new Headers,this.exists=Ze.existsSync(e),this.exists){this.status=200,this.statusText="OK";let r=Ze.statSync(e);this.headers.set("content-length",r.size.toString()),this.updateContentType();let n=this;this.body=new ReadableStream({start(a){n.arrayBuffer().then(i=>{a.enqueue(new Uint8Array(i)),a.close()})}})}else this.status=404,this.statusText="Not Found",this.body=null}updateContentType(){const e=this.filePath.toString().split(".").pop().toLowerCase();this.headers.set("content-type",this._CONTENT_TYPE_MAP[e]??"application/octet-stream")}clone(){let e=new Yi(this.filePath);return e.exists=this.exists,e.status=this.status,e.statusText=this.statusText,e.headers=new Headers(this.headers),e}async arrayBuffer(){return(await Ze.promises.readFile(this.filePath)).buffer}async blob(){const e=await Ze.promises.readFile(this.filePath);return new Blob([e],{type:this.headers.get("content-type")})}async text(){return await Ze.promises.readFile(this.filePath,"utf8")}async json(){return JSON.parse(await this.text())}}function po(t,e=null,r=null){let n;try{n=new URL(t)}catch{return!1}return!(e&&!e.includes(n.protocol)||r&&!r.includes(n.hostname))}async function ho(t){if(Ct.useFS&&!po(t,["http:","https:","blob:"]))return new Yi(t);if(typeof process<"u"&&process?.release?.name==="node"){const e=!!xs?.TESTING_REMOTELY,r=Ct.version,n=new Headers;if(n.set("User-Agent",`transformers.js/${r}; is_ci/${e};`),po(t,["http:","https:"],["huggingface.co","hf.co"])){const i=xs?.HF_TOKEN??xs?.HF_ACCESS_TOKEN;i&&n.set("Authorization",`Bearer ${i}`)}return fetch(t,{headers:n})}else return fetch(t)}const p_={400:"Bad request error occurred while trying to load file",401:"Unauthorized access to file",403:"Forbidden access to file",404:"Could not locate file",408:"Request timeout error occurred while trying to load file",500:"Internal server error error occurred while trying to load file",502:"Bad gateway error occurred while trying to load file",503:"Service unavailable error occurred while trying to load file",504:"Gateway timeout error occurred while trying to load file"};function h_(t,e,r){if(!r)return null;const n=p_[t]??`Error (${t}) occurred while trying to load file`;throw Error(`${n}: "${e}".`)}class qu{constructor(e){this.path=e}async match(e){let r=Ze.join(this.path,e),n=new Yi(r);if(n.exists)return n}async put(e,r){const n=Buffer.from(await r.arrayBuffer());let a=Ze.join(this.path,e);try{await Ze.promises.mkdir(Ze.dirname(a),{recursive:!0}),await Ze.promises.writeFile(a,n)}catch(i){console.warn("An error occurred while writing the file to cache:",i)}}}async function f_(t,...e){for(let r of e)try{let n=await t.match(r);if(n)return n}catch{continue}}async function ki(t,e,r=!0,n={}){if(!Ct.allowLocalModels&&n.local_files_only)throw Error("Invalid configuration detected: local models are disabled (`env.allowLocalModels=false`) but you have requested to only use local models (`local_files_only=true`).");Jn(n.progress_callback,{status:"initiate",name:t,file:e});let a;if(!a&&Ct.useBrowserCache){if(typeof caches>"u")throw Error("Browser cache is not available in this environment.");try{a=await caches.open("transformers-cache")}catch(k){console.warn("An error occurred while opening the browser cache:",k)}}if(!a&&Ct.useFSCache&&(a=new qu(n.cache_dir??Ct.cacheDir)),!a&&Ct.useCustomCache)throw Error("`env.useCustomCache=true`, but `env.customCache` is not defined.");const i=n.revision??"main";let s=li(t,e),o=li(Ct.localModelPath,s),u=li(Ct.remoteHost,Ct.remotePathTemplate.replaceAll("{model}",t).replaceAll("{revision}",encodeURIComponent(i)),e),l=i==="main"?s:li(t,i,e),p,f=a instanceof qu?l:u,m=!1,c;a&&(c=await f_(a,o,f));const y=c!==void 0;if(c===void 0){if(Ct.allowLocalModels)if(po(s,["http:","https:"])){if(n.local_files_only)throw new Error(`\`local_files_only=true\`, but attempted to load a remote file from: ${s}.`)}else try{c=await ho(o),p=o}catch($){console.warn(`Unable to load from local path "${o}": "${$}"`)}if(c===void 0||c.status===404){if(n.local_files_only||!Ct.allowRemoteModels){if(r)throw Error(`\`local_files_only=true\` or \`env.allowRemoteModels=false\` and file was not found locally at "${o}".`);return null}if(c=await ho(u),c.status!==200)return h_(c.status,u,r);p=f}m=a&&typeof Response<"u"&&c instanceof Response&&c.status===200}Jn(n.progress_callback,{status:"download",name:t,file:e});const w={status:"progress",name:t,file:e};let v;return n.progress_callback?y&&typeof navigator<"u"&&/firefox/i.test(navigator.userAgent)?(v=new Uint8Array(await c.arrayBuffer()),Jn(n.progress_callback,{...w,progress:100,loaded:v.length,total:v.length})):v=await m_(c,k=>{Jn(n.progress_callback,{...w,...k})}):v=new Uint8Array(await c.arrayBuffer()),m&&p&&await a.match(p)===void 0&&await a.put(p,new Response(v,{headers:c.headers})).catch(k=>{console.warn(`Unable to add response to browser cache: ${k}.`)}),Jn(n.progress_callback,{status:"done",name:t,file:e}),v}async function Mr(t,e,r=!0,n={}){let a=await ki(t,e,r,n);if(a===null)return{};let s=new TextDecoder("utf-8").decode(a);return JSON.parse(s)}async function m_(t,e){const r=t.headers.get("Content-Length");r===null&&console.warn("Unable to determine content-length from response headers. Will expand buffer when needed.");let n=parseInt(r??"0"),a=new Uint8Array(n),i=0;const s=t.body.getReader();async function o(){const{done:u,value:l}=await s.read();if(u)return;let p=i+l.length;if(p>n){n=p;let m=new Uint8Array(n);m.set(a),a=m}a.set(l,i),i=p;const f=i/n*100;return e({progress:f,loaded:i,total:n}),o()}return await o(),a}function li(...t){return t=t.map((e,r)=>(r&&(e=e.replace(new RegExp("^/"),"")),r!==t.length-1&&(e=e.replace(new RegExp("/$"),"")),e)),t.join("/")}function g_(t,[e,r,n],[a,i],s="bilinear",o=!1){const u=i/n,l=a/r,p=new t.constructor(a*i*e),f=r*n,m=a*i;for(let c=0;c=0;--o)a[o]=u,n[o]=e[r[o]],u*=n[o];const i=r.map((o,u)=>a[r.indexOf(u)]),s=new t.constructor(t.length);for(let o=0;o=0;--l)u+=p%e[l]*i[l],p=Math.floor(p/e[l]);s[u]=t[o]}return[s,n]}function In(t){const e=$r(t)[0],r=t.map(i=>Math.exp(i-e)),n=r.reduce((i,s)=>i+s,0);return r.map(i=>i/n)}function y_(t){return In(t).map(n=>Math.log(n))}function w_(t,e){let r=0;for(let n=0;n[n,r]).sort((r,n)=>n[1]-r[1]),e!==null&&e>0&&(t=t.slice(0,e)),t}function Op(t){if(t.length===0)throw Error("Array must not be empty");let e=t[0],r=0;for(let n=1;ne&&(e=t[n],r=n);return[Number(e),r]}function zp(t){return t>0&&(t&t-1)===0}class Pp{constructor(e){if(this.size=e|0,this.size<=1||!zp(this.size))throw new Error("FFT size must be a power of two larger than 1");this._csize=e<<1,this.table=new Float64Array(this.size*2);for(let n=0;nn;n<<=1)++r;this._width=r%2===0?r-1:r,this._bitrev=new Int32Array(1<>>a&3)<>>1);for(let a=0;a>>1]=e[a];return n}toComplexArray(e,r){const n=r||this.createComplexArray();for(let a=0;a>>1],n[a+1]=0;return n}transform(e,r){if(e===r)throw new Error("Input and output buffers must be different");this._transform4(e,r,1)}realTransform(e,r){if(e===r)throw new Error("Input and output buffers must be different");this._realTransform4(e,r,1)}inverseTransform(e,r){if(e===r)throw new Error("Input and output buffers must be different");this._transform4(e,r,-1);for(let n=0;n>=2;s>=2;s>>=2){o=a/s<<1;const m=o>>>2;for(u=0;u>>1,s>>>1)}else for(u=0,l=0;u>>1,s>>>1,n)}const f=this.table;for(s>>=2;s>=2;s>>=2){o=a/s<<1;const c=o>>>1,y=c>>>1,w=y>>>1;for(u=0;u>>1;for(let c=2;c>1;++p){const f=(p+1-e)**2/2,m=Math.sqrt(u**2+l**2)**f,c=f*Math.atan2(l,u),y=2*p;i[y]=m*Math.cos(c),i[y+1]=m*Math.sin(c),s[y]=i[y],s[y+1]=-i[y+1]}this._slicedChirpBuffer=i.subarray(r,n),this._f=new Pp(a>>1),this._f.transform(this._chirpBuffer,s)}_transform(e,r,n){const a=this._buffer1,i=this._buffer2,s=this._outBuffer1,o=this._outBuffer2,u=this._chirpBuffer,l=this._slicedChirpBuffer,p=this._a;if(n)for(let f=0;f>1,y=r[c];a[f]=y*l[f],a[m]=y*l[m]}else for(let f=0;f=t.length&&(u=2*(t.length-1)-u),n[s++]=t[u]}n.sort(),r[i]=n[a]}return r}function Ss(t,e){const r=Math.pow(10,e);return Math.round(t*r)/r}function x_(t){const e=Math.round(t);return Math.abs(t)%1===.5?e%2===0?e:e-1:e}/*! - * ONNX Runtime Web v1.18.0 - * Copyright (c) Microsoft Corporation. All rights reserved. - * Licensed under the MIT License. - */var zo=Object.defineProperty,S_=Object.getOwnPropertyDescriptor,k_=Object.getOwnPropertyNames,E_=Object.prototype.hasOwnProperty,Z=(t,e)=>()=>(t&&(e=t(t=0)),e),An=(t,e)=>()=>(e||t((e={exports:{}}).exports,e),e.exports),Mn=(t,e)=>{for(var r in e)zo(t,r,{get:e[r],enumerable:!0})},C_=(t,e,r,n)=>{if(e&&typeof e=="object"||typeof e=="function")for(let a of k_(e))!E_.call(t,a)&&a!==r&&zo(t,a,{get:()=>e[a],enumerable:!(n=S_(e,a))||n.enumerable});return t},Jr=t=>C_(zo({},"__esModule",{value:!0}),t),Zn,Cr,Xr,Ku,Po,Ro=Z(()=>{Zn=new Map,Cr=[],Xr=(t,e,r)=>{if(e&&typeof e.init=="function"&&typeof e.createInferenceSessionHandler=="function"){let n=Zn.get(t);if(n===void 0)Zn.set(t,{backend:e,priority:r});else{if(n.priority>r)return;if(n.priority===r&&n.backend!==e)throw new Error(`cannot register backend "${t}" using priority ${r}`)}if(r>=0){let a=Cr.indexOf(t);a!==-1&&Cr.splice(a,1);for(let i=0;i{let e=Zn.get(t);if(!e)return"backend not found.";if(e.initialized)return e.backend;if(e.aborted)return e.error;{let r=!!e.initPromise;try{return r||(e.initPromise=e.backend.init(t)),await e.initPromise,e.initialized=!0,e.backend}catch(n){return r||(e.error=`${n}`,e.aborted=!0),e.error}finally{delete e.initPromise}}},Po=async t=>{let e=t.executionProviders||[],r=e.map(u=>typeof u=="string"?u:u.name),n=r.length===0?Cr:r,a,i=[],s=new Set;for(let u of n){let l=await Ku(u);typeof l=="string"?i.push({name:u,err:l}):(a||(a=l),a===l&&s.add(u))}if(!a)throw new Error(`no available backend found. ERR: ${i.map(u=>`[${u.name}] ${u.err}`).join(", ")}`);for(let{name:u,err:l}of i)r.includes(u)&&console.warn(`removing requested execution provider "${u}" from session options because it is not available: ${l}`);let o=e.filter(u=>s.has(typeof u=="string"?u:u.name));return[a,new Proxy(t,{get:(u,l)=>l==="executionProviders"?o:Reflect.get(u,l)})]}}),T_=Z(()=>{Ro()}),Rp,I_=Z(()=>{Rp="1.18.0"}),ks,Ft,Bp=Z(()=>{I_(),ks="warning",Ft={wasm:{},webgl:{},webgpu:{},versions:{common:Rp},set logLevel(t){if(t!==void 0){if(typeof t!="string"||["verbose","info","warning","error","fatal"].indexOf(t)===-1)throw new Error(`Unsupported logging level: ${t}`);ks=t}},get logLevel(){return ks}},Object.defineProperty(Ft,"logLevel",{enumerable:!0})}),Ue,A_=Z(()=>{Bp(),Ue=Ft}),Dp,Np,M_=Z(()=>{Dp=(t,e)=>{let r=typeof document<"u"?document.createElement("canvas"):new OffscreenCanvas(1,1);r.width=t.dims[3],r.height=t.dims[2];let n=r.getContext("2d");if(n!=null){let a,i;e?.tensorLayout!==void 0&&e.tensorLayout==="NHWC"?(a=t.dims[2],i=t.dims[3]):(a=t.dims[3],i=t.dims[2]);let s=e?.format!==void 0?e.format:"RGB",o=e?.norm,u,l;o===void 0||o.mean===void 0?u=[255,255,255,255]:typeof o.mean=="number"?u=[o.mean,o.mean,o.mean,o.mean]:(u=[o.mean[0],o.mean[1],o.mean[2],0],o.mean[3]!==void 0&&(u[3]=o.mean[3])),o===void 0||o.bias===void 0?l=[0,0,0,0]:typeof o.bias=="number"?l=[o.bias,o.bias,o.bias,o.bias]:(l=[o.bias[0],o.bias[1],o.bias[2],0],o.bias[3]!==void 0&&(l[3]=o.bias[3]));let p=i*a,f=0,m=p,c=p*2,y=-1;s==="RGBA"?(f=0,m=p,c=p*2,y=p*3):s==="RGB"?(f=0,m=p,c=p*2):s==="RBG"&&(f=0,c=p,m=p*2);for(let w=0;w{let r=typeof document<"u"?document.createElement("canvas").getContext("2d"):new OffscreenCanvas(1,1).getContext("2d"),n;if(r!=null){let a,i,s;e?.tensorLayout!==void 0&&e.tensorLayout==="NHWC"?(a=t.dims[2],i=t.dims[1],s=t.dims[3]):(a=t.dims[3],i=t.dims[2],s=t.dims[1]);let o=e!==void 0&&e.format!==void 0?e.format:"RGB",u=e?.norm,l,p;u===void 0||u.mean===void 0?l=[255,255,255,255]:typeof u.mean=="number"?l=[u.mean,u.mean,u.mean,u.mean]:(l=[u.mean[0],u.mean[1],u.mean[2],255],u.mean[3]!==void 0&&(l[3]=u.mean[3])),u===void 0||u.bias===void 0?p=[0,0,0,0]:typeof u.bias=="number"?p=[u.bias,u.bias,u.bias,u.bias]:(p=[u.bias[0],u.bias[1],u.bias[2],0],u.bias[3]!==void 0&&(p[3]=u.bias[3]));let f=i*a;if(e!==void 0&&(e.format!==void 0&&s===4&&e.format!=="RGBA"||s===3&&e.format!=="RGB"&&e.format!=="BGR"))throw new Error("Tensor format doesn't match input tensor dims");let m=4,c=0,y=1,w=2,v=3,k=0,$=f,C=f*2,T=-1;o==="RGBA"?(k=0,$=f,C=f*2,T=f*3):o==="RGB"?(k=0,$=f,C=f*2):o==="RBG"&&(k=0,C=f,$=f*2),n=r.createImageData(a,i);for(let A=0;A{Bo(),di=(t,e)=>{if(t===void 0)throw new Error("Image buffer must be defined");if(e.height===void 0||e.width===void 0)throw new Error("Image height and width must be defined");if(e.tensorLayout==="NHWC")throw new Error("NHWC Tensor layout is not supported yet");let{height:r,width:n}=e,a=e.norm??{mean:255,bias:0},i,s;typeof a.mean=="number"?i=[a.mean,a.mean,a.mean,a.mean]:i=[a.mean[0],a.mean[1],a.mean[2],a.mean[3]??255],typeof a.bias=="number"?s=[a.bias,a.bias,a.bias,a.bias]:s=[a.bias[0],a.bias[1],a.bias[2],a.bias[3]??0];let o=e.format!==void 0?e.format:"RGBA",u=e.tensorFormat!==void 0&&e.tensorFormat!==void 0?e.tensorFormat:"RGB",l=r*n,p=u==="RGBA"?new Float32Array(l*4):new Float32Array(l*3),f=4,m=0,c=1,y=2,w=3,v=0,k=l,$=l*2,C=-1;o==="RGB"&&(f=3,m=0,c=1,y=2,w=-1),u==="RGBA"?C=l*3:u==="RBG"?(v=0,$=l,k=l*2):u==="BGR"&&($=0,k=l,v=l*2);for(let T=0;T{let r=typeof HTMLImageElement<"u"&&t instanceof HTMLImageElement,n=typeof ImageData<"u"&&t instanceof ImageData,a=typeof ImageBitmap<"u"&&t instanceof ImageBitmap,i=typeof t=="string",s,o=e??{},u=()=>{if(typeof document<"u")return document.createElement("canvas");if(typeof OffscreenCanvas<"u")return new OffscreenCanvas(1,1);throw new Error("Canvas is not supported")},l=p=>p instanceof HTMLCanvasElement||p instanceof OffscreenCanvas?p.getContext("2d"):null;if(r){let p=u();p.width=t.width,p.height=t.height;let f=l(p);if(f!=null){let m=t.height,c=t.width;if(e!==void 0&&e.resizedHeight!==void 0&&e.resizedWidth!==void 0&&(m=e.resizedHeight,c=e.resizedWidth),e!==void 0){if(o=e,e.tensorFormat!==void 0)throw new Error("Image input config format must be RGBA for HTMLImageElement");o.tensorFormat="RGBA",o.height=m,o.width=c}else o.tensorFormat="RGBA",o.height=m,o.width=c;f.drawImage(t,0,0),s=f.getImageData(0,0,c,m).data}else throw new Error("Can not access image data")}else if(n){let p,f;if(e!==void 0&&e.resizedWidth!==void 0&&e.resizedHeight!==void 0?(p=e.resizedHeight,f=e.resizedWidth):(p=t.height,f=t.width),e!==void 0&&(o=e),o.format="RGBA",o.height=p,o.width=f,e!==void 0){let m=u();m.width=f,m.height=p;let c=l(m);if(c!=null)c.putImageData(t,0,0),s=c.getImageData(0,0,f,p).data;else throw new Error("Can not access image data")}else s=t.data}else if(a){if(e===void 0)throw new Error("Please provide image config with format for Imagebitmap");let p=u();p.width=t.width,p.height=t.height;let f=l(p);if(f!=null){let m=t.height,c=t.width;return f.drawImage(t,0,0,c,m),s=f.getImageData(0,0,c,m).data,o.height=m,o.width=c,di(s,o)}else throw new Error("Can not access image data")}else{if(i)return new Promise((p,f)=>{let m=u(),c=l(m);if(!t||!c)return f();let y=new Image;y.crossOrigin="Anonymous",y.src=t,y.onload=()=>{m.width=y.width,m.height=y.height,c.drawImage(y,0,0,m.width,m.height);let w=c.getImageData(0,0,m.width,m.height);o.height=m.height,o.width=m.width,p(di(w.data,o))}});throw new Error("Input data provided is not supported - aborted tensor creation")}if(s!==void 0)return di(s,o);throw new Error("Input data provided is not supported - aborted tensor creation")},Lp=(t,e)=>{let{width:r,height:n,download:a,dispose:i}=e,s=[1,n,r,4];return new rr({location:"texture",type:"float32",texture:t,dims:s,download:a,dispose:i})},Up=(t,e)=>{let{dataType:r,dims:n,download:a,dispose:i}=e;return new rr({location:"gpu-buffer",type:r??"float32",gpuBuffer:t,dims:n,download:a,dispose:i})},Wp=(t,e,r)=>new rr({location:"cpu-pinned",type:t,data:e,dims:r??[e.length]})}),qr,ua,Es,Vp,z_=Z(()=>{qr=new Map([["float32",Float32Array],["uint8",Uint8Array],["int8",Int8Array],["uint16",Uint16Array],["int16",Int16Array],["int32",Int32Array],["bool",Uint8Array],["float64",Float64Array],["uint32",Uint32Array]]),ua=new Map([[Float32Array,"float32"],[Uint8Array,"uint8"],[Int8Array,"int8"],[Uint16Array,"uint16"],[Int16Array,"int16"],[Int32Array,"int32"],[Float64Array,"float64"],[Uint32Array,"uint32"]]),Es=!1,Vp=()=>{if(!Es){Es=!0;let t=typeof BigInt64Array<"u"&&BigInt64Array.from,e=typeof BigUint64Array<"u"&&BigUint64Array.from,r=typeof Float16Array<"u"&&Float16Array.from;t&&(qr.set("int64",BigInt64Array),ua.set(BigInt64Array,"int64")),e&&(qr.set("uint64",BigUint64Array),ua.set(BigUint64Array,"uint64")),r?(qr.set("float16",Float16Array),ua.set(Float16Array,"float16")):qr.set("float16",Uint16Array)}}}),Gp,Hp,P_=Z(()=>{Bo(),Gp=t=>{let e=1;for(let r=0;r{switch(t.location){case"cpu":return new rr(t.type,t.data,e);case"cpu-pinned":return new rr({location:"cpu-pinned",data:t.data,type:t.type,dims:e});case"texture":return new rr({location:"texture",texture:t.texture,type:t.type,dims:e});case"gpu-buffer":return new rr({location:"gpu-buffer",gpuBuffer:t.gpuBuffer,type:t.type,dims:e});default:throw new Error(`tensorReshape: tensor location ${t.location} is not supported`)}}}),rr,Bo=Z(()=>{M_(),O_(),z_(),P_(),rr=class{constructor(t,e,r){Vp();let n,a;if(typeof t=="object"&&"location"in t)switch(this.dataLocation=t.location,n=t.type,a=t.dims,t.location){case"cpu-pinned":{let s=qr.get(n);if(!s)throw new TypeError(`unsupported type "${n}" to create tensor from pinned buffer`);if(!(t.data instanceof s))throw new TypeError(`buffer should be of type ${s.name}`);this.cpuData=t.data;break}case"texture":{if(n!=="float32")throw new TypeError(`unsupported type "${n}" to create tensor from texture`);this.gpuTextureData=t.texture,this.downloader=t.download,this.disposer=t.dispose;break}case"gpu-buffer":{if(n!=="float32"&&n!=="float16"&&n!=="int32"&&n!=="int64"&&n!=="uint32"&&n!=="uint8"&&n!=="bool")throw new TypeError(`unsupported type "${n}" to create tensor from gpu buffer`);this.gpuBufferData=t.gpuBuffer,this.downloader=t.download,this.disposer=t.dispose;break}default:throw new Error(`Tensor constructor: unsupported location '${this.dataLocation}'`)}else{let s,o;if(typeof t=="string")if(n=t,o=r,t==="string"){if(!Array.isArray(e))throw new TypeError("A string tensor's data must be a string array.");s=e}else{let u=qr.get(t);if(u===void 0)throw new TypeError(`Unsupported tensor type: ${t}.`);if(Array.isArray(e)){if(t==="float16"&&u===Uint16Array)throw new TypeError("Creating a float16 tensor from number array is not supported. Please use Uint16Array as data.");t==="uint64"||t==="int64"?s=u.from(e,BigInt):s=u.from(e)}else if(e instanceof u)s=e;else throw new TypeError(`A ${n} tensor's data must be type of ${u}`)}else if(o=e,Array.isArray(t)){if(t.length===0)throw new TypeError("Tensor type cannot be inferred from an empty array.");let u=typeof t[0];if(u==="string")n="string",s=t;else if(u==="boolean")n="bool",s=Uint8Array.from(t);else throw new TypeError(`Invalid element type of data array: ${u}.`)}else{let u=ua.get(t.constructor);if(u===void 0)throw new TypeError(`Unsupported type for tensor data: ${t.constructor}.`);n=u,s=t}if(o===void 0)o=[s.length];else if(!Array.isArray(o))throw new TypeError("A tensor's dims must be a number array");a=o,this.cpuData=s,this.dataLocation="cpu"}let i=Gp(a);if(this.cpuData&&i!==this.cpuData.length)throw new Error(`Tensor's size(${i}) does not match data length(${this.cpuData.length}).`);this.type=n,this.dims=a,this.size=i}static async fromImage(t,e){return Fp(t,e)}static fromTexture(t,e){return Lp(t,e)}static fromGpuBuffer(t,e){return Up(t,e)}static fromPinnedBuffer(t,e,r){return Wp(t,e,r)}toDataURL(t){return Dp(this,t)}toImageData(t){return Np(this,t)}get data(){if(this.ensureValid(),!this.cpuData)throw new Error("The data is not on CPU. Use `getData()` to download GPU data to CPU, or use `texture` or `gpuBuffer` property to access the GPU data directly.");return this.cpuData}get location(){return this.dataLocation}get texture(){if(this.ensureValid(),!this.gpuTextureData)throw new Error("The data is not stored as a WebGL texture.");return this.gpuTextureData}get gpuBuffer(){if(this.ensureValid(),!this.gpuBufferData)throw new Error("The data is not stored as a WebGPU buffer.");return this.gpuBufferData}async getData(t){switch(this.ensureValid(),this.dataLocation){case"cpu":case"cpu-pinned":return this.data;case"texture":case"gpu-buffer":{if(!this.downloader)throw new Error("The current tensor is not created with a specified data downloader.");if(this.isDownloading)throw new Error("The current tensor is being downloaded.");try{this.isDownloading=!0;let e=await this.downloader();return this.downloader=void 0,this.dataLocation="cpu",this.cpuData=e,t&&this.disposer&&(this.disposer(),this.disposer=void 0),e}finally{this.isDownloading=!1}}default:throw new Error(`cannot get data from location: ${this.dataLocation}`)}}dispose(){if(this.isDownloading)throw new Error("The current tensor is being downloaded.");this.disposer&&(this.disposer(),this.disposer=void 0),this.cpuData=void 0,this.gpuTextureData=void 0,this.gpuBufferData=void 0,this.downloader=void 0,this.isDownloading=void 0,this.dataLocation="none"}ensureValid(){if(this.dataLocation==="none")throw new Error("The tensor is disposed.")}reshape(t){if(this.ensureValid(),this.downloader||this.disposer)throw new Error("Cannot reshape a tensor that owns GPU resource.");return Hp(this,t)}}}),bt,Do=Z(()=>{Bo(),bt=rr}),ma,Cs,nr,Lt,jp=Z(()=>{Bp(),ma=(t,e)=>{(typeof Ft.trace>"u"?!Ft.wasm.trace:!Ft.trace)||console.timeStamp(`${t}::ORT::${e}`)},Cs=(t,e)=>{let r=new Error().stack?.split(/\r\n|\r|\n/g)||[],n=!1;for(let a=0;a{(typeof Ft.trace>"u"?!Ft.wasm.trace:!Ft.trace)||Cs("BEGIN",t)},Lt=t=>{(typeof Ft.trace>"u"?!Ft.wasm.trace:!Ft.trace)||Cs("END",t)}}),qp,R_=Z(()=>{Ro(),Do(),jp(),qp=class Kp{constructor(e){this.handler=e}async run(e,r,n){nr();let a={},i={};if(typeof e!="object"||e===null||e instanceof bt||Array.isArray(e))throw new TypeError("'feeds' must be an object that use input names as keys and OnnxValue as corresponding values.");let s=!0;if(typeof r=="object"){if(r===null)throw new TypeError("Unexpected argument[1]: cannot be null.");if(r instanceof bt)throw new TypeError("'fetches' cannot be a Tensor");if(Array.isArray(r)){if(r.length===0)throw new TypeError("'fetches' cannot be an empty array.");s=!1;for(let l of r){if(typeof l!="string")throw new TypeError("'fetches' must be a string array or an object.");if(this.outputNames.indexOf(l)===-1)throw new RangeError(`'fetches' contains invalid output name: ${l}.`);a[l]=null}if(typeof n=="object"&&n!==null)i=n;else if(typeof n<"u")throw new TypeError("'options' must be an object.")}else{let l=!1,p=Object.getOwnPropertyNames(r);for(let f of this.outputNames)if(p.indexOf(f)!==-1){let m=r[f];(m===null||m instanceof bt)&&(l=!0,s=!1,a[f]=m)}if(l){if(typeof n=="object"&&n!==null)i=n;else if(typeof n<"u")throw new TypeError("'options' must be an object.")}else i=r}}else if(typeof r<"u")throw new TypeError("Unexpected argument[1]: must be 'fetches' or 'options'.");for(let l of this.inputNames)if(typeof e[l]>"u")throw new Error(`input '${l}' is missing in 'feeds'.`);if(s)for(let l of this.outputNames)a[l]=null;let o=await this.handler.run(e,a,i),u={};for(let l in o)if(Object.hasOwnProperty.call(o,l)){let p=o[l];p instanceof bt?u[l]=p:u[l]=new bt(p.type,p.data,p.dims)}return Lt(),u}async release(){return this.handler.dispose()}static async create(e,r,n,a){nr();let i,s={};if(typeof e=="string"){if(i=e,typeof r=="object"&&r!==null)s=r;else if(typeof r<"u")throw new TypeError("'options' must be an object.")}else if(e instanceof Uint8Array){if(i=e,typeof r=="object"&&r!==null)s=r;else if(typeof r<"u")throw new TypeError("'options' must be an object.")}else if(e instanceof ArrayBuffer||typeof SharedArrayBuffer<"u"&&e instanceof SharedArrayBuffer){let p=e,f=0,m=e.byteLength;if(typeof r=="object"&&r!==null)s=r;else if(typeof r=="number"){if(f=r,!Number.isSafeInteger(f))throw new RangeError("'byteOffset' must be an integer.");if(f<0||f>=p.byteLength)throw new RangeError(`'byteOffset' is out of range [0, ${p.byteLength}).`);if(m=e.byteLength-f,typeof n=="number"){if(m=n,!Number.isSafeInteger(m))throw new RangeError("'byteLength' must be an integer.");if(m<=0||f+m>p.byteLength)throw new RangeError(`'byteLength' is out of range (0, ${p.byteLength-f}].`);if(typeof a=="object"&&a!==null)s=a;else if(typeof a<"u")throw new TypeError("'options' must be an object.")}else if(typeof n<"u")throw new TypeError("'byteLength' must be a number.")}else if(typeof r<"u")throw new TypeError("'options' must be an object.");i=new Uint8Array(p,f,m)}else throw new TypeError("Unexpected argument[0]: must be 'path' or 'buffer'.");let[o,u]=await Po(s),l=await o.createInferenceSessionHandler(i,u);return Lt(),new Kp(l)}startProfiling(){this.handler.startProfiling()}endProfiling(){this.handler.endProfiling()}get inputNames(){return this.handler.inputNames}get outputNames(){return this.handler.outputNames}}}),No,B_=Z(()=>{R_(),No=qp}),D_=Z(()=>{}),N_=Z(()=>{}),F_=Z(()=>{}),L_=Z(()=>{}),Yu,Yp,U_=Z(()=>{Ro(),Do(),Yu="Training backend could not be resolved. Make sure you're using the correct configuration & WebAssembly files.",Yp=class Xp{constructor(e,r,n){this.handler=e,this.hasOptimizerModel=r,this.hasEvalModel=n}get trainingInputNames(){return this.handler.inputNames}get trainingOutputNames(){return this.handler.outputNames}get evalInputNames(){if(this.hasEvalModel)return this.handler.evalInputNames;throw new Error("This training session has no evalModel loaded.")}get evalOutputNames(){if(this.hasEvalModel)return this.handler.evalOutputNames;throw new Error("This training session has no evalModel loaded.")}static async create(e,r){let n=e.evalModel||"",a=e.optimizerModel||"",i=r||{},[s,o]=await Po(i);if(s.createTrainingSessionHandler){let u=await s.createTrainingSessionHandler(e.checkpointState,e.trainModel,n,a,o);return new Xp(u,!!e.optimizerModel,!!e.evalModel)}else throw new Error(Yu)}typeNarrowingForRunStep(e,r,n,a,i){let s={},o={};if(typeof n!="object"||n===null||n instanceof bt||Array.isArray(n))throw new TypeError("'feeds' must be an object that use input names as keys and OnnxValue as corresponding values.");let u=!0;if(typeof a=="object"){if(a===null)throw new TypeError("Unexpected argument[1]: cannot be null.");if(a instanceof bt)throw new TypeError("'fetches' cannot be a Tensor");if(Array.isArray(a)){if(a.length===0)throw new TypeError("'fetches' cannot be an empty array.");u=!1;for(let l of a){if(typeof l!="string")throw new TypeError("'fetches' must be a string array or an object.");if(r.indexOf(l)===-1)throw new RangeError(`'fetches' contains invalid output name: ${l}.`);s[l]=null}if(typeof i=="object"&&i!==null)o=i;else if(typeof i<"u")throw new TypeError("'options' must be an object.")}else{let l=!1,p=Object.getOwnPropertyNames(a);for(let f of r)if(p.indexOf(f)!==-1){let m=a[f];(m===null||m instanceof bt)&&(l=!0,u=!1,s[f]=m)}if(l){if(typeof i=="object"&&i!==null)o=i;else if(typeof i<"u")throw new TypeError("'options' must be an object.")}else o=a}}else if(typeof a<"u")throw new TypeError("Unexpected argument[1]: must be 'fetches' or 'options'.");for(let l of e)if(typeof n[l]>"u")throw new Error(`input '${l}' is missing in 'feeds'.`);if(u)for(let l of r)s[l]=null;return[s,o]}convertHandlerReturnTypeToMapOfTensors(e){let r={};for(let n in e)if(Object.hasOwnProperty.call(e,n)){let a=e[n];a instanceof bt?r[n]=a:r[n]=new bt(a.type,a.data,a.dims)}return r}async lazyResetGrad(){await this.handler.lazyResetGrad()}async runTrainStep(e,r,n){let[a,i]=this.typeNarrowingForRunStep(this.trainingInputNames,this.trainingOutputNames,e,r,n),s=await this.handler.runTrainStep(e,a,i);return this.convertHandlerReturnTypeToMapOfTensors(s)}async runOptimizerStep(e){if(this.hasOptimizerModel)await this.handler.runOptimizerStep(e||{});else throw new Error("This TrainingSession has no OptimizerModel loaded.")}async runEvalStep(e,r,n){if(this.hasEvalModel){let[a,i]=this.typeNarrowingForRunStep(this.evalInputNames,this.evalOutputNames,e,r,n),s=await this.handler.runEvalStep(e,a,i);return this.convertHandlerReturnTypeToMapOfTensors(s)}else throw new Error("This TrainingSession has no EvalModel loaded.")}async getParametersSize(e=!0){return this.handler.getParametersSize(e)}async loadParametersBuffer(e,r=!0){let n=await this.getParametersSize(r);if(e.length!==4*n)throw new Error("Size of the buffer passed into loadParametersBuffer must match the number of parameters in the model. Please use getParametersSize method to check.");return this.handler.loadParametersBuffer(e,r)}async getContiguousParameters(e=!0){return this.handler.getContiguousParameters(e)}async release(){return this.handler.dispose()}}}),Fo,W_=Z(()=>{U_(),Fo=Yp}),Qp={};Mn(Qp,{InferenceSession:()=>No,TRACE:()=>ma,TRACE_FUNC_BEGIN:()=>nr,TRACE_FUNC_END:()=>Lt,Tensor:()=>bt,TrainingSession:()=>Fo,env:()=>Ue,registerBackend:()=>Xr});var ar=Z(()=>{T_(),A_(),B_(),Do(),D_(),N_(),jp(),F_(),L_(),W_()}),Lo={};Mn(Lo,{createReadStream:()=>eh,readFile:()=>Jp,readFileSync:()=>Zp});var Jp,Zp,eh,th=Z(()=>{Jp=void 0,Zp=void 0,eh=void 0}),Uo={};Mn(Uo,{join:()=>rh});var rh,nh=Z(()=>{rh=void 0}),V_=An((t,e)=>{var r=(()=>{var n=typeof document<"u"?document.currentScript?.src:void 0;return typeof __filename<"u"&&(n||=__filename),function(a={}){var i=a,s,o,u=new Promise((h,_)=>{s=h,o=_});i.mountExternalData=(h,_)=>{(i.eb||(i.eb=new Map)).set(h,_)},i.unmountExternalData=()=>{delete i.eb};let l=()=>{let h=(x,E,O)=>(...F)=>{let q=kt,J=E?.();F=x(...F);let de=E?.();return J!==de&&(x=de,O(J),E=O=null),kt!=q?Ya():F},_=x=>async(...E)=>{try{if(i.cb)throw Error("Session already started");let O=i.cb={xb:E[0],errors:[]},F=await x(...E);if(i.cb!==O)throw Error("Session mismatch");i.kb?.flush();let q=O.errors;if(0de),0i._OrtCreateSession,x=>i._OrtCreateSession=x),i._OrtRun=_(h(i._OrtRun,()=>i._OrtRun,x=>i._OrtRun=x)),i._OrtRunWithBinding=_(h(i._OrtRunWithBinding,()=>i._OrtRunWithBinding,x=>i._OrtRunWithBinding=x)),i._OrtBindInput=h(i._OrtBindInput,()=>i._OrtBindInput,x=>i._OrtBindInput=x),l=void 0};i.jsepInit=(h,_)=>{if(l?.(),h==="webgpu"){[i.kb,i.pb,i.tb,i.lb,i.sb,i.Ra,i.ub,i.wb,i.qb,i.rb,i.vb]=_;let x=i.kb;i.jsepRegisterBuffer=(E,O,F,q)=>x.registerBuffer(E,O,F,q),i.jsepGetBuffer=E=>x.getBuffer(E),i.jsepCreateDownloader=(E,O,F)=>x.createDownloader(E,O,F),i.jsepOnReleaseSession=E=>{x.onReleaseSession(E)},i.jsepOnRunStart=E=>x.onRunStart(E)}};var p=Object.assign({},i),f="./this.program",m=(h,_)=>{throw _},c=typeof window=="object",y=typeof importScripts=="function",w=typeof process=="object"&&typeof process.versions=="object"&&typeof process.versions.node=="string",v="",k,$,C;if(w){var T=(th(),Jr(Lo)),A=(nh(),Jr(Uo));v=y?A.dirname(v)+"/":__dirname+"/",k=(h,_)=>(h=dt(h)?new URL(h):A.normalize(h),T.readFileSync(h,_?void 0:"utf8")),C=h=>(h=k(h,!0),h.buffer||(h=new Uint8Array(h)),h),$=(h,_,x,E=!0)=>{h=dt(h)?new URL(h):A.normalize(h),T.readFile(h,E?void 0:"utf8",(O,F)=>{O?x(O):_(E?F.buffer:F)})},!i.thisProgram&&1{throw process.exitCode=h,_}}else(c||y)&&(y?v=self.location.href:typeof document<"u"&&document.currentScript&&(v=document.currentScript.src),n&&(v=n),v.startsWith("blob:")?v="":v=v.substr(0,v.replace(/[?#].*/,"").lastIndexOf("/")+1),k=h=>{var _=new XMLHttpRequest;return _.open("GET",h,!1),_.send(null),_.responseText},y&&(C=h=>{var _=new XMLHttpRequest;return _.open("GET",h,!1),_.responseType="arraybuffer",_.send(null),new Uint8Array(_.response)}),$=(h,_,x)=>{var E=new XMLHttpRequest;E.open("GET",h,!0),E.responseType="arraybuffer",E.onload=()=>{E.status==200||E.status==0&&E.response?_(E.response):x()},E.onerror=x,E.send(null)});var B=console.log.bind(console),R=console.error.bind(console);Object.assign(i,p),p=null;var D,K=!1,j,ie,te,oe,re,M,P,H,le,G,ne;function N(){var h=D.buffer;i.HEAP8=ie=new Int8Array(h),i.HEAP16=oe=new Int16Array(h),i.HEAPU8=te=new Uint8Array(h),i.HEAPU16=re=new Uint16Array(h),i.HEAP32=M=new Int32Array(h),i.HEAPU32=P=new Uint32Array(h),i.HEAPF32=H=new Float32Array(h),i.HEAPF64=ne=new Float64Array(h),i.HEAP64=le=new BigInt64Array(h),i.HEAPU64=G=new BigUint64Array(h)}var ae=[],fe=[],Ce=[],Be=0,Ke=null;function Qe(h){throw h="Aborted("+h+")",R(h),K=!0,j=1,h=new WebAssembly.RuntimeError(h+". Build with -sASSERTIONS for more info."),o(h),h}var We=h=>h.startsWith("data:application/octet-stream;base64,"),dt=h=>h.startsWith("file://"),Ve;if(Ve="ort-wasm-simd.wasm",!We(Ve)){var Ne=Ve;Ve=i.locateFile?i.locateFile(Ne,v):v+Ne}function ht(h){if(C)return C(h);throw"both async and sync fetching of the wasm failed"}function Vt(h){if(c||y){if(typeof fetch=="function"&&!dt(h))return fetch(h,{credentials:"same-origin"}).then(_=>{if(!_.ok)throw`failed to load wasm binary file at '${h}'`;return _.arrayBuffer()}).catch(()=>ht(h));if($)return new Promise((_,x)=>{$(h,E=>_(new Uint8Array(E)),x)})}return Promise.resolve().then(()=>ht(h))}function st(h,_,x){return Vt(h).then(E=>WebAssembly.instantiate(E,_)).then(x,E=>{R(`failed to asynchronously prepare wasm: ${E}`),Qe(E)})}function Pr(h,_){var x=Ve;return typeof WebAssembly.instantiateStreaming!="function"||We(x)||dt(x)||w||typeof fetch!="function"?st(x,h,_):fetch(x,{credentials:"same-origin"}).then(E=>WebAssembly.instantiateStreaming(E,h).then(_,function(O){return R(`wasm streaming compile failed: ${O}`),R("falling back to ArrayBuffer instantiation"),st(x,h,_)}))}var hr={824920:(h,_,x,E)=>{if(typeof i>"u"||!i.eb)return 1;if(h=Ye(h>>>0),h.startsWith("./")&&(h=h.substring(2)),h=i.eb.get(h),!h)return 2;if(_>>>=0,x>>>=0,_+x>h.byteLength)return 3;try{return te.set(h.subarray(_,_+x),E>>>0>>>0),0}catch{return 4}},825421:()=>{i.qb()},825452:()=>{i.rb()},825481:()=>{i.vb()},825506:h=>i.pb(h),825539:h=>i.tb(h),825571:(h,_,x)=>{i.lb(h,_,x,!0)},825610:(h,_,x)=>{i.lb(h,_,x)},825643:h=>{i.Ra("Abs",h,void 0)},825694:h=>{i.Ra("Neg",h,void 0)},825745:h=>{i.Ra("Floor",h,void 0)},825798:h=>{i.Ra("Ceil",h,void 0)},825850:h=>{i.Ra("Reciprocal",h,void 0)},825908:h=>{i.Ra("Sqrt",h,void 0)},825960:h=>{i.Ra("Exp",h,void 0)},826011:h=>{i.Ra("Erf",h,void 0)},826062:h=>{i.Ra("Sigmoid",h,void 0)},826117:(h,_,x)=>{i.Ra("HardSigmoid",h,{alpha:_,beta:x})},826196:h=>{i.Ra("Log",h,void 0)},826247:h=>{i.Ra("Sin",h,void 0)},826298:h=>{i.Ra("Cos",h,void 0)},826349:h=>{i.Ra("Tan",h,void 0)},826400:h=>{i.Ra("Asin",h,void 0)},826452:h=>{i.Ra("Acos",h,void 0)},826504:h=>{i.Ra("Atan",h,void 0)},826556:h=>{i.Ra("Sinh",h,void 0)},826608:h=>{i.Ra("Cosh",h,void 0)},826660:h=>{i.Ra("Asinh",h,void 0)},826713:h=>{i.Ra("Acosh",h,void 0)},826766:h=>{i.Ra("Atanh",h,void 0)},826819:h=>{i.Ra("Tanh",h,void 0)},826871:h=>{i.Ra("Not",h,void 0)},826922:(h,_,x)=>{i.Ra("Clip",h,{min:_,max:x})},826991:h=>{i.Ra("Clip",h,void 0)},827043:(h,_)=>{i.Ra("Elu",h,{alpha:_})},827101:h=>{i.Ra("Relu",h,void 0)},827153:(h,_)=>{i.Ra("LeakyRelu",h,{alpha:_})},827217:(h,_)=>{i.Ra("ThresholdedRelu",h,{alpha:_})},827287:(h,_)=>{i.Ra("Cast",h,{to:_})},827345:h=>{i.Ra("Add",h,void 0)},827396:h=>{i.Ra("Sub",h,void 0)},827447:h=>{i.Ra("Mul",h,void 0)},827498:h=>{i.Ra("Div",h,void 0)},827549:h=>{i.Ra("Pow",h,void 0)},827600:h=>{i.Ra("Equal",h,void 0)},827653:h=>{i.Ra("Greater",h,void 0)},827708:h=>{i.Ra("GreaterOrEqual",h,void 0)},827770:h=>{i.Ra("Less",h,void 0)},827822:h=>{i.Ra("LessOrEqual",h,void 0)},827881:(h,_,x,E,O)=>{i.Ra("ReduceMean",h,{keepDims:!!_,noopWithEmptyAxes:!!x,axes:E?Array.from(M.subarray(E>>>0,O>>>0)):[]})},828040:(h,_,x,E,O)=>{i.Ra("ReduceMax",h,{keepDims:!!_,noopWithEmptyAxes:!!x,axes:E?Array.from(M.subarray(E>>>0,O>>>0)):[]})},828198:(h,_,x,E,O)=>{i.Ra("ReduceMin",h,{keepDims:!!_,noopWithEmptyAxes:!!x,axes:E?Array.from(M.subarray(E>>>0,O>>>0)):[]})},828356:(h,_,x,E,O)=>{i.Ra("ReduceProd",h,{keepDims:!!_,noopWithEmptyAxes:!!x,axes:E?Array.from(M.subarray(E>>>0,O>>>0)):[]})},828515:(h,_,x,E,O)=>{i.Ra("ReduceSum",h,{keepDims:!!_,noopWithEmptyAxes:!!x,axes:E?Array.from(M.subarray(E>>>0,O>>>0)):[]})},828673:(h,_,x,E,O)=>{i.Ra("ReduceL1",h,{keepDims:!!_,noopWithEmptyAxes:!!x,axes:E?Array.from(M.subarray(E>>>0,O>>>0)):[]})},828830:(h,_,x,E,O)=>{i.Ra("ReduceL2",h,{keepDims:!!_,noopWithEmptyAxes:!!x,axes:E?Array.from(M.subarray(E>>>0,O>>>0)):[]})},828987:(h,_,x,E,O)=>{i.Ra("ReduceLogSum",h,{keepDims:!!_,noopWithEmptyAxes:!!x,axes:E?Array.from(M.subarray(E>>>0,O>>>0)):[]})},829148:(h,_,x,E,O)=>{i.Ra("ReduceSumSquare",h,{keepDims:!!_,noopWithEmptyAxes:!!x,axes:E?Array.from(M.subarray(E>>>0,O>>>0)):[]})},829312:(h,_,x,E,O)=>{i.Ra("ReduceLogSumExp",h,{keepDims:!!_,noopWithEmptyAxes:!!x,axes:E?Array.from(M.subarray(E>>>0,O>>>0)):[]})},829476:h=>{i.Ra("Where",h,void 0)},829529:(h,_,x)=>{i.Ra("Transpose",h,{perm:_?Array.from(M.subarray(_>>>0,x>>>0)):[]})},829637:(h,_,x,E)=>{i.Ra("DepthToSpace",h,{blocksize:_,mode:Ye(x),format:E?"NHWC":"NCHW"})},829770:(h,_,x,E)=>{i.Ra("DepthToSpace",h,{blocksize:_,mode:Ye(x),format:E?"NHWC":"NCHW"})},829903:(h,_,x,E,O,F,q,J,de,se,me,ze,Fe,L,xe)=>{i.Ra("ConvTranspose",h,{format:de?"NHWC":"NCHW",autoPad:_,dilations:[x],group:E,kernelShape:[O],pads:[F,q],strides:[J],wIsConst:()=>!!ie[se>>>0],outputPadding:me?Array.from(M.subarray(me>>>0,ze>>>0)):[],outputShape:Fe?Array.from(M.subarray(Fe>>>0,L>>>0)):[],activation:Ye(xe)})},830304:(h,_,x,E,O,F,q,J,de,se,me,ze,Fe,L)=>{i.Ra("ConvTranspose",h,{format:J?"NHWC":"NCHW",autoPad:_,dilations:Array.from(M.subarray(x>>>0,(x>>>0)+2>>>0)),group:E,kernelShape:Array.from(M.subarray(O>>>0,(O>>>0)+2>>>0)),pads:Array.from(M.subarray(F>>>0,(F>>>0)+4>>>0)),strides:Array.from(M.subarray(q>>>0,(q>>>0)+2>>>0)),wIsConst:()=>!!ie[de>>>0],outputPadding:se?Array.from(M.subarray(se>>>0,me>>>0)):[],outputShape:ze?Array.from(M.subarray(ze>>>0,Fe>>>0)):[],activation:Ye(L)})},830869:(h,_,x,E,O,F,q,J,de,se,me,ze,Fe,L,xe)=>{i.Ra("ConvTranspose",h,{format:de?"NHWC":"NCHW",autoPad:_,dilations:[x],group:E,kernelShape:[O],pads:[F,q],strides:[J],wIsConst:()=>!!ie[se>>>0],outputPadding:me?Array.from(M.subarray(me>>>0,ze>>>0)):[],outputShape:Fe?Array.from(M.subarray(Fe>>>0,L>>>0)):[],activation:Ye(xe)})},831270:(h,_,x,E,O,F,q,J,de,se,me,ze,Fe,L)=>{i.Ra("ConvTranspose",h,{format:J?"NHWC":"NCHW",autoPad:_,dilations:Array.from(M.subarray(x>>>0,(x>>>0)+2>>>0)),group:E,kernelShape:Array.from(M.subarray(O>>>0,(O>>>0)+2>>>0)),pads:Array.from(M.subarray(F>>>0,(F>>>0)+4>>>0)),strides:Array.from(M.subarray(q>>>0,(q>>>0)+2>>>0)),wIsConst:()=>!!ie[de>>>0],outputPadding:se?Array.from(M.subarray(se>>>0,me>>>0)):[],outputShape:ze?Array.from(M.subarray(ze>>>0,Fe>>>0)):[],activation:Ye(L)})},831835:(h,_)=>{i.Ra("GlobalAveragePool",h,{format:_?"NHWC":"NCHW"})},831926:(h,_,x,E,O,F,q,J,de,se,me,ze,Fe,L,xe,Oe)=>{i.Ra("AveragePool",h,{format:Oe?"NHWC":"NCHW",auto_pad:_,ceil_mode:x,count_include_pad:E,storage_order:O,dilations:[F,q],kernel_shape:[J,de],pads:[se,me,ze,Fe],strides:[L,xe]})},832210:(h,_)=>{i.Ra("GlobalAveragePool",h,{format:_?"NHWC":"NCHW"})},832301:(h,_,x,E,O,F,q,J,de,se,me,ze,Fe,L,xe,Oe)=>{i.Ra("AveragePool",h,{format:Oe?"NHWC":"NCHW",auto_pad:_,ceil_mode:x,count_include_pad:E,storage_order:O,dilations:[F,q],kernel_shape:[J,de],pads:[se,me,ze,Fe],strides:[L,xe]})},832585:(h,_)=>{i.Ra("GlobalMaxPool",h,{format:_?"NHWC":"NCHW"})},832672:(h,_,x,E,O,F,q,J,de,se,me,ze,Fe,L,xe,Oe)=>{i.Ra("MaxPool",h,{format:Oe?"NHWC":"NCHW",auto_pad:_,ceil_mode:x,count_include_pad:E,storage_order:O,dilations:[F,q],kernel_shape:[J,de],pads:[se,me,ze,Fe],strides:[L,xe]})},832952:(h,_)=>{i.Ra("GlobalMaxPool",h,{format:_?"NHWC":"NCHW"})},833039:(h,_,x,E,O,F,q,J,de,se,me,ze,Fe,L,xe,Oe)=>{i.Ra("MaxPool",h,{format:Oe?"NHWC":"NCHW",auto_pad:_,ceil_mode:x,count_include_pad:E,storage_order:O,dilations:[F,q],kernel_shape:[J,de],pads:[se,me,ze,Fe],strides:[L,xe]})},833319:(h,_,x,E,O)=>{i.Ra("Gemm",h,{alpha:_,beta:x,transA:E,transB:O})},833423:h=>{i.Ra("MatMul",h,void 0)},833477:(h,_,x,E)=>{i.Ra("ArgMax",h,{keepDims:!!_,selectLastIndex:!!x,axis:E})},833585:(h,_,x,E)=>{i.Ra("ArgMin",h,{keepDims:!!_,selectLastIndex:!!x,axis:E})},833693:(h,_)=>{i.Ra("Softmax",h,{axis:_})},833756:(h,_)=>{i.Ra("Concat",h,{axis:_})},833816:(h,_,x,E,O)=>{i.Ra("Split",h,{axis:_,numOutputs:x,splitSizes:E?Array.from(M.subarray(E>>>0,O>>>0)):[]})},833956:h=>{i.Ra("Expand",h,void 0)},834010:(h,_)=>{i.Ra("Gather",h,{axis:Number(_)})},834081:(h,_)=>{i.Ra("GatherElements",h,{axis:Number(_)})},834160:(h,_,x,E,O,F,q,J,de,se,me)=>{i.Ra("Resize",h,{antialias:_,axes:x?Array.from(M.subarray(x>>>0,E>>>0)):[],coordinateTransformMode:Ye(O),cubicCoeffA:F,excludeOutside:q,extrapolationValue:J,keepAspectRatioPolicy:Ye(de),mode:Ye(se),nearestMode:Ye(me)})},834506:(h,_,x,E,O,F,q)=>{i.Ra("Slice",h,{starts:_?Array.from(M.subarray(_>>>0,x>>>0)):[],ends:E?Array.from(M.subarray(E>>>0,O>>>0)):[],axes:F?Array.from(M.subarray(F>>>0,q>>>0)):[]})},834722:h=>{i.Ra("Tile",h,void 0)},834774:(h,_,x,E)=>{i.Ra("LayerNormalization",h,{axis:_,epsilon:x,simplified:!!E})},834885:(h,_,x)=>{i.Ra("InstanceNormalization",h,{epsilon:_,format:x?"NHWC":"NCHW"})},834999:(h,_,x)=>{i.Ra("InstanceNormalization",h,{epsilon:_,format:x?"NHWC":"NCHW"})},835113:h=>{i.Ra("Range",h,void 0)},835166:(h,_)=>{i.Ra("Einsum",h,{equation:Ye(_)})},835247:(h,_,x,E,O)=>{i.Ra("Pad",h,{mode:_,value:x,pads:E?Array.from(M.subarray(E>>>0,O>>>0)):[]})},835374:(h,_,x,E,O,F)=>{i.Ra("BatchNormalization",h,{epsilon:_,momentum:x,spatial:!!O,trainingMode:!!E,format:F?"NHWC":"NCHW"})},835543:(h,_,x,E,O,F)=>{i.Ra("BatchNormalization",h,{epsilon:_,momentum:x,spatial:!!O,trainingMode:!!E,format:F?"NHWC":"NCHW"})},835712:(h,_,x)=>{i.Ra("CumSum",h,{exclusive:Number(_),reverse:Number(x)})},835809:(h,_,x,E,O,F,q,J,de)=>{i.Ra("Attention",h,{numHeads:_,isUnidirectional:x,maskFilterValue:E,scale:O,doRotary:F,qkvHiddenSizes:q?Array.from(M.subarray(Number(J)>>>0,Number(J)+q>>>0)):[],pastPresentShareBuffer:!!de})},836081:h=>{i.Ra("BiasAdd",h,void 0)},836136:h=>{i.Ra("BiasSplitGelu",h,void 0)},836197:h=>{i.Ra("FastGelu",h,void 0)},836253:(h,_,x,E,O,F,q,J,de,se,me,ze,Fe)=>{i.Ra("Conv",h,{format:de?"NHWC":"NCHW",auto_pad:_,dilations:[x],group:E,kernel_shape:[O],pads:F?Array.from(M.subarray(F>>>0,q>>>0)):[],strides:[J],w_is_const:()=>!!ie[se>>>0],activation:Ye(me),activation_params:ze?Array.from(H.subarray(ze>>>0,Fe>>>0)):[]})},836623:(h,_,x,E,O,F,q,J,de,se,me,ze,Fe,L,xe,Oe)=>{i.Ra("Conv",h,{format:ze?"NHWC":"NCHW",auto_pad:_,dilations:[x,E],group:O,kernel_shape:[F,q],pads:J?Array.from(M.subarray(J>>>0,de>>>0)):[],strides:[se,me],w_is_const:()=>!!ie[Fe>>>0],activation:Ye(L),activation_params:xe?Array.from(H.subarray(xe>>>0,Oe>>>0)):[]})},837014:h=>{i.Ra("Gelu",h,void 0)},837066:(h,_,x,E,O,F)=>{i.Ra("MatMulNBits",h,{k:_,n:x,accuracyLevel:E,bits:O,blockSize:F})},837193:(h,_,x,E,O,F)=>{i.Ra("MultiHeadAttention",h,{numHeads:_,isUnidirectional:x,maskFilterValue:E,scale:O,doRotary:F})},837352:(h,_,x,E,O)=>{i.Ra("RotaryEmbedding",h,{interleaved:!!_,numHeads:x,rotaryEmbeddingDim:E,scale:O})},837491:(h,_,x)=>{i.Ra("SkipLayerNormalization",h,{epsilon:_,simplified:!!x})},837593:(h,_,x)=>{i.Ra("SkipLayerNormalization",h,{epsilon:_,simplified:!!x})},837695:(h,_,x,E)=>{i.Ra("LayerNormalization",h,{axis:_,epsilon:x,simplified:!!E})},837806:h=>{i.ub(h)},837840:(h,_)=>i.wb(h,_,i.cb.xb,i.cb.errors)};function ir(h){this.name="ExitStatus",this.message=`Program terminated with exit(${h})`,this.status=h}class ls{constructor(_){this.hb=_-24}}var fr=0,Sr=typeof TextDecoder<"u"?new TextDecoder("utf8"):void 0,Bn=(h,_,x)=>{_>>>=0;var E=_+x;for(x=_;h[x]&&!(x>=E);)++x;if(16O?E+=String.fromCharCode(O):(O-=65536,E+=String.fromCharCode(55296|O>>10,56320|O&1023))}}else E+=String.fromCharCode(O)}return E},Ye=(h,_)=>(h>>>=0)?Bn(te,h,_):"",un=h=>{for(var _=0,x=0;x=E?_++:2047>=E?_+=2:55296<=E&&57343>=E?(_+=4,++x):_+=3}return _},Bt=(h,_,x,E)=>{if(x>>>=0,!(0=q){var J=h.charCodeAt(++F);q=65536+((q&1023)<<10)|J&1023}if(127>=q){if(x>=E)break;_[x++>>>0]=q}else{if(2047>=q){if(x+1>=E)break;_[x++>>>0]=192|q>>6}else{if(65535>=q){if(x+2>=E)break;_[x++>>>0]=224|q>>12}else{if(x+3>=E)break;_[x++>>>0]=240|q>>18,_[x++>>>0]=128|q>>12&63}_[x++>>>0]=128|q>>6&63}_[x++>>>0]=128|q&63}}return _[x>>>0]=0,x-O},kr,At=h=>{for(var _="";te[h>>>0];)_+=kr[te[h++>>>0]];return _},Dn={},ln={},sr;function Nn(h,_,x={}){var E=_.name;if(!h)throw new sr(`type "${E}" must have a positive integer typeid pointer`);if(ln.hasOwnProperty(h)){if(x.nb)return;throw new sr(`Cannot register type '${E}' twice`)}ln[h]=_,Dn.hasOwnProperty(h)&&(_=Dn[h],delete Dn[h],_.forEach(O=>O()))}function xt(h,_,x={}){if(!("argPackAdvance"in _))throw new TypeError("registerType registeredInstance requires argPackAdvance");return Nn(h,_,x)}var dn=(h,_,x)=>{switch(_){case 1:return x?E=>ie[E>>>0]:E=>te[E>>>0];case 2:return x?E=>oe[E>>>1>>>0]:E=>re[E>>>1>>>0];case 4:return x?E=>M[E>>>2>>>0]:E=>P[E>>>2>>>0];case 8:return x?E=>le[E>>>3]:E=>G[E>>>3];default:throw new TypeError(`invalid integer width (${_}): ${h}`)}},cn=[],ot=[];function Fn(h){h>>>=0,9{if(!h)throw new sr("Cannot use deleted val. handle = "+h);return ot[h]},St=h=>{switch(h){case void 0:return 2;case null:return 4;case!0:return 6;case!1:return 8;default:let _=cn.pop()||ot.length;return ot[_]=h,ot[_+1]=1,_}};function Rr(h){return this.fromWireType(P[h>>>2>>>0])}var ds={name:"emscripten::val",fromWireType:h=>{var _=Ie(h);return Fn(h),_},toWireType:(h,_)=>St(_),argPackAdvance:8,readValueFromPointer:Rr,bb:null},Ua=(h,_)=>{switch(_){case 4:return function(x){return this.fromWireType(H[x>>>2>>>0])};case 8:return function(x){return this.fromWireType(ne[x>>>3>>>0])};default:throw new TypeError(`invalid float width (${_}): ${h}`)}},Wa=typeof TextDecoder<"u"?new TextDecoder("utf-16le"):void 0,be=(h,_)=>{for(var x=h>>1,E=x+_/2;!(x>=E)&&re[x>>>0];)++x;if(x<<=1,32>>0,x>>>0));for(x="",E=0;!(E>=_/2);++E){var O=oe[h+2*E>>>1>>>0];if(O==0)break;x+=String.fromCharCode(O)}return x},pn=(h,_,x)=>{if(x??=2147483647,2>x)return 0;x-=2;var E=_;x=x<2*h.length?x/2:h.length;for(var O=0;O>>1>>>0]=h.charCodeAt(O),_+=2;return oe[_>>>1>>>0]=0,_-E},Va=h=>2*h.length,cs=(h,_)=>{for(var x=0,E="";!(x>=_/4);){var O=M[h+4*x>>>2>>>0];if(O==0)break;++x,65536<=O?(O-=65536,E+=String.fromCharCode(55296|O>>10,56320|O&1023)):E+=String.fromCharCode(O)}return E},Ga=(h,_,x)=>{if(_>>>=0,x??=2147483647,4>x)return 0;var E=_;x=E+x-4;for(var O=0;O=F){var q=h.charCodeAt(++O);F=65536+((F&1023)<<10)|q&1023}if(M[_>>>2>>>0]=F,_+=4,_+4>x)break}return M[_>>>2>>>0]=0,_-E},Ha=h=>{for(var _=0,x=0;x=E&&++x,_+=4}return _},hn=(h,_)=>{var x=ln[h];if(x===void 0)throw h=Yn(h),x=At(h),_t(h),new sr(`${_} has unknown type ${x}`);return x},Ln=(h,_,x)=>{var E=[];return h=h.toWireType(E,x),E.length&&(P[_>>>2>>>0]=St(E)),h},Br=h=>{try{h()}catch(_){Qe(_)}},nt=h=>{if(!K)try{h();try{j=j=h=j,i.onExit?.(h),K=!0,m(h,new ir(h))}catch(_){_ instanceof ir||_=="unwind"||m(1,_)}}catch(_){_ instanceof ir||_=="unwind"||m(1,_)}};function ja(){var h=we,_={};for(let[x,E]of Object.entries(h))_[x]=typeof E=="function"?(...O)=>{Ht.push(x);try{return E(...O)}finally{K||(Ht.pop(),kt&&Gt===1&&Ht.length===0&&(Gt=0,Br(ri),typeof Fibers<"u"&&Fibers.Db()))}}:E;return _}var Gt=0,kt=null,Un=0,Ht=[],Wn={},Vn={},qa=0,fn=null,Ka=[];function Ya(){return new Promise((h,_)=>{fn={resolve:h,reject:_}})}function Xa(){var h=Er(65548),_=h+12;P[h>>>2>>>0]=_,P[h+4>>>2>>>0]=_+65536,_=Ht[0];var x=Wn[_];return x===void 0&&(x=qa++,Wn[_]=x,Vn[x]=_),M[h+8>>>2>>>0]=x,h}function Qa(h){if(!K){if(Gt===0){var _=!1,x=!1;h((E=0)=>{if(!K&&(Un=E,_=!0,x)){Gt=2,Br(()=>qt(kt)),typeof Browser<"u"&&Browser.ib.mb&&Browser.ib.resume(),E=!1;try{var O=(0,we[Vn[M[kt+8>>>2>>>0]]])()}catch(J){O=J,E=!0}var F=!1;if(!kt){var q=fn;q&&(fn=null,(E?q.reject:q.resolve)(O),F=!0)}if(E&&!F)throw O}}),x=!0,_||(Gt=1,kt=Xa(),typeof Browser<"u"&&Browser.ib.mb&&Browser.ib.pause(),Br(()=>Fr(kt)))}else Gt===2?(Gt=0,Br(zt),_t(kt),kt=null,Ka.forEach(nt)):Qe(`invalid state: ${Gt}`);return Un}}function Gn(h){return Qa(_=>{h().then(_)})}var Dr=[],Ja={},mn=h=>{var _=Ja[h];return _===void 0?At(h):_},Mt=()=>typeof globalThis=="object"?globalThis:Function("return this")(),Hn=h=>{var _=Dr.length;return Dr.push(h),_},jn=(h,_)=>{for(var x=Array(h),E=0;E>>2>>>0],"parameter "+E);return x},jt=(h,_)=>Object.defineProperty(_,"name",{value:h});function ps(h){var _=Function;if(!(_ instanceof Function))throw new TypeError(`new_ called with constructor type ${typeof _} which is not a function`);var x=jt(_.name||"unknownFunctionName",function(){});return x.prototype=_.prototype,x=new x,h=_.apply(x,h),h instanceof Object?h:x}var ft=h=>h%4===0&&(h%100!==0||h%400===0),qn=[0,31,60,91,121,152,182,213,244,274,305,335],gn=[0,31,59,90,120,151,181,212,243,273,304,334],Ot=[],_n=(h,_)=>{Ot.length=0;for(var x;x=te[h++>>>0];){var E=x!=105;E&=x!=112,_+=E&&_%8?4:0,Ot.push(x==112?P[_>>>2>>>0]:x==106?le[_>>>3]:x==105?M[_>>>2>>>0]:ne[_>>>3>>>0]),_+=E?8:4}return Ot},ut={},Et=()=>{if(!Nr){var h={USER:"web_user",LOGNAME:"web_user",PATH:"/",PWD:"/",HOME:"/home/web_user",LANG:(typeof navigator=="object"&&navigator.languages&&navigator.languages[0]||"C").replace("-","_")+".UTF-8",_:f||"./this.program"},_;for(_ in ut)ut[_]===void 0?delete h[_]:h[_]=ut[_];var x=[];for(_ in h)x.push(`${_}=${h[_]}`);Nr=x}return Nr},Nr,hs=[null,[],[]],Za=[31,29,31,30,31,30,31,31,30,31,30,31],Kn=[31,28,31,30,31,30,31,31,30,31,30,31];function fs(h){var _=Array(un(h)+1);return Bt(h,_,0,_.length),_}function ei(h,_,x,E){function O(L,xe,Oe){for(L=typeof L=="number"?L.toString():L||"";L.length_r?-1:0<_r?1:0}var gr;return(gr=Oe(L.getFullYear()-xe.getFullYear()))===0&&(gr=Oe(L.getMonth()-xe.getMonth()))===0&&(gr=Oe(L.getDate()-xe.getDate())),gr}function J(L){switch(L.getDay()){case 0:return new Date(L.getFullYear()-1,11,29);case 1:return L;case 2:return new Date(L.getFullYear(),0,3);case 3:return new Date(L.getFullYear(),0,2);case 4:return new Date(L.getFullYear(),0,1);case 5:return new Date(L.getFullYear()-1,11,31);case 6:return new Date(L.getFullYear()-1,11,30)}}function de(L){var xe=L.$a;for(L=new Date(new Date(L.ab+1900,0,1).getTime());0gr-L.getDate())xe-=gr-L.getDate()+1,L.setDate(1),11>Oe?L.setMonth(Oe+1):(L.setMonth(0),L.setFullYear(L.getFullYear()+1));else{L.setDate(L.getDate()+xe);break}}return Oe=new Date(L.getFullYear()+1,0,4),xe=J(new Date(L.getFullYear(),0,4)),Oe=J(Oe),0>=q(xe,L)?0>=q(Oe,L)?L.getFullYear()+1:L.getFullYear():L.getFullYear()-1}h>>>=0,_>>>=0,x>>>=0,E>>>=0;var se=P[E+40>>>2>>>0];E={Ab:M[E>>>2>>>0],zb:M[E+4>>>2>>>0],fb:M[E+8>>>2>>>0],jb:M[E+12>>>2>>>0],gb:M[E+16>>>2>>>0],ab:M[E+20>>>2>>>0],Va:M[E+24>>>2>>>0],$a:M[E+28>>>2>>>0],Cb:M[E+32>>>2>>>0],yb:M[E+36>>>2>>>0],Bb:se?Ye(se):""},x=Ye(x),se={"%c":"%a %b %d %H:%M:%S %Y","%D":"%m/%d/%y","%F":"%Y-%m-%d","%h":"%b","%r":"%I:%M:%S %p","%R":"%H:%M","%T":"%H:%M:%S","%x":"%m/%d/%y","%X":"%H:%M:%S","%Ec":"%c","%EC":"%C","%Ex":"%m/%d/%y","%EX":"%H:%M:%S","%Ey":"%y","%EY":"%Y","%Od":"%d","%Oe":"%e","%OH":"%H","%OI":"%I","%Om":"%m","%OM":"%M","%OS":"%S","%Ou":"%u","%OU":"%U","%OV":"%V","%Ow":"%w","%OW":"%W","%Oy":"%y"};for(var me in se)x=x.replace(new RegExp(me,"g"),se[me]);var ze="Sunday Monday Tuesday Wednesday Thursday Friday Saturday".split(" "),Fe="January February March April May June July August September October November December".split(" ");se={"%a":L=>ze[L.Va].substring(0,3),"%A":L=>ze[L.Va],"%b":L=>Fe[L.gb].substring(0,3),"%B":L=>Fe[L.gb],"%C":L=>F((L.ab+1900)/100|0,2),"%d":L=>F(L.jb,2),"%e":L=>O(L.jb,2," "),"%g":L=>de(L).toString().substring(2),"%G":de,"%H":L=>F(L.fb,2),"%I":L=>(L=L.fb,L==0?L=12:12{for(var xe=0,Oe=0;Oe<=L.gb-1;xe+=(ft(L.ab+1900)?Za:Kn)[Oe++]);return F(L.jb+xe,3)},"%m":L=>F(L.gb+1,2),"%M":L=>F(L.zb,2),"%n":()=>` -`,"%p":L=>0<=L.fb&&12>L.fb?"AM":"PM","%S":L=>F(L.Ab,2),"%t":()=>" ","%u":L=>L.Va||7,"%U":L=>F(Math.floor((L.$a+7-L.Va)/7),2),"%V":L=>{var xe=Math.floor((L.$a+7-(L.Va+6)%7)/7);if(2>=(L.Va+371-L.$a-2)%7&&xe++,xe)xe==53&&(Oe=(L.Va+371-L.$a)%7,Oe==4||Oe==3&&ft(L.ab)||(xe=1));else{xe=52;var Oe=(L.Va+7-L.$a-1)%7;(Oe==4||Oe==5&&ft(L.ab%400-1))&&xe++}return F(xe,2)},"%w":L=>L.Va,"%W":L=>F(Math.floor((L.$a+7-(L.Va+6)%7)/7),2),"%y":L=>(L.ab+1900).toString().substring(2),"%Y":L=>L.ab+1900,"%z":L=>{L=L.yb;var xe=0<=L;return L=Math.abs(L)/60,(xe?"+":"-")+("0000"+(L/60*100+L%60)).slice(-4)},"%Z":L=>L.Bb,"%%":()=>"%"},x=x.replace(/%%/g,"\0\0");for(me in se)x.includes(me)&&(x=x.replace(new RegExp(me,"g"),se[me](E)));return x=x.replace(/\0\0/g,"%"),me=fs(x),me.length>_?0:(ie.set(me,h>>>0),me.length-1)}for(var ti=Array(256),yn=0;256>yn;++yn)ti[yn]=String.fromCharCode(yn);kr=ti,sr=i.BindingError=class extends Error{constructor(h){super(h),this.name="BindingError"}},i.InternalError=class extends Error{constructor(h){super(h),this.name="InternalError"}},ot.push(0,1,void 0,1,null,1,!0,1,!1,1),i.count_emval_handles=()=>ot.length/2-5-cn.length;var ms={ia:function(h,_,x){return Gn(async()=>{await i.sb(h,_,x)})},a:function(h,_,x){h>>>=0;var E=new ls(h);throw P[E.hb+16>>>2>>>0]=0,P[E.hb+4>>>2>>>0]=_>>>0,P[E.hb+8>>>2>>>0]=x>>>0,fr=h,fr},y:function(){return 0},ea:function(){},R:function(){},T:function(){},ga:function(){return 0},ca:function(){},Z:function(){},ba:function(){},G:function(){},S:function(){},P:function(){},da:function(){},Q:function(){},C:function(h,_,x){_=At(_>>>0),xt(h>>>0,{name:_,fromWireType:E=>E,toWireType:function(E,O){if(typeof O!="bigint"&&typeof O!="number")throw O===null?O="null":(E=typeof O,O=E==="object"||E==="array"||E==="function"?O.toString():""+O),new TypeError(`Cannot convert "${O}" to ${this.name}`);return typeof O=="number"&&(O=BigInt(O)),O},argPackAdvance:8,readValueFromPointer:dn(_,x>>>0,_.indexOf("u")==-1),bb:null})},K:function(h,_,x,E){_=At(_>>>0),xt(h>>>0,{name:_,fromWireType:function(O){return!!O},toWireType:function(O,F){return F?x:E},argPackAdvance:8,readValueFromPointer:function(O){return this.fromWireType(te[O>>>0])},bb:null})},J:function(h){return xt(h>>>0,ds)},B:function(h,_,x){_=At(_>>>0),xt(h>>>0,{name:_,fromWireType:E=>E,toWireType:(E,O)=>O,argPackAdvance:8,readValueFromPointer:Ua(_,x>>>0),bb:null})},s:function(h,_,x,E,O){if(h>>>=0,x>>>=0,_=At(_>>>0),O===-1&&(O=4294967295),O=J=>J,E===0){var F=32-8*x;O=J=>J<>>F}var q=_.includes("unsigned")?function(J,de){return de>>>0}:function(J,de){return de};xt(h,{name:_,fromWireType:O,toWireType:q,argPackAdvance:8,readValueFromPointer:dn(_,x,E!==0),bb:null})},o:function(h,_,x){function E(F){return new O(ie.buffer,P[F+4>>>2>>>0],P[F>>>2>>>0])}var O=[Int8Array,Uint8Array,Int16Array,Uint16Array,Int32Array,Uint32Array,Float32Array,Float64Array,BigInt64Array,BigUint64Array][_];x=At(x>>>0),xt(h>>>0,{name:x,fromWireType:E,argPackAdvance:8,readValueFromPointer:E},{nb:!0})},D:function(h,_){_=At(_>>>0);var x=_==="std::string";xt(h>>>0,{name:_,fromWireType:function(E){var O=P[E>>>2>>>0],F=E+4;if(x)for(var q=F,J=0;J<=O;++J){var de=F+J;if(J==O||te[de>>>0]==0){if(q=Ye(q,de-q),se===void 0)var se=q;else se+="\0",se+=q;q=de+1}}else{for(se=Array(O),J=0;J>>0]);se=se.join("")}return _t(E),se},toWireType:function(E,O){O instanceof ArrayBuffer&&(O=new Uint8Array(O));var F=typeof O=="string";if(!(F||O instanceof Uint8Array||O instanceof Uint8ClampedArray||O instanceof Int8Array))throw new sr("Cannot pass non-string to std::string");var q=x&&F?un(O):O.length,J=Er(4+q+1),de=J+4;if(P[J>>>2>>>0]=q,x&&F)Bt(O,te,de,q+1);else if(F)for(F=0;F>>0]=se}else for(F=0;F>>0]=O[F];return E!==null&&E.push(_t,J),J},argPackAdvance:8,readValueFromPointer:Rr,bb(E){_t(E)}})},x:function(h,_,x){if(_>>>=0,x>>>=0,x=At(x),_===2)var E=be,O=pn,F=Va,q=J=>re[J>>>1>>>0];else _===4&&(E=cs,O=Ga,F=Ha,q=J=>P[J>>>2>>>0]);xt(h>>>0,{name:x,fromWireType:J=>{for(var de=P[J>>>2>>>0],se,me=J+4,ze=0;ze<=de;++ze){var Fe=J+4+ze*_;(ze==de||q(Fe)==0)&&(me=E(me,Fe-me),se===void 0?se=me:(se+="\0",se+=me),me=Fe+_)}return _t(J),se},toWireType:(J,de)=>{if(typeof de!="string")throw new sr(`Cannot pass non-string to C++ string type ${x}`);var se=F(de),me=Er(4+se+_);return P[me>>>2>>>0]=se/_,O(de,me+4,se+_),J!==null&&J.push(_t,me),me},argPackAdvance:8,readValueFromPointer:Rr,bb(J){_t(J)}})},L:function(h,_){_=At(_>>>0),xt(h>>>0,{ob:!0,name:_,argPackAdvance:0,fromWireType:()=>{},toWireType:()=>{}})},ha:()=>1,u:function(h,_,x){return _>>>=0,x>>>=0,h=Ie(h>>>0),_=hn(_,"emval::as"),Ln(_,x,h)},w:function(h){return h>>>=0,Gn(()=>(h=Ie(h),h.then(St)))},n:function(h,_,x,E){return x>>>=0,E>>>=0,h=Dr[h>>>0],_=Ie(_>>>0),h(null,_,x,E)},j:function(h,_,x,E,O){return x>>>=0,E>>>=0,O>>>=0,h=Dr[h>>>0],_=Ie(_>>>0),x=mn(x),h(_,_[x],E,O)},b:Fn,A:function(h,_){return _>>>=0,h=Ie(h>>>0),_=Ie(_),h==_},m:function(h){return h>>>=0,h===0?St(Mt()):(h=mn(h),St(Mt()[h]))},i:function(h,_,x){_=jn(h,_>>>0);var E=_.shift();h--;var O=`return function (obj, func, destructorsRef, args) { -`,F=0,q=[];x===0&&q.push("obj");for(var J=["retType"],de=[E],se=0;seme.name).join(", ")}) => ${E.name}>`,Hn(jt(x,h))},r:function(h,_){return _>>>=0,h=Ie(h>>>0),_=Ie(_),St(h[_])},e:function(h){h>>>=0,9>>0);for(var _=Array(h.length),x=0;x>>0))},k:function(){return St({})},h:function(h){h>>>=0;for(var _=Ie(h);_.length;){var x=_.pop();_.pop()(x)}Fn(h)},g:function(h,_,x){_>>>=0,x>>>=0,h=Ie(h>>>0),_=Ie(_),x=Ie(x),h[_]=x},c:function(h,_){return _>>>=0,h=hn(h>>>0,"_emval_take_value"),h=h.readValueFromPointer(_),St(h)},W:function(h,_){h=-9007199254740992>h||9007199254740992>>=0,h=new Date(1e3*h),M[_>>>2>>>0]=h.getUTCSeconds(),M[_+4>>>2>>>0]=h.getUTCMinutes(),M[_+8>>>2>>>0]=h.getUTCHours(),M[_+12>>>2>>>0]=h.getUTCDate(),M[_+16>>>2>>>0]=h.getUTCMonth(),M[_+20>>>2>>>0]=h.getUTCFullYear()-1900,M[_+24>>>2>>>0]=h.getUTCDay(),M[_+28>>>2>>>0]=(h.getTime()-Date.UTC(h.getUTCFullYear(),0,1,0,0,0,0))/864e5|0},X:function(h,_){h=-9007199254740992>h||9007199254740992>>=0,h=new Date(1e3*h),M[_>>>2>>>0]=h.getSeconds(),M[_+4>>>2>>>0]=h.getMinutes(),M[_+8>>>2>>>0]=h.getHours(),M[_+12>>>2>>>0]=h.getDate(),M[_+16>>>2>>>0]=h.getMonth(),M[_+20>>>2>>>0]=h.getFullYear()-1900,M[_+24>>>2>>>0]=h.getDay(),M[_+28>>>2>>>0]=(ft(h.getFullYear())?qn:gn)[h.getMonth()]+h.getDate()-1|0,M[_+36>>>2>>>0]=-(60*h.getTimezoneOffset());var x=new Date(h.getFullYear(),6,1).getTimezoneOffset(),E=new Date(h.getFullYear(),0,1).getTimezoneOffset();M[_+32>>>2>>>0]=(x!=E&&h.getTimezoneOffset()==Math.min(E,x))|0},Y:function(h){h>>>=0;var _=new Date(M[h+20>>>2>>>0]+1900,M[h+16>>>2>>>0],M[h+12>>>2>>>0],M[h+8>>>2>>>0],M[h+4>>>2>>>0],M[h>>>2>>>0],0),x=M[h+32>>>2>>>0],E=_.getTimezoneOffset(),O=new Date(_.getFullYear(),6,1).getTimezoneOffset(),F=new Date(_.getFullYear(),0,1).getTimezoneOffset(),q=Math.min(F,O);return 0>x?M[h+32>>>2>>>0]=+(O!=F&&q==E):0>>2>>>0]=_.getDay(),M[h+28>>>2>>>0]=(ft(_.getFullYear())?qn:gn)[_.getMonth()]+_.getDate()-1|0,M[h>>>2>>>0]=_.getSeconds(),M[h+4>>>2>>>0]=_.getMinutes(),M[h+8>>>2>>>0]=_.getHours(),M[h+12>>>2>>>0]=_.getDate(),M[h+16>>>2>>>0]=_.getMonth(),M[h+20>>>2>>>0]=_.getYear(),h=_.getTime(),BigInt(isNaN(h)?-1:h/1e3)},U:function(){return-52},V:function(){},N:function(h,_,x,E){x>>>=0,E>>>=0;var O=new Date().getFullYear(),F=new Date(O,0,1),q=new Date(O,6,1);O=F.getTimezoneOffset();var J=q.getTimezoneOffset();P[h>>>0>>>2>>>0]=60*Math.max(O,J),M[_>>>0>>>2>>>0]=+(O!=J),h=de=>de.toLocaleTimeString(void 0,{hour12:!1,timeZoneName:"short"}).split(" ")[1],F=h(F),q=h(q),J{Qe("")},d:function(h,_,x){return h>>>=0,_=_n(_>>>0,x>>>0),hr[h](..._)},I:function(h,_,x){return h>>>=0,_=_n(_>>>0,x>>>0),hr[h](..._)},H:()=>Date.now(),O:function(){return 4294901760},q:()=>performance.now(),M:function(h){h>>>=0;var _=te.length;if(4294901760=x;x*=2){var E=_*(1+.2/x);E=Math.min(E,h+100663296);var O=Math;E=Math.max(h,E);e:{O=(O.min.call(O,4294901760,E+(65536-E%65536)%65536)-D.buffer.byteLength+65535)/65536;try{D.grow(O),N();var F=1;break e}catch{}F=void 0}if(F)return!0}return!1},$:function(h,_){h>>>=0,_>>>=0;var x=0;return Et().forEach((E,O)=>{var F=_+x;for(O=P[h+4*O>>>2>>>0]=F,F=0;F>>0]=E.charCodeAt(F);ie[O>>>0]=0,x+=E.length+1}),0},aa:function(h,_){h>>>=0,_>>>=0;var x=Et();P[h>>>2>>>0]=x.length;var E=0;return x.forEach(O=>E+=O.length+1),P[_>>>2>>>0]=E,0},z:()=>52,F:function(){return 52},_:function(){return 70},E:function(h,_,x,E){_>>>=0,x>>>=0,E>>>=0;for(var O=0,F=0;F>>2>>>0],J=P[_+4>>>2>>>0];_+=8;for(var de=0;de>>0],me=hs[h];se===0||se===10?((h===1?B:R)(Bn(me,0)),me.length=0):me.push(se)}O+=J}return P[E>>>2>>>0]=O,0},fa:ei,p:function(h,_,x,E){return ei(h>>>0,_>>>0,x>>>0,E>>>0)}},we=function(){function h(x){return we=x.exports,we=ja(),we=ni(),D=we.ja,N(),fe.unshift(we.ka),Be--,Be==0&&Ke&&(x=Ke,Ke=null,x()),we}var _={a:ms};if(Be++,i.instantiateWasm)try{return i.instantiateWasm(_,h)}catch(x){R(`Module.instantiateWasm callback failed with error: ${x}`),o(x)}return Pr(_,function(x){h(x.instance)}).catch(o),{}}(),Yn=h=>(Yn=we.la)(h);i._OrtInit=(h,_)=>(i._OrtInit=we.ma)(h,_),i._OrtGetLastError=(h,_)=>(i._OrtGetLastError=we.na)(h,_),i._OrtCreateSessionOptions=(h,_,x,E,O,F,q,J,de,se)=>(i._OrtCreateSessionOptions=we.oa)(h,_,x,E,O,F,q,J,de,se),i._OrtAppendExecutionProvider=(h,_)=>(i._OrtAppendExecutionProvider=we.pa)(h,_),i._OrtAddFreeDimensionOverride=(h,_,x)=>(i._OrtAddFreeDimensionOverride=we.qa)(h,_,x),i._OrtAddSessionConfigEntry=(h,_,x)=>(i._OrtAddSessionConfigEntry=we.ra)(h,_,x),i._OrtReleaseSessionOptions=h=>(i._OrtReleaseSessionOptions=we.sa)(h),i._OrtCreateSession=(h,_,x)=>(i._OrtCreateSession=we.ta)(h,_,x),i._OrtReleaseSession=h=>(i._OrtReleaseSession=we.ua)(h),i._OrtGetInputOutputCount=(h,_,x)=>(i._OrtGetInputOutputCount=we.va)(h,_,x),i._OrtGetInputName=(h,_)=>(i._OrtGetInputName=we.wa)(h,_),i._OrtGetOutputName=(h,_)=>(i._OrtGetOutputName=we.xa)(h,_),i._OrtFree=h=>(i._OrtFree=we.ya)(h),i._OrtCreateTensor=(h,_,x,E,O,F)=>(i._OrtCreateTensor=we.za)(h,_,x,E,O,F),i._OrtGetTensorData=(h,_,x,E,O)=>(i._OrtGetTensorData=we.Aa)(h,_,x,E,O),i._OrtReleaseTensor=h=>(i._OrtReleaseTensor=we.Ba)(h),i._OrtCreateRunOptions=(h,_,x,E)=>(i._OrtCreateRunOptions=we.Ca)(h,_,x,E),i._OrtAddRunConfigEntry=(h,_,x)=>(i._OrtAddRunConfigEntry=we.Da)(h,_,x),i._OrtReleaseRunOptions=h=>(i._OrtReleaseRunOptions=we.Ea)(h),i._OrtCreateBinding=h=>(i._OrtCreateBinding=we.Fa)(h),i._OrtBindInput=(h,_,x)=>(i._OrtBindInput=we.Ga)(h,_,x),i._OrtBindOutput=(h,_,x,E)=>(i._OrtBindOutput=we.Ha)(h,_,x,E),i._OrtClearBoundOutputs=h=>(i._OrtClearBoundOutputs=we.Ia)(h),i._OrtReleaseBinding=h=>(i._OrtReleaseBinding=we.Ja)(h),i._OrtRunWithBinding=(h,_,x,E,O)=>(i._OrtRunWithBinding=we.Ka)(h,_,x,E,O),i._OrtRun=(h,_,x,E,O,F,q,J)=>(i._OrtRun=we.La)(h,_,x,E,O,F,q,J),i._OrtEndProfiling=h=>(i._OrtEndProfiling=we.Ma)(h),i._JsepOutput=(h,_,x)=>(i._JsepOutput=we.Na)(h,_,x),i._JsepGetNodeName=h=>(i._JsepGetNodeName=we.Oa)(h);var Er=i._malloc=h=>(Er=i._malloc=we.Pa)(h),_t=i._free=h=>(_t=i._free=we.Qa)(h),wn=h=>(wn=we.Sa)(h),bn=h=>(bn=we.Ta)(h),Xn=()=>(Xn=we.Ua)(),Fr=h=>(Fr=we.Wa)(h),ri=()=>(ri=we.Xa)(),qt=h=>(qt=we.Ya)(h),zt=()=>(zt=we.Za)();i.___start_em_js=837952,i.___stop_em_js=838113;function ni(){var h=we;h=Object.assign({},h);var _=x=>E=>x(E)>>>0;return h.la=_(h.la),h.Pa=_(h.Pa),h.Ta=_(h.Ta),h.Ua=(x=>()=>x()>>>0)(h.Ua),h}i.stackSave=()=>Xn(),i.stackRestore=h=>wn(h),i.stackAlloc=h=>bn(h),i.UTF8ToString=Ye,i.stringToUTF8=(h,_,x)=>Bt(h,te,_,x),i.lengthBytesUTF8=un;var mr;Ke=function h(){mr||Qn(),mr||(Ke=h)};function Qn(){if(!(0r)}),G_=An(()=>{}),H_=An(()=>{}),ah={};Mn(ah,{cpus:()=>ih});var ih,j_=Z(()=>{ih=void 0}),q_=An((t,e)=>{var r=(()=>{var n=typeof document<"u"?document.currentScript?.src:void 0;return typeof __filename<"u"&&(n||=__filename),function(a={}){function i(){return ne.buffer!=Ce.buffer&&st(),Ce}function s(){return ne.buffer!=Ce.buffer&&st(),Be}function o(){return ne.buffer!=Ce.buffer&&st(),Ke}function u(){return ne.buffer!=Ce.buffer&&st(),Qe}function l(){return ne.buffer!=Ce.buffer&&st(),We}function p(){return ne.buffer!=Ce.buffer&&st(),dt}function f(){return ne.buffer!=Ce.buffer&&st(),Ve}function m(){return ne.buffer!=Ce.buffer&&st(),Vt}var c=a,y,w,v=new Promise((d,g)=>{y=d,w=g});c.mountExternalData=(d,g)=>{(c.Db||(c.Db=new Map)).set(d,g)},c.unmountExternalData=()=>{delete c.Db};let k=()=>{let d=(b,S,I)=>(...z)=>{let V=zt,X=S?.();z=b(...z);let ce=S?.();return X!==ce&&(b=ce,I(X),S=I=null),zt!=V?O():z},g=b=>async(...S)=>{try{if(c.Cb)throw Error("Session already started");let I=c.Cb={ec:S[0],errors:[]},z=await b(...S);if(c.Cb!==I)throw Error("Session mismatch");c.Kb?.flush();let V=I.errors;if(0ce),0c._OrtCreateSession,b=>c._OrtCreateSession=b),c._OrtRun=g(d(c._OrtRun,()=>c._OrtRun,b=>c._OrtRun=b)),c._OrtRunWithBinding=g(d(c._OrtRunWithBinding,()=>c._OrtRunWithBinding,b=>c._OrtRunWithBinding=b)),c._OrtBindInput=d(c._OrtBindInput,()=>c._OrtBindInput,b=>c._OrtBindInput=b),k=void 0};c.jsepInit=(d,g)=>{if(k?.(),d==="webgpu"){[c.Kb,c.Wb,c.$b,c.Lb,c.Zb,c.ob,c.ac,c.cc,c.Xb,c.Yb,c.bc]=g;let b=c.Kb;c.jsepRegisterBuffer=(S,I,z,V)=>b.registerBuffer(S,I,z,V),c.jsepGetBuffer=S=>b.getBuffer(S),c.jsepCreateDownloader=(S,I,z)=>b.createDownloader(S,I,z),c.jsepOnReleaseSession=S=>{b.onReleaseSession(S)},c.jsepOnRunStart=S=>b.onRunStart(S)}};var $=Object.assign({},c),C="./this.program",T=(d,g)=>{throw g},A=typeof window=="object",B=typeof importScripts=="function",R=typeof process=="object"&&typeof process.versions=="object"&&typeof process.versions.node=="string",D=c.ENVIRONMENT_IS_PTHREAD||!1,K="";function j(d){return c.locateFile?c.locateFile(d,K):K+d}var ie,te,oe;if(R){var re=(th(),Jr(Lo)),M=(nh(),Jr(Uo));K=B?M.dirname(K)+"/":__dirname+"/",ie=(d,g)=>(d=Bt(d)?new URL(d):M.normalize(d),re.readFileSync(d,g?void 0:"utf8")),oe=d=>(d=ie(d,!0),d.buffer||(d=new Uint8Array(d)),d),te=(d,g,b,S=!0)=>{d=Bt(d)?new URL(d):M.normalize(d),re.readFile(d,S?void 0:"utf8",(I,z)=>{I?b(I):g(S?z.buffer:z)})},!c.thisProgram&&1{throw process.exitCode=d,g},global.Worker=G_().Worker}else(A||B)&&(B?K=self.location.href:typeof document<"u"&&document.currentScript&&(K=document.currentScript.src),typeof n<"u"&&n&&(K=n),K.startsWith("blob:")?K="":K=K.substr(0,K.replace(/[?#].*/,"").lastIndexOf("/")+1),R||(ie=d=>{var g=new XMLHttpRequest;return g.open("GET",d,!1),g.send(null),g.responseText},B&&(oe=d=>{var g=new XMLHttpRequest;return g.open("GET",d,!1),g.responseType="arraybuffer",g.send(null),new Uint8Array(g.response)}),te=(d,g,b)=>{var S=new XMLHttpRequest;S.open("GET",d,!0),S.responseType="arraybuffer",S.onload=()=>{S.status==200||S.status==0&&S.response?g(S.response):b()},S.onerror=b,S.send(null)}));R&&typeof performance>"u"&&(global.performance=H_().performance);var P=console.log.bind(console),H=console.error.bind(console);R&&(P=(...d)=>re.writeSync(1,d.join(" ")+` -`),H=(...d)=>re.writeSync(2,d.join(" ")+` -`));var le=P,G=H;Object.assign(c,$),$=null;var ne,N,ae=!1,fe,Ce,Be,Ke,Qe,We,dt,Ve,Ne,ht,Vt;function st(){var d=ne.buffer;c.HEAP8=Ce=new Int8Array(d),c.HEAP16=Ke=new Int16Array(d),c.HEAPU8=Be=new Uint8Array(d),c.HEAPU16=Qe=new Uint16Array(d),c.HEAP32=We=new Int32Array(d),c.HEAPU32=dt=new Uint32Array(d),c.HEAPF32=Ve=new Float32Array(d),c.HEAPF64=Vt=new Float64Array(d),c.HEAP64=Ne=new BigInt64Array(d),c.HEAPU64=ht=new BigUint64Array(d)}var Pr=16777216;if(D)ne=c.wasmMemory;else if(c.wasmMemory)ne=c.wasmMemory;else if(ne=new WebAssembly.Memory({initial:Pr/65536,maximum:65536,shared:!0}),!(ne.buffer instanceof SharedArrayBuffer))throw G("requested a shared WebAssembly.Memory but the returned buffer is not a SharedArrayBuffer, indicating that while the browser has SharedArrayBuffer it does not have WebAssembly threads support - you may need to set a flag"),R&&G("(on node you may need: --experimental-wasm-threads --experimental-wasm-bulk-memory and/or recent version)"),Error("bad memory");st(),Pr=ne.buffer.byteLength;var hr=[],ir=[],ls=[],fr=0,Sr=null;function Bn(){if(fr--,fr==0&&Sr){var d=Sr;Sr=null,d()}}function Ye(d){throw d="Aborted("+d+")",G(d),ae=!0,fe=1,d=new WebAssembly.RuntimeError(d+". Build with -sASSERTIONS for more info."),w(d),d}var un=d=>d.startsWith("data:application/octet-stream;base64,"),Bt=d=>d.startsWith("file://"),kr;kr="ort-wasm-simd-threaded.wasm",un(kr)||(kr=j(kr));function At(d){if(oe)return oe(d);throw"both async and sync fetching of the wasm failed"}function Dn(d){if(A||B){if(typeof fetch=="function"&&!Bt(d))return fetch(d,{credentials:"same-origin"}).then(g=>{if(!g.ok)throw`failed to load wasm binary file at '${d}'`;return g.arrayBuffer()}).catch(()=>At(d));if(te)return new Promise((g,b)=>{te(d,S=>g(new Uint8Array(S)),b)})}return Promise.resolve().then(()=>At(d))}function ln(d,g,b){return Dn(d).then(S=>WebAssembly.instantiate(S,g)).then(b,S=>{G(`failed to asynchronously prepare wasm: ${S}`),Ye(S)})}function sr(d,g){var b=kr;return typeof WebAssembly.instantiateStreaming!="function"||un(b)||Bt(b)||R||typeof fetch!="function"?ln(b,d,g):fetch(b,{credentials:"same-origin"}).then(S=>WebAssembly.instantiateStreaming(S,d).then(g,function(I){return G(`wasm streaming compile failed: ${I}`),G("falling back to ArrayBuffer instantiation"),ln(b,d,g)}))}var Nn={826468:(d,g,b,S)=>{if(typeof c>"u"||!c.Db)return 1;if(d=nt(d>>>0),d.startsWith("./")&&(d=d.substring(2)),d=c.Db.get(d),!d)return 2;if(g>>>=0,b>>>=0,S>>>=0,g+b>d.byteLength)return 3;try{return s().set(d.subarray(g,g+b),S>>>0),0}catch{return 4}},826969:()=>{c.Xb()},827e3:()=>{c.Yb()},827029:()=>{c.bc()},827054:d=>c.Wb(d),827087:d=>c.$b(d),827119:(d,g,b)=>{c.Lb(d,g,b,!0)},827158:(d,g,b)=>{c.Lb(d,g,b)},827191:d=>{c.ob("Abs",d,void 0)},827242:d=>{c.ob("Neg",d,void 0)},827293:d=>{c.ob("Floor",d,void 0)},827346:d=>{c.ob("Ceil",d,void 0)},827398:d=>{c.ob("Reciprocal",d,void 0)},827456:d=>{c.ob("Sqrt",d,void 0)},827508:d=>{c.ob("Exp",d,void 0)},827559:d=>{c.ob("Erf",d,void 0)},827610:d=>{c.ob("Sigmoid",d,void 0)},827665:(d,g,b)=>{c.ob("HardSigmoid",d,{alpha:g,beta:b})},827744:d=>{c.ob("Log",d,void 0)},827795:d=>{c.ob("Sin",d,void 0)},827846:d=>{c.ob("Cos",d,void 0)},827897:d=>{c.ob("Tan",d,void 0)},827948:d=>{c.ob("Asin",d,void 0)},828e3:d=>{c.ob("Acos",d,void 0)},828052:d=>{c.ob("Atan",d,void 0)},828104:d=>{c.ob("Sinh",d,void 0)},828156:d=>{c.ob("Cosh",d,void 0)},828208:d=>{c.ob("Asinh",d,void 0)},828261:d=>{c.ob("Acosh",d,void 0)},828314:d=>{c.ob("Atanh",d,void 0)},828367:d=>{c.ob("Tanh",d,void 0)},828419:d=>{c.ob("Not",d,void 0)},828470:(d,g,b)=>{c.ob("Clip",d,{min:g,max:b})},828539:d=>{c.ob("Clip",d,void 0)},828591:(d,g)=>{c.ob("Elu",d,{alpha:g})},828649:d=>{c.ob("Relu",d,void 0)},828701:(d,g)=>{c.ob("LeakyRelu",d,{alpha:g})},828765:(d,g)=>{c.ob("ThresholdedRelu",d,{alpha:g})},828835:(d,g)=>{c.ob("Cast",d,{to:g})},828893:d=>{c.ob("Add",d,void 0)},828944:d=>{c.ob("Sub",d,void 0)},828995:d=>{c.ob("Mul",d,void 0)},829046:d=>{c.ob("Div",d,void 0)},829097:d=>{c.ob("Pow",d,void 0)},829148:d=>{c.ob("Equal",d,void 0)},829201:d=>{c.ob("Greater",d,void 0)},829256:d=>{c.ob("GreaterOrEqual",d,void 0)},829318:d=>{c.ob("Less",d,void 0)},829370:d=>{c.ob("LessOrEqual",d,void 0)},829429:(d,g,b,S,I)=>{c.ob("ReduceMean",d,{keepDims:!!g,noopWithEmptyAxes:!!b,axes:S?Array.from(l().subarray(S>>>0,I>>>0)):[]})},829588:(d,g,b,S,I)=>{c.ob("ReduceMax",d,{keepDims:!!g,noopWithEmptyAxes:!!b,axes:S?Array.from(l().subarray(S>>>0,I>>>0)):[]})},829746:(d,g,b,S,I)=>{c.ob("ReduceMin",d,{keepDims:!!g,noopWithEmptyAxes:!!b,axes:S?Array.from(l().subarray(S>>>0,I>>>0)):[]})},829904:(d,g,b,S,I)=>{c.ob("ReduceProd",d,{keepDims:!!g,noopWithEmptyAxes:!!b,axes:S?Array.from(l().subarray(S>>>0,I>>>0)):[]})},830063:(d,g,b,S,I)=>{c.ob("ReduceSum",d,{keepDims:!!g,noopWithEmptyAxes:!!b,axes:S?Array.from(l().subarray(S>>>0,I>>>0)):[]})},830221:(d,g,b,S,I)=>{c.ob("ReduceL1",d,{keepDims:!!g,noopWithEmptyAxes:!!b,axes:S?Array.from(l().subarray(S>>>0,I>>>0)):[]})},830378:(d,g,b,S,I)=>{c.ob("ReduceL2",d,{keepDims:!!g,noopWithEmptyAxes:!!b,axes:S?Array.from(l().subarray(S>>>0,I>>>0)):[]})},830535:(d,g,b,S,I)=>{c.ob("ReduceLogSum",d,{keepDims:!!g,noopWithEmptyAxes:!!b,axes:S?Array.from(l().subarray(S>>>0,I>>>0)):[]})},830696:(d,g,b,S,I)=>{c.ob("ReduceSumSquare",d,{keepDims:!!g,noopWithEmptyAxes:!!b,axes:S?Array.from(l().subarray(S>>>0,I>>>0)):[]})},830860:(d,g,b,S,I)=>{c.ob("ReduceLogSumExp",d,{keepDims:!!g,noopWithEmptyAxes:!!b,axes:S?Array.from(l().subarray(S>>>0,I>>>0)):[]})},831024:d=>{c.ob("Where",d,void 0)},831077:(d,g,b)=>{c.ob("Transpose",d,{perm:g?Array.from(l().subarray(g>>>0,b>>>0)):[]})},831185:(d,g,b,S)=>{c.ob("DepthToSpace",d,{blocksize:g,mode:nt(b),format:S?"NHWC":"NCHW"})},831318:(d,g,b,S)=>{c.ob("DepthToSpace",d,{blocksize:g,mode:nt(b),format:S?"NHWC":"NCHW"})},831451:(d,g,b,S,I,z,V,X,ce,ue,_e,Le,Ge,U,ke)=>{c.ob("ConvTranspose",d,{format:ce?"NHWC":"NCHW",autoPad:g,dilations:[b],group:S,kernelShape:[I],pads:[z,V],strides:[X],wIsConst:()=>!!i()[ue>>>0],outputPadding:_e?Array.from(l().subarray(_e>>>0,Le>>>0)):[],outputShape:Ge?Array.from(l().subarray(Ge>>>0,U>>>0)):[],activation:nt(ke)})},831852:(d,g,b,S,I,z,V,X,ce,ue,_e,Le,Ge,U)=>{c.ob("ConvTranspose",d,{format:X?"NHWC":"NCHW",autoPad:g,dilations:Array.from(l().subarray(b>>>0,(b>>>0)+2>>>0)),group:S,kernelShape:Array.from(l().subarray(I>>>0,(I>>>0)+2>>>0)),pads:Array.from(l().subarray(z>>>0,(z>>>0)+4>>>0)),strides:Array.from(l().subarray(V>>>0,(V>>>0)+2>>>0)),wIsConst:()=>!!i()[ce>>>0],outputPadding:ue?Array.from(l().subarray(ue>>>0,_e>>>0)):[],outputShape:Le?Array.from(l().subarray(Le>>>0,Ge>>>0)):[],activation:nt(U)})},832417:(d,g,b,S,I,z,V,X,ce,ue,_e,Le,Ge,U,ke)=>{c.ob("ConvTranspose",d,{format:ce?"NHWC":"NCHW",autoPad:g,dilations:[b],group:S,kernelShape:[I],pads:[z,V],strides:[X],wIsConst:()=>!!i()[ue>>>0],outputPadding:_e?Array.from(l().subarray(_e>>>0,Le>>>0)):[],outputShape:Ge?Array.from(l().subarray(Ge>>>0,U>>>0)):[],activation:nt(ke)})},832818:(d,g,b,S,I,z,V,X,ce,ue,_e,Le,Ge,U)=>{c.ob("ConvTranspose",d,{format:X?"NHWC":"NCHW",autoPad:g,dilations:Array.from(l().subarray(b>>>0,(b>>>0)+2>>>0)),group:S,kernelShape:Array.from(l().subarray(I>>>0,(I>>>0)+2>>>0)),pads:Array.from(l().subarray(z>>>0,(z>>>0)+4>>>0)),strides:Array.from(l().subarray(V>>>0,(V>>>0)+2>>>0)),wIsConst:()=>!!i()[ce>>>0],outputPadding:ue?Array.from(l().subarray(ue>>>0,_e>>>0)):[],outputShape:Le?Array.from(l().subarray(Le>>>0,Ge>>>0)):[],activation:nt(U)})},833383:(d,g)=>{c.ob("GlobalAveragePool",d,{format:g?"NHWC":"NCHW"})},833474:(d,g,b,S,I,z,V,X,ce,ue,_e,Le,Ge,U,ke,De)=>{c.ob("AveragePool",d,{format:De?"NHWC":"NCHW",auto_pad:g,ceil_mode:b,count_include_pad:S,storage_order:I,dilations:[z,V],kernel_shape:[X,ce],pads:[ue,_e,Le,Ge],strides:[U,ke]})},833758:(d,g)=>{c.ob("GlobalAveragePool",d,{format:g?"NHWC":"NCHW"})},833849:(d,g,b,S,I,z,V,X,ce,ue,_e,Le,Ge,U,ke,De)=>{c.ob("AveragePool",d,{format:De?"NHWC":"NCHW",auto_pad:g,ceil_mode:b,count_include_pad:S,storage_order:I,dilations:[z,V],kernel_shape:[X,ce],pads:[ue,_e,Le,Ge],strides:[U,ke]})},834133:(d,g)=>{c.ob("GlobalMaxPool",d,{format:g?"NHWC":"NCHW"})},834220:(d,g,b,S,I,z,V,X,ce,ue,_e,Le,Ge,U,ke,De)=>{c.ob("MaxPool",d,{format:De?"NHWC":"NCHW",auto_pad:g,ceil_mode:b,count_include_pad:S,storage_order:I,dilations:[z,V],kernel_shape:[X,ce],pads:[ue,_e,Le,Ge],strides:[U,ke]})},834500:(d,g)=>{c.ob("GlobalMaxPool",d,{format:g?"NHWC":"NCHW"})},834587:(d,g,b,S,I,z,V,X,ce,ue,_e,Le,Ge,U,ke,De)=>{c.ob("MaxPool",d,{format:De?"NHWC":"NCHW",auto_pad:g,ceil_mode:b,count_include_pad:S,storage_order:I,dilations:[z,V],kernel_shape:[X,ce],pads:[ue,_e,Le,Ge],strides:[U,ke]})},834867:(d,g,b,S,I)=>{c.ob("Gemm",d,{alpha:g,beta:b,transA:S,transB:I})},834971:d=>{c.ob("MatMul",d,void 0)},835025:(d,g,b,S)=>{c.ob("ArgMax",d,{keepDims:!!g,selectLastIndex:!!b,axis:S})},835133:(d,g,b,S)=>{c.ob("ArgMin",d,{keepDims:!!g,selectLastIndex:!!b,axis:S})},835241:(d,g)=>{c.ob("Softmax",d,{axis:g})},835304:(d,g)=>{c.ob("Concat",d,{axis:g})},835364:(d,g,b,S,I)=>{c.ob("Split",d,{axis:g,numOutputs:b,splitSizes:S?Array.from(l().subarray(S>>>0,I>>>0)):[]})},835504:d=>{c.ob("Expand",d,void 0)},835558:(d,g)=>{c.ob("Gather",d,{axis:Number(g)})},835629:(d,g)=>{c.ob("GatherElements",d,{axis:Number(g)})},835708:(d,g,b,S,I,z,V,X,ce,ue,_e)=>{c.ob("Resize",d,{antialias:g,axes:b?Array.from(l().subarray(b>>>0,S>>>0)):[],coordinateTransformMode:nt(I),cubicCoeffA:z,excludeOutside:V,extrapolationValue:X,keepAspectRatioPolicy:nt(ce),mode:nt(ue),nearestMode:nt(_e)})},836054:(d,g,b,S,I,z,V)=>{c.ob("Slice",d,{starts:g?Array.from(l().subarray(g>>>0,b>>>0)):[],ends:S?Array.from(l().subarray(S>>>0,I>>>0)):[],axes:z?Array.from(l().subarray(z>>>0,V>>>0)):[]})},836270:d=>{c.ob("Tile",d,void 0)},836322:(d,g,b,S)=>{c.ob("LayerNormalization",d,{axis:g,epsilon:b,simplified:!!S})},836433:(d,g,b)=>{c.ob("InstanceNormalization",d,{epsilon:g,format:b?"NHWC":"NCHW"})},836547:(d,g,b)=>{c.ob("InstanceNormalization",d,{epsilon:g,format:b?"NHWC":"NCHW"})},836661:d=>{c.ob("Range",d,void 0)},836714:(d,g)=>{c.ob("Einsum",d,{equation:nt(g)})},836795:(d,g,b,S,I)=>{c.ob("Pad",d,{mode:g,value:b,pads:S?Array.from(l().subarray(S>>>0,I>>>0)):[]})},836922:(d,g,b,S,I,z)=>{c.ob("BatchNormalization",d,{epsilon:g,momentum:b,spatial:!!I,trainingMode:!!S,format:z?"NHWC":"NCHW"})},837091:(d,g,b,S,I,z)=>{c.ob("BatchNormalization",d,{epsilon:g,momentum:b,spatial:!!I,trainingMode:!!S,format:z?"NHWC":"NCHW"})},837260:(d,g,b)=>{c.ob("CumSum",d,{exclusive:Number(g),reverse:Number(b)})},837357:(d,g,b,S,I,z,V,X,ce)=>{c.ob("Attention",d,{numHeads:g,isUnidirectional:b,maskFilterValue:S,scale:I,doRotary:z,qkvHiddenSizes:V?Array.from(l().subarray(Number(X)>>>0,Number(X)+V>>>0)):[],pastPresentShareBuffer:!!ce})},837629:d=>{c.ob("BiasAdd",d,void 0)},837684:d=>{c.ob("BiasSplitGelu",d,void 0)},837745:d=>{c.ob("FastGelu",d,void 0)},837801:(d,g,b,S,I,z,V,X,ce,ue,_e,Le,Ge)=>{c.ob("Conv",d,{format:ce?"NHWC":"NCHW",auto_pad:g,dilations:[b],group:S,kernel_shape:[I],pads:z?Array.from(l().subarray(z>>>0,V>>>0)):[],strides:[X],w_is_const:()=>!!i()[ue>>>0],activation:nt(_e),activation_params:Le?Array.from(f().subarray(Le>>>0,Ge>>>0)):[]})},838171:(d,g,b,S,I,z,V,X,ce,ue,_e,Le,Ge,U,ke,De)=>{c.ob("Conv",d,{format:Le?"NHWC":"NCHW",auto_pad:g,dilations:[b,S],group:I,kernel_shape:[z,V],pads:X?Array.from(l().subarray(X>>>0,ce>>>0)):[],strides:[ue,_e],w_is_const:()=>!!i()[Ge>>>0],activation:nt(U),activation_params:ke?Array.from(f().subarray(ke>>>0,De>>>0)):[]})},838562:d=>{c.ob("Gelu",d,void 0)},838614:(d,g,b,S,I,z)=>{c.ob("MatMulNBits",d,{k:g,n:b,accuracyLevel:S,bits:I,blockSize:z})},838741:(d,g,b,S,I,z)=>{c.ob("MultiHeadAttention",d,{numHeads:g,isUnidirectional:b,maskFilterValue:S,scale:I,doRotary:z})},838900:(d,g,b,S,I)=>{c.ob("RotaryEmbedding",d,{interleaved:!!g,numHeads:b,rotaryEmbeddingDim:S,scale:I})},839039:(d,g,b)=>{c.ob("SkipLayerNormalization",d,{epsilon:g,simplified:!!b})},839141:(d,g,b)=>{c.ob("SkipLayerNormalization",d,{epsilon:g,simplified:!!b})},839243:(d,g,b,S)=>{c.ob("LayerNormalization",d,{axis:g,epsilon:b,simplified:!!S})},839354:d=>{c.ac(d)},839388:(d,g)=>c.cc(d,g,c.Cb.ec,c.Cb.errors)};function xt(d){this.name="ExitStatus",this.message=`Program terminated with exit(${d})`,this.status=d}var dn=d=>{d.terminate(),d.onmessage=()=>{}},cn=d=>{be.xb.length==0&&(Ua(),be.Mb(be.xb[0]));var g=be.xb.pop();if(!g)return 6;be.yb.push(g),be.ub[d.wb]=g,g.wb=d.wb;var b={cmd:"run",start_routine:d.fc,arg:d.Rb,pthread_ptr:d.wb};return R&&g.unref(),g.postMessage(b,d.mc),0},ot=0,Fn=d=>{var g=$s();return d=d(),oi(g),d},Ie=(d,g,...b)=>Fn(()=>{for(var S=2*b.length,I=vs(8*S),z=I>>>3,V=0;V>>0]=X)}return Ru(d,0,S,I,g)});function St(d){if(D)return Ie(0,1,d);fe=d,0{if(fe=d,D)throw Va(d),"unwind";St(d)};function ds(){for(var d=c.numThreads;d--;)Ua();hr.unshift(()=>{fr++,Wa(()=>Bn())})}function Ua(){var d=j("ort-wasm-simd-threaded.worker.js");d=new Worker(d),be.xb.push(d)}function Wa(d){D?d():Promise.all(be.xb.map(be.Mb)).then(d)}var be={xb:[],yb:[],Qb:[],ub:{},Gb(){D?(be.receiveObjectTransfer=be.dc,be.threadInitTLS=be.Pb,be.setExitStatus=be.Ob):ds()},Ob:d=>fe=d,pc:["$terminateWorker"],hc:()=>{for(var d of be.yb)dn(d);for(d of be.xb)dn(d);be.xb=[],be.yb=[],be.ub=[]},Nb:d=>{var g=d.wb;delete be.ub[g],be.xb.push(d),be.yb.splice(be.yb.indexOf(d),1),d.wb=0,ws(g)},dc(){},Pb(){be.Qb.forEach(d=>d())},Mb:d=>new Promise(g=>{d.onmessage=z=>{z=z.data;var V=z.cmd;if(z.targetThread&&z.targetThread!=ii()){var X=be.ub[z.targetThread];X?X.postMessage(z,z.transferList):G(`Internal error! Worker sent a message "${V}" to target pthread ${z.targetThread}, but that thread no longer exists!`)}else V==="checkMailbox"?_t():V==="spawnThread"?cn(z):V==="cleanupThread"?be.Nb(be.ub[z.thread]):V==="killThread"?(z=z.thread,V=be.ub[z],delete be.ub[z],dn(V),ws(z),be.yb.splice(be.yb.indexOf(V),1),V.wb=0):V==="cancelThread"?be.ub[z.thread].postMessage({cmd:"cancel"}):V==="loaded"?(d.loaded=!0,R&&!d.wb&&d.unref(),g(d)):V==="alert"?alert(`Thread ${z.threadId}: ${z.text}`):z.target==="setimmediate"?d.postMessage(z):V==="callHandler"?c[z.handler](...z.args):V&&G(`worker sent an unknown command ${V}`)},d.onerror=z=>{throw G(`worker sent an error! ${z.filename}:${z.lineno}: ${z.message}`),z},R&&(d.on("message",z=>d.onmessage({data:z})),d.on("error",z=>d.onerror(z)));var b=[],S=["onExit"],I;for(I of S)c.hasOwnProperty(I)&&b.push(I);d.postMessage({cmd:"load",handlers:b,urlOrBlob:c.mainScriptUrlOrBlob||n,wasmMemory:ne,wasmModule:N})})};c.PThread=be;var pn=d=>{for(;0{var d=ii(),g=p()[d+52>>>2>>>0];d=p()[d+56>>>2>>>0],Du(g,g-d),oi(g)};function Va(d){if(D)return Ie(1,0,d);Rr(d)}c.invokeEntryPoint=(d,g)=>{ot=0,d=Nu(d,g),0>>2>>>0]=0,p()[this.Ib+4>>>2>>>0]=g,p()[this.Ib+8>>>2>>>0]=b}}var Ga=0;function Ha(d,g,b,S){return D?Ie(2,1,d,g,b,S):hn(d,g,b,S)}function hn(d,g,b,S){if(d>>>=0,g>>>=0,b>>>=0,S>>>=0,typeof SharedArrayBuffer>"u")return G("Current environment does not support SharedArrayBuffer, pthreads are not available!"),6;var I=[];return D&&I.length===0?Ha(d,g,b,S):(d={fc:b,wb:d,Rb:S,mc:I},D?(d.oc="spawnThread",postMessage(d,I),0):cn(d))}var Ln=typeof TextDecoder<"u"?new TextDecoder("utf8"):void 0,Br=(d,g,b)=>{g>>>=0;var S=g+b;for(b=g;d[b]&&!(b>=S);)++b;if(16I?S+=String.fromCharCode(I):(I-=65536,S+=String.fromCharCode(55296|I>>10,56320|I&1023))}}else S+=String.fromCharCode(I)}return S},nt=(d,g)=>(d>>>=0)?Br(s(),d,g):"";function ja(d,g,b){return D?Ie(3,1,d,g,b):0}function Gt(d,g){if(D)return Ie(4,1,d,g)}var kt=d=>{for(var g=0,b=0;b=S?g++:2047>=S?g+=2:55296<=S&&57343>=S?(g+=4,++b):g+=3}return g},Un=(d,g,b,S)=>{if(b>>>=0,!(0=V){var X=d.charCodeAt(++z);V=65536+((V&1023)<<10)|X&1023}if(127>=V){if(b>=S)break;g[b++>>>0]=V}else{if(2047>=V){if(b+1>=S)break;g[b++>>>0]=192|V>>6}else{if(65535>=V){if(b+2>=S)break;g[b++>>>0]=224|V>>12}else{if(b+3>=S)break;g[b++>>>0]=240|V>>18,g[b++>>>0]=128|V>>12&63}g[b++>>>0]=128|V>>6&63}g[b++>>>0]=128|V&63}}return g[b>>>0]=0,b-I},Ht=(d,g,b)=>Un(d,s(),g,b);function Wn(d,g){if(D)return Ie(5,1,d,g)}function Vn(d,g,b){if(D)return Ie(6,1,d,g,b)}function qa(d,g,b){return D?Ie(7,1,d,g,b):0}function fn(d,g){if(D)return Ie(8,1,d,g)}function Ka(d,g,b){if(D)return Ie(9,1,d,g,b)}function Ya(d,g,b,S){if(D)return Ie(10,1,d,g,b,S)}function Xa(d,g,b,S){if(D)return Ie(11,1,d,g,b,S)}function Qa(d,g,b,S){if(D)return Ie(12,1,d,g,b,S)}function Gn(d){if(D)return Ie(13,1,d)}function Dr(d,g){if(D)return Ie(14,1,d,g)}function Ja(d,g,b){if(D)return Ie(15,1,d,g,b)}var mn,Mt=d=>{for(var g="";s()[d>>>0];)g+=mn[s()[d++>>>0]];return g},Hn={},jn={},jt;function ps(d,g,b={}){var S=g.name;if(!d)throw new jt(`type "${S}" must have a positive integer typeid pointer`);if(jn.hasOwnProperty(d)){if(b.Ub)return;throw new jt(`Cannot register type '${S}' twice`)}jn[d]=g,Hn.hasOwnProperty(d)&&(g=Hn[d],delete Hn[d],g.forEach(I=>I()))}function ft(d,g,b={}){if(!("argPackAdvance"in g))throw new TypeError("registerType registeredInstance requires argPackAdvance");return ps(d,g,b)}var qn=(d,g,b)=>{switch(g){case 1:return b?S=>i()[S>>>0]:S=>s()[S>>>0];case 2:return b?S=>o()[S>>>1>>>0]:S=>u()[S>>>1>>>0];case 4:return b?S=>l()[S>>>2>>>0]:S=>p()[S>>>2>>>0];case 8:return b?S=>Ne[S>>>3]:S=>ht[S>>>3];default:throw new TypeError(`invalid integer width (${g}): ${d}`)}},gn=[],Ot=[];function _n(d){d>>>=0,9{if(!d)throw new jt("Cannot use deleted val. handle = "+d);return Ot[d]},Et=d=>{switch(d){case void 0:return 2;case null:return 4;case!0:return 6;case!1:return 8;default:let g=gn.pop()||Ot.length;return Ot[g]=d,Ot[g+1]=1,g}};function Nr(d){return this.fromWireType(p()[d>>>2>>>0])}var hs={name:"emscripten::val",fromWireType:d=>{var g=ut(d);return _n(d),g},toWireType:(d,g)=>Et(g),argPackAdvance:8,readValueFromPointer:Nr,Bb:null},Za=(d,g)=>{switch(g){case 4:return function(b){return this.fromWireType(f()[b>>>2>>>0])};case 8:return function(b){return this.fromWireType(m()[b>>>3>>>0])};default:throw new TypeError(`invalid float width (${g}): ${d}`)}},Kn=typeof TextDecoder<"u"?new TextDecoder("utf-16le"):void 0,fs=(d,g)=>{for(var b=d>>1,S=b+g/2;!(b>=S)&&u()[b>>>0];)++b;if(b<<=1,32=g/2);++S){var I=o()[d+2*S>>>1>>>0];if(I==0)break;b+=String.fromCharCode(I)}return b},ei=(d,g,b)=>{if(b??=2147483647,2>b)return 0;b-=2;var S=g;b=b<2*d.length?b/2:d.length;for(var I=0;I>>1>>>0]=z,g+=2}return o()[g>>>1>>>0]=0,g-S},ti=d=>2*d.length,yn=(d,g)=>{for(var b=0,S="";!(b>=g/4);){var I=l()[d+4*b>>>2>>>0];if(I==0)break;++b,65536<=I?(I-=65536,S+=String.fromCharCode(55296|I>>10,56320|I&1023)):S+=String.fromCharCode(I)}return S},ms=(d,g,b)=>{if(g>>>=0,b??=2147483647,4>b)return 0;var S=g;b=S+b-4;for(var I=0;I=z){var V=d.charCodeAt(++I);z=65536+((z&1023)<<10)|V&1023}if(l()[g>>>2>>>0]=z,g+=4,g+4>b)break}return l()[g>>>2>>>0]=0,g-S},we=d=>{for(var g=0,b=0;b=S&&++b,g+=4}return g},Yn=d=>{if(!ae)try{if(d(),!(0>>=0,typeof Atomics.nc=="function"&&(Atomics.nc(l(),d>>>2,d).value.then(_t),d+=128,Atomics.store(l(),d>>>2,1))}c.__emscripten_thread_mailbox_await=Er;var _t=()=>{var d=ii();d&&(Er(d),Yn(Bu))};c.checkMailbox=_t;var wn=[],bn=(d,g)=>{var b=jn[d];if(b===void 0)throw d=zu(d),b=Mt(d),or(d),new jt(`${g} has unknown type ${b}`);return b},Xn=(d,g,b)=>{var S=[];return d=d.toWireType(S,b),S.length&&(p()[g>>>2>>>0]=Et(S)),d},Fr=d=>{try{d()}catch(g){Ye(g)}};function ri(){var d=he,g={};for(let[b,S]of Object.entries(d))g[b]=typeof S=="function"?(...I)=>{mr.push(b);try{return S(...I)}finally{ae||(mr.pop(),zt&&qt===1&&mr.length===0&&(qt=0,ot+=1,Fr(Lu),typeof Fibers<"u"&&Fibers.rc()))}}:S;return g}var qt=0,zt=null,ni=0,mr=[],Qn={},h={},_=0,x=null,E=[];function O(){return new Promise((d,g)=>{x={resolve:d,reject:g}})}function F(){var d=si(65548),g=d+12;p()[d>>>2>>>0]=g,p()[d+4>>>2>>>0]=g+65536,g=mr[0];var b=Qn[g];return b===void 0&&(b=_++,Qn[g]=b,h[b]=g),g=b,l()[d+8>>>2>>>0]=g,d}function q(){var d=l()[zt+8>>>2>>>0];return d=he[h[d]],--ot,d()}function J(d){if(!ae){if(qt===0){var g=!1,b=!1;d((S=0)=>{if(!ae&&(ni=S,g=!0,b)){qt=2,Fr(()=>Uu(zt)),typeof Browser<"u"&&Browser.Hb.Tb&&Browser.Hb.resume(),S=!1;try{var I=q()}catch(X){I=X,S=!0}var z=!1;if(!zt){var V=x;V&&(x=null,(S?V.reject:V.resolve)(I),z=!0)}if(S&&!z)throw I}}),b=!0,g||(qt=1,zt=F(),typeof Browser<"u"&&Browser.Hb.Tb&&Browser.Hb.pause(),Fr(()=>Fu(zt)))}else qt===2?(qt=0,Fr(Wu),or(zt),zt=null,E.forEach(Yn)):Ye(`invalid state: ${qt}`);return ni}}function de(d){return J(g=>{d().then(g)})}var se=[],me={},ze=d=>{var g=me[d];return g===void 0?Mt(d):g},Fe=()=>typeof globalThis=="object"?globalThis:Function("return this")(),L=d=>{var g=se.length;return se.push(d),g},xe=(d,g)=>{for(var b=Array(d),S=0;S>>2>>>0],"parameter "+S);return b},Oe=(d,g)=>Object.defineProperty(g,"name",{value:d});function gr(d){var g=Function;if(!(g instanceof Function))throw new TypeError(`new_ called with constructor type ${typeof g} which is not a function`);var b=Oe(g.name||"unknownFunctionName",function(){});return b.prototype=g.prototype,b=new b,d=g.apply(b,d),d instanceof Object?d:b}var _r=d=>d%4===0&&(d%100!==0||d%400===0),_u=[0,31,60,91,121,152,182,213,244,274,305,335],yu=[0,31,59,90,120,151,181,212,243,273,304,334];function wu(d,g,b,S,I,z,V){return D?Ie(16,1,d,g,b,S,I,z,V):-52}function bu(d,g,b,S,I,z){if(D)return Ie(17,1,d,g,b,S,I,z)}var gs=[],vu=(d,g)=>{gs.length=0;for(var b;b=s()[d++>>>0];){var S=b!=105;S&=b!=112,g+=S&&g%8?4:0,gs.push(b==112?p()[g>>>2>>>0]:b==106?Ne[g>>>3]:b==105?l()[g>>>2>>>0]:m()[g>>>3>>>0]),g+=S?8:4}return gs},_s={},$u=()=>{if(!ys){var d={USER:"web_user",LOGNAME:"web_user",PATH:"/",PWD:"/",HOME:"/home/web_user",LANG:(typeof navigator=="object"&&navigator.languages&&navigator.languages[0]||"C").replace("-","_")+".UTF-8",_:C||"./this.program"},g;for(g in _s)_s[g]===void 0?delete d[g]:d[g]=_s[g];var b=[];for(g in d)b.push(`${g}=${d[g]}`);ys=b}return ys},ys;function xu(d,g){if(D)return Ie(18,1,d,g);d>>>=0,g>>>=0;var b=0;return $u().forEach((S,I)=>{var z=g+b;for(I=p()[d+4*I>>>2>>>0]=z,z=0;z>>0]=S.charCodeAt(z);i()[I>>>0]=0,b+=S.length+1}),0}function Su(d,g){if(D)return Ie(19,1,d,g);d>>>=0,g>>>=0;var b=$u();p()[d>>>2>>>0]=b.length;var S=0;return b.forEach(I=>S+=I.length+1),p()[g>>>2>>>0]=S,0}function ku(d){return D?Ie(20,1,d):52}function Eu(d,g,b,S){return D?Ie(21,1,d,g,b,S):52}function Cu(d,g,b,S){return D?Ie(22,1,d,g,b,S):70}var Q0=[null,[],[]];function Tu(d,g,b,S){if(D)return Ie(23,1,d,g,b,S);g>>>=0,b>>>=0,S>>>=0;for(var I=0,z=0;z>>2>>>0],X=p()[g+4>>>2>>>0];g+=8;for(var ce=0;ce>>0],_e=Q0[d];ue===0||ue===10?((d===1?le:G)(Br(_e,0)),_e.length=0):_e.push(ue)}I+=X}return p()[S>>>2>>>0]=I,0}var Iu=[31,29,31,30,31,30,31,31,30,31,30,31],Au=[31,28,31,30,31,30,31,31,30,31,30,31];function J0(d){var g=Array(kt(d)+1);return Un(d,g,0,g.length),g}var Z0=(d,g)=>{i().set(d,g>>>0)};function Mu(d,g,b,S){function I(U,ke,De){for(U=typeof U=="number"?U.toString():U||"";U.lengthGu?-1:0Lr-U.getDate())ke-=Lr-U.getDate()+1,U.setDate(1),11>De?U.setMonth(De+1):(U.setMonth(0),U.setFullYear(U.getFullYear()+1));else{U.setDate(U.getDate()+ke);break}}return De=new Date(U.getFullYear()+1,0,4),ke=X(new Date(U.getFullYear(),0,4)),De=X(De),0>=V(ke,U)?0>=V(De,U)?U.getFullYear()+1:U.getFullYear():U.getFullYear()-1}d>>>=0,g>>>=0,b>>>=0,S>>>=0;var ue=p()[S+40>>>2>>>0];S={kc:l()[S>>>2>>>0],jc:l()[S+4>>>2>>>0],Eb:l()[S+8>>>2>>>0],Jb:l()[S+12>>>2>>>0],Fb:l()[S+16>>>2>>>0],Ab:l()[S+20>>>2>>>0],vb:l()[S+24>>>2>>>0],zb:l()[S+28>>>2>>>0],qc:l()[S+32>>>2>>>0],ic:l()[S+36>>>2>>>0],lc:ue?nt(ue):""},b=nt(b),ue={"%c":"%a %b %d %H:%M:%S %Y","%D":"%m/%d/%y","%F":"%Y-%m-%d","%h":"%b","%r":"%I:%M:%S %p","%R":"%H:%M","%T":"%H:%M:%S","%x":"%m/%d/%y","%X":"%H:%M:%S","%Ec":"%c","%EC":"%C","%Ex":"%m/%d/%y","%EX":"%H:%M:%S","%Ey":"%y","%EY":"%Y","%Od":"%d","%Oe":"%e","%OH":"%H","%OI":"%I","%Om":"%m","%OM":"%M","%OS":"%S","%Ou":"%u","%OU":"%U","%OV":"%V","%Ow":"%w","%OW":"%W","%Oy":"%y"};for(var _e in ue)b=b.replace(new RegExp(_e,"g"),ue[_e]);var Le="Sunday Monday Tuesday Wednesday Thursday Friday Saturday".split(" "),Ge="January February March April May June July August September October November December".split(" ");ue={"%a":U=>Le[U.vb].substring(0,3),"%A":U=>Le[U.vb],"%b":U=>Ge[U.Fb].substring(0,3),"%B":U=>Ge[U.Fb],"%C":U=>z((U.Ab+1900)/100|0,2),"%d":U=>z(U.Jb,2),"%e":U=>I(U.Jb,2," "),"%g":U=>ce(U).toString().substring(2),"%G":ce,"%H":U=>z(U.Eb,2),"%I":U=>(U=U.Eb,U==0?U=12:12{for(var ke=0,De=0;De<=U.Fb-1;ke+=(_r(U.Ab+1900)?Iu:Au)[De++]);return z(U.Jb+ke,3)},"%m":U=>z(U.Fb+1,2),"%M":U=>z(U.jc,2),"%n":()=>` -`,"%p":U=>0<=U.Eb&&12>U.Eb?"AM":"PM","%S":U=>z(U.kc,2),"%t":()=>" ","%u":U=>U.vb||7,"%U":U=>z(Math.floor((U.zb+7-U.vb)/7),2),"%V":U=>{var ke=Math.floor((U.zb+7-(U.vb+6)%7)/7);if(2>=(U.vb+371-U.zb-2)%7&&ke++,ke)ke==53&&(De=(U.vb+371-U.zb)%7,De==4||De==3&&_r(U.Ab)||(ke=1));else{ke=52;var De=(U.vb+7-U.zb-1)%7;(De==4||De==5&&_r(U.Ab%400-1))&&ke++}return z(ke,2)},"%w":U=>U.vb,"%W":U=>z(Math.floor((U.zb+7-(U.vb+6)%7)/7),2),"%y":U=>(U.Ab+1900).toString().substring(2),"%Y":U=>U.Ab+1900,"%z":U=>{U=U.ic;var ke=0<=U;return U=Math.abs(U)/60,(ke?"+":"-")+("0000"+(U/60*100+U%60)).slice(-4)},"%Z":U=>U.lc,"%%":()=>"%"},b=b.replace(/%%/g,"\0\0");for(_e in ue)b.includes(_e)&&(b=b.replace(new RegExp(_e,"g"),ue[_e](S)));return b=b.replace(/\0\0/g,"%"),_e=J0(b),_e.length>g?0:(Z0(_e,d),_e.length-1)}be.Gb();for(var Ou=Array(256),ai=0;256>ai;++ai)Ou[ai]=String.fromCharCode(ai);mn=Ou,jt=c.BindingError=class extends Error{constructor(d){super(d),this.name="BindingError"}},c.InternalError=class extends Error{constructor(d){super(d),this.name="InternalError"}},Ot.push(0,1,void 0,1,null,1,!0,1,!1,1),c.count_emval_handles=()=>Ot.length/2-5-gn.length;var e_=[St,Va,Ha,ja,Gt,Wn,Vn,qa,fn,Ka,Ya,Xa,Qa,Gn,Dr,Ja,wu,bu,xu,Su,ku,Eu,Cu,Tu],t_={ua:function(d,g,b){return de(async()=>{await c.Zb(d,g,b)})},b:function(d,g,b){throw d>>>=0,new cs(d).Gb(g>>>0,b>>>0),Ga=d,Ga},ia:function(d){Pu(d>>>0,!B,1,!A,131072,!1),be.Pb()},G:function(d){d>>>=0,D?postMessage({cmd:"cleanupThread",thread:d}):be.Nb(be.ub[d])},_:hn,A:ja,pa:Gt,W:Wn,Y:Vn,qa,na:fn,fa:Ka,ma:Ya,K:Xa,X:Qa,U:Gn,oa:Dr,V:Ja,E:function(d,g,b){d>>>=0,b>>>=0,g=Mt(g>>>0),ft(d,{name:g,fromWireType:S=>S,toWireType:function(S,I){if(typeof I!="bigint"&&typeof I!="number")throw I===null?I="null":(S=typeof I,I=S==="object"||S==="array"||S==="function"?I.toString():""+I),new TypeError(`Cannot convert "${I}" to ${this.name}`);return typeof I=="number"&&(I=BigInt(I)),I},argPackAdvance:8,readValueFromPointer:qn(g,b,g.indexOf("u")==-1),Bb:null})},O:function(d,g,b,S){d>>>=0,g=Mt(g>>>0),ft(d,{name:g,fromWireType:function(I){return!!I},toWireType:function(I,z){return z?b:S},argPackAdvance:8,readValueFromPointer:function(I){return this.fromWireType(s()[I>>>0])},Bb:null})},N:function(d){return ft(d>>>0,hs)},D:function(d,g,b){d>>>=0,b>>>=0,g=Mt(g>>>0),ft(d,{name:g,fromWireType:S=>S,toWireType:(S,I)=>I,argPackAdvance:8,readValueFromPointer:Za(g,b),Bb:null})},t:function(d,g,b,S,I){if(d>>>=0,b>>>=0,g=Mt(g>>>0),I===-1&&(I=4294967295),I=X=>X,S===0){var z=32-8*b;I=X=>X<>>z}var V=g.includes("unsigned")?function(X,ce){return ce>>>0}:function(X,ce){return ce};ft(d,{name:g,fromWireType:I,toWireType:V,argPackAdvance:8,readValueFromPointer:qn(g,b,S!==0),Bb:null})},p:function(d,g,b){function S(z){var V=p()[z>>>2>>>0];return z=p()[z+4>>>2>>>0],new I(i().buffer,z,V)}d>>>=0;var I=[Int8Array,Uint8Array,Int16Array,Uint16Array,Int32Array,Uint32Array,Float32Array,Float64Array,BigInt64Array,BigUint64Array][g];b=Mt(b>>>0),ft(d,{name:b,fromWireType:S,argPackAdvance:8,readValueFromPointer:S},{Ub:!0})},F:function(d,g){d>>>=0,g=Mt(g>>>0);var b=g==="std::string";ft(d,{name:g,fromWireType:function(S){var I=p()[S>>>2>>>0],z=S+4;if(b)for(var V=z,X=0;X<=I;++X){var ce=z+X;if(X==I||s()[ce>>>0]==0){if(V=nt(V,ce-V),ue===void 0)var ue=V;else ue+="\0",ue+=V;V=ce+1}}else{for(ue=Array(I),X=0;X>>0]);ue=ue.join("")}return or(S),ue},toWireType:function(S,I){I instanceof ArrayBuffer&&(I=new Uint8Array(I));var z=typeof I=="string";if(!(z||I instanceof Uint8Array||I instanceof Uint8ClampedArray||I instanceof Int8Array))throw new jt("Cannot pass non-string to std::string");var V=b&&z?kt(I):I.length,X=si(4+V+1),ce=X+4;if(p()[X>>>2>>>0]=V,b&&z)Ht(I,ce,V+1);else if(z)for(z=0;z>>0]=ue}else for(z=0;z>>0]=I[z];return S!==null&&S.push(or,X),X},argPackAdvance:8,readValueFromPointer:Nr,Bb(S){or(S)}})},z:function(d,g,b){if(d>>>=0,g>>>=0,b>>>=0,b=Mt(b),g===2)var S=fs,I=ei,z=ti,V=X=>u()[X>>>1>>>0];else g===4&&(S=yn,I=ms,z=we,V=X=>p()[X>>>2>>>0]);ft(d,{name:b,fromWireType:X=>{for(var ce=p()[X>>>2>>>0],ue,_e=X+4,Le=0;Le<=ce;++Le){var Ge=X+4+Le*g;(Le==ce||V(Ge)==0)&&(_e=S(_e,Ge-_e),ue===void 0?ue=_e:(ue+="\0",ue+=_e),_e=Ge+g)}return or(X),ue},toWireType:(X,ce)=>{if(typeof ce!="string")throw new jt(`Cannot pass non-string to C++ string type ${b}`);var ue=z(ce),_e=si(4+ue+g);return p()[_e>>>2>>>0]=ue/g,I(ce,_e+4,ue+g),X!==null&&X.push(or,_e),_e},argPackAdvance:8,readValueFromPointer:Nr,Bb(X){or(X)}})},P:function(d,g){d>>>=0,g=Mt(g>>>0),ft(d,{Vb:!0,name:g,argPackAdvance:0,fromWireType:()=>{},toWireType:()=>{}})},ta:()=>1,S:function(d,g){d>>>=0,d==g>>>0?setTimeout(_t):D?postMessage({targetThread:d,cmd:"checkMailbox"}):(d=be.ub[d])&&d.postMessage({cmd:"checkMailbox"})},$:function(d,g,b,S,I){g>>>=0,b>>>=0,S/=2,wn.length=S,I=I>>>0>>>3;for(var z=0;z>>0];return d=g?Nn[g]:e_[d],be.Sb=b,b=d(...wn),be.Sb=0,b},ha:Er,sa:function(d){R&&be.ub[d>>>0].ref()},w:function(d,g,b){return g>>>=0,b>>>=0,d=ut(d>>>0),g=bn(g,"emval::as"),Xn(g,b,d)},y:function(d){return d>>>=0,de(()=>(d=ut(d),d.then(Et)))},o:function(d,g,b,S){return b>>>=0,S>>>=0,d=se[d>>>0],g=ut(g>>>0),d(null,g,b,S)},k:function(d,g,b,S,I){return b>>>=0,S>>>=0,I>>>=0,d=se[d>>>0],g=ut(g>>>0),b=ze(b),d(g,g[b],S,I)},c:_n,C:function(d,g){return g>>>=0,d=ut(d>>>0),g=ut(g),d==g},n:function(d){return d>>>=0,d===0?Et(Fe()):(d=ze(d),Et(Fe()[d]))},j:function(d,g,b){g=xe(d,g>>>0);var S=g.shift();d--;var I=`return function (obj, func, destructorsRef, args) { -`,z=0,V=[];b===0&&V.push("obj");for(var X=["retType"],ce=[S],ue=0;ue_e.name).join(", ")}) => ${S.name}>`,L(Oe(b,d))},s:function(d,g){return g>>>=0,d=ut(d>>>0),g=ut(g),Et(d[g])},d:function(d){d>>>=0,9>>0);for(var g=Array(d.length),b=0;b>>0))},l:function(){return Et({})},i:function(d){d>>>=0;for(var g=ut(d);g.length;){var b=g.pop();g.pop()(b)}_n(d)},h:function(d,g,b){g>>>=0,b>>>=0,d=ut(d>>>0),g=ut(g),b=ut(b),d[g]=b},e:function(d,g){return g>>>=0,d=bn(d>>>0,"_emval_take_value"),d=d.readValueFromPointer(g),Et(d)},ca:function(d,g){d=-9007199254740992>d||9007199254740992>>=0,d=new Date(1e3*d),l()[g>>>2>>>0]=d.getUTCSeconds(),l()[g+4>>>2>>>0]=d.getUTCMinutes(),l()[g+8>>>2>>>0]=d.getUTCHours(),l()[g+12>>>2>>>0]=d.getUTCDate(),l()[g+16>>>2>>>0]=d.getUTCMonth(),l()[g+20>>>2>>>0]=d.getUTCFullYear()-1900,l()[g+24>>>2>>>0]=d.getUTCDay(),d=(d.getTime()-Date.UTC(d.getUTCFullYear(),0,1,0,0,0,0))/864e5|0,l()[g+28>>>2>>>0]=d},da:function(d,g){d=-9007199254740992>d||9007199254740992>>=0,d=new Date(1e3*d),l()[g>>>2>>>0]=d.getSeconds(),l()[g+4>>>2>>>0]=d.getMinutes(),l()[g+8>>>2>>>0]=d.getHours(),l()[g+12>>>2>>>0]=d.getDate(),l()[g+16>>>2>>>0]=d.getMonth(),l()[g+20>>>2>>>0]=d.getFullYear()-1900,l()[g+24>>>2>>>0]=d.getDay();var b=(_r(d.getFullYear())?_u:yu)[d.getMonth()]+d.getDate()-1|0;l()[g+28>>>2>>>0]=b,l()[g+36>>>2>>>0]=-(60*d.getTimezoneOffset()),b=new Date(d.getFullYear(),6,1).getTimezoneOffset();var S=new Date(d.getFullYear(),0,1).getTimezoneOffset();d=(b!=S&&d.getTimezoneOffset()==Math.min(S,b))|0,l()[g+32>>>2>>>0]=d},ea:function(d){d>>>=0;var g=new Date(l()[d+20>>>2>>>0]+1900,l()[d+16>>>2>>>0],l()[d+12>>>2>>>0],l()[d+8>>>2>>>0],l()[d+4>>>2>>>0],l()[d>>>2>>>0],0),b=l()[d+32>>>2>>>0],S=g.getTimezoneOffset(),I=new Date(g.getFullYear(),6,1).getTimezoneOffset(),z=new Date(g.getFullYear(),0,1).getTimezoneOffset(),V=Math.min(z,I);return 0>b?l()[d+32>>>2>>>0]=+(I!=z&&V==S):0>>2>>>0]=g.getDay(),b=(_r(g.getFullYear())?_u:yu)[g.getMonth()]+g.getDate()-1|0,l()[d+28>>>2>>>0]=b,l()[d>>>2>>>0]=g.getSeconds(),l()[d+4>>>2>>>0]=g.getMinutes(),l()[d+8>>>2>>>0]=g.getHours(),l()[d+12>>>2>>>0]=g.getDate(),l()[d+16>>>2>>>0]=g.getMonth(),l()[d+20>>>2>>>0]=g.getYear(),d=g.getTime(),BigInt(isNaN(d)?-1:d/1e3)},aa:wu,ba:bu,R:function(d,g,b,S){d>>>=0,g>>>=0,b>>>=0,S>>>=0;var I=new Date().getFullYear(),z=new Date(I,0,1),V=new Date(I,6,1);I=z.getTimezoneOffset();var X=V.getTimezoneOffset(),ce=Math.max(I,X);p()[d>>>2>>>0]=60*ce,l()[g>>>2>>>0]=+(I!=X),d=ue=>ue.toLocaleTimeString(void 0,{hour12:!1,timeZoneName:"short"}).split(" ")[1],z=d(z),V=d(V),X{Ye("")},f:function(d,g,b){return d>>>=0,g=vu(g>>>0,b>>>0),Nn[d](...g)},M:function(d,g,b){return d>>>=0,g=vu(g>>>0,b>>>0),Nn[d](...g)},H:()=>{},L:()=>Date.now(),ra:()=>{throw ot+=1,"unwind"},T:function(){return 4294901760},u:()=>performance.timeOrigin+performance.now(),x:()=>R?(j_(),Jr(ah)).cpus().length:navigator.hardwareConcurrency,Q:function(d){d>>>=0;var g=s().length;if(d<=g||4294901760=b;b*=2){var S=g*(1+.2/b);S=Math.min(S,d+100663296);var I=Math;S=Math.max(d,S);e:{I=(I.min.call(I,4294901760,S+(65536-S%65536)%65536)-ne.buffer.byteLength+65535)/65536;try{ne.grow(I),st();var z=1;break e}catch{}z=void 0}if(z)return!0}return!1},ja:xu,la:Su,Z:Rr,B:ku,J:Eu,ga:Cu,I:Tu,a:ne||c.wasmMemory,ka:Mu,r:function(d,g,b,S){return Mu(d>>>0,g>>>0,b>>>0,S>>>0)}},he=function(){function d(b,S){return he=b.exports,he=ri(),he=r_(),be.Qb.push(he.cb),ir.unshift(he.va),N=S,Bn(),he}var g={a:t_};if(fr++,c.instantiateWasm)try{return c.instantiateWasm(g,d)}catch(b){G(`Module.instantiateWasm callback failed with error: ${b}`),w(b)}return sr(g,function(b){d(b.instance,b.module)}).catch(w),{}}(),zu=d=>(zu=he.wa)(d);c.__embind_initialize_bindings=()=>(c.__embind_initialize_bindings=he.xa)(),c._OrtInit=(d,g)=>(c._OrtInit=he.ya)(d,g),c._OrtGetLastError=(d,g)=>(c._OrtGetLastError=he.za)(d,g),c._OrtCreateSessionOptions=(d,g,b,S,I,z,V,X,ce,ue)=>(c._OrtCreateSessionOptions=he.Aa)(d,g,b,S,I,z,V,X,ce,ue),c._OrtAppendExecutionProvider=(d,g)=>(c._OrtAppendExecutionProvider=he.Ba)(d,g),c._OrtAddFreeDimensionOverride=(d,g,b)=>(c._OrtAddFreeDimensionOverride=he.Ca)(d,g,b),c._OrtAddSessionConfigEntry=(d,g,b)=>(c._OrtAddSessionConfigEntry=he.Da)(d,g,b),c._OrtReleaseSessionOptions=d=>(c._OrtReleaseSessionOptions=he.Ea)(d),c._OrtCreateSession=(d,g,b)=>(c._OrtCreateSession=he.Fa)(d,g,b),c._OrtReleaseSession=d=>(c._OrtReleaseSession=he.Ga)(d),c._OrtGetInputOutputCount=(d,g,b)=>(c._OrtGetInputOutputCount=he.Ha)(d,g,b),c._OrtGetInputName=(d,g)=>(c._OrtGetInputName=he.Ia)(d,g),c._OrtGetOutputName=(d,g)=>(c._OrtGetOutputName=he.Ja)(d,g),c._OrtFree=d=>(c._OrtFree=he.Ka)(d),c._OrtCreateTensor=(d,g,b,S,I,z)=>(c._OrtCreateTensor=he.La)(d,g,b,S,I,z),c._OrtGetTensorData=(d,g,b,S,I)=>(c._OrtGetTensorData=he.Ma)(d,g,b,S,I),c._OrtReleaseTensor=d=>(c._OrtReleaseTensor=he.Na)(d),c._OrtCreateRunOptions=(d,g,b,S)=>(c._OrtCreateRunOptions=he.Oa)(d,g,b,S),c._OrtAddRunConfigEntry=(d,g,b)=>(c._OrtAddRunConfigEntry=he.Pa)(d,g,b),c._OrtReleaseRunOptions=d=>(c._OrtReleaseRunOptions=he.Qa)(d),c._OrtCreateBinding=d=>(c._OrtCreateBinding=he.Ra)(d),c._OrtBindInput=(d,g,b)=>(c._OrtBindInput=he.Sa)(d,g,b),c._OrtBindOutput=(d,g,b,S)=>(c._OrtBindOutput=he.Ta)(d,g,b,S),c._OrtClearBoundOutputs=d=>(c._OrtClearBoundOutputs=he.Ua)(d),c._OrtReleaseBinding=d=>(c._OrtReleaseBinding=he.Va)(d),c._OrtRunWithBinding=(d,g,b,S,I)=>(c._OrtRunWithBinding=he.Wa)(d,g,b,S,I),c._OrtRun=(d,g,b,S,I,z,V,X)=>(c._OrtRun=he.Xa)(d,g,b,S,I,z,V,X),c._OrtEndProfiling=d=>(c._OrtEndProfiling=he.Ya)(d),c._JsepOutput=(d,g,b)=>(c._JsepOutput=he.Za)(d,g,b),c._JsepGetNodeName=d=>(c._JsepGetNodeName=he._a)(d);var ii=c._pthread_self=()=>(ii=c._pthread_self=he.$a)(),si=c._malloc=d=>(si=c._malloc=he.ab)(d),or=c._free=d=>(or=c._free=he.bb)(d);c.__emscripten_tls_init=()=>(c.__emscripten_tls_init=he.cb)();var Pu=c.__emscripten_thread_init=(d,g,b,S,I,z)=>(Pu=c.__emscripten_thread_init=he.eb)(d,g,b,S,I,z);c.__emscripten_thread_crashed=()=>(c.__emscripten_thread_crashed=he.fb)();var Ru=(d,g,b,S,I)=>(Ru=he.gb)(d,g,b,S,I),ws=d=>(ws=he.hb)(d),bs=c.__emscripten_thread_exit=d=>(bs=c.__emscripten_thread_exit=he.ib)(d),Bu=()=>(Bu=he.jb)(),Du=(d,g)=>(Du=he.kb)(d,g),oi=d=>(oi=he.lb)(d),vs=d=>(vs=he.mb)(d),$s=()=>($s=he.nb)(),Nu=c.dynCall_ii=(d,g)=>(Nu=c.dynCall_ii=he.pb)(d,g),Fu=d=>(Fu=he.qb)(d),Lu=()=>(Lu=he.rb)(),Uu=d=>(Uu=he.sb)(d),Wu=()=>(Wu=he.tb)();c.___start_em_js=839500,c.___stop_em_js=839661;function r_(){var d=he;d=Object.assign({},d);var g=S=>I=>S(I)>>>0,b=S=>()=>S()>>>0;return d.wa=g(d.wa),d.$a=b(d.$a),d.ab=g(d.ab),d.emscripten_main_runtime_thread_id=b(d.emscripten_main_runtime_thread_id),d.mb=g(d.mb),d.nb=b(d.nb),d}c.wasmMemory=ne,c.stackSave=()=>$s(),c.stackRestore=d=>oi(d),c.stackAlloc=d=>vs(d),c.keepRuntimeAlive=()=>0r)}),K_=An((t,e)=>{e.exports='"use strict";var Module={},ENVIRONMENT_IS_NODE=typeof process=="object"&&typeof process.versions=="object"&&typeof process.versions.node=="string";if(ENVIRONMENT_IS_NODE){var nodeWorkerThreads=require("worker_threads"),parentPort=nodeWorkerThreads.parentPort;parentPort.on("message",e=>onmessage({data:e}));var fs=require("fs"),vm=require("vm");Object.assign(global,{self:global,require,Module,location:{href:__filename},Worker:nodeWorkerThreads.Worker,importScripts:e=>vm.runInThisContext(fs.readFileSync(e,"utf8"),{filename:e}),postMessage:e=>parentPort.postMessage(e),performance:global.performance||{now:Date.now}})}var initializedJS=!1;function threadPrintErr(...e){var a=e.join(" ");if(ENVIRONMENT_IS_NODE){fs.writeSync(2,a+`\n`);return}console.error(a)}function threadAlert(...e){var a=e.join(" ");postMessage({cmd:"alert",text:a,threadId:Module._pthread_self()})}var err=threadPrintErr;self.alert=threadAlert,Module.instantiateWasm=(e,a)=>{var r=Module.wasmModule;Module.wasmModule=null;var t=new WebAssembly.Instance(r,e);return a(t)},self.onunhandledrejection=e=>{throw e.reason||e};function handleMessage(e){try{if(e.data.cmd==="load"){let r=[];self.onmessage=t=>r.push(t),self.startWorker=t=>{Module=t,postMessage({cmd:"loaded"});for(let s of r)handleMessage(s);self.onmessage=handleMessage},Module.wasmModule=e.data.wasmModule;for(const t of e.data.handlers)Module[t]=(...s)=>{postMessage({cmd:"callHandler",handler:t,args:s})};if(Module.wasmMemory=e.data.wasmMemory,Module.buffer=Module.wasmMemory.buffer,Module.ENVIRONMENT_IS_PTHREAD=!0,typeof e.data.urlOrBlob=="string")importScripts(e.data.urlOrBlob);else{var a=URL.createObjectURL(e.data.urlOrBlob);importScripts(a),URL.revokeObjectURL(a)}ortWasmThreaded(Module)}else if(e.data.cmd==="run"){Module.__emscripten_thread_init(e.data.pthread_ptr,0,0,1),Module.__emscripten_thread_mailbox_await(e.data.pthread_ptr),Module.establishStackSpace(),Module.PThread.receiveObjectTransfer(e.data),Module.PThread.threadInitTLS(),initializedJS||(initializedJS=!0);try{Module.invokeEntryPoint(e.data.start_routine,e.data.arg)}catch(r){if(r!="unwind")throw r}}else e.data.cmd==="cancel"?Module._pthread_self()&&Module.__emscripten_thread_exit(-1):e.data.target==="setimmediate"||(e.data.cmd==="checkMailbox"?initializedJS&&Module.checkMailbox():e.data.cmd&&(err(`worker.js received unknown command ${e.data.cmd}`),err(e.data)))}catch(r){throw Module.__emscripten_thread_crashed?.(),r}}self.onmessage=handleMessage;\n'}),Xu,Qu,Ts,ci,ea,Is,Ju,Zu,el,sh,at,xa=Z(()=>{Xu=V_(),Qu=q_(),ci=!1,ea=!1,Is=!1,Ju=t=>{if(t===1)return!1;if(typeof SharedArrayBuffer>"u")return typeof self<"u"&&!self.crossOriginIsolated&&console.warn("env.wasm.numThreads is set to "+t+", but this will not work unless you enable crossOriginIsolated mode. See https://web.dev/cross-origin-isolation-guide/ for more info."),!1;typeof process<"u"&&process.versions&&process.versions.node&&console.warn("env.wasm.numThreads is set to "+t+", however, currently onnxruntime-web does not support multi-threads in Node.js. Please consider using onnxruntime-node for performance critical scenarios.");try{return typeof MessageChannel<"u"&&new MessageChannel().port1.postMessage(new SharedArrayBuffer(1)),WebAssembly.validate(new Uint8Array([0,97,115,109,1,0,0,0,1,4,1,96,0,0,3,2,1,0,5,4,1,3,1,1,10,11,1,9,0,65,0,254,16,2,0,26,11]))}catch{return!1}},Zu=()=>{try{return WebAssembly.validate(new Uint8Array([0,97,115,109,1,0,0,0,1,4,1,96,0,0,3,2,1,0,10,30,1,28,0,65,0,253,15,253,12,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,253,186,1,26,11]))}catch{return!1}},el=(t,e)=>t?e?"ort-wasm-simd-threaded.wasm":"ort-wasm-simd.wasm":e?"ort-wasm-threaded.wasm":"ort-wasm.wasm",sh=async t=>{if(ci)return Promise.resolve();if(ea)throw new Error("multiple calls to 'initializeWebAssembly()' detected.");if(Is)throw new Error("previous call to 'initializeWebAssembly()' failed.");ea=!0;let e=t.initTimeout,r=t.numThreads,n=t.simd,a=Ju(r),i=n&&Zu(),s=t.wasmPaths,o=typeof s=="string"?s:void 0,u=el(i,a),l=typeof s=="object"?s[u]:void 0,p=!1,f=[];if(e>0&&f.push(new Promise(m=>{setTimeout(()=>{p=!0,m()},e)})),f.push(new Promise((m,c)=>{let y=a?Qu:Xu,w={locateFile:(v,k)=>{if(a&&v.endsWith(".worker.js")&&typeof Blob<"u")return URL.createObjectURL(new Blob([K_()],{type:"text/javascript"}));if(v.endsWith(".wasm")){if(l)return l;let $=o??k;return u==="ort-wasm-simd.wasm"?$+"ort-wasm-simd.jsep.wasm":u==="ort-wasm-simd-threaded.wasm"?$+"ort-wasm-simd-threaded.jsep.wasm":$+u}return k+v}};if(a)if(w.numThreads=r,typeof Blob>"u")w.mainScriptUrlOrBlob=(void 0)(__dirname,"ort-wasm-threaded.js");else{let v=`var ortWasmThreaded=${y.toString()};`;w.mainScriptUrlOrBlob=new Blob([v],{type:"text/javascript"})}y(w).then(v=>{ea=!1,ci=!0,Ts=v,m()},v=>{ea=!1,Is=!0,c(v)})})),await Promise.race(f),p)throw new Error(`WebAssembly backend initializing failed due to timeout: ${e}ms`)},at=()=>{if(ci&&Ts)return Ts;throw new Error("WebAssembly is not initialized yet.")}}),tt,Bi,je,Wo=Z(()=>{xa(),tt=(t,e)=>{let r=at(),n=r.lengthBytesUTF8(t)+1,a=r._malloc(n);return r.stringToUTF8(t,a,n),e.push(a),a},Bi=(t,e,r,n)=>{if(typeof t=="object"&&t!==null){if(r.has(t))throw new Error("Circular reference in options");r.add(t)}Object.entries(t).forEach(([a,i])=>{let s=e?e+a:a;if(typeof i=="object")Bi(i,s+".",r,n);else if(typeof i=="string"||typeof i=="number")n(s,i.toString());else if(typeof i=="boolean")n(s,i?"1":"0");else throw new Error(`Can't handle extra config type: ${typeof i}`)})},je=t=>{let e=at(),r=e.stackSave();try{let n=e.stackAlloc(8);e._OrtGetLastError(n,n+4);let a=e.HEAP32[n/4],i=e.HEAPU32[n/4+1],s=i?e.UTF8ToString(i):"";throw new Error(`${t} ERROR_CODE: ${a}, ERROR_MESSAGE: ${s}`)}finally{e.stackRestore(r)}}}),oh,Y_=Z(()=>{xa(),Wo(),oh=t=>{let e=at(),r=0,n=[],a=t||{};try{if(t?.logSeverityLevel===void 0)a.logSeverityLevel=2;else if(typeof t.logSeverityLevel!="number"||!Number.isInteger(t.logSeverityLevel)||t.logSeverityLevel<0||t.logSeverityLevel>4)throw new Error(`log serverity level is not valid: ${t.logSeverityLevel}`);if(t?.logVerbosityLevel===void 0)a.logVerbosityLevel=0;else if(typeof t.logVerbosityLevel!="number"||!Number.isInteger(t.logVerbosityLevel))throw new Error(`log verbosity level is not valid: ${t.logVerbosityLevel}`);t?.terminate===void 0&&(a.terminate=!1);let i=0;return t?.tag!==void 0&&(i=tt(t.tag,n)),r=e._OrtCreateRunOptions(a.logSeverityLevel,a.logVerbosityLevel,!!a.terminate,i),r===0&&je("Can't create run options."),t?.extra!==void 0&&Bi(t.extra,"",new WeakSet,(s,o)=>{let u=tt(s,n),l=tt(o,n);e._OrtAddRunConfigEntry(r,u,l)!==0&&je(`Can't set a run config entry: ${s} - ${o}.`)}),[r,n]}catch(i){throw r!==0&&e._OrtReleaseRunOptions(r),n.forEach(s=>e._free(s)),i}}}),tl,rl,nl,al,uh,X_=Z(()=>{xa(),Wo(),tl=t=>{switch(t){case"disabled":return 0;case"basic":return 1;case"extended":return 2;case"all":return 99;default:throw new Error(`unsupported graph optimization level: ${t}`)}},rl=t=>{switch(t){case"sequential":return 0;case"parallel":return 1;default:throw new Error(`unsupported execution mode: ${t}`)}},nl=t=>{t.extra||(t.extra={}),t.extra.session||(t.extra.session={});let e=t.extra.session;e.use_ort_model_bytes_directly||(e.use_ort_model_bytes_directly="1"),t.executionProviders&&t.executionProviders.some(r=>(typeof r=="string"?r:r.name)==="webgpu")&&(t.enableMemPattern=!1)},al=(t,e,r)=>{for(let n of e){let a=typeof n=="string"?n:n.name;switch(a){case"webnn":if(a="WEBNN",typeof n!="string"){let s=n;if(s?.deviceType){let o=tt("deviceType",r),u=tt(s.deviceType,r);at()._OrtAddSessionConfigEntry(t,o,u)!==0&&je(`Can't set a session config entry: 'deviceType' - ${s.deviceType}.`)}if(s?.numThreads){let o=s.numThreads;(typeof o!="number"||!Number.isInteger(o)||o<0)&&(o=0);let u=tt("numThreads",r),l=tt(o.toString(),r);at()._OrtAddSessionConfigEntry(t,u,l)!==0&&je(`Can't set a session config entry: 'numThreads' - ${s.numThreads}.`)}if(s?.powerPreference){let o=tt("powerPreference",r),u=tt(s.powerPreference,r);at()._OrtAddSessionConfigEntry(t,o,u)!==0&&je(`Can't set a session config entry: 'powerPreference' - ${s.powerPreference}.`)}}break;case"webgpu":if(a="JS",typeof n!="string"){let s=n;if(s?.preferredLayout){if(s.preferredLayout!=="NCHW"&&s.preferredLayout!=="NHWC")throw new Error(`preferredLayout must be either 'NCHW' or 'NHWC': ${s.preferredLayout}`);let o=tt("preferredLayout",r),u=tt(s.preferredLayout,r);at()._OrtAddSessionConfigEntry(t,o,u)!==0&&je(`Can't set a session config entry: 'preferredLayout' - ${s.preferredLayout}.`)}}break;case"wasm":case"cpu":continue;default:throw new Error(`not supported execution provider: ${a}`)}let i=tt(a,r);at()._OrtAppendExecutionProvider(t,i)!==0&&je(`Can't append execution provider: ${a}.`)}},uh=t=>{let e=at(),r=0,n=[],a=t||{};nl(a);try{let i=tl(a.graphOptimizationLevel??"all"),s=rl(a.executionMode??"sequential"),o=typeof a.logId=="string"?tt(a.logId,n):0,u=a.logSeverityLevel??2;if(!Number.isInteger(u)||u<0||u>4)throw new Error(`log serverity level is not valid: ${u}`);let l=a.logVerbosityLevel??0;if(!Number.isInteger(l)||l<0||l>4)throw new Error(`log verbosity level is not valid: ${l}`);let p=typeof a.optimizedModelFilePath=="string"?tt(a.optimizedModelFilePath,n):0;if(r=e._OrtCreateSessionOptions(i,!!a.enableCpuMemArena,!!a.enableMemPattern,s,!!a.enableProfiling,0,o,u,l,p),r===0&&je("Can't create session options."),a.executionProviders&&al(r,a.executionProviders,n),a.enableGraphCapture!==void 0){if(typeof a.enableGraphCapture!="boolean")throw new Error(`enableGraphCapture must be a boolean value: ${a.enableGraphCapture}`);let f=tt("enableGraphCapture",n),m=tt(a.enableGraphCapture.toString(),n);e._OrtAddSessionConfigEntry(r,f,m)!==0&&je(`Can't set a session config entry: 'enableGraphCapture' - ${a.enableGraphCapture}.`)}if(a.freeDimensionOverrides)for(let[f,m]of Object.entries(a.freeDimensionOverrides)){if(typeof f!="string")throw new Error(`free dimension override name must be a string: ${f}`);if(typeof m!="number"||!Number.isInteger(m)||m<0)throw new Error(`free dimension override value must be a non-negative integer: ${m}`);let c=tt(f,n);e._OrtAddFreeDimensionOverride(r,c,m)!==0&&je(`Can't set a free dimension override: ${f} - ${m}.`)}return a.extra!==void 0&&Bi(a.extra,"",new WeakSet,(f,m)=>{let c=tt(f,n),y=tt(m,n);e._OrtAddSessionConfigEntry(r,c,y)!==0&&je(`Can't set a session config entry: ${f} - ${m}.`)}),[r,n]}catch(i){throw r!==0&&e._OrtReleaseSessionOptions(r),n.forEach(s=>e._free(s)),i}}}),fo,Kr,ga,Vo,Di,Go,mo,$e=Z(()=>{fo=t=>{switch(t){case"int8":return 3;case"uint8":return 2;case"bool":return 9;case"int16":return 5;case"uint16":return 4;case"int32":return 6;case"uint32":return 12;case"float16":return 10;case"float32":return 1;case"float64":return 11;case"string":return 8;case"int64":return 7;case"uint64":return 13;default:throw new Error(`unsupported data type: ${t}`)}},Kr=t=>{switch(t){case 3:return"int8";case 2:return"uint8";case 9:return"bool";case 5:return"int16";case 4:return"uint16";case 6:return"int32";case 12:return"uint32";case 10:return"float16";case 1:return"float32";case 11:return"float64";case 8:return"string";case 7:return"int64";case 13:return"uint64";default:throw new Error(`unsupported data type: ${t}`)}},ga=t=>[void 0,4,1,1,2,2,4,8,void 0,1,2,8,4,8,void 0,void 0,void 0][t],Vo=t=>{switch(t){case"float16":return typeof Float16Array<"u"&&Float16Array.from?Float16Array:Uint16Array;case"float32":return Float32Array;case"uint8":return Uint8Array;case"int8":return Int8Array;case"uint16":return Uint16Array;case"int16":return Int16Array;case"int32":return Int32Array;case"bool":return Uint8Array;case"float64":return Float64Array;case"uint32":return Uint32Array;case"int64":return BigInt64Array;case"uint64":return BigUint64Array;default:throw new Error(`unsupported type: ${t}`)}},Di=t=>{switch(t){case"verbose":return 0;case"info":return 1;case"warning":return 2;case"error":return 3;case"fatal":return 4;default:throw new Error(`unsupported logging level: ${t}`)}},Go=t=>t==="float32"||t==="float16"||t==="int32"||t==="int64"||t==="uint32"||t==="uint8"||t==="bool",mo=t=>{switch(t){case"none":return 0;case"cpu":return 1;case"cpu-pinned":return 2;case"texture":return 3;case"gpu-buffer":return 4;default:throw new Error(`unsupported data location: ${t}`)}}}),Ni,lh=Z(()=>{Ni=async t=>{if(typeof t=="string")if(typeof process<"u"&&process.versions&&process.versions.node)try{return new Uint8Array(await(void 0)(t))}catch(e){if(e.code==="ERR_FS_FILE_TOO_LARGE"){let r=(void 0)(t),n=[];for await(let a of r)n.push(a);return new Uint8Array(Buffer.concat(n))}throw e}else{let e=await fetch(t);if(!e.ok)throw new Error(`failed to load external data file: ${t}`);let r=e.headers.get("Content-Length"),n=r?parseInt(r,10):0;if(n<1073741824)return new Uint8Array(await e.arrayBuffer());{if(!e.body)throw new Error(`failed to load external data file: ${t}, no response body.`);let a=e.body.getReader(),i;try{i=new ArrayBuffer(n)}catch(o){if(o instanceof RangeError){let u=Math.ceil(n/65536);i=new WebAssembly.Memory({initial:u,maximum:u}).buffer}else throw o}let s=0;for(;;){let{done:o,value:u}=await a.read();if(o)break;let l=u.byteLength;new Uint8Array(i,s,l).set(u),s+=l}return new Uint8Array(i,0,n)}}else return t instanceof Blob?new Uint8Array(await t.arrayBuffer()):t instanceof Uint8Array?t:new Uint8Array(t)}}),il,sl,ol,ul,dh,ll,rt,nn=Z(()=>{$e(),il=["V","I","W","E","F"],sl=(t,e)=>{console.log(`[${il[t]},${new Date().toISOString()}]${e}`)},dh=(t,e)=>{ol=t,ul=e},ll=(t,e)=>{let r=Di(t),n=Di(ol);r>=n&&sl(r,typeof e=="function"?e():e)},rt=(...t)=>{ul&&ll(...t)}}),ch,Q_=Z(()=>{$e(),ch=(t,e)=>new(Vo(e))(t)}),Ho=Z(()=>{}),As,pi,hi,dl,cl,Ms,go,pl,ph,J_=Z(()=>{nn(),Ho(),As=new Map([[64,250],[128,200],[256,200],[512,200],[2048,230],[4096,200],[8192,50],[16384,50],[32768,50],[65536,50],[131072,50],[262144,50],[524288,50],[1048576,50],[2097152,30],[4194304,20],[8388608,10],[12582912,10],[16777216,10],[26214400,15],[33554432,22],[44236800,2],[58982400,6],[67108864,6],[134217728,6],[167772160,6]]),pi=[],hi=t=>Math.ceil(t/16)*16,dl=t=>{for(let e=0;ecl++,go=async(t,e,r,n)=>{let a=hi(r),i=t.device.createBuffer({size:a,usage:GPUBufferUsage.COPY_DST|GPUBufferUsage.MAP_READ});try{let s=t.getCommandEncoder();t.endComputePass(),s.copyBufferToBuffer(e,0,i,0,a),t.flush(),await i.mapAsync(GPUMapMode.READ);let o=i.getMappedRange();if(n){let u=n();return u.set(new Uint8Array(o,0,r)),u}else return new Uint8Array(o.slice(0,r))}finally{i.destroy()}},pl=class{constructor(t){this.backend=t,this.storageCache=new Map,this.freeBuffers=new Map,this.freeUniformBuffers=new Map,this.buffersForUploadingPending=[],this.buffersPending=[],this.externalBuffers=new Map,this.capturedPendingBuffers=new Map;for(let[e]of As)pi.push(e),this.freeBuffers.set(e,[]),this.freeUniformBuffers.set(e,[])}upload(t,e){let r=e.buffer,n=e.byteOffset,a=e.byteLength,i=hi(a),s=this.storageCache.get(t);if(!s)throw new Error("gpu data for uploading does not exist");if(s.originalSize!==a)throw new Error(`inconsistent data size. gpu data size=${s.originalSize}, data size=${a}`);let o=this.backend.device.createBuffer({mappedAtCreation:!0,size:i,usage:GPUBufferUsage.MAP_WRITE|GPUBufferUsage.COPY_SRC}),u=o.getMappedRange();new Uint8Array(u).set(new Uint8Array(r,n,a)),o.unmap();let l=this.backend.getCommandEncoder();this.backend.endComputePass(),l.copyBufferToBuffer(o,0,s.gpuData.buffer,0,i),rt("verbose",()=>`[WebGPU] GpuDataManager.upload(id=${t})`),this.buffersForUploadingPending.push(o)}memcpy(t,e){let r=this.storageCache.get(t);if(!r)throw new Error("source gpu data for memcpy does not exist");let n=this.storageCache.get(e);if(!n)throw new Error("destination gpu data for memcpy does not exist");if(r.originalSize!==n.originalSize)throw new Error("inconsistent source and destination gpu data size");let a=hi(r.originalSize),i=this.backend.getCommandEncoder();this.backend.endComputePass(),i.copyBufferToBuffer(r.gpuData.buffer,0,n.gpuData.buffer,0,a)}registerExternalBuffer(t,e,r){let n;if(r){if(n=this.externalBuffers.get(r),n===void 0)throw new Error("previous buffer is not registered");if(t===r)return rt("verbose",()=>`[WebGPU] GpuDataManager.registerExternalBuffer(size=${e}) => id=${n}, buffer is the same, skip.`),n;if(this.backend.capturedCommandList.has(this.backend.currentSessionId))throw new Error(`Registering a different external buffer under graph capture mode is not supported yet. - Please use the previous external buffer!`);this.externalBuffers.delete(r)}else n=Ms();return this.storageCache.set(n,{gpuData:{id:n,type:0,buffer:t},originalSize:e}),this.externalBuffers.set(t,n),rt("verbose",()=>`[WebGPU] GpuDataManager.registerExternalBuffer(size=${e}) => id=${n}, registered.`),n}unregisterExternalBuffer(t){let e=this.externalBuffers.get(t);e!==void 0&&(this.storageCache.delete(e),this.externalBuffers.delete(t),rt("verbose",()=>`[WebGPU] GpuDataManager.unregisterExternalBuffer() => id=${e}`))}create(t,e=GPUBufferUsage.STORAGE|GPUBufferUsage.COPY_SRC|GPUBufferUsage.COPY_DST){let r=dl(t),n,a=(e&GPUBufferUsage.STORAGE)===GPUBufferUsage.STORAGE,i=(e&GPUBufferUsage.UNIFORM)===GPUBufferUsage.UNIFORM;if(a||i){let o=(a?this.freeBuffers:this.freeUniformBuffers).get(r);o?o.length>0?n=o.pop():n=this.backend.device.createBuffer({size:r,usage:e}):n=this.backend.device.createBuffer({size:r,usage:e})}else n=this.backend.device.createBuffer({size:r,usage:e});let s={id:Ms(),type:0,buffer:n};return this.storageCache.set(s.id,{gpuData:s,originalSize:t}),rt("verbose",()=>`[WebGPU] GpuDataManager.create(size=${t}) => id=${s.id}`),s}get(t){return this.storageCache.get(t)?.gpuData}release(t){let e=this.storageCache.get(t);if(!e)throw new Error("releasing data does not exist");return rt("verbose",()=>`[WebGPU] GpuDataManager.release(id=${t}), gpuDataId=${e.gpuData.id}`),this.storageCache.delete(t),this.buffersPending.push(e.gpuData.buffer),e.originalSize}async download(t,e){let r=this.storageCache.get(t);if(!r)throw new Error("data does not exist");await go(this.backend,r.gpuData.buffer,r.originalSize,e)}refreshPendingBuffers(){for(let t of this.buffersForUploadingPending)t.destroy();if(this.buffersForUploadingPending=[],this.buffersPending.length!==0)if(this.backend.sessionStatus==="default"){for(let t of this.buffersPending){let e=As.get(t.size);if((t.usage&GPUBufferUsage.STORAGE)===GPUBufferUsage.STORAGE){let r=this.freeBuffers.get(t.size)||[];e===void 0||r.length>=e?t.destroy():r.push(t)}else if((t.usage&GPUBufferUsage.UNIFORM)===GPUBufferUsage.UNIFORM){let r=this.freeUniformBuffers.get(t.size)||[];e===void 0||r.length>=e?t.destroy():r.push(t)}else t.destroy()}this.buffersPending=[]}else{let t=this.capturedPendingBuffers.get(this.backend.currentSessionId);t||(t=[],this.capturedPendingBuffers.set(this.backend.currentSessionId,t));for(let e of this.buffersPending)t.push(e);this.buffersPending=[]}}dispose(){this.freeBuffers.forEach(t=>{t.forEach(e=>{e.destroy()})}),this.freeUniformBuffers.forEach(t=>{t.forEach(e=>{e.destroy()})}),this.storageCache.forEach(t=>{t.gpuData.buffer.destroy()}),this.capturedPendingBuffers.forEach(t=>{t.forEach(e=>{e.destroy()})}),this.storageCache=new Map,this.freeBuffers=new Map,this.freeUniformBuffers=new Map,this.capturedPendingBuffers=new Map}onReleaseSession(t){let e=this.capturedPendingBuffers.get(t);e&&(e.forEach(r=>{r.destroy()}),this.capturedPendingBuffers.delete(t))}},ph=(...t)=>new pl(...t)}),hl,qe,lt=Z(()=>{hl=class{constructor(t){Object.assign(this,t)}get cacheKey(){return this.key||(this.key=Object.getOwnPropertyNames(this).sort().map(t=>`${this[t]}`).join(";")),this.key}},qe=t=>new hl(t)}),fl,En,Y,Fi,hh,jo,qo,Ae=Z(()=>{fl=class{static calcMatMulShape(t,e){return t[1]!==e[0]?void 0:[t[0],e[1]]}},En=class{static calcShape(t,e,r=!1){let n=t.length,a=e.length;if(n===0)return e;if(a===0)return t;let i=Math.max(t.length,e.length),s=new Array(i);if(r){if(n<2||a<2)return;let o=fl.calcMatMulShape([t[n-2],t[n-1]],[e[a-2],e[a-1]]);if(o===void 0)return;[s[i-2],s[i-1]]=o}for(let o=r?3:1;o<=i;o++){let u=n-o<0?1:t[n-o],l=a-o<0?1:e[a-o];if(u!==l&&u>1&&l>1)return;let p=Math.max(u,l);if(u&&l)s[i-o]=Math.max(u,l);else{if(p>1)return;s[i-o]=0}}return s}static isValidBroadcast(t,e){let r=t.length,n=e.length;if(r>n)return!1;for(let a=1;a<=r;a++)if(t[r-a]!==1&&t[r-a]!==e[n-a])return!1;return!0}},Y=class Ei{static size(e){return Ei.getSizeFromDimensionRange(e,0,e.length)}static convertShape(e,r=4){let n=e.length;if(n===0)return[];let a=new Array(n),i=n-1;for(;i>=0;){if(e[i]%r===0){a[i]=e[i]/r;break}if(r%e[i]!==0)throw new Error("cannot convert shape");a[i]=1,r/=e[i],i--}for(i--;i>=0;i--)a[i]=e[i];return a}static sizeFromDimension(e,r){if(r<0||r>e.length)throw new Error(`invalid dimension of ${r} for sizeFromDimension as Tensor has ${e.length} dimensions.`);return Ei.getSizeFromDimensionRange(e,r,e.length)}static sizeToDimension(e,r){if(r<0||r>e.length)throw new Error(`invalid dimension of ${r} for sizeToDimension as Tensor has ${e.length} dimensions.`);return Ei.getSizeFromDimensionRange(e,0,r)}static getSizeFromDimensionRange(e,r,n){let a=1;for(let i=r;i=0;--a)n[a]=n[a+1]*e[a+1];return n}static normalizeAxis(e,r){if(e<-r&&e>=r)throw new Error("unsupported axis for this operation.");return e<0?e+r:e}static normalizeAxes(e,r){return e.map(n=>this.normalizeAxis(n,r??e.length))}static sortBasedOnPerm(e,r){return r?r.map(n=>e[n]):e.slice().reverse()}static padShape(e,r){let n=e.length;return e.map((a,i)=>a+r[i]+r[i+n])}static areEqual(e,r){return e.length!==r.length?!1:e.every((n,a)=>n===r[a])}},Fi=class la{static adjustPoolAttributes(e,r,n,a,i,s){if(!e&&n.length!==r.length-2)throw new Error("length of specified kernel shapes should be 2 less than length of input dimensions");if(e)for(let o=0;o=n.length?n.push(r[o+2]):n[o]=r[o+2];for(let o=0;o=n[o]||s[o+n.length]>=n[o])throw new Error("pads should be smaller than kernel")}}static adjustPadsBasedOnAutoPad(e,r,n,a,i,s,o){if(o){if(i.length!==2*(e.length-2))throw new Error("length of pads should be twice the length of data dimensions");if(r.length!==e.length-2)throw new Error("length of strides should be the length of data dimensions");if(a.length!==e.length-2)throw new Error("length of kernel shapes should be the length of data dimensions");for(let u=0;u{$e(),Ae(),Cn=64,fi=(t,e)=>{if(e===3)throw new Error("vec3 has same alignment as vec4, use vec4 instead");switch(t){case 10:return e>1?`vec${e}`:"f16";case 1:return e>1?`vec${e}`:"f32";case 6:return e>1?`vec${e}`:"i32";case 12:return e>1?`vec${e}`:"u32";case 7:if(e>1)throw new Error("currently not supported vecX of uint64 yet");return["vec2","i32"];case 13:if(e>1)throw new Error("currently not supported vecX of uint64 yet");return["vec2","u32"];case 9:if(e!==4)throw new Error("bool must be vec4");return["u32","vec4"];default:throw new Error(`Unknown data type: ${t}`)}},pt=(t,e=1)=>{let r=fi(t,e);return typeof r=="string"?r:r[0]},Tt=(t,e=1)=>{let r=fi(t,e);return typeof r=="string"?r:r[1]},ye=(...t)=>{let e=[];return t.forEach(r=>{r.length!==0&&e.push({type:12,data:r},{type:12,data:Y.computeStrides(r)})}),e},it=t=>t%4===0?4:t%2===0?2:1,wr=(t="f32",e,r="0")=>!e||e===1?`${t}(${r})`:`vec${e}<${t}>(${r})`,Sn=(t,e,r)=>t==="f32"?r:e===1?`f32(${r})`:`vec${e}(${r})`,Or=(t,e)=>e===4?`(${t}.x + ${t}.y + ${t}.z + ${t}.w)`:e===2?`(${t}.x + ${t}.y)`:e===3?`(${t}.x + ${t}.y + ${t}.z)`:t,Se=(t,e,r,n)=>t.startsWith("uniforms.")&&r>4?typeof e=="string"?n==="f16"?`${t}[(${e}) / 8][(${e}) % 8 / 4][(${e}) % 8 % 4]`:`${t}[(${e}) / 4][(${e}) % 4]`:n==="f16"?`${t}[${Math.floor(e/8)}][${Math.floor(e%8/4)}][${e%8%4}]`:`${t}[${Math.floor(e/4)}][${e%4}]`:r>1?`${t}[${e}]`:t,mi=(t,e,r,n,a)=>{let i=typeof r=="number",s=i?r:r.length,o=[...new Array(s).keys()],u=s<2?"u32":s<=4?`vec${s}`:`array`,l=fi(e,a),p=typeof l=="string"?l:l[1],f=typeof l=="string"?l:l[0],m={indices:u,value:p,storage:f,tensor:e},c=N=>typeof N=="string"?N:`${N}u`,y={offsetToIndices:!1,indicesToOffset:!1,broadcastedIndicesToOffset:!1,set:!1,setByIndices:!1,get:!1,getByIndices:!1},w=i?"uniforms.":"",v=`${w}${t}_shape`,k=`${w}${t}_strides`,$="";for(let N=0;N ${m.indices} { - var indices: ${m.indices}; - var current = offset; - ${$} - return indices; - }`,T=N=>(y.offsetToIndices=!0,s<2?N:`o2i_${t}(${N})`),A=[];if(s>=2)for(let N=s-1;N>=0;N--)A.push(`${Se(k,N,s)} * (indices[${N}])`);let B=s<2?"":` - fn i2o_${t}(indices: ${m.indices}) -> u32 { - return ${A.join("+")}; - }`,R=N=>(y.indicesToOffset=!0,s<2?N:`i2o_${t}(${N})`),D=(...N)=>s===0?"0u":`${m.indices}(${N.map(c).join(",")})`,K=(N,ae)=>s<2?`${N}`:`${Se(N,ae,s)}`,j=(N,ae,fe)=>s<2?`${N}=${fe};`:`${Se(N,ae,s)}=${fe};`,ie={},te=(N,ae)=>{y.broadcastedIndicesToOffset=!0;let fe=`${ae.name}broadcastedIndicesTo${t}Offset`;if(fe in ie)return`${fe}(${N})`;let Ce=[];for(let Be=s-1;Be>=0;Be--){let Ke=ae.indicesGet("outputIndices",Be+ae.rank-s);Ce.push(`${K(k,Be)} * (${Ke} % ${K(v,Be)})`)}return ie[fe]=`fn ${fe}(outputIndices: ${ae.type.indices}) -> u32 { - return ${Ce.length>0?Ce.join("+"):"0u"}; - }`,`${fe}(${N})`},oe=(N,ae)=>(()=>{if(m.storage===m.value)return`${t}[${N}]=${ae};`;if(m.storage==="vec2"&&m.value==="i32")return`${t}[${N}]=vec2(u32(${ae}), select(0u, 0xFFFFFFFFu, ${ae} < 0));`;if(m.storage==="vec2"&&m.value==="u32")return`${t}[${N}]=vec2(u32(${ae}), 0u);`;if(m.storage==="u32"&&m.value==="vec4")return`${t}[${N}]=dot(vec4(0x1, 0x100, 0x10000, 0x1000000), vec4(${ae}));`;throw new Error(`not supported combination of storage type ${m.storage} and value type ${m.value} yet`)})(),re=N=>(()=>{if(m.storage===m.value)return`${t}[${N}]`;if(m.storage==="vec2"&&m.value==="i32")return`i32(${t}[${N}].x)`;if(m.storage==="vec2"&&m.value==="u32")return`u32(${t}[${N}].x)`;if(m.storage==="u32"&&m.value==="vec4")return`vec4(bool(${t}[${N}] & 0xFFu), bool(${t}[${N}] & 0xFF00u), bool(${t}[${N}] & 0xFF0000u), bool(${t}[${N}] & 0xFF000000u))`;throw new Error(`not supported combination of storage type ${m.storage} and value type ${m.value} yet`)})(),M=s<2?"":` - fn get_${t}ByIndices(indices: ${m.indices}) -> ${p} { - return ${re(`i2o_${t}(indices)`)}; - }`,P=s<2?"":(()=>{let N=o.map(fe=>`d${fe}: u32`).join(", "),ae=o.map(fe=>`d${fe}`).join(", ");return` - fn get_${t}(${N}) -> ${p} { - return get_${t}ByIndices(${D(ae)}); - }`})(),H=(...N)=>{if(N.length!==s)throw new Error(`indices length must be ${s}`);let ae=N.map(c).join(",");return s===0?re("0u"):s===1?re(ae[0]):(y.get=!0,y.getByIndices=!0,y.indicesToOffset=!0,`get_${t}(${ae})`)},le=N=>s<2?re(N):(y.getByIndices=!0,y.indicesToOffset=!0,`get_${t}ByIndices(${N})`),G=s<2?"":` - fn set_${t}ByIndices(indices: ${m.indices}, value: ${p}) { - ${oe(`i2o_${t}(indices)`,"value")} - }`,ne=s<2?"":(()=>{let N=o.map(fe=>`d${fe}: u32`).join(", "),ae=o.map(fe=>`d${fe}`).join(", ");return` - fn set_${t}(${N}, value: ${p}) { - set_${t}ByIndices(${D(ae)}, value); - }`})();return{impl:()=>{let N=[],ae=!1;return y.offsetToIndices&&(N.push(C),ae=!0),y.indicesToOffset&&(N.push(B),ae=!0),y.broadcastedIndicesToOffset&&(Object.values(ie).forEach(fe=>N.push(fe)),ae=!0),y.set&&(N.push(ne),ae=!0),y.setByIndices&&(N.push(G),ae=!0),y.get&&(N.push(P),ae=!0),y.getByIndices&&(N.push(M),ae=!0),!i&&ae&&N.unshift(`const ${v} = ${m.indices}(${r.join(",")});`,`const ${k} = ${m.indices}(${Y.computeStrides(r).join(",")});`),N.join(` -`)},type:m,offsetToIndices:T,indicesToOffset:R,broadcastedIndicesToOffset:te,indices:D,indicesGet:K,indicesSet:j,set:(...N)=>{if(N.length!==s+1)throw new Error(`indices length must be ${s}`);let ae=N[s];if(typeof ae!="string")throw new Error("value must be string");let fe=N.slice(0,s).map(c).join(",");return s===0?oe("0u",ae):s===1?oe(fe[0],ae):(y.set=!0,y.setByIndices=!0,y.indicesToOffset=!0,`set_${t}(${fe}, ${ae})`)},setByOffset:oe,setByIndices:(N,ae)=>s<2?oe(N,ae):(y.setByIndices=!0,y.indicesToOffset=!0,`set_${t}ByIndices(${N}, ${ae});`),get:H,getByOffset:re,getByIndices:le,usage:n,name:t,strides:k,shape:v,rank:s}},Q=(t,e,r,n=1)=>mi(t,e,r,"input",n),ge=(t,e,r,n=1)=>mi(t,e,r,"output",n),Ko=(t,e,r,n=1)=>mi(t,e,r,"internal",n),ml=class{constructor(t,e){this.normalizedDispatchGroup=t,this.limits=e,this.internalVariables=[],this.variables=[],this.uniforms=[],this.variableIndex=0}guardAgainstOutOfBoundsWorkgroupSizes(t){return`if (global_idx >= ${typeof t=="number"?`${t}u`:t}) { return; }`}mainStart(t=Cn){let e=typeof t=="number"?t:t[0],r=typeof t=="number"?1:t[1],n=typeof t=="number"?1:t[2];if(e>this.limits.maxComputeWorkgroupSizeX||r>this.limits.maxComputeWorkgroupSizeY||n>this.limits.maxComputeWorkgroupSizeZ)throw new Error(`workgroup size [${e}, ${r}, ${n}] exceeds the maximum workgroup size [${this.limits.maxComputeWorkgroupSizeX}, ${this.limits.maxComputeWorkgroupSizeY}, ${this.limits.maxComputeWorkgroupSizeZ}].`);if(e*r*n>this.limits.maxComputeInvocationsPerWorkgroup)throw new Error(`workgroup size [${e}, ${r}, ${n}] exceeds the maximum workgroup invocations ${this.limits.maxComputeInvocationsPerWorkgroup}.`);let a=this.normalizedDispatchGroup[1]===1&&this.normalizedDispatchGroup[2]===1,i=a?`@builtin(global_invocation_id) global_id : vec3, - @builtin(workgroup_id) workgroup_id : vec3, - @builtin(local_invocation_id) local_id : vec3`:`@builtin(global_invocation_id) global_id : vec3, - @builtin(local_invocation_id) local_id : vec3, - @builtin(local_invocation_index) local_idx : u32, - @builtin(workgroup_id) workgroup_id : vec3, - @builtin(num_workgroups) num_workgroups : vec3`,s=a?"let global_idx = global_id.x; let local_idx = local_id.x;":`let global_idx = (workgroup_id.z * num_workgroups[0] * num_workgroups[1] + - workgroup_id.y * num_workgroups[0] + workgroup_id.x) * ${e*r*n}u + local_idx;`;return`@compute @workgroup_size(${e}, ${r}, ${n}) - fn main(${i}) { - ${s} - `}appendVariableUniforms(t){t.rank!==0&&(t.shape.startsWith("uniforms.")&&this.uniforms.push({name:t.shape.replace("uniforms.",""),type:"u32",length:t.rank}),t.strides.startsWith("uniforms.")&&this.uniforms.push({name:t.strides.replace("uniforms.",""),type:"u32",length:t.rank}))}declareVariable(t,e){if(t.usage==="internal")throw new Error("cannot use internal variable with declareVariable(). use registerInternalVariables() instead.");this.variables.push(t),this.appendVariableUniforms(t);let r=t.usage==="input"?"read":"read_write",n=t.type.storage;return`@group(0) @binding(${e}) var ${t.name}: array<${n}>;`}declareVariables(...t){return t.map(e=>this.declareVariable(e,this.variableIndex++)).join(` -`)}registerInternalVariable(t){if(t.usage!=="internal")throw new Error("cannot use input or output variable with registerInternalVariable(). use declareVariables() instead.");this.internalVariables.push(t),this.appendVariableUniforms(t)}registerInternalVariables(...t){return t.forEach(e=>this.registerInternalVariable(e)),this}registerUniform(t,e,r=1){return this.uniforms.push({name:t,type:e,length:r}),this}registerUniforms(t){return this.uniforms=this.uniforms.concat(t),this}uniformDeclaration(){if(this.uniforms.length===0)return"";let t=[];for(let{name:e,type:r,length:n}of this.uniforms)if(n&&n>4)r==="f16"?t.push(`@align(16) ${e}:array, ${Math.ceil(n/8)}>`):t.push(`${e}:array, ${Math.ceil(n/4)}>`);else{let a=n==null||n===1?r:`vec${n}<${r}>`;t.push(`${e}:${a}`)}return` - struct Uniforms { ${t.join(", ")} }; - @group(0) @binding(${this.variableIndex}) var uniforms: Uniforms;`}get additionalImplementations(){return this.uniformDeclaration()+this.variables.map(t=>t.impl()).join(` -`)+this.internalVariables.map(t=>t.impl()).join(` -`)}get variablesInfo(){if(this.uniforms.length===0)return;let t=e=>[12,10,1,6][["u32","f16","f32","i32"].indexOf(e)];return this.uniforms.map(e=>[t(e.type),e.length??1])}},fh=(t,e)=>new ml(t,e),_a=(t,e)=>{let r=t.length,n=[];for(let a=0;a1&&s===1&&n.unshift(i)}return n}}),gl,Os,_l,yl,vr,mh,gh,Sa=Z(()=>{$e(),Ae(),lt(),Te(),gl=t=>{if(!t||t.length!==1)throw new Error("Transpose requires 1 input.")},Os=(t,e)=>e&&e.length!==t?[...new Array(t).keys()].reverse():e,_l=(t,e)=>Y.sortBasedOnPerm(t,Os(t.length,e)),yl=(t,e,r,n)=>{let a=[];a.push(`fn perm(i: ${n.type.indices}) -> ${r.type.indices} { - var a: ${r.type.indices};`);for(let i=0;i{let r=t.dataType,n=t.dims.length,a=Os(n,e),i=_l(t.dims,a),s=ge("output",r,i.length),o=Q("a",r,n),u=l=>` - ${l.registerUniform("output_size","u32").declareVariables(o,s)} - - ${yl(a,n,o,s)} - - ${l.mainStart()} - ${l.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} - - let indices = ${s.offsetToIndices("global_idx")}; - let aIndices = perm(indices); - - ${s.setByOffset("global_idx",o.getByIndices("aIndices"))} - }`;return{name:"Transpose",shaderCache:{hint:`${e}`,inputDependencies:["rank"]},getRunData:l=>{let p=Y.size(i);return{outputs:[{dims:i,dataType:l[0].dataType}],dispatchGroup:{x:Math.ceil(p/64)},programUniforms:[{type:12,data:p},...ye(l[0].dims,i)]}},getShaderSource:u}},mh=(t,e)=>{gl(t.inputs),t.compute(vr(t.inputs[0],e.perm))},gh=t=>qe({perm:t.perm})}),wl,bl,vl,$l,xl,Sl,kl,El,Cl,Tl,Kt,_h,yh,wh,bh,vh,$h,xh,Sh,kh,Eh,Z_=Z(()=>{$e(),Ae(),Te(),Yo(),Sa(),wl={max:"select(bestValue, candidate, candidate > bestValue)",min:"select(bestValue, candidate, candidate < bestValue)",mean:"bestValue + candidate",sum:"bestValue + candidate",prod:"bestValue * candidate",sumSquare:"bestValue + candidate * candidate",logSumExp:"bestValue + exp(candidate)",l1:"bestValue + abs(candidate)",l2:"bestValue + candidate * candidate",logSum:"bestValue + candidate"},bl={max:"select(bestValue, candidate, candidate > bestValue)",min:"select(bestValue, candidate, candidate < bestValue)",mean:"bestValue + candidate",sum:"bestValue + candidate",prod:"bestValue * candidate",sumSquare:"bestValue + candidate",logSumExp:"bestValue + candidate",l1:"bestValue + candidate",l2:"bestValue + candidate",logSum:"bestValue + candidate"},vl={max:"_A[offset]",min:"_A[offset]",mean:"0",sum:"0",prod:"1",sumSquare:"0",logSumExp:"0",l1:"0",l2:"0",logSum:"0"},$l={max:"bestValue",min:"bestValue",sum:"bestValue",prod:"bestValue",sumSquare:"bestValue",logSumExp:"log(bestValue)",l1:"bestValue",l2:"sqrt(bestValue)",logSum:"log(bestValue)"},xl=(t,e)=>{let r=[];for(let n=e-t;n{let r=[],n=t.length;for(let i=0;it[i]);return[r,a]},kl=(t,e)=>{let r=t.length+e.length,n=[],a=0;for(let i=0;i{for(let r=0;r{let r=[];if(!El(t,e)){for(let n=0;nr.push(n))}return r},Tl=(t,e,r,n,a,i,s)=>{let o=r[0].dims,u=Y.size(i),l=Y.size(s),p=Q("_A",r[0].dataType,o),f=ge("output",a,i),m=32,c=` - var aBestValues : array; - `;return{name:t,shaderCache:e,getShaderSource:y=>` - ${y.registerUniform("reduceSize","u32").declareVariables(p,f)} - ${c} - fn DIV_CEIL(a : u32, b : u32) -> u32 { - return ((a - 1u) / b + 1u); - } - ${y.mainStart(m)} - - let outputIndex = global_idx / ${m}; - let offset = outputIndex * uniforms.reduceSize; - - var bestValue = f32(${vl[n]}); - let Length = uniforms.reduceSize; - for (var k = local_idx; k < Length; k = k + ${m}) { - let candidate = f32(${p.getByOffset("offset + k")}); - bestValue = ${wl[n]}; - } - aBestValues[local_idx] = bestValue; - workgroupBarrier(); - - var reduceSize = min(Length, ${m}u); - for (var currentSize = reduceSize / 2u; reduceSize > 1u; - currentSize = reduceSize / 2u) { - let interval = DIV_CEIL(reduceSize, 2u); - if (local_idx < currentSize) { - let candidate = aBestValues[local_idx + interval]; - bestValue = ${bl[n]}; - aBestValues[local_idx] = bestValue; - } - reduceSize = interval; - workgroupBarrier(); - } - - if (local_idx == 0u) { - ${f.setByOffset("outputIndex",`${n==="mean"?`${f.type.storage}(bestValue / f32(uniforms.reduceSize))`:`${f.type.storage}(${$l[n]})`}`)}; - } - }`,getRunData:()=>({outputs:[{dims:i,dataType:a}],dispatchGroup:{x:u},programUniforms:[{type:12,data:l}]})}},Kt=(t,e,r,n)=>{let a=t.inputs.length===1?r:_o(t.inputs,r),i=a.axes;i.length===0&&!a.noopWithEmptyAxes&&(i=t.inputs[0].dims.map((c,y)=>y));let s=Y.normalizeAxes(i,t.inputs[0].dims.length),o=s,u=t.inputs[0],l=Cl(o,t.inputs[0].dims.length);l.length>0&&(u=t.compute(vr(t.inputs[0],l),{inputs:[0],outputs:[-1]})[0],o=xl(o.length,u.dims.length));let[p,f]=Sl(u.dims,o),m=p;a.keepDims&&(m=kl(p,s)),t.compute(Tl(e,{hint:a.cacheKey,inputDependencies:["type"]},[u],n,t.inputs[0].dataType,m,f),{inputs:[u]})},_h=(t,e)=>{Kt(t,"ReduceMeanShared",e,"mean")},yh=(t,e)=>{Kt(t,"ReduceL1Shared",e,"l1")},wh=(t,e)=>{Kt(t,"ReduceL2Shared",e,"l2")},bh=(t,e)=>{Kt(t,"ReduceLogSumExpShared",e,"logSumExp")},vh=(t,e)=>{Kt(t,"ReduceMaxShared",e,"max")},$h=(t,e)=>{Kt(t,"ReduceMinShared",e,"min")},xh=(t,e)=>{Kt(t,"ReduceProdShared",e,"prod")},Sh=(t,e)=>{Kt(t,"ReduceSumShared",e,"sum")},kh=(t,e)=>{Kt(t,"ReduceSumSquareShared",e,"sumSquare")},Eh=(t,e)=>{Kt(t,"ReduceLogSumShared",e,"logSum")}}),Yt,Il,Li,_o,Xt,Al,Ml,Ol,zl,Pl,Rl,Bl,Dl,Nl,Fl,Qt,Ch,Th,Ih,Ah,Mh,Oh,zh,Ph,Rh,Bh,Yo=Z(()=>{$e(),Ae(),lt(),Te(),Z_(),Yt=t=>{if(!t||t.length===0||t.length>2)throw new Error("Reduce op requires 1 or 2 inputs.");if(t.length===2&&t[1].dims.length!==1)throw new Error("Invalid axes input dims.")},Il=t=>["","",`var value = ${t.getByIndices("input_indices")};`,""],Li=(t,e,r,n,a,i,s=!1,o=!1)=>{let u=[],l=r[0].dims,p=l.length,f=Y.normalizeAxes(a,p),m=!o&&f.length===0;l.forEach((w,v)=>{m||f.indexOf(v)>=0?s&&u.push(1):u.push(w)});let c=u.length,y=Y.size(u);return{name:t,shaderCache:e,getShaderSource:w=>{let v=[],k=Q("_A",r[0].dataType,p),$=ge("output",i,c),C=n(k,$,f),T=C[2];for(let A=0,B=0;A=0?(s&&B++,T=`for(var j${A}: u32 = 0; j${A} < ${l[A]}; j${A}++) { - ${C[2].includes("last_index")?`let last_index = j${A};`:""} - ${k.indicesSet("input_indices",A,`j${A}`)} - ${T} - }`):(v.push(`${k.indicesSet("input_indices",A,$.indicesGet("output_indices",B))};`),B++);return` - - ${w.registerUniform("output_size","u32").declareVariables(k,$)} - - ${w.mainStart()} - ${w.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} - var input_indices: ${k.type.indices}; - let output_indices = ${$.offsetToIndices("global_idx")}; - - ${v.join(` -`)} - ${C[0]} // init ops for reduce max/min - ${C[1]} - ${T} - ${C[3]} - ${C.length===4?$.setByOffset("global_idx","value"):C.slice(4).join(` -`)} - }`},getRunData:()=>({outputs:[{dims:u,dataType:i}],dispatchGroup:{x:Math.ceil(y/64)},programUniforms:[{type:12,data:y},...ye(l,u)]})}},_o=(t,e)=>{let r=[];return t[1].dims[0]>0&&t[1].getBigInt64Array().forEach(n=>r.push(Number(n))),qe({axes:r,keepDims:e.keepDims,noopWithEmptyAxes:e.noopWithEmptyAxes})},Xt=(t,e,r,n)=>{let a=t.inputs,i=a.length===1?r:_o(a,r);t.compute(Li(e,{hint:i.cacheKey,inputDependencies:["rank"]},[a[0]],i.noopWithEmptyAxes&&i.axes.length===0?Il:n,i.axes,a[0].dataType,i.keepDims,i.noopWithEmptyAxes),{inputs:[0]})},Al=(t,e)=>{Yt(t.inputs),Xt(t,"ReduceLogSum",e,(r,n)=>[`var value = ${n.type.storage}(0);`,"",`value += ${r.getByIndices("input_indices")};`,"value = log(value);"])},Ml=(t,e)=>{Yt(t.inputs),Xt(t,"ReduceL1",e,(r,n)=>[`var value = ${n.type.storage}(0);`,"",`value += abs(${r.getByIndices("input_indices")});`,""])},Ol=(t,e)=>{Yt(t.inputs),Xt(t,"ReduceL2",e,(r,n)=>[`var t = ${n.type.value}(0); var value = ${n.type.value}(0);`,"",`t = ${r.getByIndices("input_indices")}; value += (t * t);`,"value = sqrt(value);"])},zl=(t,e)=>{Yt(t.inputs),Xt(t,"ReduceLogSumExp",e,(r,n)=>[`var value = ${n.type.storage}(0);`,"",`value += exp(${r.getByIndices("input_indices")});`,"value = log(value);"])},Pl=(t,e)=>{Yt(t.inputs),Xt(t,"ReduceMax",e,(r,n,a)=>{let i=[];for(let s=0;s=0||a.length===0)&&i.push(r.indicesSet("input_indices",s,0));return[`${i.join(` -`)}`,`var value = ${r.getByIndices("input_indices")};`,`value = max(value, ${r.getByIndices("input_indices")});`,""]})},Rl=(t,e)=>{Yt(t.inputs),Xt(t,"ReduceMean",e,(r,n,a)=>{let i=1;for(let s=0;s=0||a.length===0)&&(i*=t.inputs[0].dims[s]);return["var sum = f32(0);","",`sum += f32(${r.getByIndices("input_indices")});`,`let value = ${n.type.value}(sum / ${i});`]})},Bl=(t,e)=>{Yt(t.inputs),Xt(t,"ReduceMin",e,(r,n,a)=>{let i=[];for(let s=0;s=0||a.length===0)&&i.push(`input_indices[${s}] = 0;`);return[`${i.join(` -`)}`,`var value = ${r.getByIndices("input_indices")};`,`value = min(value, ${r.getByIndices("input_indices")});`,""]})},Dl=(t,e)=>{Yt(t.inputs),Xt(t,"ReduceProd",e,(r,n)=>[`var value = ${n.type.storage}(1);`,"",`value *= ${r.getByIndices("input_indices")};`,""])},Nl=(t,e)=>{Yt(t.inputs),Xt(t,"ReduceSum",e,(r,n)=>[`var value = ${n.type.storage}(0);`,"",`value += ${r.getByIndices("input_indices")};`,""])},Fl=(t,e)=>{Yt(t.inputs),Xt(t,"ReduceSumSquare",e,(r,n)=>[`var t = ${n.type.value}(0); var value = ${n.type.value}(0);`,"",`t = ${r.getByIndices("input_indices")}; value += t * t;`,""])},Qt=(t,e,r)=>{if(e.length===0)return r;let n=1,a=1;for(let i=0;i1024},Ch=(t,e)=>{Qt(t.inputs[0].dims,e.axes,e.noopWithEmptyAxes)?Rl(t,e):_h(t,e)},Th=(t,e)=>{Qt(t.inputs[0].dims,e.axes,e.noopWithEmptyAxes)?Ml(t,e):yh(t,e)},Ih=(t,e)=>{Qt(t.inputs[0].dims,e.axes,e.noopWithEmptyAxes)?Ol(t,e):wh(t,e)},Ah=(t,e)=>{Qt(t.inputs[0].dims,e.axes,e.noopWithEmptyAxes)?zl(t,e):bh(t,e)},Mh=(t,e)=>{Qt(t.inputs[0].dims,e.axes,e.noopWithEmptyAxes)?Pl(t,e):vh(t,e)},Oh=(t,e)=>{Qt(t.inputs[0].dims,e.axes,e.noopWithEmptyAxes)?Bl(t,e):$h(t,e)},zh=(t,e)=>{Qt(t.inputs[0].dims,e.axes,e.noopWithEmptyAxes)?Dl(t,e):xh(t,e)},Ph=(t,e)=>{Qt(t.inputs[0].dims,e.axes,e.noopWithEmptyAxes)?Nl(t,e):Sh(t,e)},Rh=(t,e)=>{Qt(t.inputs[0].dims,e.axes,e.noopWithEmptyAxes)?Fl(t,e):kh(t,e)},Bh=(t,e)=>{Qt(t.inputs[0].dims,e.axes,e.noopWithEmptyAxes)?Al(t,e):Eh(t,e)}}),zs,Dh,Nh,yo,ey=Z(()=>{$e(),lt(),Yo(),zs=t=>{if(!t||t.length===0||t.length>2)throw new Error("ArgMinMaxOp op requires 1 or 2 inputs.");if(t[0].dataType!==1)throw new Error("Invalid input type.")},Dh=(t,e)=>{zs(t.inputs);let r=(n,a,i)=>{let s=[];for(let o=0;o=0||i.length===0)&&s.push(`input_indices[${o}] = 0;`);return[`${s.join(` -`)}`,`var value = ${n.getByIndices("input_indices")}; -var best_index : i32 = 0;`,`if (${n.getByIndices("input_indices")} ${e.selectLastIndex>0?"<=":"<"} value) { - value = ${n.getByIndices("input_indices")}; - best_index = i32(last_index); - }`,"",a.setByOffset("global_idx","best_index")]};t.compute(Li("ArgMin",{hint:e.cacheKey,inputDependencies:["rank"]},[t.inputs[0]],r,[e.axis],7,e.keepDims),{inputs:[0]})},Nh=(t,e)=>{zs(t.inputs);let r=(n,a,i)=>{let s=[];for(let o=0;o=0||i.length===0)&&s.push(`input_indices[${o}] = 0;`);return[`${s.join(` -`)}`,`var value = ${n.getByIndices("input_indices")}; -var best_index : i32 = 0;`,`if (${n.getByIndices("input_indices")} ${e.selectLastIndex>0?">=":">"} value) { - value = ${n.getByIndices("input_indices")}; - best_index = i32(last_index); - }`,"",a.setByOffset("global_idx","best_index")]};t.compute(Li("argMax",{hint:e.cacheKey,inputDependencies:["rank"]},[t.inputs[0]],r,[e.axis],7,e.keepDims),{inputs:[0]})},yo=t=>qe(t)}),Ll,Ul,Wl,Ui,Fh,Lh,Uh=Z(()=>{$e(),Ae(),lt(),Te(),Ll=(t,e)=>{if(!t||t.length<1)throw new Error("too few inputs");let r=0,n=t[r],a=n.dataType,i=n.dims.length;t.forEach((s,o)=>{if(o!==r){if(s.dataType!==a)throw new Error("input tensors should be one type");if(s.dims.length!==i)throw new Error("input tensors should have the same shape");s.dims.forEach((u,l)=>{if(l!==e&&u!==n.dims[l])throw new Error("non concat dimensions must match")})}})},Ul=(t,e)=>` - fn calculateInputIndex(index: u32) -> u32 { - let sizeInConcatAxis = array(${e}); - for (var i: u32 = 0u; i < ${t}; i += 1u ) { - if (index < sizeInConcatAxis[i]) { - return i; - } - } - return ${t}u; - }`,Wl=(t,e)=>{let r=t.length,n=[];for(let a=0;a{let a=Y.size(r),i=new Array(t.length),s=new Array(t.length),o=0,u=[],l=[],p=[{type:12,data:a}];for(let w=0;w`uniforms.sizeInConcatAxis${w}`).join(","),y=w=>` - - ${(()=>{w.registerUniform("outputSize","u32");for(let v=0;v(${c}); - ${m} -= sizeInConcatAxis[inputIndex - 1u]; - } - - ${Wl(s,f)} - }`;return{name:"Concat",shaderCache:{hint:`${e}`,inputDependencies:u},getRunData:()=>({outputs:[{dims:r,dataType:n}],dispatchGroup:{x:Math.ceil(a/64)},programUniforms:p}),getShaderSource:y}},Fh=(t,e)=>{let r=t.inputs,n=r[0].dims,a=Y.normalizeAxis(e.axis,n.length);Ll(r,a);let i=n.slice();i[a]=r.reduce((o,u)=>o+(u.dims.length>a?u.dims[a]:0),0);let s=r.filter(o=>Y.size(o.dims)>0);t.compute(Ui(s,a,i,r[0].dataType),{inputs:s})},Lh=t=>qe({axis:t.axis})}),Vl,Gl,Hl,jl,Wi,ql,Wh,Vh=Z(()=>{$e(),Ho(),Te(),Uh(),Vl=(t,e)=>{let r=t[0],n=t[1],a=t[2],i=t[3],s=t[4],o=t[5];if(s&&o)throw new Error("Attention cannot have both past and relative_position_bias");if(r.dims.length!==3)throw new Error('Input "input" must have 3 dimensions');let u=r.dims[0],l=r.dims[1],p=r.dims[2];if(a.dims.length!==1)throw new Error('Input "bias" is expected to have 1 dimensions');if(n.dims.length!==2)throw new Error('Input "weights" is expected to have 2 dimensions');if(n.dims[0]!==p)throw new Error("Input 1 dimension 0 should have same length as dimension 2 of input 0");if(a.dims[0]!==n.dims[1])throw new Error('Input "bias" dimension 0 should have same length as dimension 1 of input "weights"');let f=a.dims[0]/3,m=f,c=m;if(e.qkvHiddenSizes.length>0){if(e.qkvHiddenSizes.length!==3)throw new Error("qkv_hidden_sizes attribute should have 3 elements");for(let C of e.qkvHiddenSizes)if(C%e.numHeads!==0)throw new Error("qkv_hidden_sizes should be divisible by num_heads");f=e.qkvHiddenSizes[0],m=e.qkvHiddenSizes[1],c=e.qkvHiddenSizes[2]}let y=l;if(f!==m)throw new Error("qkv_hidden_sizes first element should be same as the second");if(a.dims[0]!==f+m+c)throw new Error('Input "bias" dimension 0 should have same length as sum of Q/K/V hidden sizes');let w=0;if(s){if(m!==c)throw new Error('Input "past" expect k_hidden_size == v_hidden_size');if(s.dims.length!==5)throw new Error('Input "past" must have 5 dimensions');if(s.dims[0]!==2)throw new Error('Input "past" first dimension must be 2');if(s.dims[1]!==u)throw new Error('Input "past" second dimension must be batch_size');if(s.dims[2]!==e.numHeads)throw new Error('Input "past" third dimension must be num_heads');if(s.dims[4]!==m/e.numHeads)throw new Error('Input "past" fifth dimension must be k_hidden_size / num_heads');e.pastPresentShareBuffer||(w=s.dims[3])}let v=y+w,k=-1,$=0;if(i)throw new Error("Mask not supported");if(s)throw new Error("past is not supported");return{batchSize:u,sequenceLength:l,pastSequenceLength:w,kvSequenceLength:y,totalSequenceLength:v,maxSequenceLength:k,inputHiddenSize:p,hiddenSize:f,vHiddenSize:c,headSize:Math.floor(f/e.numHeads),vHeadSize:Math.floor(c/e.numHeads),numHeads:e.numHeads,isUnidirectional:!1,pastPresentShareBuffer:!1,maskFilterValue:e.maskFilterValue,maskType:$,scale:e.scale,broadcastResPosBias:!1,passPastInKv:!1,qkvFormat:1}},Gl=(t,e,r,n)=>{let a=it(n),i=64,s=n/a;s{let c=ge("x",e.dataType,e.dims,a),y=[{name:"d_inv",type:Tt(e.dataType)},{name:"d_comp",type:"u32"},{name:"elements_per_thread",type:"u32"}];return` - var thread_max: array; - var thread_sum: array; - ${m.registerUniforms(y).declareVariables(c)} - ${m.mainStart([i,1,1])} - let local_offset = local_idx * uniforms.elements_per_thread; - let offset = workgroup_id.x * uniforms.d_comp + local_offset; - - var thread_max_vector = ${p}(-3.402823e+38f); - for (var i: u32 = 0; i < uniforms.elements_per_thread && i + local_offset < uniforms.d_comp; i++) { - thread_max_vector = max(${p}(x[offset + i]), thread_max_vector); - } - thread_max[local_idx] = ${(()=>{switch(a){case 1:return"thread_max_vector";case 2:return"max(thread_max_vector.x, thread_max_vector.y)";case 4:return"max(max(thread_max_vector.x, thread_max_vector.y), max(thread_max_vector.z, thread_max_vector.w))";default:throw new Error(`Unsupported components: ${a}`)}})()}; - workgroupBarrier(); - - var max_value = f32(-3.402823e+38f); - for (var i = 0u; i < ${i}; i++) { - max_value = max(thread_max[i], max_value); - } - - var sum_vector = ${p}(0); - for (var i: u32 = 0; i < uniforms.elements_per_thread && i + local_offset < uniforms.d_comp; i++) { - sum_vector += exp(${p}(x[offset + i]) - max_value); - } - thread_sum[local_idx] = ${(()=>{switch(a){case 1:return"sum_vector";case 2:return"sum_vector.x + sum_vector.y";case 4:return"sum_vector.x + sum_vector.y + sum_vector.z + sum_vector.w";default:throw new Error(`Unsupported components: ${a}`)}})()}; - workgroupBarrier(); - - var sum: f32 = 0; - for (var i = 0u; i < ${i}; i++) { - sum += thread_sum[i]; - } - - if (sum == 0) { - for (var i: u32 = 0; i < uniforms.elements_per_thread && i + local_offset < uniforms.d_comp; i++) { - x[offset + i] = ${c.type.value}(uniforms.d_inv); - } - } else { - for (var i: u32 = 0; i < uniforms.elements_per_thread && i + local_offset < uniforms.d_comp; i++) { - var f32input = ${p}(x[offset + i]); - x[offset + i] = ${c.type.value}(exp(f32input - max_value) / sum); - } - } - }`};return{name:"AttentionProbsSoftmax",shaderCache:{hint:`${i};${l};${a}`},getShaderSource:f,getRunData:()=>({outputs:[],dispatchGroup:{x:r},programUniforms:u})}},Hl=(t,e,r,n,a,i,s)=>{let o=s+a.kvSequenceLength,u=[a.batchSize,a.numHeads,a.sequenceLength,o],l=i.scale===0?1/Math.sqrt(a.headSize):i.scale,p=it(a.headSize),f=a.headSize/p,m=12,c={x:Math.ceil(o/m),y:Math.ceil(a.sequenceLength/m),z:a.batchSize*a.numHeads},y=[{type:12,data:a.sequenceLength},{type:12,data:f},{type:12,data:o},{type:12,data:a.numHeads},{type:1,data:l}],w=n?["type","type","type"]:["type","type"],v=k=>{let $=Q("q",e.dataType,e.dims,p),C=Q("key",r.dataType,r.dims,p),T=[$,C];n&&T.push(Q("relative_position_bias",n.dataType,n.dims));let A=ge("output",e.dataType,u),B=Tt(1,p),R=[{name:"M",type:"u32"},{name:"K",type:"u32"},{name:"N",type:"u32"},{name:"num_heads",type:"u32"},{name:"alpha",type:"f32"}];return` - const TILE_SIZE = ${m}u; - - var tileQ: array<${$.type.storage}, ${m*m}>; - var tileK: array<${$.type.storage}, ${m*m}>; - ${k.registerUniforms(R).declareVariables(...T,A)} - ${k.mainStart([m,m,1])} - // x holds the N and y holds the M - let headIdx = workgroup_id.z; - let m = workgroup_id.y * TILE_SIZE; - let n = workgroup_id.x * TILE_SIZE; - let qOffset = uniforms.M * uniforms.K * headIdx + m * uniforms.K; - let kOffset = uniforms.N * uniforms.K * headIdx + n * uniforms.K; - - var value = ${B}(0); - for (var w: u32 = 0u; w < uniforms.K; w += TILE_SIZE) { - if (global_id.y < uniforms.M && w + local_id.x < uniforms.K) { - tileQ[TILE_SIZE * local_id.y + local_id.x] = q[qOffset + local_id.y * uniforms.K + w + local_id.x]; - } - if (n + local_id.y < uniforms.N && w + local_id.x < uniforms.K) { - tileK[TILE_SIZE * local_id.y + local_id.x] = key[kOffset + local_id.y * uniforms.K + w + local_id.x]; - } - workgroupBarrier(); - - for (var k: u32 = 0u; k < TILE_SIZE && w+k < uniforms.K; k++) { - value += ${B}(tileQ[TILE_SIZE * local_id.y + k] * tileK[TILE_SIZE * local_id.x + k]); - } - - workgroupBarrier(); - } - - let headOffset = headIdx * uniforms.M * uniforms.N; - if (global_id.y < uniforms.M && global_id.x < uniforms.N) { - let outputIdx = headOffset + global_id.y * uniforms.N + global_id.x; - var sum: f32 = ${(()=>{switch(p){case 1:return"value";case 2:return"value.x + value.y";case 4:return"value.x + value.y + value.z + value.w";default:throw new Error(`Unsupported components: ${p}`)}})()}; - output[outputIdx] = ${A.type.value} (sum * uniforms.alpha) + ${n?"relative_position_bias[outputIdx]":"0.0"}; - } - }`};return{name:"AttentionProbs",shaderCache:{hint:`${p}`,inputDependencies:w},getRunData:()=>({outputs:[{dims:u,dataType:e.dataType,gpuDataType:0}],dispatchGroup:c,programUniforms:y}),getShaderSource:v}},jl=(t,e,r,n,a)=>{let i=a+n.kvSequenceLength,s=[n.batchSize,n.sequenceLength,n.vHiddenSize],o=12,u={x:Math.ceil(n.vHeadSize/o),y:Math.ceil(n.sequenceLength/o),z:n.batchSize*n.numHeads},l=[{type:12,data:n.sequenceLength},{type:12,data:i},{type:12,data:n.vHeadSize},{type:12,data:n.numHeads},{type:12,data:n.vHiddenSize}];return{name:"AttentionScore",shaderCache:{inputDependencies:["type","type"]},getRunData:()=>({outputs:[{dims:s,dataType:e.dataType,gpuDataType:0}],dispatchGroup:u,programUniforms:l}),getShaderSource:p=>{let f=Q("probs",e.dataType,e.dims),m=Q("v",r.dataType,r.dims),c=ge("output",e.dataType,s),y=[{name:"M",type:"u32"},{name:"K",type:"u32"},{name:"N",type:"u32"},{name:"num_heads",type:"u32"},{name:"v_hidden_size",type:"u32"}];return` - const TILE_SIZE = ${o}u; - var tileQ: array<${f.type.value}, ${o*o}>; - var tileK: array<${f.type.value}, ${o*o}>; - ${p.registerUniforms(y).declareVariables(f,m,c)} - ${p.mainStart([o,o,1])} - let headIdx = workgroup_id.z; - let m = global_id.y; - let n = global_id.x; - - let offsetA = headIdx * (uniforms.M * uniforms.K) + m * uniforms.K; - let offsetB = headIdx * (uniforms.N * uniforms.K) + n; - - var value = ${f.type.storage}(0); - for (var w: u32 = 0u; w < uniforms.K; w += TILE_SIZE) { - if (m < uniforms.M && w + local_id.x < uniforms.K) { - tileQ[TILE_SIZE * local_id.y + local_id.x] = probs[offsetA + w + local_id.x]; - } - if (n < uniforms.N && w + local_id.y < uniforms.K) { - tileK[TILE_SIZE * local_id.y + local_id.x] = v[offsetB + (w + local_id.y) * uniforms.N]; - } - workgroupBarrier(); - for (var k: u32 = 0u; k < TILE_SIZE && w+k < uniforms.K; k++) { - value += tileQ[TILE_SIZE * local_id.y + k] * tileK[TILE_SIZE * k + local_id.x]; - } - workgroupBarrier(); - } - - // we need to transpose output from BNSH_v to BSND_v - let batchIdx = workgroup_id.z / uniforms.num_heads; - let currentBatchHeadNumber = workgroup_id.z % uniforms.num_heads; - if (m < uniforms.M && n < uniforms.N) { - let outputIdx = batchIdx * uniforms.M * uniforms.v_hidden_size + m * uniforms.v_hidden_size - + currentBatchHeadNumber * uniforms.N + n; - output[outputIdx] = value; - } - }`}}},Wi=(t,e,r,n,a,i,s,o,u,l,p)=>{let f=t.outputCount>1,m=t.outputCount>2,c=f&&m?l.pastSequenceLength:0,y=c+l.kvSequenceLength,w=[l.batchSize,l.numHeads,y,l.headSize],v=s?[s,r]:[r],k=f?t.compute(Ui(v,2,w,r.dataType),{inputs:v,outputs:[1]})[0]:r,$=[l.batchSize,l.numHeads,y,l.headSize],C=o?[o,n]:[n],T=m?t.compute(Ui(C,2,$,n.dataType),{inputs:C,outputs:[2]})[0]:n,A=[e,k];u&&A.push(u);let B=t.compute(Hl(t,e,k,u,l,p,c),{inputs:A,outputs:[-1]})[0];t.compute(Gl(t,B,l.batchSize*l.numHeads*l.sequenceLength,y),{inputs:[B],outputs:[]});let R=[B,T];t.compute(jl(t,B,T,l,c),{inputs:R,outputs:[0]})},ql=(t,e)=>{let r=[e.batchSize,e.numHeads,e.sequenceLength,e.headSize],n=e.sequenceLength,a=e.inputHiddenSize,i=e.headSize,s=12,o={x:Math.ceil(e.headSize/s),y:Math.ceil(e.sequenceLength/s),z:e.batchSize*e.numHeads},u=[t.inputs[0],t.inputs[1],t.inputs[2]],l=[{type:12,data:n},{type:12,data:a},{type:12,data:i},{type:12,data:e.numHeads},{type:12,data:e.headSize},{type:12,data:e.hiddenSize},{type:12,data:e.hiddenSize+e.hiddenSize+e.vHiddenSize}],p=f=>{let m=ge("output_q",u[0].dataType,r),c=ge("output_k",u[0].dataType,r),y=ge("output_v",u[0].dataType,r),w=Q("input",u[0].dataType,u[0].dims),v=Q("weight",u[1].dataType,u[1].dims),k=Q("bias",u[2].dataType,u[2].dims),$=w.type.storage,C=[{name:"M",type:"u32"},{name:"K",type:"u32"},{name:"N",type:"u32"},{name:"num_heads",type:"u32"},{name:"head_size",type:"u32"},{name:"hidden_size",type:"u32"},{name:"ldb",type:"u32"}];return` - const TILE_SIZE = ${s}u; - var tileInput: array<${$}, ${s*s}>; - var tileWeightQ: array<${$}, ${s*s}>; - var tileWeightK: array<${$}, ${s*s}>; - var tileWeightV: array<${$}, ${s*s}>; - ${f.registerUniforms(C).declareVariables(w,v,k,m,c,y)} - ${f.mainStart([s,s,1])} - let batchIndex = workgroup_id.z / uniforms.num_heads; - let headNumber = workgroup_id.z % uniforms.num_heads; - let m = global_id.y; - let n = global_id.x; - - let inputOffset = batchIndex * (uniforms.M * uniforms.K) + m * uniforms.K; - let biasOffsetQ = headNumber * uniforms.head_size; - let biasOffsetK = uniforms.hidden_size + biasOffsetQ; - let biasOffsetV = uniforms.hidden_size + biasOffsetK; - - var valueQ = ${$}(0); - var valueK = ${$}(0); - var valueV = ${$}(0); - for (var w: u32 = 0u; w < uniforms.K; w += TILE_SIZE) { - if (m < uniforms.M && w + local_id.x < uniforms.K) { - tileInput[TILE_SIZE * local_id.y + local_id.x] = input[inputOffset + w + local_id.x]; - } - if (n < uniforms.N && w + local_id.y < uniforms.K) { - let offset = n + (w + local_id.y) * uniforms.ldb; - tileWeightQ[TILE_SIZE * local_id.y + local_id.x] = weight[biasOffsetQ + offset]; - tileWeightK[TILE_SIZE * local_id.y + local_id.x] = weight[biasOffsetK + offset]; - tileWeightV[TILE_SIZE * local_id.y + local_id.x] = weight[biasOffsetV + offset]; - } - workgroupBarrier(); - for (var k: u32 = 0u; k({outputs:[{dims:r,dataType:t.inputs[0].dataType,gpuDataType:0},{dims:r,dataType:t.inputs[0].dataType,gpuDataType:0},{dims:r,dataType:t.inputs[0].dataType,gpuDataType:0}],dispatchGroup:o,programUniforms:l}),getShaderSource:p},{inputs:u,outputs:[-1,-1,-1]})},Wh=(t,e)=>{let r=Vl(t.inputs,e),[n,a,i]=ql(t,r);return Wi(t,n,a,i,t.inputs[4],void 0,void 0,void 0,t.inputs[5],r,e)}}),Kl,Yl,Xl,Gh,ty=Z(()=>{ar(),$e(),Ae(),lt(),Te(),Kl=(t,e)=>{if(!t||t.length!==5)throw new Error("BatchNormalization requires 5 inputs");let r=(n,a,i)=>{let s=a.length;if(s!==n.length)throw new Error(`${i}: num dimensions != ${s}`);a.forEach((o,u)=>{if(o!==n[u])throw new Error(`${i}: dim[${u}] do not match`)})};if(t[0].dims.length>1){let n=e.format==="NHWC"?e.spatial?t[0].dims.slice(-1):t[0].dims.slice(-1).concat(t[0].dims.slice(1,t[0].dims.length-1)):t[0].dims.slice(1,e.spatial?2:void 0);r(t[1].dims,n,"Invalid input scale"),r(t[2].dims,n,"Invalid input B"),r(t[3].dims,n,"Invalid input mean"),r(t[4].dims,n,"Invalid input var")}else r(t[1].dims,[1],"Invalid input scale"),r(t[2].dims,[1],"Invalid input B"),r(t[3].dims,[1],"Invalid input mean"),r(t[4].dims,[1],"Invalid input var")},Yl=(t,e)=>{let{epsilon:r,spatial:n,format:a}=e,i=t[0].dims,s=n?it(i[i.length-1]):1,o=a==="NHWC"&&i.length>1?s:1,u=Y.size(i)/s,l=n,p=l?i.length:i,f=Q("x",t[0].dataType,t[0].dims,s),m=Q("scale",t[1].dataType,t[1].dims,o),c=Q("bias",t[2].dataType,t[2].dims,o),y=Q("inputMean",t[3].dataType,t[3].dims,o),w=Q("inputVar",t[4].dataType,t[4].dims,o),v=ge("y",t[0].dataType,p,s),k=()=>{let C="";if(n)C=`let cOffset = ${i.length===1?"0u":a==="NHWC"?`outputIndices[${i.length-1}] / ${s}`:"outputIndices[1]"};`;else if(a==="NCHW")C=` - ${v.indicesSet("outputIndices","0","0")} - let cOffset = ${v.indicesToOffset("outputIndices")};`;else{C=`var cIndices = ${m.type.indices}(0); - cIndices[0] = outputIndices[${i.length-1}];`;for(let T=1;T` - const epsilon = ${r}; - ${C.registerUniform("outputSize","u32").declareVariables(f,m,c,y,w,v)} - ${C.mainStart()} - ${C.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} - var outputIndices = ${v.offsetToIndices(`global_idx * ${s}`)}; - ${k()} - let scale = ${m.getByOffset("cOffset")}; - let bias = ${c.getByOffset("cOffset")}; - let inputMean = ${y.getByOffset("cOffset")}; - let inputVar = ${w.getByOffset("cOffset")}; - let x = ${f.getByOffset("global_idx")}; - let value = (x - inputMean) * inverseSqrt(inputVar + epsilon) * scale + bias; - ${v.setByOffset("global_idx","value")} - }`;return{name:"BatchNormalization",shaderCache:{hint:`${e.epsilon}_${e.format}_${n}_${s}`,inputDependencies:l?["rank","type","type","type","type"]:void 0},getShaderSource:$,getRunData:()=>({outputs:[{dims:t[0].dims,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(u/64)},programUniforms:l?[{type:12,data:u},...ye(i)]:[{type:12,data:u}]})}},Xl=t=>qe(t),Gh=(t,e)=>{let{inputs:r,outputCount:n}=t,a=Xl({...e,outputCount:n});if(Ue.webgpu.validateInputContent&&Kl(r,a),e.trainingMode)throw new Error("BatchNormalization trainingMode is not supported yet.");t.compute(Yl(r,a))}}),Ql,Jl,Hh,ry=Z(()=>{Ae(),Te(),Ql=t=>{if(t[0].dims.length!==3)throw new Error("input should have 3 dimensions");if(![320,640,1280].includes(t[0].dims[2]))throw new Error("number of channels should be 320, 640 or 1280");if(t[1].dims.length!==1)throw new Error("bias is expected to have 1 dimensions");if(t[0].dims[2]!==t[1].dims[0])throw new Error("last dimension of input and bias are not the same")},Jl=t=>{let e=t[0].dims,r=t[0].dims[2],n=Y.size(e)/4,a=t[0].dataType,i=Q("input",a,e,4),s=Q("bias",a,[r],4),o=Q("residual",a,e,4),u=ge("output",a,e,4);return{name:"BiasAdd",getRunData:()=>({outputs:[{dims:e,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(n/64)}}),getShaderSource:l=>` - const channels = ${r}u / 4; - ${l.declareVariables(i,s,o,u)} - - ${l.mainStart()} - ${l.guardAgainstOutOfBoundsWorkgroupSizes(n)} - let value = ${i.getByOffset("global_idx")} - + ${s.getByOffset("global_idx % channels")} + ${o.getByOffset("global_idx")}; - ${u.setByOffset("global_idx","value")} - }`}},Hh=t=>{Ql(t.inputs),t.compute(Jl(t.inputs))}}),Zl,Re,jh,qh,Kh,Yh,Xh,Qh,Jh,Zh,ef,ed,tf,rf,nf,af,Ci,sf,Ti,of,uf,lf,df,cf,pf,hf,ff,mf,gf,_f,yf,wf,bf,vf,$f,Ps,xf,wo,bo,Sf,kf,Ef,Xo=Z(()=>{$e(),Ae(),lt(),Te(),Zl=(t,e,r,n,a,i)=>{let s=Math.ceil(e/4),o="";typeof a=="string"?o=`${a}(a)`:o=a("a");let u=Q("inputData",r,[s],4),l=ge("outputData",n,[s],4);return` - ${t.registerUniform("vec_size","u32").declareVariables(u,l)} - - ${i??""} - - ${t.mainStart()} - ${t.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.vec_size")} - - let a = ${u.getByOffset("global_idx")}; - ${l.setByOffset("global_idx",o)} - }`},Re=(t,e,r,n,a,i=t.dataType)=>({name:e,shaderCache:{hint:a,inputDependencies:["type"]},getShaderSource:s=>Zl(s,Y.size(t.dims),t.dataType,i,r,n),getRunData:s=>({outputs:[{dims:t.dims,dataType:i}],dispatchGroup:{x:Math.ceil(Y.size(s[0].dims)/64/4)},programUniforms:[{type:12,data:Math.ceil(Y.size(t.dims)/4)}]})}),jh=t=>{t.compute(Re(t.inputs[0],"Abs","abs"))},qh=t=>{t.compute(Re(t.inputs[0],"Acos","acos"))},Kh=t=>{t.compute(Re(t.inputs[0],"Acosh","acosh"))},Yh=t=>{t.compute(Re(t.inputs[0],"Asin","asin"))},Xh=t=>{t.compute(Re(t.inputs[0],"Asinh","asinh"))},Qh=t=>{t.compute(Re(t.inputs[0],"Atan","atan"))},Jh=t=>{t.compute(Re(t.inputs[0],"Atanh","atanh"))},Zh=t=>qe(t),ef=(t,e)=>{let r;switch(e.to){case 10:r="vec4";break;case 1:r="vec4";break;case 12:r="vec4";break;case 6:r="vec4";break;case 9:r="vec4";break;default:throw new RangeError(`not supported type (specified in attribute 'to' from 'Cast' operator): ${e.to}`)}t.compute(Re(t.inputs[0],"Cast",r,void 0,e.cacheKey,e.to))},ed=t=>{let e=t.length>=2&&t[1].data!==0?t[1].getFloat32Array()[0]:jo,r=t.length>=3&&t[2].data!==0?t[2].getFloat32Array()[0]:qo;return qe({min:e,max:r})},tf=(t,e)=>{let r=t.inputs.length===1?e:ed(t.inputs),n=Tt(t.inputs[0].dataType);t.compute(Re(t.inputs[0],"Clip",a=>`clamp(${a}, clip_min_, clip_max_)`,` - const clip_min_: vec4<${n}> = vec4(${n}(${r.min})); - const clip_max_: vec4<${n}> = vec4(${n}(${r.max})); -`,r.cacheKey),{inputs:[0]})},rf=t=>{t.compute(Re(t.inputs[0],"Ceil","ceil"))},nf=t=>{t.compute(Re(t.inputs[0],"Cos","cos"))},af=t=>{t.compute(Re(t.inputs[0],"Cosh","cosh"))},Ci=t=>qe(t),sf=(t,e)=>{let r=Tt(t.inputs[0].dataType);t.compute(Re(t.inputs[0],"Elu",n=>`elu_vf32(${n})`,` - const elu_alpha_ = ${r}(${e.alpha}); - - fn elu_f32(a: ${r}) -> ${r} { - return select((exp(a) - 1.0) * elu_alpha_, a, a >= 0.0); - } - - fn elu_vf32(v: vec4<${r}>) -> vec4<${r}> { - return vec4(elu_f32(v.x), elu_f32(v.y), elu_f32(v.z), elu_f32(v.w)); - }`,e.cacheKey))},Ti=(t="f32")=>` -const r0: ${t} = 0.3275911; -const r1: ${t} = 0.254829592; -const r2: ${t} = -0.284496736; -const r3: ${t} = 1.421413741; -const r4: ${t} = -1.453152027; -const r5: ${t} = 1.061405429; - -fn erf_vf32(v: vec4<${t}>) -> vec4<${t}> { - let absv = abs(v); - let x = 1.0 / (1.0 + r0 * absv); - return sign(v) * (1.0 - ((((r5 * x + r4) * x + r3) * x + r2) * x + r1) * x * exp(-absv * absv)); -}`,of=t=>{let e=Tt(t.inputs[0].dataType);t.compute(Re(t.inputs[0],"Erf",r=>`erf_vf32(${r})`,Ti(e)))},uf=t=>{t.compute(Re(t.inputs[0],"Exp","exp"))},lf=t=>{t.compute(Re(t.inputs[0],"Floor","floor"))},df=t=>{let e=Tt(t.inputs[0].dataType);t.compute(Re(t.inputs[0],"Gelu",r=>`0.5 * ${r} * (1.0 + erf_vf32(${r} * 0.7071067811865475))`,Ti(e)))},cf=(t,e)=>{let r=Tt(t.inputs[0].dataType);t.compute(Re(t.inputs[0],"LeakyRelu",n=>`select(leaky_relu_alpha_ * ${n}, ${n}, ${n} >= vec4<${r}>(0.0))`,`const leaky_relu_alpha_ = ${r}(${e.alpha});`,e.cacheKey))},pf=t=>{t.compute(Re(t.inputs[0],"Not",e=>`!${e}`))},hf=t=>{t.compute(Re(t.inputs[0],"Neg",e=>`-${e}`))},ff=t=>{t.compute(Re(t.inputs[0],"Reciprocal",e=>`1.0/${e}`))},mf=t=>{let e=Tt(t.inputs[0].dataType);t.compute(Re(t.inputs[0],"Relu",r=>`select(vec4<${e}>(0.0), ${r}, ${r} > vec4<${e}>(0.0))`))},gf=t=>{t.compute(Re(t.inputs[0],"Sigmoid",e=>`(1.0 / (1.0 + exp(-${e})))`))},_f=t=>qe(t),yf=(t,e)=>{let r=Tt(t.inputs[0].dataType);t.compute(Re(t.inputs[0],"HardSigmoid",n=>`max(vec4<${r}>(0.0), min(vec4<${r}>(1.0), ${e.alpha} * ${n} + vec4<${r}>(${e.beta})))`,void 0,e.cacheKey))},wf=t=>{t.compute(Re(t.inputs[0],"Sin","sin"))},bf=t=>{t.compute(Re(t.inputs[0],"Sinh","sinh"))},vf=t=>{t.compute(Re(t.inputs[0],"Sqrt","sqrt"))},$f=t=>{t.compute(Re(t.inputs[0],"Tan","tan"))},Ps=t=>`sign(${t}) * (1 - exp(-2 * abs(${t}))) / (1 + exp(-2 * abs(${t})))`,xf=t=>{t.compute(Re(t.inputs[0],"Tanh",Ps))},wo=(t="f32")=>` -const fast_gelu_a: ${t} = 0.5; -const fast_gelu_b: ${t} = 0.7978845608028654; -const fast_gelu_c: ${t} = 0.035677408136300125; - -fn tanh_v(v: vec4<${t}>) -> vec4<${t}> { - return ${Ps("v")}; -} -`,bo=t=>`(fast_gelu_a + fast_gelu_a * tanh_v(${t} * (fast_gelu_c * ${t} * ${t} + fast_gelu_b))) * ${t}`,Sf=t=>{let e=Tt(t.inputs[0].dataType);t.compute(Re(t.inputs[0],"FastGelu",bo,wo(e),void 0,t.inputs[0].dataType))},kf=(t,e)=>{let r=Tt(t.inputs[0].dataType);return t.compute(Re(t.inputs[0],"ThresholdedRelu",n=>`select(vec4<${r}>(0.0), ${n}, ${n} > thresholded_relu_alpha_)`,`const thresholded_relu_alpha_ = vec4<${r}>(${e.alpha});`,e.cacheKey)),0},Ef=t=>{t.compute(Re(t.inputs[0],"Log","log"))}}),td,rd,Cf,ny=Z(()=>{Ae(),Te(),Xo(),td=t=>{if(t[0].dims.length!==3)throw new Error("input should have 3 dimensions");if(![2560,5120,10240].includes(t[0].dims[2]))throw new Error("hidden state should be 2560, 5120 or 10240");if(t[1].dims.length!==1)throw new Error("bias is expected to have 1 dimensions");if(t[0].dims[2]!==t[1].dims[0])throw new Error("last dimension of input and bias are not the same")},rd=t=>{let e=t[0].dims.slice();e[2]=e[2]/2;let r=Q("input",t[0].dataType,t[0].dims,4),n=Q("bias",t[0].dataType,[t[0].dims[2]],4),a=ge("output",t[0].dataType,e,4),i=Y.size(e)/4,s=pt(t[0].dataType);return{name:"BiasSplitGelu",getRunData:()=>({outputs:[{dims:e,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(i/64)}}),getShaderSource:o=>` - const M_SQRT2 = sqrt(2.0); - const halfChannels = ${t[0].dims[2]/4/2}u; - - ${o.declareVariables(r,n,a)} - - ${Ti(s)} - - ${o.mainStart()} - ${o.guardAgainstOutOfBoundsWorkgroupSizes(i)} - let biasIdx = global_idx % halfChannels; - let batchIndex = global_idx / halfChannels; - let inputOffset = biasIdx + batchIndex * halfChannels * 2; - let valueLeft = input[inputOffset] + bias[biasIdx]; - let valueRight = input[inputOffset + halfChannels] + bias[biasIdx + halfChannels]; - let geluRight = valueRight * 0.5 * (erf_vf32(valueRight / M_SQRT2) + 1); - - ${a.setByOffset("global_idx","valueLeft * geluRight")} - }`}},Cf=t=>{td(t.inputs),t.compute(rd(t.inputs))}}),nd,ad,Jt,Tf,If,Af,Mf,Of,zf,Pf,Rf,Bf,Df,ay=Z(()=>{$e(),Ae(),Te(),nd=(t,e,r,n,a,i,s,o,u,l,p,f)=>{let m,c;typeof o=="string"?m=c=($,C)=>`${o}((${$}),(${C}))`:typeof o=="function"?m=c=o:(m=o.scalar,c=o.vector);let y=ge("outputData",p,n.length,4),w=Q("aData",u,e.length,4),v=Q("bData",l,r.length,4),k;if(a)if(i){let $=Y.size(e)===1,C=Y.size(r)===1,T=e.length>0&&e[e.length-1]%4===0,A=r.length>0&&r[r.length-1]%4===0;$||C?k=y.setByOffset("global_idx",c($?`${w.type.value}(${w.getByOffset("0")}.x)`:w.getByOffset("global_idx"),C?`${v.type.value}(${v.getByOffset("0")}.x)`:v.getByOffset("global_idx"))):k=` - let outputIndices = ${y.offsetToIndices("global_idx * 4u")}; - let offsetA = ${w.broadcastedIndicesToOffset("outputIndices",y)}; - let offsetB = ${v.broadcastedIndicesToOffset("outputIndices",y)}; - ${y.setByOffset("global_idx",c(s||T?w.getByOffset("offsetA / 4u"):`${w.type.value}(${w.getByOffset("offsetA / 4u")}[offsetA % 4u])`,s||A?v.getByOffset("offsetB / 4u"):`${v.type.value}(${v.getByOffset("offsetB / 4u")}[offsetB % 4u])`))} - `}else k=y.setByOffset("global_idx",c(w.getByOffset("global_idx"),v.getByOffset("global_idx")));else{if(!i)throw new Error("no necessary to use scalar implementation for element-wise binary op implementation.");let $=(C,T,A="")=>{let B=`aData[indexA${T}][componentA${T}]`,R=`bData[indexB${T}][componentB${T}]`;return` - let outputIndices${T} = ${y.offsetToIndices(`global_idx * 4u + ${T}u`)}; - let offsetA${T} = ${w.broadcastedIndicesToOffset(`outputIndices${T}`,y)}; - let offsetB${T} = ${v.broadcastedIndicesToOffset(`outputIndices${T}`,y)}; - let indexA${T} = offsetA${T} / 4u; - let indexB${T} = offsetB${T} / 4u; - let componentA${T} = offsetA${T} % 4u; - let componentB${T} = offsetB${T} % 4u; - ${C}[${T}] = ${A}(${m(B,R)}); - `};p===9?k=` - var data = vec4(0); - ${$("data",0,"u32")} - ${$("data",1,"u32")} - ${$("data",2,"u32")} - ${$("data",3,"u32")} - outputData[global_idx] = dot(vec4(0x1, 0x100, 0x10000, 0x1000000), vec4(data));`:k=` - ${$("outputData[global_idx]",0)} - ${$("outputData[global_idx]",1)} - ${$("outputData[global_idx]",2)} - ${$("outputData[global_idx]",3)} - `}return` - ${t.registerUniform("vec_size","u32").declareVariables(w,v,y)} - - ${f??""} - - ${t.mainStart()} - ${t.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.vec_size")} - ${k} - }`},ad=(t,e,r,n,a,i,s=r.dataType)=>{let o=!Y.areEqual(r.dims,n.dims),u=r.dims,l=Y.size(r.dims),p=!1,f=!1,m=[o];if(o){let c=En.calcShape(r.dims,n.dims,!1);if(!c)throw new Error("Can't perform binary op on the given tensors");u=c,l=Y.size(u);let y=Y.size(r.dims)===1,w=Y.size(n.dims)===1,v=r.dims.length>0&&r.dims[r.dims.length-1]%4===0,k=n.dims.length>0&&n.dims[n.dims.length-1]%4===0;m.push(y),m.push(w),m.push(v),m.push(k);let $=1;for(let C=1;Cc.toString()).join("_"),inputDependencies:["rank","rank"]},getShaderSource:c=>nd(c,r.dims,n.dims,u,p,o,f,a,r.dataType,n.dataType,s,i),getRunData:()=>({outputs:[{dims:u,dataType:s}],dispatchGroup:{x:Math.ceil(l/64/4)},programUniforms:[{type:12,data:Math.ceil(Y.size(u)/4)},...ye(r.dims,n.dims,u)]})}},Jt=(t,e,r,n,a,i)=>{t.compute(ad(e,a??"",t.inputs[0],t.inputs[1],r,n,i))},Tf=t=>{Jt(t,"Add",(e,r)=>`${e}+${r}`)},If=t=>{Jt(t,"Div",(e,r)=>`${e}/${r}`)},Af=t=>{Jt(t,"Equal",{scalar:(e,r)=>`u32(${e}==${r})`,vector:(e,r)=>`vec4(${e}==${r})`},void 0,void 0,9)},Mf=t=>{Jt(t,"Mul",(e,r)=>`${e}*${r}`)},Of=t=>{let e=Q("input",t.inputs[0].dataType,t.inputs[0].dims).type.value;Jt(t,"Pow",{scalar:(r,n)=>`pow_custom(${r},${n})`,vector:(r,n)=>`pow_vector_custom(${r},${n})`},` - fn pow_custom(a : ${e}, b : ${e}) -> ${e} { - if (b == ${e}(0.0)) { - return ${e}(1.0); - } else if (a < ${e}(0.0) && f32(b) != floor(f32(b))) { - return ${e}(pow(f32(a), f32(b))); // NaN - } - return select(sign(a), ${e}(1.0), round(f32(abs(b) % ${e}(2.0))) != 1.0) * ${e}(${e==="i32"?"round":""}(pow(f32(abs(a)), f32(b)))); - } - fn pow_vector_custom(a : vec4<${e}>, b : vec4<${e}>) -> vec4<${e}> { - // TODO: implement vectorized pow - return vec4<${e}>(pow_custom(a.x, b.x), pow_custom(a.y, b.y), pow_custom(a.z, b.z), pow_custom(a.w, b.w)); - } - `)},zf=t=>{Jt(t,"Sub",(e,r)=>`${e}-${r}`)},Pf=t=>{Jt(t,"Greater",{scalar:(e,r)=>`u32(${e}>${r})`,vector:(e,r)=>`vec4(${e}>${r})`},void 0,void 0,9)},Rf=t=>{Jt(t,"Less",{scalar:(e,r)=>`u32(${e}<${r})`,vector:(e,r)=>`vec4(${e}<${r})`},void 0,void 0,9)},Bf=t=>{Jt(t,"GreaterOrEqual",{scalar:(e,r)=>`u32(${e}>=${r})`,vector:(e,r)=>`vec4(${e}>=${r})`},void 0,void 0,9)},Df=t=>{Jt(t,"LessOrEqual",{scalar:(e,r)=>`u32(${e}<=${r})`,vector:(e,r)=>`vec4(${e}<=${r})`},void 0,void 0,9)}}),en,tn,rn,Qo,an=Z(()=>{$e(),Ae(),en=(t,e,r="f32")=>{switch(t.activation){case"Relu":return`value = max(value, ${e}(0.0));`;case"Sigmoid":return`value = (${e}(1.0) / (${e}(1.0) + exp(-value)));`;case"Clip":return`value = clamp(value, ${e}(${r}(uniforms.clip_min)), ${e}(${r}(uniforms.clip_max)));`;case"HardSigmoid":return`value = max(${e}(0.0), min(${e}(1.0), ${r}(uniforms.alpha) * value + ${r}(uniforms.beta)));`;case"LeakyRelu":return`value = select(${r}(uniforms.alpha) * value, value, value >= ${e}(0.0));`;case"":return"";default:throw new Error(`Unsupported activation ${t.activation}`)}},tn=(t,e)=>{t.activation==="Clip"?e.push({type:1,data:t.clipMax},{type:1,data:t.clipMin}):t.activation==="HardSigmoid"?e.push({type:1,data:t.alpha},{type:1,data:t.beta}):t.activation==="LeakyRelu"&&e.push({type:1,data:t.alpha})},rn=(t,e)=>{t.activation==="Clip"?e.push({name:"clip_max",type:"f32"},{name:"clip_min",type:"f32"}):t.activation==="HardSigmoid"?e.push({name:"alpha",type:"f32"},{name:"beta",type:"f32"}):t.activation==="LeakyRelu"&&e.push({name:"alpha",type:"f32"})},Qo=t=>{let e=t?.activation||"";if(e==="HardSigmoid"){let[r,n]=t?.activation_params||[.2,.5];return{activation:e,alpha:r,beta:n}}else if(e==="Clip"){let[r,n]=t?.activation_params||[jo,qo];return{activation:e,clipMax:n,clipMin:r}}else if(e==="LeakyRelu"){let[r]=t?.activation_params||[.01];return{activation:e,alpha:r}}return{activation:e}}}),wt,Jo,Zo=Z(()=>{wt=(t,e)=>{switch(t){case 1:return e;case 2:return`vec2<${e}>`;case 3:return`vec3<${e}>`;case 4:return`vec4<${e}>`;default:throw new Error(`${t}-component is not supported.`)}},Jo=t=>` - ${t?"value = value + getBiasByOutputCoords(coords);":""} - `}),eu,Nf=Z(()=>{eu=t=>` -fn getIndexFromCoords4D(coords : vec4, shape : vec4) -> i32 { - return dot(coords, vec4( - shape.y * shape.z * shape.w, shape.z * shape.w, shape.w, 1)); -} -fn getOutputIndexFromCoords(coords : vec4) -> i32 { - return dot(coords, vec4( - i32(${t}.x), i32(${t}.y), i32(${t}.z), 1)); -} -`}),id,sd,Vi,Rs,od,Gi,ud,tu,Xi=Z(()=>{$e(),Ae(),Te(),an(),Zo(),id=(t,e)=>t?` - mm_Asub[inputRow][inputCol] = mm_readA(batch, - kStart + inputRow, - globalRowStart / innerElementSize + inputCol${e?", batchIndices":""}); - `:` - mm_Asub[inputRow][inputCol] = mm_readA(batch, - globalRow + innerRow, - kStart / innerElementSize + inputCol${e?", batchIndices":""}); - `,sd=(t,e)=>t?` - let ACached0 = mm_Asub[k * innerElementSize][localRow]; - let ACached1 = mm_Asub[k * innerElementSize + 1][localRow]; - let ACached2 = mm_Asub[k * innerElementSize + 2][localRow]; - ${e===3?"":"let ACached3 = mm_Asub[k * innerElementSize + 3][localRow];"} - for (var i = 0; i < rowPerThread; i = i + 1) { - acc[i] = BCached0 * ACached0[i] + acc[i]; - acc[i] = BCached1 * ACached1[i] + acc[i]; - acc[i] = BCached2 * ACached2[i] + acc[i]; - ${e===3?"":"acc[i] = BCached3 * ACached3[i] + acc[i];"} - }`:` - for (var i = 0; i < rowPerThread; i = i + 1) { - let ACached = mm_Asub[tileRow + i][k]; - acc[i] = BCached0 * ACached.x + acc[i]; - acc[i] = BCached1 * ACached.y + acc[i]; - acc[i] = BCached2 * ACached.z + acc[i]; - ${e===3?"":"acc[i] = BCached3 * ACached.w + acc[i];"} - }`,Vi=(t,e,r="f32",n,a=!1,i=32,s=!1,o=32)=>{let u=e[1]*t[1],l=e[0]*t[0],p=a?u:i,f=a?i:u,m=p/e[0],c=i/e[1];if(!((a&&m===4&&t[1]===4||!a&&(m===3||m===4))&&p%e[0]===0&&i%e[1]===0&&t[0]===4))throw new Error(`If transposeA ${a} is true, innerElementSize ${m} and workPerThread[1] ${t[1]} must be 4. - Otherwise, innerElementSize ${m} must be 3 or 4. - tileAWidth ${p} must be divisible by workgroupSize[0]${e[0]}. tileInner ${i} must be divisible by workgroupSize[1] ${e[1]}. colPerThread ${t[0]} must be 4.`);return` -var mm_Asub: array, ${p/m}>, ${f}>; -var mm_Bsub: array, ${l/t[0]}>, ${i}>; - -const rowPerThread = ${t[1]}; -const colPerThread = ${t[0]}; -const innerElementSize = ${m}; -const tileInner = ${i}; - -@compute @workgroup_size(${e[0]}, ${e[1]}, ${e[2]}) -fn main(@builtin(local_invocation_id) localId : vec3, - @builtin(global_invocation_id) globalId : vec3, - @builtin(workgroup_id) workgroupId : vec3) { - let localRow = i32(localId.y); - let tileRow = localRow * rowPerThread; - let tileCol = i32(localId.x); - - let globalRow =i32(globalId.y) * rowPerThread; - let globalCol = i32(globalId.x); - let batch = ${s?"0":"i32(globalId.z)"}; - ${n?`let batchIndices = ${n.offsetToIndices("u32(batch)")};`:""} - let globalRowStart = i32(workgroupId.y) * ${u}; - - let num_tiles = ${s?`${Math.ceil(o/i)}`:"(uniforms.dim_inner - 1) / tileInner + 1"}; - var kStart = ${s?`i32(globalId.z) * ${o}`:"0"}; - - var acc: array, rowPerThread>; - - // Loop over shared dimension. - let tileRowB = localRow * ${c}; - for (var t = 0; t < num_tiles; t = t + 1) { - // Load one tile of A into local memory. - for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) { - let inputRow = tileRow + innerRow; - let inputCol = tileCol; - ${id(a,n)} - } - - // Load one tile of B into local memory. - for (var innerRow = 0; innerRow < ${c}; innerRow = innerRow + 1) { - let inputRow = tileRowB + innerRow; - let inputCol = tileCol; - mm_Bsub[inputRow][inputCol] = mm_readB(batch, kStart + inputRow, globalCol${n?", batchIndices":""}); - } - kStart = kStart + tileInner; - workgroupBarrier(); - - // Compute acc values for a single thread. - for (var k = 0; k < tileInner / innerElementSize; k = k + 1) { - let BCached0 = mm_Bsub[k * innerElementSize][tileCol]; - let BCached1 = mm_Bsub[k * innerElementSize + 1][tileCol]; - let BCached2 = mm_Bsub[k * innerElementSize + 2][tileCol]; - ${m===3?"":"let BCached3 = mm_Bsub[k * innerElementSize + 3][tileCol];"} - - ${sd(a,m)} - } - - workgroupBarrier(); - } - - for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) { - mm_write(batch, globalRow + innerRow, globalCol, acc[innerRow]); - } -}`},Rs=(t,e)=>t?` - mm_Asub[inputRow][inputCol] = mm_readA(batch, - kStart + inputRow, - globalRowStart + inputCol${e?", batchIndices":""}); - `:` - mm_Asub[inputRow][inputCol] = mm_readA(batch, - globalRowStart + inputRow, - kStart + inputCol${e?", batchIndices":""}); - `,od=t=>t?"let ACached = mm_Asub[k][tileRow + innerRow];":"let ACached = mm_Asub[tileRow + innerRow][k];",Gi=(t,e,r="f32",n,a=!1,i=32,s=!1,o=32,u=!1)=>{let l=t[1]*e[1],p=t[0]*e[0],f=a?l:i,m=a?i:l;if(!(m%e[1]===0&&f%e[0]===0&&i%e[1]===0))throw new Error(`tileAHight ${m} must be divisible by workgroupSize[1]${e[1]}, tileAWidth ${f} must be divisible by workgroupSize[0]${e[0]}, tileInner ${i} must be divisible by workgroupSize[1]${e[1]}`);let c=m/e[1],y=f/e[0],w=i/e[1],v=u?` - let localRow = i32(localId.y); - let localCol = i32(localId.x); - let globalRowStart = i32(workgroupId.y) * ${l}; - let globalColStart = i32(workgroupId.x) * ${p}; - - // Loop over shared dimension. - for (var t = 0; t < num_tiles; t = t + 1) { - // Load one tile of A into local memory. - for (var inputRow = localRow; inputRow < ${m}; inputRow = inputRow + ${e[1]}) { - for (var inputCol = localCol; inputCol < ${f}; inputCol = inputCol + ${e[0]}) { - ${Rs(a,n)} - } - } - // Load one tile of B into local memory. - for (var inputRow = localRow; inputRow < ${i}; inputRow = inputRow + ${e[1]}) { - for (var inputCol = localCol; inputCol < ${p}; inputCol = inputCol + ${e[0]}) { - mm_Bsub[inputRow][inputCol] = mm_readB(batch, - kStart + inputRow, - globalColStart + inputCol${n?", batchIndices":""}); - } - } - kStart = kStart + tileInner; - workgroupBarrier(); - - // Compute acc values for a single thread. - var BCached : array<${r}, colPerThread>; - for (var k = 0; k < tileInner; k = k + 1) { - for (var inner = 0; inner < colPerThread; inner = inner + 1) { - BCached[inner] = mm_Bsub[k][localCol + inner * ${e[0]}]; - } - for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) { - let ACached = ${a?`mm_Asub[k][localRow + innerRow * ${e[1]}];`:`mm_Asub[localRow + innerRow * ${e[1]}][k];`} - for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) { - acc[innerRow][innerCol] = acc[innerRow][innerCol] + - ACached * BCached[innerCol]; - } - } - } - workgroupBarrier(); - } - for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) { - let gRow = globalRowStart + localRow + innerRow * ${e[1]}; - for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) { - let gCol = globalColStart + localCol + innerCol * ${e[0]}; - mm_write(batch, gRow, gCol, acc[innerRow][innerCol]); - } - } - `:` -let tileRow = i32(localId.y) * rowPerThread; -let tileCol = i32(localId.x) * colPerThread; - -let globalRow = i32(globalId.y) * rowPerThread; -let globalCol = i32(globalId.x) * colPerThread; -let globalRowStart = i32(workgroupId.y) * ${l}; - -let tileRowA = i32(localId.y) * ${c}; -let tileColA = i32(localId.x) * ${y}; -let tileRowB = i32(localId.y) * ${w}; -// Loop over shared dimension. -for (var t = 0; t < num_tiles; t = t + 1) { - // Load one tile of A into local memory. - for (var innerRow = 0; innerRow < ${c}; innerRow = innerRow + 1) { - for (var innerCol = 0; innerCol < ${y}; innerCol = innerCol + 1) { - let inputRow = tileRowA + innerRow; - let inputCol = tileColA + innerCol; - ${Rs(a,n)} - } - } - - // Load one tile of B into local memory. - for (var innerRow = 0; innerRow < ${w}; innerRow = innerRow + 1) { - for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) { - let inputRow = tileRowB + innerRow; - let inputCol = tileCol + innerCol; - mm_Bsub[inputRow][inputCol] = mm_readB(batch, - kStart + inputRow, - globalCol + innerCol${n?", batchIndices":""}); - } - } - kStart = kStart + tileInner; - workgroupBarrier(); - - // Compute acc values for a single thread. - var BCached : array<${r}, colPerThread>; - for (var k = 0; k < tileInner; k = k + 1) { - for (var inner = 0; inner < colPerThread; inner = inner + 1) { - BCached[inner] = mm_Bsub[k][tileCol + inner]; - } - - for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) { - ${od(a)} - for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) { - acc[innerRow][innerCol] = acc[innerRow][innerCol] + ACached * BCached[innerCol]; - } - } - } - - workgroupBarrier(); -} - -for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) { - for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) { - mm_write(batch, globalRow + innerRow, globalCol + innerCol, - acc[innerRow][innerCol]); - } -} -`;return` - var mm_Asub : array, ${m}>; - var mm_Bsub : array, ${i}>; - const rowPerThread = ${t[1]}; - const colPerThread = ${t[0]}; - const tileInner = ${i}; - -@compute @workgroup_size(${e[0]}, ${e[1]}, ${e[2]}) -fn main(@builtin(local_invocation_id) localId : vec3, - @builtin(global_invocation_id) globalId : vec3, - @builtin(workgroup_id) workgroupId : vec3) { - let batch = ${s?"0":"i32(globalId.z)"}; - ${n?`let batchIndices = ${n.offsetToIndices("u32(batch)")};`:""} - let num_tiles = ${s?`${Math.ceil(o/i)}`:"(uniforms.dim_inner - 1) / tileInner + 1"}; - var kStart = ${s?`i32(globalId.z) * ${o}`:"0"}; - - var acc : array, rowPerThread>; - - // Without this initialization strange values show up in acc. - for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) { - for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) { - acc[innerRow][innerCol] = 0.0; - } - } - ${v} - } -`},ud=(t,e,r,n,a,i=!1)=>{let[s,o,u]=a,[l,p,f,m]=n,c=_a(s,u),y=_a(o,u),w=pt(n[0].type.tensor),v=()=>{let $=p.rank,C=l.rank,T=`var aIndices: ${p.type.indices};`;for(let A=$-2-1,B=C-1;A>=0;A--,B--)T+=` -aIndices[${A}] = ${C>1?`batchIndices[${B}]`:"batchIndices"};`;return c.forEach(A=>{T+=` -aIndices[${A}] = 0;`}),T+=` -aIndices[${$-2}] = u32(row); - aIndices[${$-1}] = u32(colIn);`,T},k=()=>{let $=f.rank,C=l.rank,T=`var bIndices: ${f.type.indices};`;for(let A=$-2-1,B=C-1;A>=0;A--,B--)T+=` -bIndices[${A}] = ${C>1?`batchIndices[${B}]`:"batchIndices"};`;return y.forEach(A=>{T+=` -bIndices[${A}] = 0;`}),T+=` -bIndices[${$-2}] = u32(row); - bIndices[${$-1}] = u32(colIn);`,T};return` - fn mm_readA(batch: i32, row: i32, colIn: i32, batchIndices: ${l.type.indices}) -> ${wt(t,w)} { - var value = ${wt(t,w)}(0.0); - let col = colIn * ${t}; - if(row < uniforms.dim_a_outer && col < uniforms.dim_inner) - { - ${v()} - value = ${p.getByIndices("aIndices")}; - } - return value; - } - - fn mm_readB(batch: i32, row: i32, colIn: i32, batchIndices: ${l.type.indices}) -> ${wt(t,w)} { - var value = ${wt(t,w)}(0.0); - let col = colIn * ${t}; - if(row < uniforms.dim_inner && col < uniforms.dim_b_outer) - { - ${k()} - value = ${f.getByIndices("bIndices")}; - } - return value; - } - - fn mm_write(batch: i32, row: i32, colIn: i32, valueIn: ${wt(t,w)}) { - let col = colIn * ${t}; - if (row < uniforms.dim_a_outer && col < uniforms.dim_b_outer) { - var value = valueIn; - let coords = vec3(batch, row, colIn); - ${e?`value = value + ${i?"bias[colIn]":`${wt(t,w)}(bias[row])`};`:""} - ${r} - ${m.setByIndices("vec3(coords)","value")} - } - } - `},tu=(t,e,r,n,a=!1)=>{let i=t[0].dims,s=t[1].dims,o=i.slice(0,-2),u=s.slice(0,-2),l=n?n.slice(0,-2):r.slice(0,-2),p=Y.size(l),f=i[i.length-2],m=i[i.length-1],c=s[s.length-1],y=m%4===0&&c%4===0,w=f<=8?[4,1,1]:[4,4,1],v=[8,8,1],k=[Math.ceil(c/v[0]/w[0]),Math.ceil(f/v[1]/w[1]),Math.ceil(p/v[2]/w[2])],$=y?4:1,C=[...o,f,m/$],T=C.length,A=[...u,m,c/$],B=A.length,R=[p,f,c/$],D=[{type:6,data:f},{type:6,data:c},{type:6,data:m}];tn(e,D),D.push(...ye(l,C,A));let K=["rank","rank"],j=t.length>2;j&&(D.push(...ye(t[2].dims)),K.push("rank")),D.push(...ye(R));let ie=te=>{let oe=l.length,re=Ko("batchDims",t[0].dataType,oe,1),M=pt(t[0].dataType),P=Q("a",t[0].dataType,T,$),H=Q("b",t[1].dataType,B,$),le=ge("result",t[0].dataType,R.length,$),G=[P,H];if(j){let Ce=a?$:1;G.push(Q("bias",t[2].dataType,t[2].dims.length,Ce))}let ne=[{name:"dim_a_outer",type:"i32"},{name:"dim_b_outer",type:"i32"},{name:"dim_inner",type:"i32"}];rn(e,ne);let N=pt(le.type.tensor),ae=en(e,le.type.value,N),fe=ud($,j,ae,[re,P,H,le],[o,u,l],a);return` - ${te.registerUniforms(ne).registerInternalVariables(re).declareVariables(...G,le)} - ${fe} - ${y?Vi(w,v,M,re):Gi(w,v,M,re)} - `};return{name:"MatMul",shaderCache:{hint:`${w};${e.activation};${y};${a}`,inputDependencies:K},getRunData:()=>({outputs:[{dims:r,dataType:t[0].dataType}],dispatchGroup:{x:k[0],y:k[1],z:k[2]},programUniforms:D}),getShaderSource:ie}}}),ld,Ff,iy=Z(()=>{$e(),nn(),Te(),an(),Zo(),Nf(),Xi(),ld=(t,e,r,n,a=!1,i,s=4,o=4,u=4,l="f32")=>{let p=K=>{switch(K){case 1:return"resData = x[xIndex];";case 3:return`resData = vec3<${l}>(x[xIndex], x[xIndex + 1], x[xIndex + 2]);`;case 4:return"resData = x[xIndex / 4];";default:throw new Error(`innerElementSize ${K} is not supported.`)}},f=K=>{switch(K){case 1:return"return w[row * i32(uniforms.w_shape[3]) + colIn];";case 4:return"return w[row * i32(uniforms.w_shape[3]) / 4 + colIn];";default:throw new Error(`innerElementSize ${K} is not supported.`)}},m=t?` - let coord = vec4(batch, xRow, xCol, xCh); - `:` - let coord = vec4(batch, xCh, xRow, xCol); - `,c=t?` - let coords = vec4( - batch, - row / outWidth, - row % outWidth, - col); - `:` - let coords = vec4( - batch, - row, - col / outWidth, - col % outWidth); - `,y=t?"i32(uniforms.x_shape[1])":"i32(uniforms.x_shape[2])",w=t?"i32(uniforms.x_shape[2])":"i32(uniforms.x_shape[3])",v=t?"row":"col",k=t?"col":"row",$=` - let inChannels = i32(uniforms.w_shape[2]); - let outWidth = ${t?"i32(uniforms.result_shape[2])":"i32(uniforms.result_shape[3])"}; - let outRow = ${v} / outWidth; - let outCol = ${v} % outWidth; - - let WRow = ${k} / (i32(uniforms.w_shape[1]) * inChannels); - let WCol = ${k} / inChannels % i32(uniforms.w_shape[1]); - let xRow = outRow * uniforms.stride[0] + uniforms.dilation[0] * WRow - uniforms.pad[0]; - let xCol = outCol * uniforms.stride[1] + uniforms.dilation[1] * WCol - uniforms.pad[1]; - let xCh = ${k} % inChannels; - var resData = ${wt(s,l)}(0.0); - // The bounds checking is always needed since we use it to pad zero for - // the 'same' padding type. - if (xRow >= 0 && xRow < ${y} && xCol >= 0 && xCol < ${w}) { - ${m} - let xIndex = getIndexFromCoords4D(coord, vec4(uniforms.x_shape)); - ${p(s)} - } - return resData;`,C=t?e&&n?` - let col = colIn * ${s}; - ${$}`:` - let col = colIn * ${s}; - if (row < uniforms.dim_a_outer && col < uniforms.dim_inner) { - ${$} - } - return ${wt(s,l)}(0.0);`:n&&r?` - let col = colIn * ${s}; - ${$}`:` - let col = colIn * ${s}; - if (row < uniforms.dim_inner && col < uniforms.dim_b_outer) { - ${$} - } - return ${wt(s,l)}(0.0);`,T=`${f(o)}`,A=wt(u,l),B=wt(t?s:o,l),R=wt(t?o:s,l),D=en(i,A,l);return` - fn mm_readA(batch: i32, row : i32, colIn : i32) -> ${B} { - ${t?C:T} - } - - fn mm_readB(batch: i32, row : i32, colIn : i32) -> ${R} { - ${t?T:C} - } - - fn mm_write(batch: i32, row : i32, colIn : i32, valueIn : ${A}) { - let col = colIn * ${u}; - if (row < uniforms.dim_a_outer && col < uniforms.dim_b_outer) - { - var value = valueIn; - let outWidth = ${t?"i32(uniforms.result_shape[2])":"i32(uniforms.result_shape[3])"}; - ${c} - ${Jo(a)} - ${D} - setOutputAtCoords(coords[0], coords[1], coords[2], coords[3], value); - } - }`},Ff=(t,e,r,n,a,i,s,o)=>{let u=e.format==="NHWC",l=u?t[0].dims[3]:t[0].dims[1],p=r[0],f=u?r[2]:r[3],m=u?r[1]:r[2],c=u?r[3]:r[1],y=u&&(l%4===0||l%3===0)&&c%4===0,w=u?c:f*m,v=u?f*m:c,k=[8,8,1],$=n<=8?[4,1,1]:[4,4,1],C=[Math.ceil(w/k[0]/$[0]),Math.ceil(v/k[1]/$[1]),Math.ceil(p/k[2]/$[2])];rt("verbose",()=>`[conv2d_mm_webgpu] dispatch = ${C}`);let T=y?u&&l%4!==0?3:4:1,A=k[1]*$[1],B=k[0]*$[0],R=Math.max(k[0]*T,k[1]),D=n%A===0,K=a%B===0,j=i%R===0,ie=y?[T,4,4]:[1,1,1],te=[{type:6,data:n},{type:6,data:a},{type:6,data:i},{type:6,data:[e.pads[0],e.pads[1]]},{type:6,data:e.strides},{type:6,data:e.dilations}];tn(e,te),te.push(...ye(t[0].dims,t[1].dims));let oe=["rank","rank"];s&&(te.push(...ye(t[2].dims)),oe.push("rank")),te.push(...ye(r));let re=M=>{let P=[{name:"dim_a_outer",type:"i32"},{name:"dim_b_outer",type:"i32"},{name:"dim_inner",type:"i32"},{name:"pad",type:"i32",length:2},{name:"stride",type:"i32",length:2},{name:"dilation",type:"i32",length:2}];rn(e,P);let H=y?4:1,le=pt(t[0].dataType),G=` - fn setOutputAtIndex(flatIndex : i32, value : ${y?`vec4<${le}>`:le}) { - result[flatIndex] = ${y?`vec4<${le}>`:le}(value); - } - fn setOutputAtCoords(d0 : i32, d1 : i32, d2 : i32, d3 : i32, value : ${y?`vec4<${le}>`:le}) { - let flatIndex = getOutputIndexFromCoords(vec4(d0, d1, d2, d3)); - setOutputAtIndex(flatIndex ${y?"/ 4":""}, value); - }`,ne=Q("x",t[0].dataType,t[0].dims.length,T===3?1:T),N=Q("w",t[1].dataType,t[1].dims.length,H),ae=[ne,N],fe=ge("result",t[0].dataType,r.length,H);if(s){let Ce=Q("bias",t[2].dataType,t[2].dims.length,H);ae.push(Ce),G+=` - fn getBiasByOutputCoords(coords : vec4) -> ${y?`vec4<${le}>`:le} { - return bias[coords.${u?"w":"y"}${y?"/ 4":""}]; - }`}return` - ${eu("uniforms.result_strides")} - //struct Uniforms { xShape : vec4, wShape : vec4, outShape : vec4, - // outShapeStrides: vec3, filterDims : vec2, pad : vec2, stride : vec2, - // dilation : vec2, dimAOuter : i32, dimBOuter : i32, dimInner : i32 }; - ${M.registerUniforms(P).declareVariables(...ae,fe)} - ${G} - ${ld(u,D,K,j,s,e,ie[0],ie[1],ie[2],le)} - ${y?Vi($,k,le,void 0,!u,R):Gi($,k,le,void 0,!u,R,!1,void 0,o)}`};return{name:"Conv2DMatMul",shaderCache:{hint:`${e.cacheKey};${T};${y};${D};${K};${j};${A};${B};${R}`,inputDependencies:oe},getRunData:()=>({outputs:[{dims:r,dataType:t[0].dataType}],dispatchGroup:{x:C[0],y:C[1],z:C[2]},programUniforms:te}),getShaderSource:re}}}),vo,Lf,sy=Z(()=>{$e(),Ae(),Te(),Vf(),an(),vo=(t,e,r)=>{let n=t.length>2,a=n?"value += b[output_channel];":"",i=t[0].dims,s=t[1].dims,o=s[0]/e.group,u=e.format==="NHWC",l=Ii(i,s,e.dilations,e.pads,e.strides,u),p=Y.size(l),f=[{type:12,data:p},{type:12,data:e.dilations},{type:12,data:[e.strides[0],e.strides[1]]},{type:12,data:[e.pads[0],e.pads[1]]},{type:12,data:o}];tn(e,f),f.push(...ye(i,s));let m=["rank","rank"];n&&(f.push(...ye(t[2].dims)),m.push("rank")),f.push(...ye(l));let c=y=>{let w=ge("output",t[0].dataType,l.length),v=pt(w.type.tensor),k=en(e,w.type.value,v),$=Q("x",t[0].dataType,i.length),C=Q("w",t[1].dataType,s.length),T=[$,C];n&&T.push(Q("b",t[2].dataType,t[2].dims.length));let A=[{name:"output_size",type:"u32"},{name:"dilations",type:"u32",length:e.dilations.length},{name:"strides",type:"u32",length:2},{name:"pads",type:"u32",length:2},{name:"output_channels_per_group",type:"u32"}];return rn(e,A),` - ${y.registerUniforms(A).declareVariables(...T,w)} - - ${y.mainStart()} - ${y.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} - - let outputIndices = ${w.offsetToIndices("global_idx")}; - let batch: u32 = outputIndices[0]; - let output_channel: u32 = outputIndices[${u?3:1}]; - let xRCCorner: vec2 = vec2(outputIndices[${u?1:2}], outputIndices[${u?2:3}]) * uniforms.strides - uniforms.pads; - let group_id: u32 = output_channel / uniforms.output_channels_per_group; - - var value: ${w.type.value} = ${w.type.value}(0); - for (var wInChannel: u32 = 0u; wInChannel < uniforms.w_shape[1]; wInChannel++) { - let input_channel = group_id * uniforms.w_shape[1] + wInChannel; - for (var wHeight: u32 = 0u; wHeight < uniforms.w_shape[2]; wHeight++) { - let xHeight = xRCCorner.x + wHeight * uniforms.dilations[0]; - - if (xHeight < 0u || xHeight >= uniforms.x_shape[${u?1:2}]) { - continue; - } - - for (var wWidth: u32 = 0u; wWidth < uniforms.w_shape[3]; wWidth++) { - let xWidth = xRCCorner.y + wWidth * uniforms.dilations[1]; - if (xWidth < 0u || xWidth >= uniforms.x_shape[${u?2:3}]) { - continue; - } - - let xVal = ${u?$.get("batch","xHeight","xWidth","input_channel"):$.get("batch","input_channel","xHeight","xWidth")}; - let wVal = ${C.get("output_channel","wInChannel","wHeight","wWidth")}; - value += xVal*wVal; - } - } - } - ${a} - ${k} - ${w.setByOffset("global_idx","value")} - }`};return{name:"GroupedConv",shaderCache:{hint:e.cacheKey,inputDependencies:m},getRunData:()=>({outputs:[{dims:r?r(l):l,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(p/64)},programUniforms:f}),getShaderSource:c}},Lf=(t,e,r)=>{let n=t.length>2,a=it(r[3]),i=it(r[2]),s=Y.size(r)/a/i,o=[t[0].dims[0],t[0].dims[1],t[0].dims[2],t[0].dims[3]/a],u=[t[1].dims[0],t[1].dims[1],t[1].dims[2],t[1].dims[3]/a],l=[r[0],r[1],r[2],r[3]/a],p=[{type:12,data:s},{type:6,data:[e.strides[0],e.strides[1]]},{type:6,data:[e.pads[0],e.pads[1]]}];tn(e,p),p.push(...ye(o,u,l));let f=(i-1)*e.strides[1]+u[1],m=c=>{let y=ge("output",t[0].dataType,l.length,a),w=pt(y.type.tensor),v=en(e,y.type.value,w),k=Q("x",t[0].dataType,o.length,a),$=Q("w",t[1].dataType,u.length,a),C=[k,$];n&&C.push(Q("b",t[2].dataType,t[2].dims,a));let T=n?"value += b[output_channel];":"",A=[{name:"output_size",type:"u32"},{name:"strides",type:"i32",length:2},{name:"pads",type:"i32",length:2}];return rn(e,A),` - ${c.registerUniforms(A).declareVariables(...C,y)} - ${c.mainStart()} - ${c.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} - let width0 = uniforms.output_shape[3]; - let output_channel = global_idx % width0; - var index1 = global_idx / width0; - let width1 = uniforms.output_shape[2] / ${i}u; - let col = (index1 % width1) * ${i}u; - index1 = index1 / width1; - let row = index1 % uniforms.output_shape[1]; - let batch = index1 / uniforms.output_shape[1]; - - let x_corner = vec2(i32(row), i32(col)) * uniforms.strides - uniforms.pads; - - var x_vals: array<${k.type.value}, ${f}>; - var values: array<${y.type.value}, ${i}>; - let input_channel = output_channel; - // Use constant instead of uniform can give better performance for w's height/width. - for (var w_height: u32 = 0u; w_height < ${u[0]}; w_height++) { - let x_height = x_corner.x + i32(w_height); - if (x_height >= 0 && u32(x_height) < uniforms.x_shape[1]) { - for (var i = 0; i < ${f}; i++) { - let x_width = x_corner.y + i; - if (x_width >= 0 && u32(x_width) < uniforms.x_shape[2]) { - x_vals[i] = ${k.get("batch","u32(x_height)","u32(x_width)","input_channel")}; - } else { - x_vals[i] = ${k.type.value}(0); - } - } - for (var w_width: u32 = 0u; w_width < ${u[1]}; w_width++) { - let w_val = ${$.get("w_height","w_width","0","output_channel")}; - for (var i = 0u; i < ${i}u; i++) { - values[i] = fma(x_vals[i * u32(uniforms.strides[1]) + w_width], w_val, values[i]); - } - } - } - } - - for (var i = 0u; i < ${i}u; i++) { - var value = values[i]; - ${T} - ${v} - ${y.set("batch","row","col + i","output_channel","value")}; - } - }`};return{name:"GroupedConv-Vectorize",shaderCache:{hint:`${e.cacheKey};${a};${i};${f};${u[0]};${u[1]}`,inputDependencies:n?["rank","rank","type"]:["rank","rank"]},getRunData:()=>({outputs:[{dims:r,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(s/64)},programUniforms:p}),getShaderSource:m}}}),$o,dd,Uf,Wf=Z(()=>{$e(),Ae(),Xi(),Te(),an(),$o=(t,e,r,n,a=!1)=>{let i=t[0].dims,s=t[1].dims,o=i[i.length-2],u=s[s.length-1],l=i[i.length-1],p=it(u),f=it(l),m=it(o),c=Y.size(r)/p/m,y=t.length>2,w=n?n.slice(0,-2):r.slice(0,-2),v=[Y.size(w),o,u],k=[{type:12,data:c},{type:12,data:o},{type:12,data:u},{type:12,data:l}];tn(e,k),k.push(...ye(w,i,s)),y&&k.push(...ye(t[2].dims)),k.push(...ye(v));let $=C=>{let T=Ko("batch_dims",t[0].dataType,w.length),A=Q("a",t[0].dataType,i.length,f),B=Q("b",t[1].dataType,s.length,p),R=ge("output",t[0].dataType,v.length,p),D=pt(R.type.tensor),K=en(e,R.type.value,D),j=[A,B],ie="";if(y){let G=a?p:1;j.push(Q("bias",t[2].dataType,t[2].dims.length,G)),ie=`${a?`value += bias[col / ${G}];`:`value += ${R.type.value}(bias[row + i]);`}`}let te=i.slice(0,-2),oe=s.slice(0,-2),re=_a(te,w),M=_a(oe,w),P=[{name:"output_size",type:"u32"},{name:"M",type:"u32"},{name:"N",type:"u32"},{name:"K",type:"u32"}];rn(e,P);let H=(G,ne)=>{let N=G.rank,ae=G.name;if(N===2)return`var ${ae}_indices = ${G.type.indices}(0u, 0u);`;let fe=T.rank,Ce=`var ${ae}_indices: ${G.type.indices};`;for(let Be=N-2-1,Ke=fe-1;Be>=0;Be--,Ke--)Ce+=` -${ae}_indices[${Be}] = ${fe>1?`batch_indices[${Ke}]`:"batch_indices"};`;return ne.forEach(Be=>{Ce+=` -${ae}_indices[${Be}] = 0;`}),Ce+=`${ae}_indices[${N-2}] = 0u; - ${ae}_indices[${N-1}] = 0u;`,Ce},le=()=>{let G=`var a_data: ${A.type.value};`;for(let ne=0;ne; - for (var k: u32 = 0u; k < uniforms.K; k = k + ${f}) { - ${le()} - } - for (var i = 0u; i < ${m}u; i++) { - var value = values[i]; - ${ie} - ${K} - let cur_indices = ${R.type.indices}(batch, row + i, col); - let offset = ${R.indicesToOffset("cur_indices")}; - ${R.setByOffset(`offset / ${p}`,"value")}; - } - } - `};return{name:"MatMulNaive",shaderCache:{hint:`${e.activation};${p};${f};${m};${a}`,inputDependencies:y?["rank","rank","rank"]:["rank","rank"]},getRunData:()=>({outputs:[{dims:r,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(c/64)},programUniforms:k}),getShaderSource:$}},dd=t=>{if(!t||t.length!==2)throw new Error("MatMul requires 2 inputs.");if(t[0].dims[t[0].dims.length-1]!==t[1].dims[t[1].dims.length-2])throw new Error("shared dimension does not match.")},Uf=t=>{dd(t.inputs);let e=En.calcShape(t.inputs[0].dims,t.inputs[1].dims,!0);if(!e)throw new Error("Can't use matmul on the given tensors");let r=e[e.length-1],n=t.inputs[0].dims[t.inputs[0].dims.length-1];r<8&&n<8?t.compute($o(t.inputs,{activation:""},e)):t.compute(tu(t.inputs,{activation:""},e))}}),Ii,gi,cd,Bs,xo,pd,hd,So,Vf=Z(()=>{Ae(),iy(),Xi(),sy(),an(),Wf(),Sa(),Ii=(t,e,r,n,a,i)=>{let s=t[0],o=t.slice(i?1:2,i?3:4),u=o.length,l=e[0],p=e.slice(2).map((m,c)=>m+(m-1)*(r[c]-1)),f=o.map((m,c)=>m+n[c]+n[c+u]).map((m,c)=>Math.floor((m-p[c]+a[c])/a[c]));return f.splice(0,0,s),f.splice(i?3:1,0,l),f},gi=[2,3,1,0],cd=(t,e)=>{if(!t||t.length!==2&&t.length!==3)throw new Error("Conv requires 2 or 3 inputs");if(t[0].dims.length!==4&&t[0].dims.length!==3)throw new Error("currently only support conv 1D and 2D");if(t[0].dims.length!==t[1].dims.length)throw new Error("filter does not have same dimension as input");let r=t[0].dims[e.format==="NHWC"?t[0].dims.length-1:1],n=t[1].dims[1]*e.group;if(r!==n)throw new Error("FILTER_IN_CHANNEL should be equal to DATA_CHANNEL");if(t.length===3&&(t[2].dims.length!==1||t[1].dims[0]!==t[2].dims[0]))throw new Error("invalid bias");let a=t[0].dims.length-2;if(e.dilations.length!==a)throw new Error(`dilations should be ${a}D`);if(e.strides.length!==a)throw new Error(`strides should be ${a}D`);if(e.pads.length!==a*2)throw new Error(`pads should be ${a*2}D`);if(e.kernelShape.length!==0&&e.kernelShape.length!==t[1].dims.length-2)throw new Error("invalid kernel shape")},Bs=(t,e)=>{let r=t.kernelShape.slice();for(let i=2;i{let e=Qo(t),r=t.format,n=["NOTSET","VALID","SAME_UPPER","SAME_LOWER"][t.auto_pad],a=t.dilations,i=t.group,s=t.kernel_shape,o=t.pads,u=t.strides,l=t.w_is_const();return{autoPad:n,format:r,dilations:a,group:i,kernelShape:s,pads:o,strides:u,wIsConst:l,...e,cacheKey:`${t.format};${e.activation};`}},pd=(t,e,r)=>{let n=Bs(r,e),a=r.format==="NHWC";if(r.group!==1){if(!t.adapterInfo.isArchitecture("ampere")&&a&&e[1].dims[0]===r.group&&e[1].dims[1]===1&&r.dilations[0]===1&&r.dilations[1]===1){let B=Ii(e[0].dims,e[1].dims,r.dilations,n.pads,r.strides,a),R=t.kernelCustomData.wT??t.compute(vr(e[1],gi),{inputs:[1],outputs:[r.wIsConst?-2:-1]})[0];r.wIsConst&&!t.kernelCustomData.wT&&(t.kernelCustomData.wT=R);let D=[e[0],R];e.length===3&&D.push(e[2]),t.compute(Lf(D,n,B),{inputs:D})}else t.compute(vo(e,n));return}let i=e.length===3,s=e[0].dims[a?1:2],o=e[0].dims[a?2:3],u=e[0].dims[a?3:1],l=e[1].dims[2],p=e[1].dims[3],f=Ii(e[0].dims,e[1].dims,r.dilations,n.pads,r.strides,a),m=f[a?1:2],c=f[a?2:3],y=f[a?3:1],w=a&&l===s&&p===o&&r.pads[0]===0&&r.pads[1]===0;if(w||l===1&&p===1&&r.dilations[0]===1&&r.dilations[1]===1&&r.strides[0]===1&&r.strides[1]===1&&r.pads[0]===0&&r.pads[1]===0){let B=f[0],R,D,K,j=[];if(a){let oe=t.kernelCustomData.wT??t.compute(vr(e[1],gi),{inputs:[1],outputs:[r.wIsConst?-2:-1]})[0];if(r.wIsConst&&!t.kernelCustomData.wT&&(t.kernelCustomData.wT=oe),w){let re=s*o*u;R=e[0].reshape([1,B,re]),D=oe.reshape([1,re,y]),K=[1,B,y]}else R=e[0].reshape([B,s*o,u]),D=oe.reshape([1,u,y]),K=[B,m*c,y];j.push(R),j.push(D)}else R=e[0].reshape([B,u,s*o]),D=e[1].reshape([1,y,u]),K=[B,y,m*c],j.push(D),j.push(R);i&&j.push(e[2]);let ie=K[2],te=j[0].dims[j[0].dims.length-1];ie<8&&te<8?t.compute($o(j,n,f,K,a),{inputs:j}):t.compute(tu(j,n,f,K,a),{inputs:j});return}let v=!0,k=t.kernelCustomData.wT??t.compute(vr(e[1],gi),{inputs:[1],outputs:[r.wIsConst?-2:-1]})[0];r.wIsConst&&!t.kernelCustomData.wT&&(t.kernelCustomData.wT=k);let $=[e[0],k];i&&$.push(e[2]);let C=a?m*c:y,T=a?y:m*c,A=l*p*u;t.compute(Ff($,n,f,C,T,A,i,v),{inputs:$})},hd=(t,e)=>{let r=e.format==="NHWC",n=[t.inputs[0].reshape(r?[t.inputs[0].dims[0],1,t.inputs[0].dims[1],t.inputs[0].dims[2]]:[t.inputs[0].dims[0],t.inputs[0].dims[1],1,t.inputs[0].dims[2]]),t.inputs[1].reshape([t.inputs[1].dims[0],t.inputs[1].dims[1],1,t.inputs[1].dims[2]])];t.inputs.length===3&&n.push(t.inputs[2]);let a=[0,e.pads[0],0,e.pads[1]],i=[1].concat(e.strides),s=[1].concat(e.dilations),o=[1].concat(e.kernelShape),u=Bs({...e,pads:a,strides:i,dilations:s,kernelShape:o},n);t.compute(vo(n,u,l=>r?[l[0],l[2],l[3]]:[]))},So=(t,e)=>{cd(t.inputs,e),t.inputs[0].dims.length===3?hd(t,e):pd(t,t.inputs,e)}}),fd,Gf,oy=Z(()=>{$e(),nn(),Te(),an(),Zo(),Nf(),Xi(),fd=(t,e=!1,r,n,a=4)=>{let i=v=>{switch(v){case 1:return"return w[getIndexFromCoords4D(coord, vec4(uniforms.w_shape))];";case 4:return` - let coord1 = vec4(coordX, coordY, col + 1, rowInner); - let coord2 = vec4(coordX, coordY, col + 2, rowInner); - let coord3 = vec4(coordX, coordY, col + 3, rowInner); - let v0 = w[getIndexFromCoords4D(coord, vec4(uniforms.w_shape))]; - let v1 = w[getIndexFromCoords4D(coord1, vec4(uniforms.w_shape))]; - let v2 = w[getIndexFromCoords4D(coord2, vec4(uniforms.w_shape))]; - let v3 = w[getIndexFromCoords4D(coord3, vec4(uniforms.w_shape))]; - return ${n}(v0, v1, v2, v3); - `;default:throw new Error(`innerElementSize ${v} is not supported.`)}},s=t?` - let coord = vec4(batch, iXR, iXC, xCh); - `:` - let coord = vec4(batch, xCh, iXR, iXC); - `,o=t?` - let coords = vec4( - batch, - row / outWidth, - row % outWidth, - col); - `:` - let coords = vec4( - batch, - row, - col / outWidth, - col % outWidth); - `,u=t?"i32(uniforms.x_shape[1])":"i32(uniforms.x_shape[2])",l=t?"i32(uniforms.x_shape[2])":"i32(uniforms.x_shape[3])",p=t?"row":"col",f=t?"col":"row",m=` - let inChannels = ${t?"i32(uniforms.x_shape[3])":"i32(uniforms.x_shape[1])"}; - let outWidth = ${t?"i32(uniforms.result_shape[2])":"i32(uniforms.result_shape[3])"}; - let outRow = ${p} / outWidth; - let outCol = ${p} % outWidth; - - let WRow = ${f} / (uniforms.filter_dims[1] * inChannels); - let WCol = ${f} / inChannels % uniforms.filter_dims[1]; - let xR = f32(outRow - uniforms.pads[0] + uniforms.dilations[0] * WRow) / f32(uniforms.strides[0]); - let xC = f32(outCol - uniforms.pads[1] + uniforms.dilations[1] * WCol) / f32(uniforms.strides[1]); - if (xR < 0.0 || xR >= f32(${u}) || fract(xR) > 0.0) { - return ${n}(0.0); - } - if (xC < 0.0 || xC >= f32(${l}) || fract(xC) > 0.0) { - return ${n}(0.0); - } - let iXR = i32(xR); - let iXC = i32(xC); - let xCh = ${f} % inChannels; - ${s} - return x[getIndexFromCoords4D(coord, vec4(uniforms.x_shape))/${a}];`,c=t?` - let col = colIn * ${a}; - if (row < uniforms.dim_a_outer && col < uniforms.dim_inner) { - ${m} - } - return ${n}(0.0);`:` - let col = colIn * ${a}; - if (row < uniforms.dim_inner && col < uniforms.dim_b_outer) { - ${m} - } - return ${n}(0.0);`,y=` - let col = colIn * ${a}; - let inChannels = ${t?"i32(uniforms.x_shape[3])":"i32(uniforms.x_shape[1])"}; - let coordX = uniforms.filter_dims[0] - 1 - row / (uniforms.filter_dims[1] * inChannels); - let coordY = uniforms.filter_dims[1] - 1 - (row / inChannels) % uniforms.filter_dims[1]; - if (${t?"row < uniforms.dim_inner && col < uniforms.dim_b_outer":"row < uniforms.dim_inner && col < uniforms.dim_a_outer"} && coordX >= 0 && coordY >= 0) { - let rowInner = row % inChannels; - let coord = vec4(coordX, coordY, col, rowInner); - ${i(a)} - } - return ${n}(0.0); - `,w=en(r,n);return` - fn mm_readA(batch: i32, row : i32, colIn : i32) -> ${n} { - ${t?c:y} - } - - fn mm_readB(batch: i32, row : i32, colIn : i32) -> ${n} { - ${t?y:c} - } - - fn mm_write(batch: i32, row : i32, colIn : i32, valueInput : ${n}) { - let col = colIn * ${a}; - if (row < uniforms.dim_a_outer && col < uniforms.dim_b_outer) { - var value = valueInput; - let outWidth = ${t?"i32(uniforms.result_shape[2])":"i32(uniforms.result_shape[3])"}; - ${o} - ${Jo(e)} - ${w} - result[getIndexFromCoords4D(coords, vec4(uniforms.result_shape))/${a}] = value; - } - }`},Gf=(t,e,r,n,a,i,s,o)=>{let u=e.format==="NHWC",l=u?t[0].dims[3]:t[0].dims[1],p=r[0],f=u?r[2]:r[3],m=u?r[1]:r[2],c=u?r[3]:r[1],y=u&&l%4===0&&l%3&&c%4===0,w=u?c:f*m,v=u?f*m:c,k=[8,8,1],$=n<=8?[4,1,1]:[4,4,1],C=[Math.ceil(w/k[0]/$[0]),Math.ceil(v/k[1]/$[1]),Math.ceil(p/k[2]/$[2])];rt("verbose",()=>`[conv_backprop_mm_webgpu] dispatch = ${C}`);let T=y?4:1,A=Math.max(k[0]*T,k[1]),B=y?4:1,R=[e.kernelShape[u?1:2],e.kernelShape[u?2:3]],D=[R[0]+(e.dilations[0]<=1?0:(R[0]-1)*(e.dilations[0]-1)),R[1]+(e.dilations[1]<=1?0:(R[1]-1)*(e.dilations[1]-1))],K=[D[0]-1-Math.floor((e.pads[0]+e.pads[2])/2),D[1]-1-Math.floor((e.pads[1]+e.pads[3])/2)],j=[{type:6,data:n},{type:6,data:a},{type:6,data:i},{type:6,data:e.strides},{type:6,data:e.dilations},{type:6,data:R},{type:6,data:K}];tn(e,j),j.push(...ye(t[0].dims,t[1].dims));let ie=["rank","rank"];s&&(j.push(...ye(t[2].dims)),ie.push("rank")),j.push(...ye(r));let te=oe=>{let re=Q("x",t[0].dataType,t[0].dims.length,B),M=Q("w",t[1].dataType,t[1].dims.length,1),P=ge("result",t[0].dataType,r.length,B),H=[re,M],le="";if(s){let N=Q("bias",t[2].dataType,t[2].dims.length,B);H.push(N),le+=` - fn getBiasByOutputCoords(coords : vec4) -> ${N.type.value} { - return bias[coords.${u?"w":"y"}${y?"/ 4":""}]; - }`}let G=[{name:"dim_a_outer",type:"i32"},{name:"dim_b_outer",type:"i32"},{name:"dim_inner",type:"i32"},{name:"strides",type:"i32",length:2},{name:"dilations",type:"i32",length:2},{name:"filter_dims",type:"i32",length:R.length},{name:"pads",type:"i32",length:K.length}];rn(e,G);let ne=pt(t[0].dataType,1);if(ne!=="f16"&&ne!=="f32")throw new Error(`elemType ${ne} is not supported.`);return` - ${eu("uniforms.result_strides")} - ${oe.registerUniforms(G).declareVariables(...H,P)}; - ${le} - ${fd(u,s,e,re.type.value,T)} - ${y?Vi($,k,ne,void 0,!u,A):Gi($,k,ne,void 0,!u,A,!1,void 0,o)}`};return{name:"Conv2DTransposeMatMul",shaderCache:{hint:`${e.cacheKey};${$};${k};${y}`,inputDependencies:ie},getRunData:()=>({outputs:[{dims:r,dataType:t[0].dataType}],dispatchGroup:{x:C[0],y:C[1],z:C[2]},programUniforms:j}),getShaderSource:te}}}),md,ko,uy=Z(()=>{$e(),nn(),Ae(),Te(),md=(t,e,r,n,a,i=!1,s,o,u=!1)=>{let l=u?1:2,p=u?2:3,f=u?3:1,m=i?2:1,c=` - fn setOutputAtIndex(flatIndex : u32, value : ${i?`vec4<${s}>`:s}) { - result[flatIndex] = ${i?`vec4<${s}>`:s}(value); - }`;n&&(c+=` - fn getBiasByOutputCoords(coords : vec4) -> ${i?`vec4<${s}>`:s} { - return bias[coords.${u?"w":"y"}${i?"/ 4":""}]; - }`);let y=i?4:1,w=Q("W",e[1].dataType,e[1].dims.length,y),v=Q("Dy",e[0].dataType,e[0].dims.length,y),k=[v,w];n&&k.push(Q("bias",e[2].dataType,[r[f]].length,y));let $=ge("result",e[0].dataType,r.length,y),C=`{ - let batch: u32 = ${a?"global_id.z":"workgroup_id.z"} / uniforms.result_shape[1]; - let r = ${a?"global_id.z":"workgroup_id.z"} % uniforms.result_shape[1]; - let c = ${a?"global_id.y":"workgroup_id.y"} * ${m}; - let d1: u32 = ${a?"global_id.x":"workgroup_id.x"} * 4; - - let dyCorner = vec2(i32(r), i32(c)) - vec2(uniforms.pads); - - // Convolve dy(?, ?, d2) with w(:, :, d1, d2) to compute dx(xR, xC, d1). - // ? = to be determined. : = across all values in that axis. - var dotProd: array, ${m}>; - for (var i = 0; i < ${m}; i++) { - dotProd[i] = vec4<${s}>(0.0); - } - for (var wR: u32 = 0; wR < uniforms.filter_dims[0]; wR = wR + 1) { - var dyR = (${s}(dyCorner.x) + ${s}(wR)) / ${s}(uniforms.strides.x); - let wRPerm = uniforms.filter_dims[0] - 1 - wR; - if (dyR < 0.0 || dyR >= ${s}(uniforms.Dy_shape[1]) || - fract(dyR) > 0.0 || wRPerm < 0) { - continue; - } - let idyR: u32 = u32(dyR); - - for (var wC: u32 = 0; wC < uniforms.filter_dims[1]; wC = wC + 1) { - let dyC = (${s}(dyCorner.y) + ${s}(wC)) / ${s}(uniforms.strides.y); - let dyC2 = (${s}(dyCorner.y) + 1.0 + ${s}(wC)) / ${s}(uniforms.strides.y); - let wCPerm = uniforms.filter_dims[1] - 1 - wC; - if (wCPerm < 0) { - continue; - } - var bDyCVal = true; - var bDyCVal2 = true; - if (dyC < 0.0 || dyC >= ${s}(uniforms.Dy_shape[2]) || - fract(dyC) > 0.0) { - bDyCVal = false; - } - if (dyC2 < 0.0 || dyC2 >= ${s}(uniforms.Dy_shape[2]) || - fract(dyC2) > 0.0) { - bDyCVal2 = false; - } - - let idyC: u32 = u32(dyC); - let idyC2: u32 = u32(dyC2); - if (bDyCVal && bDyCVal2) { - let d2Length = uniforms.Dy_shape[3]; - for (var d2 :u32 = 0; d2 < d2Length; d2 = d2 + 4) { - let wValue0 = ${w.get("u32(wRPerm)","u32(wCPerm)","d1","d2")}; - let wValue1 = ${w.get("u32(wRPerm)","u32(wCPerm)","d1 + 1","d2")}; - let wValue2 = ${w.get("u32(wRPerm)","u32(wCPerm)","d1 + 2","d2")}; - let wValue3 = ${w.get("u32(wRPerm)","u32(wCPerm)","d1 + 3","d2")}; - - var xValue = ${v.get("batch","idyR","idyC","d2")}; - let tmpval = vec4<${s}>(dot(xValue, wValue0), - dot(xValue, wValue1), - dot(xValue, wValue2), - dot(xValue, wValue3)); - dotProd[0] = dotProd[0] + tmpval; - - xValue = ${v.get("batch","idyR","idyC2","d2")}; - - dotProd[1] = dotProd[1] + vec4<${s}>(dot(xValue, wValue0), - dot(xValue, wValue1), - dot(xValue, wValue2), - dot(xValue, wValue3)); - } - } else if (bDyCVal) { - let d2Length = uniforms.Dy_shape[${f}]; - for (var d2: u32 = 0; d2 < d2Length; d2 = d2 + 4) { - let wValue0 = ${w.get("u32(wRPerm)","u32(wCPerm)","d1","d2")}; - let wValue1 = ${w.get("u32(wRPerm)","u32(wCPerm)","d1 + 1","d2")}; - let wValue2 = ${w.get("u32(wRPerm)","u32(wCPerm)","d1 + 2","d2")}; - let wValue3 = ${w.get("u32(wRPerm)","u32(wCPerm)","d1 + 3","d2")}; - - var xValue = ${v.get("batch","idyR","idyC","d2")}; - let tmpval = vec4<${s}>(dot(xValue, wValue0), - dot(xValue, wValue1), - dot(xValue, wValue2), - dot(xValue, wValue3)); - dotProd[0] = dotProd[0] + tmpval; - } - } else if (bDyCVal2) { - let d2Length = uniforms.Dy_shape[3]; - for (var d2: u32 = 0; d2 < d2Length; d2 = d2 + 4) { - let wValue0 = ${w.get("u32(wRPerm)","u32(wCPerm)","d1","d2")}; - let wValue1 = ${w.get("u32(wRPerm)","u32(wCPerm)","d1 + 1","d2")}; - let wValue2 = ${w.get("u32(wRPerm)","u32(wCPerm)","d1 + 2","d2")}; - let wValue3 = ${w.get("u32(wRPerm)","u32(wCPerm)","d1 + 3","d2")}; - - var xValue = ${v.get("batch","idyR","idyC2","d2")}; - let tmpval = vec4<${s}>(dot(xValue, wValue0), - dot(xValue, wValue1), - dot(xValue, wValue2), - dot(xValue, wValue3)); - dotProd[1] = dotProd[1] + tmpval; - } - } - } - } - - for (var i: u32 = 0; i < ${m}; i = i + 1) { - let value = dotProd[i] + ${n?"bias[c+i]":`vec4<${s}>(0.0)`}; - ${$.set("batch","r","c + i","d1","value")}; - } - }`,T=` - let outputIndices = ${$.offsetToIndices("global_idx")}; - let batch = ${$.indicesGet("outputIndices",0)}; - let d1 = ${$.indicesGet("outputIndices",f)}; - let r = ${$.indicesGet("outputIndices",l)}; - let c = ${$.indicesGet("outputIndices",p)}; - let dyCorner = vec2(i32(r), i32(c)) - uniforms.pads; - let dyRCorner = dyCorner.x; - let dyCCorner = dyCorner.y; - let groupId = d1 / uniforms.output_channels_per_group; - let wOutChannel = d1 - groupId * uniforms.output_channels_per_group; - // Convolve dy(?, ?, d2) with w(:, :, d1, d2) to compute dx(xR, xC, d1). - // ? = to be determined. : = across all values in that axis. - var dotProd = ${s}(0.0); - for (var wR: u32 = 0; wR < uniforms.effective_filter_dims.x; wR = wR + 1) { - if (wR % uniforms.dilations.x != 0) { - continue; - } - let dyR = (${s}(dyRCorner) + ${s}(wR)) / ${s}(uniforms.strides[0]); - let wRPerm = uniforms.filter_dims.x - 1 - wR / uniforms.dilations.x; - if (dyR < 0.0 || dyR >= ${s}(uniforms.Dy_shape[${l}]) || fract(dyR) > 0.0 || - wRPerm < 0) { - continue; - } - let idyR: u32 = u32(dyR); - - for (var wC: u32 = 0; wC < uniforms.effective_filter_dims.y; wC = wC + 1) { - if (wC % uniforms.dilations.y != 0) { - continue; - } - let dyC = (${s}(dyCCorner) + ${s}(wC)) / ${s}(uniforms.strides.y); - let wCPerm = uniforms.filter_dims.y - 1 - wC / uniforms.dilations.y; - if (dyC < 0.0 || dyC >= ${s}(uniforms.Dy_shape[${p}]) || - fract(dyC) > 0.0 || wCPerm < 0) { - continue; - } - let idyC: u32 = u32(dyC); - var inputChannel = groupId * uniforms.input_channels_per_group; - for (var d2: u32 = 0; d2 < uniforms.input_channels_per_group; d2 = d2 + 1) { - let xValue = ${u?v.get("batch","idyR","idyC","inputChannel"):v.get("batch","inputChannel","idyR","idyC")}; - let wValue = ${w.get("inputChannel","wOutChannel","u32(wRPerm)","u32(wCPerm)")}; - dotProd = dotProd + xValue * wValue; - inputChannel = inputChannel + 1; - } - } - } - let value = dotProd + ${n?"bias[d1]":`${s}(0.0)`}; - ${$.setByOffset("global_idx","value")}; - `;return` - ${t.registerUniforms(o).declareVariables(...k,$)} - ${c} - - ${t.mainStart()} - ${t.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")}; - ${i?C:T}}`},ko=(t,e,r)=>{let n=t.length>2,a=e.outputShape,i=Y.size(a),s=[Math.ceil(i/64),1,1];rt("verbose",()=>`[conv2d_backprop_webgpu] dispatch = ${s}`);let o=e.format==="NHWC",u=["rank","rank"],l=[e.strides[0],e.strides[1]],p=[e.kernelShape[o?1:2],e.kernelShape[o?2:3]],f=[e.dilations[0],e.dilations[1]],m=[p[0]+(e.dilations[0]<=1?0:(e.kernelShape[o?1:2]-1)*(e.dilations[0]-1)),p[1]+(e.dilations[1]<=1?0:(e.kernelShape[o?2:3]-1)*(e.dilations[1]-1))],c=[m[0]-1-Math.floor((e.pads[0]+e.pads[2])/2),m[1]-1-Math.floor(e.pads[1]+e.pads[3])/2],y=!1,w=e.group,v=t[1].dims,k=v[0]/w,$=v[1],C=[{type:12,data:i},{type:12,data:l},{type:12,data:p},{type:12,data:f},{type:12,data:m},{type:6,data:c},{type:12,data:k},{type:12,data:$},...ye(t[0].dims,t[1].dims)];n&&(C.push(...ye(t[2].dims)),u.push("rank")),C.push(...ye(a));let T=s[1]===1&&s[2]===1,A=B=>{let R=[{name:"output_size",type:"u32"},{name:"strides",type:"u32",length:l.length},{name:"filter_dims",type:"u32",length:p.length},{name:"dilations",type:"u32",length:p.length},{name:"effective_filter_dims",type:"u32",length:m.length},{name:"pads",type:"i32",length:c.length},{name:"input_channels_per_group",type:"u32"},{name:"output_channels_per_group",type:"u32"}],D=pt(t[0].dataType);return`${md(B,t,a,n,T,y,D,R,o)}`};return{name:"ConvTranspose2D",shaderCache:{hint:`${e.cacheKey};`,inputDependencies:u},getRunData:()=>({dispatchGroup:{x:s[0],y:s[1],z:s[2]},outputs:[{dims:r?r(a):a,dataType:t[0].dataType}],programUniforms:C}),getShaderSource:A}}}),gd,_d,yd,Ds,Hf,wd,bd,vd,$d,jf,ly=Z(()=>{oy(),uy(),an(),Sa(),gd=(t,e,r,n,a,i)=>(t-1)*e+r+(n-1)*a+1-i,_d=(t,e,r,n,a)=>{let i=Math.floor(t/2);e==="SAME_UPPER"?(r[n]=i,r[a]=t-i):e==="SAME_LOWER"&&(r[n]=t-i,r[a]=i)},yd=(t,e,r,n,a,i,s,o,u,l)=>{let p=t.length-2,f=l.length===0;if(u.length===0)for(let y=0;y{let r=t.kernelShape.slice();if(t.kernelShape.length===0||t.kernelShape.reduce((f,m)=>f*m,1)===0){r.length=0;for(let f=2;ff+m,0)===0){let f=e[0].dims.length-2;u=new Array(f).fill(1)}let l=t.strides.slice();if(l.reduce((f,m)=>f+m,0)===0){let f=e[0].dims.length-2;l=new Array(f).fill(1)}yd(o,r,u,t.autoPad,t.group,a,l,n,s,i);let p=Object.assign({},t);return Object.assign(p,{kernelShape:r,pads:a,outputPadding:s,outputShape:i,dilations:u,strides:l}),p},Hf=t=>{let e=Qo(t),r=t.format,n=["NOTSET","VALID","SAME_UPPER","SAME_LOWER"][typeof t.autoPad>"u"?0:t.autoPad],a=t.dilations,i=t.group,s=t.kernelShape,o=t.pads,u=t.strides,l=t.wIsConst(),p=t.outputPadding,f=t.outputShape;return{autoPad:n,format:r,dilations:a,group:i,kernelShape:s,outputPadding:p,outputShape:f,pads:o,strides:u,wIsConst:l,...e,cacheKey:`${t.format};${e.activation};`}},wd=(t,e)=>{if(!t||t.length!==2&&t.length!==3)throw new Error("Conv requires 2 or 3 inputs");if(t[0].dims.length!==4&&t[0].dims.length!==3)throw new Error("currently only support 2-dimensional conv");if(t[0].dims.length!==t[1].dims.length)throw new Error("filter does not have same dimension as input");let r=t[0].dims[e.format==="NHWC"?t[0].dims.length-1:1],n=t[1].dims[0];if(r!==n)throw new Error("FILTER_IN_CHANNEL should be equal to DATA_CHANNEL");let a=t[1].dims[1]*e.group;if(t.length===3&&(t[2].dims.length!==1||t[2].dims[0]!==a))throw new Error("invalid bias");let i=t[0].dims.length-2;if(e.dilations.reduce((s,o)=>s+o,0)>0&&e.dilations.length!==i)throw new Error(`dilations should be ${i}D`);if(e.strides.reduce((s,o)=>s+o,0)>0&&e.strides.length!==i)throw new Error(`strides should be ${i}D`);if(e.pads.reduce((s,o)=>s+o,0)>0&&e.pads.length!==i*2)throw new Error(`pads should be ${i*2}D`);if(e.outputPadding.length!==i&&e.outputPadding.length!==0)throw new Error(`output_padding should be ${i}D`);if(e.kernelShape.reduce((s,o)=>s+o,0)>0&&e.kernelShape.length!==0&&e.kernelShape.length!==t[1].dims.length-2)throw new Error("invalid kernel shape");if(e.outputShape.length!==0&&e.outputShape.length!==t[0].dims.length-2)throw new Error("invalid output shape")},bd=[2,3,1,0],vd=(t,e,r)=>{let n=Ds(r,e),a=r.format==="NHWC",i=n.outputShape,s=i[a?3:1],o=e[0].dims[a?3:1];if(n.group!==1||s===1&&o===1){t.compute(ko(e,n));return}let u=i[a?1:2],l=i[a?2:3],p=e[1].dims[2],f=e[1].dims[3],m=a?u*l:s,c=a?s:u*l,y=p*f*o,w=!0,v=t.kernelCustomData.wT??t.compute(vr(e[1],bd),{inputs:[1],outputs:[r.wIsConst?-2:-1]})[0];r.wIsConst&&!t.kernelCustomData.wT&&(t.kernelCustomData.wT=v);let k=[e[0],v],$=e.length===3;$&&(!a&&e[2].dims.length===1?k.push(e[2].reshape([e[2].dims[0],1,1])):k.push(e[2])),t.compute(Gf(k,n,i,m,c,y,$,w),{inputs:k})},$d=(t,e)=>{let r=e.format==="NHWC",n=[t.inputs[0].reshape(r?[t.inputs[0].dims[0],1,t.inputs[0].dims[1],t.inputs[0].dims[2]]:[t.inputs[0].dims[0],t.inputs[0].dims[1],1,t.inputs[0].dims[2]]),t.inputs[1].reshape([t.inputs[1].dims[0],t.inputs[1].dims[1],1,t.inputs[1].dims[2]])];t.inputs.length===3&&n.push(t.inputs[2]);let a=e.kernelShape;(a.length===0||a[0]===0)&&(a=[t.inputs[1].dims[2]]);let i=e.dilations;(i.length===0||i[0]===0)&&(i=[1]);let s=e.strides;(s.length===0||s[0]===0)&&(s=[1]);let o=e.pads;o.length===0&&(o=[0,0]),o=[0,o[0],0,o[1]],s=[1].concat(s),i=[1].concat(i),a=[1].concat(a);let u=Ds({...e,pads:o,strides:s,dilations:i,kernelShape:a},n);t.compute(ko(n,u,l=>r?[l[0],l[2],l[3]]:[l[0],l[1],l[3]]))},jf=(t,e)=>{wd(t.inputs,e),t.inputs[0].dims.length===3?$d(t,e):vd(t,t.inputs,e)}}),xd,qf,Kf,dy=Z(()=>{$e(),Ae(),lt(),Te(),xd=(t,e,r,n)=>{let a=Y.size(e),i=e.length,s=Q("input",t,i),o=ge("output",t,i),u=r.dataType===6?r.getInt32Array()[0]:Number(r.getBigInt64Array()[0]),l=Y.normalizeAxis(u,i),p=f=>{let m=` i32(${s.indicesGet("inputIndices","uniforms.axis")}) `,c=Se("uniforms.input_shape","uniforms.axis",i),y=n.reverse?m+(n.exclusive?" + 1":""):"0",w=n.reverse?c:m+(n.exclusive?"":" + 1");return` - ${f.registerUniform("outputSize","u32").registerUniform("axis","u32").declareVariables(s,o)} - ${f.mainStart()} - ${f.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} - var inputIndices = ${o.offsetToIndices("global_idx")}; - var sum = ${o.type.value}(0); - let first : i32 = ${y}; - let last : i32 = ${w}; - for (var i : i32 = first; i < last; i++) { - ${s.indicesSet("inputIndices","uniforms.axis","u32(i)")}; - sum = sum + ${s.getByIndices("inputIndices")}; - } - ${o.setByOffset("global_idx","sum")}; - }`};return{name:"CumSum",shaderCache:{hint:n.cacheKey,inputDependencies:["rank"]},getRunData:()=>({outputs:[{dims:e,dataType:t}],dispatchGroup:{x:Math.ceil(a/64)},programUniforms:[{type:12,data:a},{type:12,data:l},...ye(e,e)]}),getShaderSource:p}},qf=(t,e)=>{let r=t.inputs[0].dims,n=t.inputs[0].dataType,a=t.inputs[1];t.compute(xd(n,r,a,e),{inputs:[0]})},Kf=t=>{let e=t.exclusive===1,r=t.reverse===1;return qe({exclusive:e,reverse:r})}}),Sd,kd,Ed,Yf,Xf,cy=Z(()=>{$e(),Ae(),lt(),Te(),Sd=t=>{if(!t||t.length!==1)throw new Error("DepthToSpace requires 1 input.");if(t[0].dims.length!==4)throw new Error("DepthToSpace requires 4D input.")},kd=(t,e,r,n)=>{let a=[];a.push(`fn perm(i: ${n.type.indices}) -> ${r.type.indices} { - var a: ${r.type.indices};`);for(let i=0;i{let r,n,a,i,s,o,u=e.format==="NHWC",l=e.blocksize,p=e.mode==="DCR";u?([r,n,a,i]=t.dims,s=p?[r,n,a,l,l,i/l**2]:[r,n,a,i/l**2,l,l],o=p?[0,1,3,2,4,5]:[0,1,4,2,5,3]):([r,n,a,i]=[t.dims[0],t.dims[2],t.dims[3],t.dims[1]],s=p?[r,l,l,i/l**2,n,a]:[r,i/l**2,l,l,n,a],o=p?[0,3,4,1,5,2]:[0,1,4,2,5,3]);let f=t.reshape(s),m=f.dims.length,c=t.dataType,y=Q("a",c,m),w=ge("output",c,m),v=k=>` - ${k.registerUniform("output_size","u32").declareVariables(y,w)} - - ${kd(o,m,y,w)} - - ${k.mainStart()} - ${k.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} - - let indices = ${w.offsetToIndices("global_idx")}; - let aIndices = perm(indices); - - ${w.setByOffset("global_idx",y.getByIndices("aIndices"))} - }`;return{name:"DepthToSpace",shaderCache:{hint:`${t.dims};${e.blocksize};${e.mode}`,inputDependencies:["rank"]},getRunData:k=>{let $=u?[r,n*l,a*l,i/l**2]:[r,i/l**2,n*l,a*l],C=Y.size($),T=f.dims,A=Y.sortBasedOnPerm(T,o);return{outputs:[{dims:$,dataType:k[0].dataType}],dispatchGroup:{x:Math.ceil(C/64)},programUniforms:[{type:12,data:C},...ye(T,A)]}},getShaderSource:v}},Yf=(t,e)=>{Sd(t.inputs),t.compute(Ed(t.inputs[0],e))},Xf=t=>qe({blocksize:t.blocksize,mode:t.mode,format:t.format})}),_i,ta,Ns,Cd,Td,Id,Ad,Fs,Md,Qf,Jf,py=Z(()=>{$e(),Ae(),lt(),Te(),_i="[a-zA-Z]|\\.\\.\\.",ta="("+_i+")+",Ns="^"+ta+"$",Cd="("+ta+",)*"+ta,Td="^"+Cd+"$",Id=class{constructor(t=-1){this.symbolToIndices=new Map,this.inputIndex=t}addSymbol(t,e){let r=this.symbolToIndices.get(t);r===void 0?r=[e]:r.push(e),this.symbolToIndices.set(t,r)}},Ad=class{constructor(t,e){this.equation=e,this.hasEllipsis=!1,this.symbolToInfo=new Map,this.lhs=new Array,this.outputDims=[];let[r,n]=e.includes("->")?e.split("->",2):[e,""];if(!r.match(RegExp(Td)))throw new Error("Invalid LHS term");if(r.split(",").forEach((a,i)=>{let s=t[i].dims.slice();if(!a.match(RegExp(Ns)))throw new Error("Invalid LHS term");let o=this.processTerm(a,!0,s,i);this.lhs.push(o)}),n==="")n+=[...this.symbolToInfo.entries()].filter(([a,i])=>i.count===1||a==="...").map(([a])=>a).join("");else if(!n.match(RegExp(ta)))throw new Error("Invalid RHS");n.match(RegExp(_i,"g"))?.forEach(a=>{if(a==="...")this.outputDims=this.outputDims.concat(this.ellipsisDims);else{let i=this.symbolToInfo.get(a);if(i===void 0)throw new Error("Invalid RHS symbol");this.outputDims.push(i.dimValue)}}),this.rhs=this.processTerm(n,!1,this.outputDims)}addSymbol(t,e,r){let n=this.symbolToInfo.get(t);if(n!==void 0){if(n.dimValue!==e&&n.count!==1)throw new Error("Dimension mismatch");n.count++,n.inputIndices.push(r)}else n={count:1,dimValue:e,inputIndices:[r]};this.symbolToInfo.set(t,n)}processTerm(t,e,r,n=-1){let a=r.length,i=!1,s=[],o=0;if(!t.match(RegExp(Ns))&&!e&&t!=="")throw new Error("Invalid LHS term");let u=t.match(RegExp(_i,"g")),l=new Id(n);return u?.forEach((p,f)=>{if(p==="..."){if(i)throw new Error("Only one ellipsis is allowed per input term");i=!0;let m=a-u.length+1;if(m<0)throw new Error("Ellipsis out of bounds");if(s=r.slice(o,o+m),this.hasEllipsis){if(this.ellipsisDims.length!==s.length||this.ellipsisDims.toString()!==s.toString())throw new Error("Ellipsis dimensions mismatch")}else if(e)this.hasEllipsis=!0,this.ellipsisDims=s;else throw new Error("Ellipsis must be specified in the LHS");for(let c=0;ct+"_max",Md=(t,e,r,n)=>{let a=t.map(l=>l.length).map((l,p)=>Q(`input${p}`,e,l)),i=Y.size(n),s=ge("output",e,n.length),o=[...r.symbolToInfo.keys()].filter(l=>!r.rhs.symbolToIndices.has(l)),u=l=>{let p=[],f="var prod = 1.0;",m="var sum = 0.0;",c="sum += prod;",y=[],w=[],v=[],k=[],$=r.symbolToInfo.size===r.rhs.symbolToIndices.size;r.symbolToInfo.forEach((T,A)=>{if(r.rhs.symbolToIndices.has(A)){let B=r.rhs.symbolToIndices.get(A)?.[0];B!==void 0&&r.lhs.forEach((R,D)=>{if(T.inputIndices.includes(D)){let K=R.symbolToIndices.get(A);if(K===void 0)throw new Error("Invalid symbol error");K.forEach(j=>{p.push(`${a[D].indicesSet(`input${D}Indices`,j,s.indicesGet("outputIndices",B))}`)})}})}else r.lhs.forEach((B,R)=>{if(T.inputIndices.includes(R)){let D=B.symbolToIndices.get(A);if(D===void 0)throw new Error("Invalid symbol error");D.forEach(K=>{y.push(`${a[R].indicesSet(`input${R}Indices`,K,`${A}`)}`)}),k.push(`prod *= ${a[R].getByIndices(`input${R}Indices`)};`)}}),w.push(`for(var ${A}: u32 = 0; ${A} < uniforms.${Fs(A)}; ${A}++) {`),v.push("}")});let C=$?[...p,`let sum = ${a.map((T,A)=>T.getByIndices(`input${A}Indices`)).join(" * ")};`]:[...p,m,...w,...y,f,...k,c,...v];return` - ${l.registerUniforms(o.map(T=>({name:`${Fs(T)}`,type:"u32"}))).registerUniform("outputSize","u32").declareVariables(...a,s)} - - ${l.mainStart()} - ${l.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} - var outputIndices = ${s.offsetToIndices("global_idx")}; - ${a.map((T,A)=>`var input${A}Indices: ${a[A].type.indices};`).join(` -`)} - ${C.join(` -`)}; - ${s.setByOffset("global_idx","sum")}; - }`};return{name:"Einsum",shaderCache:{hint:r.equation,inputDependencies:t.map(()=>"rank")},getRunData:()=>{let l=o.filter(f=>r.symbolToInfo.has(f)).map(f=>({type:12,data:r.symbolToInfo.get(f)?.dimValue||0}));l.push({type:12,data:i});let p=t.map((f,m)=>[...ye(f)]).reduce((f,m)=>f.concat(m),l);return p.push(...ye(n)),{outputs:[{dims:n,dataType:e}],dispatchGroup:{x:Math.ceil(i/64)},programUniforms:p}},getShaderSource:u}},Qf=(t,e)=>{let r=new Ad(t.inputs,e.equation),n=r.outputDims,a=t.inputs.map((i,s)=>i.dims);t.compute(Md(a,t.inputs[0].dataType,r,n))},Jf=t=>{let e=t.equation.replace(/\s+/g,"");return qe({equation:e})}}),Od,Ls,zd,Pd,Zf,hy=Z(()=>{$e(),Ae(),Te(),Od=t=>{if(!t||t.length!==2)throw new Error("Expand requires 2 input.");let e=t[0].dims,r=Array.from(t[1].getBigInt64Array(),Number),n=r.length{let r=t.length-e.length,n=[];for(let a=0;at.length>e.length?Ls(t,e):Ls(e,t),Pd=t=>{let e=t[0].dims,r=Array.from(t[1].getBigInt64Array(),Number),n=zd(e,r),a=t[0].dataType,i=a===9?4:1,s=Math.ceil(Y.size(n)/i),o=l=>{let p=Q("input",a,e.length,i),f=ge("output",a,n.length,i),m;if(a===9){let c=(y,w,v="")=>` - let outputIndices${w} = ${f.offsetToIndices(`outputOffset + ${w}u`)}; - let offset${w} = ${p.broadcastedIndicesToOffset(`outputIndices${w}`,f)}; - let index${w} = offset${w} / 4u; - let component${w} = offset${w} % 4u; - ${y}[${w}] = ${v}(${p.getByOffset(`index${w}`)}[component${w}]); - `;m=` - let outputOffset = global_idx * ${i}; - var data = vec4(0); - ${c("data",0,"u32")} - ${c("data",1,"u32")} - ${c("data",2,"u32")} - ${c("data",3,"u32")} - ${f.setByOffset("global_idx","data")} - }`}else m=` - let outputIndices = ${f.offsetToIndices("global_idx")}; - let inputOffset = ${p.broadcastedIndicesToOffset("outputIndices",f)}; - ${f.setByOffset("global_idx",p.getByOffset("inputOffset"))} - }`;return` - ${l.registerUniform("vec_size","u32").declareVariables(p,f)} - ${l.mainStart()} - ${l.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.vec_size")} - ${m}`},u=[{type:12,data:s},...ye(e,n)];return{name:"Expand",shaderCache:{hint:`${n.length}`,inputDependencies:["rank"]},getShaderSource:o,getRunData:()=>({outputs:[{dims:n,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(s/64)},programUniforms:u})}},Zf=t=>{Od(t.inputs),t.compute(Pd(t.inputs),{inputs:[0]})}}),Rd,em,fy=Z(()=>{$e(),Ae(),Te(),Xo(),Rd=t=>{let e=t[0].dataType,r=Y.size(t[0].dims),n=Y.size(t[1].dims),a=n%4===0,i=s=>{let o=Q("x",e,[1],4),u=Q("bias",e,[1],4),l=ge("y",e,[1],4),p=[{name:"output_vec_size",type:"u32"},{name:"bias_size",type:"u32"}],f=c=>` - let bias${c}_offset: u32 = (global_idx * 4 + ${c}) % uniforms.bias_size; - let bias${c} = ${u.getByOffset(`bias${c}_offset / 4`)}[bias${c}_offset % 4];`,m=a?` - let bias = ${u.getByOffset("global_idx % (uniforms.bias_size / 4)")};`:`${f(0)}${f(1)}${f(2)}${f(3)} - let bias = ${o.type.value}(bias0, bias1, bias2, bias3);`;return`${s.registerUniforms(p).declareVariables(o,u,l)} - - ${wo(Tt(e))} - - ${s.mainStart(Cn)} - ${s.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_vec_size")} - - let x = ${o.getByOffset("global_idx")}; - ${m} - let x_in = x + bias; - ${l.setByOffset("global_idx",bo("x_in"))} - }`};return{name:"FastGeluWithBias",shaderCache:{hint:`${a}`,inputDependencies:["type","type"]},getShaderSource:i,getRunData:s=>({outputs:[{dims:s[0].dims,dataType:s[0].dataType}],programUniforms:[{type:12,data:Math.ceil(r/4)},{type:12,data:n}],dispatchGroup:{x:Math.ceil(r/Cn/4)}})}},em=t=>{t.inputs.length<2||Y.size(t.inputs[1].dims)===0?Sf(t):t.compute(Rd(t.inputs))}}),Bd,Dd,tm,rm,my=Z(()=>{$e(),Ae(),lt(),Te(),Bd=t=>{if(!t||t.length!==2)throw new Error("Gather requires 2 inputs.")},Dd=(t,e)=>{let r=t[0].dims,n=t[1].dims,a=r.length,i=Y.normalizeAxis(e.axis,a),s=r.slice(0);s.splice(i,1,...n);let o=r[i],u=t[0].dataType===9?4:1,l=Math.ceil(Y.size(s)/u),p=[{type:12,data:l},{type:6,data:o},{type:12,data:i},...ye(t[0].dims,t[1].dims,s)],f=m=>{let c=Q("data",t[0].dataType,t[0].dims.length,u),y=Q("inputIndices",t[1].dataType,t[1].dims.length),w=ge("output",t[0].dataType,s.length,u),v=$=>{let C=n.length,T=`var indicesIndices${$} = ${y.type.indices}(0);`;for(let A=0;A1?`indicesIndices${$}[${A}]`:`indicesIndices${$}`} = ${s.length>1?`outputIndices${$}[uniforms.axis + ${A}]`:`outputIndices${$}`};`;T+=` - var idx${$} = ${y.getByIndices(`indicesIndices${$}`)}; - if (idx${$} < 0) { - idx${$} = idx${$} + uniforms.axisDimLimit; - } - var dataIndices${$} : ${c.type.indices}; - `;for(let A=0,B=0;A1?`dataIndices${$}[${A}]`:`dataIndices${$}`} = u32(idx${$});`,B+=C):(T+=`${a>1?`dataIndices${$}[${A}]`:`dataIndices${$}`} = ${s.length>1?`outputIndices${$}[${B}]`:`outputIndices${$}`};`,B++);return T},k;if(t[0].dataType===9){let $=(C,T,A="")=>` - let outputIndices${T} = ${w.offsetToIndices(`outputOffset + ${T}u`)}; - ${v(T)}; - let offset${T} = ${c.indicesToOffset(`dataIndices${T}`)}; - let index${T} = offset${T} / 4u; - let component${T} = offset${T} % 4u; - ${C}[${T}] = ${A}(${c.getByOffset(`index${T}`)}[component${T}]); - `;k=` - let outputOffset = global_idx * ${u}; - var value = vec4(0); - ${$("value",0,"u32")} - ${$("value",1,"u32")} - ${$("value",2,"u32")} - ${$("value",3,"u32")} - ${w.setByOffset("global_idx","value")} - `}else k=` - let outputIndices = ${w.offsetToIndices("global_idx")}; - ${v("")}; - let value = ${c.getByIndices("dataIndices")}; - ${w.setByOffset("global_idx","value")}; - `;return` - ${m.registerUniform("outputSize","u32").registerUniform("axisDimLimit","i32").registerUniform("axis","u32").declareVariables(c,y,w)} - ${m.mainStart()} - ${m.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} - ${k} - }`};return{name:"Gather",shaderCache:{hint:e.cacheKey,inputDependencies:["rank","rank"]},getRunData:()=>({outputs:[{dims:s,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(l/64)},programUniforms:p}),getShaderSource:f}},tm=t=>qe({axis:t.axis}),rm=(t,e)=>{let r=t.inputs;Bd(r),t.compute(Dd(t.inputs,e))}}),Nd,Fd,nm,am,gy=Z(()=>{$e(),Ae(),lt(),Te(),Nd=t=>{if(!t||t.length!==2)throw new Error("GatherElements requires 2 inputs.");if(t[0].dims.length<1)throw new Error("GatherElements requires that the data input be rank >= 1.");if(t[0].dims.length!==t[1].dims.length)throw new Error(`GatherElements requires that the data input and - indices input tensors be of same rank.`)},Fd=(t,e)=>{let r=t[0].dims,n=t[0].dataType,a=r.length,i=t[1].dims,s=t[1].dataType,o=Y.normalizeAxis(e.axis,a),u=r[o],l=i.slice(0),p=Y.size(l),f=Q("input",n,a),m=Q("indicesInput",s,i.length),c=ge("output",n,l.length),y=[{type:12,data:p},{type:6,data:u},{type:12,data:o}];return y.push(...ye(r,i,l)),{name:"GatherElements",shaderCache:{inputDependencies:["rank","rank"]},getRunData:()=>({outputs:[{dims:l,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(p/64)},programUniforms:y}),getShaderSource:w=>` - ${w.registerUniform("outputSize","u32").registerUniform("axisDimLimit","i32").registerUniform("axis","u32").declareVariables(f,m,c)} - ${w.mainStart()} - ${w.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} - - let outputIndices = ${c.offsetToIndices("global_idx")}; - - var idx = ${m.getByOffset("global_idx")}; - if (idx < 0) { - idx = idx + uniforms.axisDimLimit; - } - var inputIndices = ${f.type.indices}(outputIndices); - ${f.indicesSet("inputIndices","uniforms.axis","u32(idx)")}; - let value = ${f.getByIndices("inputIndices")}; - - ${c.setByOffset("global_idx","value")}; - }`}},nm=t=>qe({axis:t.axis}),am=(t,e)=>{let r=t.inputs;Nd(r),t.compute(Fd(t.inputs,e))}}),Ld,Ud,im,sm,_y=Z(()=>{$e(),Ae(),Te(),Ld=t=>{if(!t)throw new Error("Input is missing");if(t.length<2||t.length>3)throw new Error("Invaid input number.");if(t.length===3&&t[2].dims.length>2)throw new Error("Invalid input shape of C");if(t[0].dataType!==t[1].dataType||t.length===3&&t[0].dataType!==t[2].dataType)throw new Error("Input types are mismatched")},Ud=(t,e)=>{let r=t[0].dims.slice(),n=t[1].dims.slice(),[a,i,s]=hh.getShapeOfGemmResult(r,e.transA,n,e.transB,t.length===3?t[2].dims:void 0),o=[a,i];if(!o)throw new Error("Can't use gemm on the given tensors");let u=Y.size(o),l=[{type:12,data:u},{type:12,data:a},{type:12,data:i},{type:12,data:s},{type:1,data:e.alpha},{type:1,data:e.beta}],p=["type","type"];t.length===3&&(l.push(...ye(t[2].dims)),p.push("rank")),l.push(...ye(o));let f=m=>{let c="";e.transA&&e.transB?c="value += a[k * uniforms.M + m] * b[n * uniforms.K + k];":e.transA&&!e.transB?c="value += a[k * uniforms.M + m] * b[k * uniforms.N + n];":!e.transA&&e.transB?c="value += a[m * uniforms.K + k] * b[n * uniforms.K + k];":!e.transA&&!e.transB&&(c="value += a[m * uniforms.K + k] * b[k * uniforms.N + n];");let y=e.alpha===1?"":"value *= uniforms.alpha;",w=Q("a",t[0].dataType,t[0].dims),v=Q("b",t[1].dataType,t[1].dims),k=w.type.value,$=null,C=[w,v];t.length===3&&($=Q("c",t[2].dataType,t[2].dims.length),C.push($));let T=ge("output",t[0].dataType,o.length);C.push(T);let A=[{name:"output_size",type:"u32"},{name:"M",type:"u32"},{name:"N",type:"u32"},{name:"K",type:"u32"},{name:"alpha",type:"f32"},{name:"beta",type:"f32"}];return` - ${m.registerUniforms(A).declareVariables(...C)} - - ${m.mainStart()} - ${m.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} - - let m = global_idx / uniforms.N; - let n = global_idx % uniforms.N; - - var value = ${k}(0); - for (var k: u32 = 0u; k < uniforms.K; k++) { - ${c} - } - - ${y} - ${$!=null?`let cOffset = ${$.broadcastedIndicesToOffset("vec2(m, n)",T)}; value += ${k}(uniforms.beta) * ${$.getByOffset("cOffset")};`:""} - output[global_idx] = value; - }`};return{name:"Gemm",shaderCache:{hint:`${e.cacheKey}`,inputDependencies:p},getRunData:()=>({outputs:[{dims:o,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(u/64)},programUniforms:l}),getShaderSource:f}},im=t=>{let e=t.transA,r=t.transB,n=t.alpha,a=t.beta;return{transA:e,transB:r,alpha:n,beta:a,cacheKey:`${t.transA};${t.transB};${t.alpha===1}`}},sm=(t,e)=>{Ld(t.inputs),t.compute(Ud(t.inputs,e))}}),Wd,Vd,Gd,om,yy=Z(()=>{$e(),Ae(),Te(),Wd=(t,e)=>{let r=t[0].dims,n=r,a=2,i=Y.sizeToDimension(r,a),s=Y.sizeFromDimension(r,a),o=it(s),u=s/o,l=[r[0],r[1],u],p=["rank","type","type"],f=[{type:12,data:s},{type:12,data:u}];f.push(...ye(l,l));let m=c=>{let y=Q("x",t[0].dataType,l.length,o),w=Q("scale",t[1].dataType,t[1].dims),v=Q("bias",t[2].dataType,t[2].dims),k=ge("output",t[0].dataType,l.length,o),$=[y,w,v,k],C=y.type.value,T=o===1?"f32":`vec${o}`,A=64,B=[{name:"normSize",type:"u32"},{name:"normPackedSize",type:"u32"}];return` - var meanShared : f32; - var squaredNormShared : f32; - var workgroupShared : array<${T}, ${A}>; - const workgroupSize = ${A}u; - ${c.registerUniforms(B).declareVariables(...$)} - ${c.mainStart(A)} - let norm = global_idx / workgroupSize; - let batch = norm / uniforms.x_shape[1]; - let channel = norm % uniforms.x_shape[1]; - let localIndex = local_id.x; - - // initialize workgroup memory - var initial = ${T}(0); - for (var h = localIndex; h < uniforms.normPackedSize; h += workgroupSize) { - initial = initial + ${T}(${y.get("batch","channel","h")}); - } - workgroupShared[localIndex] = initial; - workgroupBarrier(); - - // Calculate the mean of current channel data. - for (var currSize = workgroupSize >> 1; currSize > 0; currSize = currSize >> 1) { - if (localIndex < currSize) { - workgroupShared[localIndex] = workgroupShared[localIndex] + workgroupShared[localIndex + currSize]; - } - workgroupBarrier(); - } - if (localIndex == 0) { - meanShared = ${Or("workgroupShared[0]",o)} / f32(uniforms.normSize); - } - workgroupBarrier(); - - // reinitialize workgroup memory. - initial = ${T}(0); - for (var h = localIndex; h < uniforms.normPackedSize; h += workgroupSize) { - let deviation = ${T}(${y.get("batch","channel","h")}) - ${T}(meanShared); - initial = initial + deviation * deviation; - } - workgroupShared[localIndex] = initial; - workgroupBarrier(); - - // Calculate the sum of square of deviation of current channel data. - for (var currSize = workgroupSize >> 1; currSize > 0; currSize = currSize >> 1) { - if (localIndex < currSize) { - workgroupShared[localIndex] = workgroupShared[localIndex] + workgroupShared[localIndex + currSize]; - } - workgroupBarrier(); - } - if (localIndex == 0) { - squaredNormShared = ${Or("workgroupShared[0]",o)}; - } - workgroupBarrier(); - - let invStdDev = inverseSqrt(squaredNormShared / f32(uniforms.normSize) + f32(${e.epsilon})); - let channelScale = invStdDev * f32(${w.getByOffset("channel")}); - let channelShift = f32(${v.getByOffset("channel")}) - meanShared * channelScale; - for (var h = localIndex; h < uniforms.normPackedSize; h += workgroupSize) { - let value = ${y.get("batch","channel","h")} * ${C}(${T}(channelScale)) + ${C}(${T}(channelShift)); - ${k.set("batch","channel","h","value")}; - } - }`};return{name:"InstanceNormalization",shaderCache:{hint:`${e.epsilon};${o}`,inputDependencies:p},getRunData:()=>({outputs:[{dims:n,dataType:t[0].dataType}],dispatchGroup:{x:i},programUniforms:f}),getShaderSource:m}},Vd=(t,e,r,n,a,i,s,o)=>{let u=it(s),l=64,p=u===1?"vec2f":`mat2x${u}f`,f=u===1?"f32":`vec${u}f`,m=(B,R)=>`${p}(${B}, ${R})`,c=a*s/u,y=Math.ceil(i/l),w=["type"],v=[{type:12,data:y},{type:12,data:i},{type:12,data:Math.floor(s/u)},{type:12,data:Math.floor(i*s/u)}],k=B=>{let R=Q("input",e.dataType,e.dims,u);return` - ${B.declareVariables(R)} - @group(0) @binding(1) var output : array<${p}>; - struct Uniforms {wg_size:u32, H:u32, C:u32, image_size:u32}; - @group(0) @binding(2) var uniforms: Uniforms; - - ${B.mainStart(l)} - let currentImageNumber = global_idx / ${l} / uniforms.C; - let currentChannelNumber = (global_idx / ${l}) % uniforms.C; - let wgOffset = local_id.x * uniforms.wg_size; - if (wgOffset >= uniforms.H) { - return; - } - let wgMax = min(wgOffset + uniforms.wg_size, uniforms.H); - - let offset = currentImageNumber * uniforms.image_size + currentChannelNumber; - var sum = ${wr("f32",u)}; - var squaredSum = ${wr("f32",u)}; - for (var i: u32 = wgOffset; i < wgMax; i++) { - let value = ${f}(input[offset + i * uniforms.C]); - sum += value; - squaredSum += value * value; - } - output[global_idx] = ${m("sum","squaredSum")}; - }`},$=t.compute({name:"InstanceNormComputeMean",shaderCache:{hint:`${u}`,inputDependencies:w},getRunData:()=>({outputs:[{dims:[a,s,l,2],dataType:1}],dispatchGroup:{x:a*s/u},programUniforms:v}),getShaderSource:k},{inputs:[e],outputs:[-1]})[0],C=[{type:12,data:c},{type:12,data:i},{type:12,data:Math.floor(s/u)},{type:12,data:Math.floor(l*s/u)}],T=["type","type","type"],A=B=>{let R=Q("scale",r.dataType,r.dims,u),D=Q("bias",n.dataType,n.dims,u);return` - @group(0) @binding(0) var input : array<${p}>; - @group(0) @binding(1) var scale : array<${R.type.storage}>; - @group(0) @binding(2) var bias : array<${D.type.storage}>; - @group(0) @binding(3) var output : array<${p}>; - struct Uniforms {units_of_work : u32, H: u32, C : u32, image_size : u32}; - @group(0) @binding(4) var uniforms: Uniforms; - - ${B.mainStart()} - ${B.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.units_of_work")} - let currentImageNumber = global_idx / uniforms.C; - let currentChannelNumber = global_idx % uniforms.C; - - let offset = currentImageNumber * uniforms.image_size; - var sum = ${wr("f32",u)}; - var squaredSum = ${wr("f32",u)}; - for (var i: u32 = 0; i < min(${l}, uniforms.H); i++) { - let value = input[offset + i + currentChannelNumber * ${l}]; - sum += value[0]; - squaredSum += value[1]; - } - sum = sum / f32(uniforms.H); - squaredSum = squaredSum / f32(uniforms.H); - let invStdDev = inverseSqrt(squaredSum - sum * sum + f32(${o})); - let channelScale = invStdDev * ${f}(scale[currentChannelNumber]); - let channelShift = ${f}(bias[currentChannelNumber]) - sum * channelScale; - - output[global_idx] = ${m("channelScale","channelShift")}; - }`};return t.compute({name:"InstanceNormComputeChannelScaleShift",shaderCache:{hint:`${u};${o}`,inputDependencies:T},getRunData:()=>({outputs:[{dims:[a,s,2],dataType:1}],dispatchGroup:{x:Math.ceil(c/64)},programUniforms:C}),getShaderSource:A},{inputs:[$,r,n],outputs:[-1]})[0]},Gd=(t,e,r)=>{let n=e[0].dims,a=n,i=n[0],s=n[n.length-1],o=Y.sizeFromDimension(n,1)/s,u=it(s),l=Y.size(a)/u,p=[{type:12,data:o},{type:12,data:Math.floor(s/u)}],f=["type","type"],m=Vd(t,e[0],e[1],e[2],i,o,s,r.epsilon),c=y=>{let w=pt(e[0].dataType),v=u===1?"vec2f":`mat2x${u}f`,k=u===1?w:`vec${u}<${w}>`,$=Q("input",e[0].dataType,e[0].dims,u),C=ge("output",e[0].dataType,a,u);return` - @group(0) @binding(0) var input : array<${$.type.storage}>; - @group(0) @binding(1) var scaleInput : array<${v}>; - @group(0) @binding(2) var output : array<${C.type.storage}>; - struct Uniforms {H: u32, C : u32}; - @group(0) @binding(3) var uniforms: Uniforms; - - ${y.mainStart()} - let currentImageNumber = global_idx / (uniforms.C * uniforms.H); - let currentChannelNumber = global_idx % uniforms.C; - - let scaleOffset = currentImageNumber * uniforms.C + currentChannelNumber; - let scale = scaleInput[scaleOffset]; - output[global_idx] = fma(input[global_idx], ${k}(scale[0]), ${k}(scale[1])); - }`};t.compute({name:"InstanceNormalizationNHWC",shaderCache:{hint:`${u}`,inputDependencies:f},getRunData:()=>({outputs:[{dims:a,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(l/64)},programUniforms:p}),getShaderSource:c},{inputs:[e[0],m]})},om=(t,e)=>{e.format==="NHWC"?Gd(t,t.inputs,e):t.compute(Wd(t.inputs,e))}}),Hd,jd,um,wy=Z(()=>{$e(),Ae(),Te(),Hd=t=>{if(!t||t.length<2)throw new Error("layerNorm requires at least 2 inputs.")},jd=(t,e,r)=>{let n=e.simplified,a=t[0].dims,i=t[1],s=!n&&t[2],o=a,u=Y.normalizeAxis(e.axis,a.length),l=Y.sizeToDimension(a,u),p=Y.sizeFromDimension(a,u),f=Y.size(i.dims),m=s?Y.size(s.dims):0;if(f!==p||s&&m!==p)throw new Error(`Size of X.shape()[axis:] == ${p}. - Size of scale and bias (if provided) must match this. - Got scale size of ${f} and bias size of ${m}`);let c=[];for(let A=0;A1,$=r>2,C=A=>{let B=pt(t[0].dataType),R=[Q("x",t[0].dataType,t[0].dims,y),Q("scale",i.dataType,i.dims,y)];s&&R.push(Q("bias",s.dataType,s.dims,y)),R.push(ge("output",t[0].dataType,o,y)),k&&R.push(ge("mean_data_output",1,c)),$&&R.push(ge("inv_std_output",1,c));let D=[{name:"norm_count",type:"u32"},{name:"norm_size",type:"f32"},{name:"norm_size_vectorized",type:"u32"},{name:"epsilon",type:"f32"}];return` - ${A.registerUniforms(D).declareVariables(...R)} - ${A.mainStart()} - ${A.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.norm_count")} - let offset = global_idx * uniforms.norm_size_vectorized; - var mean_vector = ${wr("f32",y)}; - var mean_square_vector = ${wr("f32",y)}; - - for (var h: u32 = 0u; h < uniforms.norm_size_vectorized; h++) { - let value = ${Sn(B,y,"x[h + offset]")}; - mean_vector += value; - mean_square_vector += value * value; - } - let mean = ${Or("mean_vector",y)} / uniforms.norm_size; - let inv_std_dev = inverseSqrt(${Or("mean_square_vector",y)} / uniforms.norm_size ${n?"":"- mean * mean"} + uniforms.epsilon); - - for (var j: u32 = 0; j < uniforms.norm_size_vectorized; j++) { - let f32input = ${Sn(B,y,"x[j + offset]")}; - let f32scale = ${Sn(B,y,"scale[j]")}; - output[j + offset] = ${R[0].type.value}((f32input ${n?"":"- mean"}) * inv_std_dev * f32scale - ${s?`+ ${Sn(B,y,"bias[j]")}`:""} - ); - } - - ${k?"mean_data_output[global_idx] = mean":""}; - ${$?"inv_std_output[global_idx] = inv_std_dev":""}; - }`},T=[{dims:o,dataType:t[0].dataType}];return k&&T.push({dims:c,dataType:1}),$&&T.push({dims:c,dataType:1}),{name:"LayerNormalization",shaderCache:{hint:`${y};${r};${n}`,inputDependencies:w},getRunData:()=>({outputs:T,dispatchGroup:{x:Math.ceil(l/64)},programUniforms:v}),getShaderSource:C}},um=(t,e)=>{Hd(t.inputs),t.compute(jd(t.inputs,e,t.outputCount))}}),qd,Kd,lm,dm,by=Z(()=>{$e(),Ae(),lt(),Te(),qd=(t,e)=>{if(t.length<3||t.length>4)throw new Error("MatMulNBits requires 3 or 4 inputs");let r=t[0],n=r.dims.length;if(r.dims[n-1]!==e.k)throw new Error("The last dim of input shape does not match the k value");let a=Math.floor((e.k+e.blockSize-1)/e.blockSize),i=e.blockSize/8*e.bits,s=t[1];if(!Y.areEqual(s.dims,[e.n,a,i]))throw new Error("The second inputs must be 3D tensor with shape N X nBlocksPerCol X blobSize");let o=t[2].dims;if(Y.size(o)!==e.n*a)throw new Error("scales input size error.");if(t.length===4){let u=t[3].dims,l=e.bits>4?e.n*a:e.n*Math.floor((a+1)/2);if(Y.size(u)!==l)throw new Error("zeroPoints input size error.")}},Kd=(t,e,r,n)=>{let a=t[0].dims,i=a.length,s=Math.floor((e.k+e.blockSize-1)/e.blockSize),o=a[i-2],u=e.k,l=e.n,p=a.slice(0,i-2),f=Y.size(p),m=e.blockSize/8*e.bits/4,c=t[0].dataType,y=it(o),w=it(e.k),v=it(m),k=ga(c),$=o*s*k,C=Math.floor(n/$),T=s<=r[0]&&C>0,A=!T||C>=4?it(l):C>=2&&it(l)>=2?2:1,B=p.concat([o,l]),R=Y.size(B)/A/y,D=T?[]:[{type:12,data:R},{type:12,data:e.blockSize}],K=[f,o,u/w],j=Y.convertShape(t[1].dims).slice();j.splice(-1,1,m/v),D.push(...ye(K)),D.push(...ye(j)),D.push(...ye(t[2].dims)),t.length===4&&D.push(...ye(Y.convertShape(t[3].dims)));let ie=[f,o,l/A];D.push(...ye(ie));let te=oe=>{let re=K.length,M=Q("a",t[0].dataType,re,w),P=Q("b",12,j.length,v),H=Q("scales",t[2].dataType,t[2].dims.length),le=[M,P,H],G=t.length===4?Q("zero_points",12,t[3].dims.length):void 0;G&&le.push(G);let ne=ie.length,N=ge("output",t[0].dataType,ne,A),ae=[{name:"output_size",type:"u32"},{name:"block_size",type:"u32"}],fe=pt(t[0].dataType),Ce=(()=>{switch(w){case 1:return`array<${fe}, 8>`;case 2:return`mat4x2<${fe}>`;case 4:return`mat2x4<${fe}>`;default:throw new Error(`${w}-component is not supported.`)}})(),Be=` - for (var word: u32 = 0; word < ${m}; word += ${v}) { - ${P.indicesSet("b_indices","2","word")}; - let b_data = ${P.getByIndices("b_indices")}; - for (var i: u32 = 0; i < ${v}; i++) { - let b_value: u32 = ${v===1?"b_data":"b_data[word + i]"}; - let b_mask: u32 = 0x0F0F0F0Fu; - let b_value_lower: vec4 = unpack4xU8(b_value & b_mask); - let b_value_upper: vec4 = unpack4xU8((b_value >> 4) & b_mask); - let b_quantized_values = ${Ce}(${Array.from({length:4},(Qe,We)=>`${fe}(b_value_lower[${We}]), ${fe}(b_value_upper[${We}])`).join(", ")}); - let b_dequantized_values = ${w===1?`${Ce}(${Array.from({length:8},(Qe,We)=>`(b_quantized_values[${We}] - zero_point) * scale`).join(", ")});`:`(b_quantized_values - ${Ce}(${Array(8).fill("zero_point").join(",")})) * scale;`}; - // Number of B elements per 32-bit word is 32/bits = 32/4 = 8 - for (var m: u32 = 0; m < ${T?o:y}u; m++) { - ${M.indicesSet("a_indices",re-2,T?"m":`row * ${y} + m`)}; - ${M.indicesSet("a_indices",re-1,"word_offset")}; - var input_offset = ${M.indicesToOffset("a_indices")}; - var a_data: ${Ce}; - for (var j: u32 = 0; j < ${8/w}; j++) { - a_data[j] = ${M.getByOffset("input_offset")}; - input_offset++; - } - ${T?"workgroup_shared[workgroup_shared_offset + m]":"output_values[m]"}${A>1?"[c]":""} += ${Array.from({length:8/w},(Qe,We)=>`${w===1?`a_data[${We}] * b_dequantized_values[${We}]`:`dot(a_data[${We}], b_dequantized_values[${We}])`}`).join(" + ")}; - } - word_offset += ${8/w}; - } - }`,Ke=G?` - zero_point_offset += 4; - if (zero_point_offset == 32) { - zero_point_offset = 0; - zero_point_index++; - zero_point_word = ${G.getByOffset("zero_point_index")}; - }`:"";return T?` - var workgroup_shared: array<${N.type.value}, ${o*s}>; - ${oe.declareVariables(...le,N)} - ${oe.mainStart([s,1,1])} - var a_indices: ${M.type.indices}; - var block = local_id.x; - var col = workgroup_id.y; - var batch = workgroup_id.z; - ${M.indicesSet("a_indices","0","batch")}; - // Two zero points are packed into one byte when uniforms.bits is 4. - for (var c: u32 = 0; c < ${A}; c++) { - let col_times_components_plus_c = col * ${A} + c; - ${G?` - var zero_point_bytes_per_col: u32 = (${s} + 1) / 2; - var zero_point_byte_count: u32 = col_times_components_plus_c * zero_point_bytes_per_col + (block >> 0x1u); - var zero_point_word_index: u32 = zero_point_byte_count >> 0x2u; - var zero_point_byte_offset: u32 = zero_point_byte_count & 0x3u; - var zero_point_nibble_offset: u32 = block & 0x1u; - var zero_point_bits_offset: u32 = (zero_point_byte_offset << 3) + (zero_point_nibble_offset << 2); - var zero_point_word: u32 = ${G.getByOffset("zero_point_word_index")} >> zero_point_bits_offset;`:""} - var b_indices: ${P.type.indices}; - ${P.indicesSet("b_indices","0","col_times_components_plus_c")}; - // The scale and zero points are computed per block. - var scales_index = col_times_components_plus_c * ${s} + block; - let scale = ${H.getByOffset("scales_index")}; - // The default zero point is 8 for unsigned 4-bit quantization. - let zero_point = ${fe}(${G?"(zero_point_word) & 0xFu":8}); - ${P.indicesSet("b_indices","1","block")}; - var word_offset: u32 = block * ${e.blockSize/w}; - var workgroup_shared_offset: u32 = block * ${o}; - ${Be} - } - workgroupBarrier(); - if (local_id.x == 0u) { - var output_indices: ${N.type.indices}; - ${N.indicesSet("output_indices","0","batch")}; - ${N.indicesSet("output_indices",ne-1,"col")}; - ${N.indicesSet("output_indices",ne-2,"0")}; - var output_offset = ${N.indicesToOffset("output_indices")}; - for (var m: u32 = 0u; m < ${o}u; m++) { - var output_value: ${N.type.value} = ${N.type.value}(0); - var workgroup_shared_offset: u32 = m; - for (var b: u32 = 0u; b < ${s}u; b++) { - output_value += workgroup_shared[workgroup_shared_offset]; - workgroup_shared_offset += ${o}; - } - ${N.setByOffset("output_offset","output_value")}; - output_offset += ${l/A}; - } - } - }`:` - ${oe.registerUniforms(ae).declareVariables(...le,N)} - ${oe.mainStart()} - ${oe.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} - var output_values: array<${N.type.value}, ${y}>; - var output_indices = ${N.offsetToIndices("global_idx")}; - var col = ${N.indicesGet("output_indices",ne-1)}; - var row = ${N.indicesGet("output_indices",ne-2)}; - var a_indices: ${M.type.indices} = output_indices; - // Two zero points are packed into one byte because uniforms.bits <= 4. - // zero_point_offset is either 0 or 4. It is bit offset within one byte. - // TODO support zero_point_offset for bits > 4 - ${G?` - var zero_point_abs_offset = col * ${A} * ((${s} + 1) / 2); - var zero_point_index: u32 = zero_point_abs_offset / 4; - var zero_point_word: u32 = ${G.getByOffset("zero_point_index")}; - var zero_point_offset: u32 = (zero_point_abs_offset % 4) * 8;`:""} - var scale_index = col * ${s*A}; - var b_indices: ${P.type.indices}; - for (var c: u32 = 0; c < ${A}; c++) { - ${P.indicesSet("b_indices","0",`col * ${A} + c`)}; - var block_offset: u32 = 0; - for (var block: u32 = 0; block < ${s}; block++) { - // The scale and zero points are computed per block. - let scale = ${H.getByOffset("scale_index")}; - // The default zero point is 8 for unsigned 4-bit quantization. - let zero_point = ${fe}(${G?"extractBits(zero_point_word, zero_point_offset, 4)":8}); - ${P.indicesSet("b_indices","1","block")}; - var word_offset: u32 = block_offset; - ${Be} - scale_index++; - ${Ke} - block_offset += uniforms.block_size / ${w}; - } - // Drop the trailing 4 bits if the zero_poit_offset is not a byte boundary to align with the next byte. - ${G?`if (zero_point_offset % 8 > 0) { - ${Ke} - }`:""} - } - for (var k: u32 = 0u; k < ${y}u; k++) { - ${N.indicesSet("output_indices",ne-2,`${y} * row + k`)}; - ${N.setByIndices("output_indices","output_values[k]")} - } - }`};return{name:T?"BlockwiseMatMulNBits":"MatMulNBits",shaderCache:{hint:`${e.cacheKey};${o};${c};${t.length}`,inputDependencies:Array(t.length).fill("rank")},getRunData:()=>({outputs:[{dims:B,dataType:c}],name:T?"BlockwiseMatMulNBits":"MatMulNBits",dispatchGroup:T?{x:1,y:Math.ceil(l/A),z:f}:{x:Math.ceil(R/64)},programUniforms:D}),getShaderSource:te}},lm=(t,e)=>{qd(t.inputs,e);let r=t.getMaxComputeWorkgroupSizes(),n=t.getMaxComputeWorkgroupStoragesize();t.compute(Kd(t.inputs,e,r,n))},dm=t=>qe(t)}),yt,Yd,cm,Us,Xd,yi,pm,vy=Z(()=>{$e(),Ae(),lt(),Ho(),Vh(),Te(),Sa(),yt=(t,e)=>t.length>e&&t[e].dims.length>0&&Y.size(t[e].dims)>0?t[e]:void 0,Yd=(t,e)=>{let r=t[0],n=yt(t,1),a=yt(t,2),i=yt(t,3),s=yt(t,4),o=yt(t,5),u=yt(t,6),l=yt(t,7);if(r.dims.length!==3&&r.dims.length!==5)throw new Error("Input query is expected to have 3 or 5 dimensions");let p=!1,f=r.dims[0],m=r.dims[1],c=r.dims.length===3?p?r.dims[2]/3:r.dims[2]:e.numHeads*r.dims[4],y=m,w=0,v=0,k=Math.floor(c/e.numHeads);if(u&&l){if(u.dims.length!==4)throw new Error('Input "past_key" is expected to have 4 dimensions');if(u.dims[0]!==f||u.dims[1]!==e.numHeads||u.dims[3]!==k)throw new Error('Input "past_key" shape (batch_size, num_heads, past_sequence_length, head_size)');if(l.dims[0]!==f||l.dims[1]!==e.numHeads||l.dims[3]!==k)throw new Error('Input "past_value" shape (batch_size, num_heads, past_sequence_length, head_size)');if(u.dims[2]!==l.dims[2])throw new Error('Input "past_key" and "past_value" shall have same dim 2 (past_sequence_length)');if(l.dims.length!==4)throw new Error('Input "past_value" is expected to have 4 dimensions');w=u.dims[2],v=u.dims[2]}else if(u||l)throw new Error('Input "past_key" and "past_value" shall be both present or both absent');let $;if(n){if(r.dims.length!==3)throw new Error('Input "query" is expected to have 3 dimensions when key is given');if(n.dims.length<3||n.dims.length>5)throw new Error('Input "key" is expected to have 3, 4, or 5 dimensions');if(r.dims[0]!==n.dims[0])throw new Error('Input "query" and "key" shall have same dim 0 (batch size)');if(n.dims.length===3){if(n.dims[2]!==r.dims[2])throw new Error('Input "query" and "key" shall have same dim 2 (hidden_size)');$=2,y=n.dims[1]}else if(n.dims.length===5){if(n.dims[2]!==e.numHeads||n.dims[3]!==2||n.dims[4]!==k)throw new Error('Expect "key" shape (batch_size, kv_sequence_length, num_heads, 2, head_size) for packed kv');if(a)throw new Error('Expect "value" be none when "key" has packed kv format.');$=5,y=n.dims[1]}else{if(n.dims[1]!==e.numHeads||n.dims[3]!==k)throw new Error('Expect "key" shape (batch_size, num_heads, kv_sequence_length, head_size) for past_key');$=0,y=n.dims[2]}}else{if(r.dims.length!==3&&r.dims.length!==5)throw new Error('Input "query" is expected to have 3 or 5 dimensions when key is empty');if(r.dims.length===5&&(r.dims[2]!==e.numHeads||r.dims[3]!==3))throw new Error('Expect "query" shape (batch_size, kv_sequence_length, num_heads, 3, head_size) for packed kv');$=3}if(i){if(i.dims.length!==1)throw new Error('Input "bias" is expected to have 1 dimension');if(a&&r.dims.length===5&&r.dims[3]===2)throw new Error("bias is not allowed for packed kv.")}let C=0;if(s){C=8;let D=s.dims;throw D.length===1?D[0]===f?C=1:D[0]===3*f+2&&(C=3):D.length===2&&D[0]===f&&D[1]===y&&(C=5),C===8?new Error('Input "key_padding_mask" shape shall be (batch_size) or (batch_size, kv_sequence_length)'):new Error("Mask not supported")}let T=!1,A=c;if(a){if(a.dims.length!==3&&a.dims.length!==4)throw new Error('Input "value" is expected to have 3 or 4 dimensions');if(r.dims[0]!==a.dims[0])throw new Error('Input "query" and "value" shall have same dim 0 (batch_size)');if(a.dims.length===3){if(y!==a.dims[1])throw new Error('Input "key" and "value" shall have the same dim 1 (kv_sequence_length)');A=a.dims[2]}else{if(y!==a.dims[2])throw new Error('Input "past_key" and "past_value" shall have the same dim 2 (kv_sequence_length)');A=a.dims[1]*a.dims[3],T=!0}}let B=w+y,R=!1;if(s)throw new Error("Key padding mask is not supported");if(o){if(o.dims.length!==4)throw new Error('Input "relative_position_bias" is expected to have 4 dimensions');if(o.dims[0]!==f&&o.dims[0]!==1||o.dims[1]!==e.numHeads||o.dims[2]!==m||o.dims[3]!==B)throw new Error('Input "relative_position_bias" shape (batch_size, 1, sequence_length, kv_sequence_length)')}return{batchSize:f,sequenceLength:m,pastSequenceLength:w,kvSequenceLength:y,totalSequenceLength:B,maxSequenceLength:v,inputHiddenSize:0,hiddenSize:c,vHiddenSize:A,headSize:k,vHeadSize:Math.floor(A/e.numHeads),numHeads:e.numHeads,isUnidirectional:!1,pastPresentShareBuffer:!1,maskFilterValue:e.maskFilterValue,maskType:C,scale:e.scale,broadcastResPosBias:R,passPastInKv:T,qkvFormat:$}},cm=t=>qe({...t}),Us=qe({perm:[0,2,1,3]}),Xd=(t,e,r,n,a,i,s)=>{let o=[n,a,i],u=Y.size(o),l=[{type:12,data:u},{type:12,data:s},{type:12,data:i}],p=f=>{let m=ge("qkv_with_bias",e.dataType,o),c=Q("qkv",e.dataType,o),y=Q("bias",r.dataType,o),w=[{name:"output_size",type:"u32"},{name:"bias_offset",type:"u32"},{name:"hidden_size",type:"u32"}];return` - ${f.registerUniforms(w).declareVariables(c,y,m)} - ${f.mainStart()} - ${f.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} - let bias_offset_idx = (global_idx % uniforms.hidden_size) + uniforms.bias_offset; - - qkv_with_bias[global_idx] = qkv[global_idx] + bias[bias_offset_idx]; - }`};return t.compute({name:"MultiHeadAttentionAddBias",shaderCache:{inputDependencies:["type","type"]},getRunData:()=>({outputs:[{dims:o,dataType:e.dataType,gpuDataType:0}],dispatchGroup:{x:Math.ceil(u/64)},programUniforms:l}),getShaderSource:p},{inputs:[e,r],outputs:[-1]})[0]},yi=(t,e,r,n,a,i,s,o)=>{let u=i;if(s){if(n===1)throw new Error("AddBiasReshape is not implemented. Please export your model with packed QKV or KV");return u=Xd(t,i,s,e,n,r*a,o),u=u.reshape([e,n,r,a]),t.compute(vr(u,Us.perm),{inputs:[u],outputs:[-1]})[0]}else return i.dims.length===3&&(u=i.reshape([e,n,r,a])),t.compute(vr(u,Us.perm),{inputs:[u],outputs:[-1]})[0]},pm=(t,e)=>{let r=Yd(t.inputs,e),n=t.inputs[0],a=yt(t.inputs,1),i=yt(t.inputs,2),s=yt(t.inputs,3),o=yt(t.inputs,4),u=yt(t.inputs,5),l=yt(t.inputs,6),p=yt(t.inputs,7);if(n.dims.length===5)throw new Error("Packed QKV is not implemented");if(a?.dims.length===5)throw new Error("Packed KV is not implemented");let f=a&&i&&a.dims.length===4&&i.dims.length===4,m=yi(t,r.batchSize,r.numHeads,r.sequenceLength,r.headSize,n,s,0);if(f)return Wi(t,m,a,i,o,void 0,l,p,u,r,e);if(!a||!i)throw new Error("key and value must be provided");let c=yi(t,r.batchSize,r.numHeads,r.kvSequenceLength,r.headSize,a,s,r.hiddenSize),y=yi(t,r.batchSize,r.numHeads,r.kvSequenceLength,r.vHeadSize,i,s,2*r.hiddenSize);Wi(t,m,c,y,o,void 0,l,p,u,r,e)}}),Qd,Jd,Zd,ec,tc,rc,nc,ac,hm,$y=Z(()=>{$e(),Ae(),Te(),Qd=t=>{if(!t||t.length<1)throw new Error("Too few inputs");if(t[0].dataType!==1&&t[0].dataType!==10)throw new Error("Input type must be float or float16.");if(t.length>=2){let e=t[0].dims.length*2===t[1].dims[0];if(t.length===4&&(e=t[3].dims[0]*2===t[1].dims[0]),!e)throw new Error("The pads should be a 1D tensor of shape [2 * input_rank] or [2 * num_axes].")}},Jd=(t,e,r)=>{let n="";for(let a=e-1;a>=0;--a)n+=` - k = i32(${t.indicesGet("indices",a)}) - ${Se("uniforms.pads",a,r)}; - if (k < 0) { - break; - } - if (k >= i32(${Se("uniforms.x_shape",a,e)})) { - break; - } - offset += k * i32(${Se("uniforms.x_strides",a,e)}); - `;return` - value = ${t.type.value}(uniforms.constant_value); - for (var i = 0; i < 1; i++) { - var offset = 0; - var k = 0; - ${n} - value = x[offset]; - } - `},Zd=(t,e,r)=>{let n="";for(let a=e-1;a>=0;--a)n+=` - k = i32(${t.indicesGet("indices",a)}) - ${Se("uniforms.pads",a,r)}; - if (k < 0) { - k = -k; - } - { - let _2n_1 = 2 * (i32(${Se("uniforms.x_shape",a,e)}) - 1); - k = k % _2n_1; - if(k >= i32(${Se("uniforms.x_shape",a,e)})) { - k = _2n_1 - k; - } - } - offset += k * i32(${Se("uniforms.x_strides",a,e)}); - `;return` - var offset = 0; - var k = 0; - ${n} - value = x[offset]; - `},ec=(t,e,r)=>{let n="";for(let a=e-1;a>=0;--a)n+=` - k = i32(${t.indicesGet("indices",a)}) - ${Se("uniforms.pads",a,r)}; - if (k < 0) { - k = 0; - } - if (k >= i32(${Se("uniforms.x_shape",a,e)})) { - k = i32(${Se("uniforms.x_shape",a,e)}) - 1; - } - offset += k * i32(${Se("uniforms.x_strides",a,e)}); - `;return` - var offset = 0; - var k = 0; - ${n} - value = x[offset]; - `},tc=(t,e,r)=>{let n="";for(let a=e-1;a>=0;--a)n+=` - k = i32(${t.indicesGet("indices",a)}) - ${Se("uniforms.pads",a,r)}; - if (k < 0) { - k += i32(${Se("uniforms.x_shape",a,e)}]); - } - if (k >= i32(${Se("uniforms.x_shape",a,e)})) { - k -= i32(${Se("uniforms.x_shape",a,e)}); - } - offset += k * i32(${Se("uniforms.x_strides",a,e)}); - `;return` - var offset = 0; - var k = 0; - ${n} - value = x[offset]; - `},rc=(t,e,r)=>{switch(r.mode){case 0:return Jd(t,e,r.pads.length);case 1:return Zd(t,e,r.pads.length);case 2:return ec(t,e,r.pads.length);case 3:return tc(t,e,r.pads.length);default:throw new Error("Invalid mode")}},nc=(t,e)=>{let r=Y.padShape(t[0].dims.slice(),e.pads),n=t[0].dims,a=Y.size(r),i=[{type:12,data:a},{type:6,data:e.pads}];e.mode===0&&i.push({type:t[0].dataType,data:e.value}),i.push(...ye(t[0].dims,r));let s=["rank"],o=u=>{let l=ge("output",t[0].dataType,r.length),p=Q("x",t[0].dataType,n.length),f=p.type.value,m=rc(l,n.length,e),c=[{name:"output_size",type:"u32"},{name:"pads",type:"i32",length:e.pads.length}];return e.mode===0&&c.push({name:"constant_value",type:f}),` - ${u.registerUniforms(c).declareVariables(p,l)} - ${u.mainStart()} - ${u.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} - - let indices = ${l.offsetToIndices("global_idx")}; - - var value = ${f}(0); - ${m} - output[global_idx] = value; - }`};return{name:"Pad",shaderCache:{hint:`${e.mode}`,inputDependencies:s},getRunData:()=>({outputs:[{dims:r,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(Y.size(r)/64)},programUniforms:i}),getShaderSource:o}},ac=(t,e)=>{if(t.length>1){let r=t[1].getBigInt64Array(),n=t.length>=3&&t[2].data?t[2].getFloat32Array()[0]:0,a=t[0].dims.length,i=new Int32Array(2*a).fill(0);if(t.length>=4){let o=t[3].getBigInt64Array();for(let u=0;ui[Number(u)]=Number(o));let s=[];return i.forEach(o=>s.push(o)),{mode:e.mode,value:n,pads:s}}else return e},hm=(t,e)=>{Qd(t.inputs);let r=ac(t.inputs,e);t.compute(nc(t.inputs,r),{inputs:[0]})}}),ra,Ws,Vs,Gs,Hs,ic,sc,js,qs,fm,mm,Ks,gm,_m,Ys,ym,wm,bm,vm,xy=Z(()=>{ar(),$e(),Ae(),Te(),ra=t=>{if(Ue.webgpu.validateInputContent&&(!t||t.length!==1))throw new Error("Pool ops requires 1 input.")},Ws=(t,e,r)=>{let n=e.format==="NHWC",a=t.dims.slice();n&&a.splice(1,0,a.pop());let i=Object.hasOwnProperty.call(e,"dilations"),s=e.kernelShape.slice(),o=e.strides.slice(),u=i?e.dilations.slice():[],l=e.pads.slice();Fi.adjustPoolAttributes(r,a,s,o,u,l);let p=Fi.computePoolOutputShape(r,a,o,u,s,l,e.autoPad),f=Object.assign({},e);i?Object.assign(f,{kernelShape:s,strides:o,pads:l,dilations:u,cacheKey:e.cacheKey}):Object.assign(f,{kernelShape:s,strides:o,pads:l,cacheKey:e.cacheKey});let m=p.slice();return m.push(m.splice(1,1)[0]),[f,n?m:p]},Vs=(t,e)=>{let r=e.format==="NHWC",n=Y.size(t),a=Y.size(e.kernelShape),i=[{type:12,data:n},{type:12,data:a}],s=[{name:"outputSize",type:"u32"},{name:"kernelSize",type:"u32"}];if(e.kernelShape.length<=2){let o=e.kernelShape[e.kernelShape.length-1],u=e.strides[e.strides.length-1],l=e.pads[e.pads.length/2-1],p=e.pads[e.pads.length-1],f=!!(l+p);i.push({type:12,data:o},{type:12,data:u},{type:12,data:l},{type:12,data:p}),s.push({name:"kw",type:"u32"},{name:"sw",type:"u32"},{name:"pwStart",type:"u32"},{name:"pwEnd",type:"u32"});let m=!1;if(e.kernelShape.length===2){let c=e.kernelShape[e.kernelShape.length-2],y=e.strides[e.strides.length-2],w=e.pads[e.pads.length/2-2],v=e.pads[e.pads.length-2];m=!!(w+v),i.push({type:12,data:c},{type:12,data:y},{type:12,data:w},{type:12,data:v}),s.push({name:"kh",type:"u32"},{name:"sh",type:"u32"},{name:"phStart",type:"u32"},{name:"phEnd",type:"u32"})}return[i,s,!0,f,m]}else{if(r)throw new Error("Pooling with kernelShape.length > 2 is not supported for NHWC format.");let o=Y.computeStrides(e.kernelShape);i.push({type:12,data:o},{type:12,data:e.pads},{type:12,data:e.strides}),s.push({name:"kernelStrides",type:"u32",length:o.length},{name:"pads",type:"u32",length:e.pads.length},{name:"strides",type:"u32",length:e.strides.length});let u=e.pads.reduce((l,p)=>l+p);return[i,s,!!u,!1,!1]}},Gs=(t,e,r,n,a,i,s,o,u,l,p,f)=>{let m=a.format==="NHWC",c=e.type.value,y=ge("output",e.type.tensor,n);if(a.kernelShape.length<=2){let w="",v="",k="",$=r-(m?2:1);if(p?w=` - for (var i: u32 = 0u; i < uniforms.kw; i++) { - xIndices[${$}] = indices[${$}] * uniforms.sw - uniforms.pwStart + i; - if (xIndices[${$}] < 0 || xIndices[${$}] - >= uniforms.x_shape[${$}]) { - pad++; - continue; - } - let x_val = x[${e.indicesToOffset("xIndices")}]; - ${i} - }`:w=` - for (var i: u32 = 0u; i < uniforms.kw; i++) { - xIndices[${$}] = indices[${$}] * uniforms.sw - uniforms.pwStart + i; - let x_val = x[${e.indicesToOffset("xIndices")}]; - ${i} - }`,a.kernelShape.length===2){let C=r-(m?3:2);f?v=` - for (var j: u32 = 0u; j < uniforms.kh; j++) { - xIndices[${C}] = indices[${C}] * uniforms.sh - uniforms.phStart + j; - if (xIndices[${C}] < 0 || xIndices[${C}] >= uniforms.x_shape[${C}]) { - pad += i32(uniforms.kw); - continue; - } - `:v=` - for (var j: u32 = 0u; j < uniforms.kh; j++) { - xIndices[${C}] = indices[${C}] * uniforms.sh - uniforms.phStart + j; - `,k=` - } - `}return` - ${t.registerUniforms(u).declareVariables(e,y)} - - ${t.mainStart()} - ${t.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} - - let indices = ${y.offsetToIndices("global_idx")}; - var xIndices = ${y.offsetToIndices("global_idx")}; - - var value = ${c}(${o}); - var pad = 0; - ${v} - ${w} - ${k} - ${s} - - output[global_idx] = value; - }`}else{if(m)throw new Error("Pooling with kernelShape.length > 2 is not supported for NHWC format.");let w=a.kernelShape.length,v=a.pads.length,k="";return l?k=` - if (xIndices[j] >= uniforms.x_shape[j]) { - pad++; - isPad = true; - break; - } - } - if (!isPad) { - let x_val = x[${e.indicesToOffset("xIndices")}]; - ${i} - }`:k=` - } - let x_val = x[${e.indicesToOffset("xIndices")}]; - ${i} - `,` - ${t.registerUniforms(u).declareVariables(e,y)} - - ${t.mainStart()} - ${t.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} - let indices = ${y.offsetToIndices("global_idx")}; - var xIndices = ${y.offsetToIndices("global_idx")}; - - var offsets: array; - - var value = ${c}(${o}); - var pad = 0; - var isPad = false; - - for (var i: u32 = 0u; i < uniforms.kernelSize; i++) { - var offset = i; - for (var j = 0u; j < ${w-1}u; j++) { - offsets[j] = offset / ${Se("uniforms.kernelStrides","j",w)}; - offset -= offsets[j] * ${Se("uniforms.kernelStrides","j",w)}; - } - offsets[${w-1}] = offset; - - isPad = false; - for (var j = ${r-w}u; j < ${r}u; j++) { - xIndices[j] = indices[j] * ${Se("uniforms.strides",`j - ${r-w}u`,w)} - + offsets[j - ${r-w}u] - ${Se("uniforms.pads","j - 2u",v)}; - ${k} - } - ${s} - - output[global_idx] = value; - }`}},Hs=t=>`${t.format};${t.ceilMode};${t.autoPad};${t.kernelShape.length}`,ic=t=>`${Hs(t)};${t.countIncludePad}`,sc=t=>`${Hs(t)};${t.storageOrder};${t.dilations}`,js=t=>({format:t.format,autoPad:["NOTSET","VALID","SAME_UPPER","SAME_LOWER"][t.auto_pad],ceilMode:t.ceil_mode,kernelShape:t.kernel_shape,strides:t.strides,pads:t.pads}),qs=(t,e,r,n)=>{let[a,i]=Ws(e,n,r),s=Q("x",e.dataType,e.dims.length),o=s.type.value,u="value += x_val;",l="";a.countIncludePad?l+=`value /= ${o}(uniforms.kernelSize);`:l+=`value /= ${o}(i32(uniforms.kernelSize) - pad);`;let[p,f,m,c,y]=Vs(i,a);p.push(...ye(e.dims,i));let w=["rank"];return{name:t,shaderCache:{hint:`${n.cacheKey};${m};${c};${y}`,inputDependencies:w},getRunData:()=>({outputs:[{dims:i,dataType:e.dataType}],dispatchGroup:{x:Math.ceil(Y.size(i)/64)},programUniforms:p}),getShaderSource:v=>Gs(v,s,e.dims.length,i.length,a,u,l,0,f,m,c,y)}},fm=t=>{let e=t.count_include_pad!==0,r=js(t);if(r.ceilMode!==0)throw new Error("using ceil() in shape computation is not yet supported for AveragePool");let n={countIncludePad:e,...r,cacheKey:""};return{...n,cacheKey:ic(n)}},mm=(t,e)=>{ra(t.inputs),t.compute(qs("AveragePool",t.inputs[0],!1,e))},Ks={autoPad:"",ceilMode:0,countIncludePad:!1,kernelShape:[],strides:[],pads:[],storageOrder:0,dilations:[]},gm=t=>{let e=t.format;return{format:e,...Ks,cacheKey:e}},_m=(t,e)=>{ra(t.inputs),t.compute(qs("GlobalAveragePool",t.inputs[0],!0,e))},Ys=(t,e,r,n)=>{let[a,i]=Ws(e,n,r),s=` - value = max(x_val, value); - `,o="",u=Q("x",e.dataType,e.dims.length),l=["rank"],[p,f,m,c,y]=Vs(i,a);return p.push(...ye(e.dims,i)),{name:t,shaderCache:{hint:`${n.cacheKey};${m};${c};${y}`,inputDependencies:l},getRunData:()=>({outputs:[{dims:i,dataType:e.dataType}],dispatchGroup:{x:Math.ceil(Y.size(i)/64)},programUniforms:p}),getShaderSource:w=>Gs(w,u,e.dims.length,i.length,a,s,o,e.dataType===10?-65504:-1e5,f,m,c,y)}},ym=(t,e)=>{ra(t.inputs),t.compute(Ys("MaxPool",t.inputs[0],!1,e))},wm=t=>{let e=t.storage_order,r=t.dilations,n=js(t);if(e!==0)throw new Error("column major storage order is not yet supported for MaxPool");if(n.ceilMode!==0)throw new Error("using ceil() in shape computation is not yet supported for MaxPool");let a={storageOrder:e,dilations:r,...n,cacheKey:""};return{...a,cacheKey:sc(a)}},bm=t=>{let e=t.format;return{format:e,...Ks,cacheKey:e}},vm=(t,e)=>{ra(t.inputs),t.compute(Ys("GlobalMaxPool",t.inputs[0],!0,e))}}),oc,uc,$m,Sy=Z(()=>{ar(),$e(),Te(),oc=(t,e,r)=>{let n=t===e,a=te&&r>0;if(n||a||i)throw new Error("Range these inputs' contents are invalid.")},uc=(t,e,r,n)=>{let a=Math.abs(Math.ceil((e-t)/r)),i=[a],s=a,o=[{type:12,data:s},{type:n,data:t},{type:n,data:r},...ye(i)],u=l=>{let p=ge("output",n,i.length),f=p.type.value,m=[{name:"outputSize",type:"u32"},{name:"start",type:f},{name:"delta",type:f}];return` - ${l.registerUniforms(m).declareVariables(p)} - ${l.mainStart()} - ${l.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} - output[global_idx] = uniforms.start + ${f}(global_idx) * uniforms.delta; - }`};return{name:"Range",shaderCache:{hint:`${n}`},getShaderSource:u,getRunData:()=>({outputs:[{dims:i,dataType:n}],dispatchGroup:{x:Math.ceil(s/64)},programUniforms:o})}},$m=t=>{let e=0,r=0,n=0;t.inputs[0].dataType===6?(e=t.inputs[0].getInt32Array()[0],r=t.inputs[1].getInt32Array()[0],n=t.inputs[2].getInt32Array()[0]):t.inputs[0].dataType===1&&(e=t.inputs[0].getFloat32Array()[0],r=t.inputs[1].getFloat32Array()[0],n=t.inputs[2].getFloat32Array()[0]),Ue.webgpu.validateInputContent&&oc(e,r,n),t.compute(uc(e,r,n,t.inputs[0].dataType),{inputs:[]})}}),lc,dc,cc,pc,hc,fc,mc,gc,_c,yc,wc,Xs,bc,vc,$c,xc,Sc,xm,Sm,ky=Z(()=>{$e(),Ae(),lt(),Te(),lc=(t,e)=>{if(t.every(r=>r>0||(()=>{throw new Error("Resize requires scales input values to be positive")})),t.length>0){if(e.mode==="linear"){if(!(t.length===2||t.length===3||t.length===4&&t[0]===1&&t[1]===1||t.length===4&&t[0]===1&&t[3]===1||t.length===5&&t[0]===1&&t[1]===1))throw new Error(`For linear mode, Resize requires scales to be 2D, 3D, 4D with either two outermost or one innermost and - one outermost scale values equal to 1, or 5D with two outermost scale values equal to 1`)}else if(e.mode==="cubic"&&!(t.length===2||t.length===4&&t[0]===1&&t[1]===1||t.length===4&&t[0]===1&&t[3]===1))throw new Error("Resize requires scales input size to be 2 or 4 for cubic mode")}},dc=(t,e,r)=>{e.every(a=>a>=0&&a{throw new Error("Resize requires axes input values to be positive and less than rank")}));let n=new Array(r).fill(1);return e.forEach((a,i)=>n[a]=t[i]),n},cc=(t,e,r,n,a,i)=>{let[s,o,u]=r>10?[1,2,3]:[-1,t.length>1?1:-1,-1],l=t[0].dims.length;if(s>0&&t.length>s&&t[s].dims.length>0)t[s].getFloat32Array().forEach(p=>i.push(p));else if(e.coordinateTransformMode==="tf_crop_and_resize")throw new Error("Resize requires RoI input to be specified when coordinateTransformMode is tfCropAndResize");if(o>0&&t.length>o&&t[o].dims.length>0){if(t[o].getFloat32Array().forEach(p=>n.push(p)),n.length!==0&&n.length!==l&&r>=18&&n.length!==e.axes.length)throw new Error("Resize requires scales input size to be same as input rank or axes size for opset 18 and up");lc(n,e),e.axes.length>0&&dc(n,e.axes,l).forEach((p,f)=>n[f]=p)}if(u>0&&t.length>u&&(t[u].getBigInt64Array().forEach(p=>a.push(Number(p))),a.length!==l||r>=18&&a.length===e.axes.length))throw new Error("Resize requires sizes input size to be same as input rank or axes size for opset 18 and up");if(e.axes.length>0){if(n.length!==e.axes.length)throw new Error('Resize requires "scales" input size to be of axes rank when axes attributes is specified');if(a.length!==e.axes.length)throw new Error('Resize requires "sizes" input size to be of rank axes rank when axes attributes is specified')}if(typeof n<"u"&&typeof a<"u"&&n.length>0&&a.length>l)throw new Error("Resize requires only of scales or sizes to be specified")},pc=(t,e)=>`fn getOriginalCoordinateFromResizedCoordinate(xResized: u32, xScale: f32, lengthResized: u32, - lengthOriginal: u32, roiStart: f32, roiEnd: f32) -> ${e} { `+(()=>{switch(t){case"asymmetric":return`return ${e}(xResized) / ${e}(xScale);`;case"pytorch_half_pixel":return`if (lengthResized > 1) { - return (${e}(xResized) + 0.5) / ${e}(xScale) - 0.5; - } else { - return 0.0; - }`;case"tf_half_pixel_for_nn":return`return (${e}(xResized) + 0.5) / ${e}(xScale);`;case"align_corners":return`if (lengthResized == 1) { - return 0.0; - } else { - // The whole part and the fractional part are calculated separately due to inaccuracy of floating - // point division. As an example, f32(21) / f32(7) may evaluate to 2.99... instead of 3, causing an - // offset-by-one error later in floor(). - let whole = ${e}(xResized * (lengthOriginal - 1) / (lengthResized - 1)); - let fract = - ${e}(xResized * (lengthOriginal - 1) % (lengthResized - 1)) / ${e}(lengthResized - 1); - return whole + fract; - }`;case"tf_crop_and_resize":return`if (lengthResized > 1) { - return ${e}(roiStart) * ${e}(lengthOriginal - 1) + - (${e}(xResized) * ${e}(roiEnd - roiStart) * ${e}(lengthOriginal - 1)) / - ${e}(lengthResized - 1); - } else { - return 0.5 * ${e}(roiStart + roiEnd) * ${e}(lengthOriginal - 1); - }`;case"half_pixel_symmetric":return`const outputWidth = ${e}xScale * ${e}(lengthResized); - const adjustment = ${e}(lengthResized) / outputWidth; - const center = ${e}(lengthOriginal) / 2; - const offset = center * (1 - adjustment); - return offset + ((${e}(xResized) + 0.5) / ${e}(xScale)) - 0.5;`;case"half_pixel":return`return ((${e}(xResized) + 0.5) / ${e}(xScale)) - 0.5;`;default:throw new Error(`Coordinate transform mode ${t} is not supported`)}})()+"}",hc=(t,e,r)=>`fn getNearestPixelFromOriginal(xOriginal: ${r}, isDownSample: bool) -> ${r} {`+(()=>{switch(t){case"round_prefer_ceil":return"if (fract(xOriginal) == 0.5) { return ceil(xOriginal); } else { return round(xOriginal); }";case"floor":return"return floor(xOriginal);";case"ceil":return"return ceil(xOriginal);";case"round_prefer_floor":return"if (fract(xOriginal) == 0.5) { return floor(xOriginal); } else { return round(xOriginal); }";case"simple":default:if(e<11)return"if (isDownSample) { return ceil(xOriginal); } else { return xOriginal; }";throw new Error(`Nearest mode ${t} is not supported`)}})()+"}",fc=(t,e,r)=>{let n=new Array(r).fill(0).concat(new Array(r).fill(1)),a=t.length===0?n:t.slice();return e.length>0?(e.forEach((i,s)=>{n[i]=a[s],n[s+r]=a[e.length+s]}),n):a},mc=(t,e,r,n)=>{let a=[];if(r.length>0)if(n.length>0){if(t.forEach(i=>a.push(i)),Math.max(...n)>t.length)throw new Error("axes is out of bound");n.forEach((i,s)=>a[i]=r[s])}else r.forEach(i=>a.push(i));else{if(e.length===0)throw new Error("Resize requires either scales or sizes.");a=t.map((i,s)=>Math.round(i*e[s]))}return a},gc=(t,e,r)=>{let n=(()=>{switch(r.keepAspectRatioPolicy){case"not_larger":return r.axes.length>0?Math.min(...r.axes.map(i=>e[i]),Number.MAX_VALUE):Math.min(...e,Number.MAX_VALUE);case"not_smaller":return r.axes.length>0?Math.max(...r.axes.map(i=>e[i]),Number.MIN_VALUE):Math.max(...e,Number.MIN_VALUE);default:throw new Error(`Keep aspect ratio policy ${r.keepAspectRatioPolicy} is not supported`)}})();e.fill(1,0,e.length);let a=t.slice();return r.axes.length>0?(r.axes.forEach(i=>e[i]=n),r.axes.forEach(i=>a[i]=Math.round(t[i]*e[i]))):(e.fill(n,0,e.length),a.forEach((i,s)=>a[s]=Math.round(i*e[s]))),a},_c=(t,e,r,n,a)=>` - fn calculateOriginalIndicesFromOutputIndices(output_indices: ${t.type.indices}) -> array<${t.type.value}, ${r.length}> { - var original_indices: array<${t.type.value}, ${r.length}>; - for (var i:u32 = 0; i < ${r.length}; i++) { - var output_index = ${t.indicesGet("output_indices","i")}; - var scale = ${Se("uniforms.scales","i",n)}; - var roi_low = ${Se("uniforms.roi","i",a)}; - var roi_hi = ${Se("uniforms.roi",`i + ${e.length}`,a)}; - if (scale == 1.0) { - original_indices[i] = ${t.type.value}(output_index); - } else { - var input_shape_i = ${Se("uniforms.input_shape","i",e.length)}; - var output_shape_i = ${Se("uniforms.output_shape","i",r.length)}; - original_indices[i] = getOriginalCoordinateFromResizedCoordinate(output_index, scale, output_shape_i, - input_shape_i, roi_low, roi_hi); - } - } - return original_indices; - }`,yc=(t,e,r,n,a,i,s)=>` - fn calculateInputIndicesFromOutputIndices(output_indices: ${e.type.indices}) -> ${t.type.indices} { - var input_indices: ${t.type.indices}; - for (var i:u32 = 0; i < ${n.length}; i++) { - var output_index = ${e.indicesGet("output_indices","i")}; - var input_index: u32; - var scale = ${Se("uniforms.scales","i",a)}; - if (scale == 1.0) { - input_index = output_index; - } else { - var roi_low = ${Se("uniforms.roi","i",i)}; - var roi_hi = ${Se("uniforms.roi",`i + ${r.length}`,i)}; - var input_shape_i = ${Se("uniforms.input_shape","i",r.length)}; - var output_shape_i = ${Se("uniforms.output_shape","i",n.length)}; - var original_idx = getOriginalCoordinateFromResizedCoordinate(output_index, scale, output_shape_i, - input_shape_i, roi_low, roi_hi); - if (!${s} || (original_idx >= 0 && original_idx < ${e.type.value}(input_shape_i))) { - if (original_idx < 0) { - input_index = 0; - } else if (original_idx > ${e.type.value}(input_shape_i - 1)) { - input_index = input_shape_i - 1; - } else { - input_index = u32(getNearestPixelFromOriginal(original_idx, scale < 1)); - } - } else { - input_index = u32(original_idx); - } - } - ${t.indicesSet("input_indices","i"," input_index")} - } - return input_indices; - }`,wc=(t,e)=>` - fn checkInputIndices(input_indices: ${t.type.indices}) -> bool { - for (var i:u32 = 0; i < ${e.length}; i++) { - var input_index = ${t.indicesGet("input_indices","i")}; - if (input_index < 0 || input_index >= ${Se("uniforms.input_shape","i",e.length)}) { - return false; - } - } - return true; - }`,Xs=(t,e,r,n)=>t.rank>n?` - ${t.indicesSet("input_indices",e,"channel")}; - ${t.indicesSet("input_indices",r,"batch")}; -`:"",bc=(t,e,r,n,a)=>{let[i,s,o,u]=r.length===2?[-1,0,1,-1]:[0,2,3,1],l=t.type.value;return` - fn getInputValue(batch: u32, channel: u32, row: u32, col: u32) -> ${l} { - var input_indices: ${t.type.indices}; - ${t.indicesSet("input_indices",s,`max(0, min(row, ${r[s]} - 1))`)}; - ${t.indicesSet("input_indices",o,`max(0, min(col, ${r[o]} - 1))`)}; - ${Xs(t,u,i,2)} - return ${t.getByIndices("input_indices")}; - } - - fn bilinearInterpolation(output_indices: ${e.type.indices}) -> ${l} { - var originalIndices = calculateOriginalIndicesFromOutputIndices(output_indices); - var row:${l} = originalIndices[${s}]; - var col:${l} = originalIndices[${o}]; - ${n?`if (row < 0 || row > (${r[s]} - 1) || col < 0 || col > (${r[o]} - 1)) { - return ${a}; - }`:""}; - row = max(0, min(row, ${r[s]} - 1)); - col = max(0, min(col, ${r[o]} - 1)); - var row1: u32 = u32(row); - var col1: u32 = u32(col); - var row2: u32 = u32(row + 1); - var col2: u32 = u32(col + 1); - var channel: u32 = ${r.length>2?`u32(originalIndices[${u}])`:"0"}; - var batch: u32 = ${r.length>2?`u32(originalIndices[${i}])`:"0"}; - var x11: ${l} = getInputValue(batch, channel, row1, col1); - var x12: ${l} = getInputValue(batch, channel, row1, col2); - var x21: ${l} = getInputValue(batch, channel, row2, col1); - var x22: ${l} = getInputValue(batch, channel, row2, col2); - var dx1: ${l} = abs(row - ${l}(row1)); - var dx2: ${l} = abs(${l}(row2) - row); - var dy1: ${l} = abs(col - ${l}(col1)); - var dy2: ${l} = abs(${l}(col2) - col); - if (row1 == row2) { - dx1 = 0.5; - dx2 = 0.5; - } - if (col1 == col2) { - dy1 = 0.5; - dy2 = 0.5; - } - return (x11 * dx2 * dy2 + x12 * dx2 * dy1 + x21 * dx1 * dy2 + x22 * dx1 * dy1); - }`},vc=(t,e,r,n,a,i,s,o,u,l)=>{let p=r.length===2,[f,m]=p?[0,1]:[2,3],c=t.type.value,y=w=>{let v=w===f?"row":"col";return` - fn ${v}CubicInterpolation(input_indices: ${t.type.indices}, output_indices: ${e.type.indices}) -> ${c} { - var output_index = ${e.indicesGet("output_indices",w)}; - var originalIdx: ${c} = getOriginalCoordinateFromResizedCoordinate(output_index, ${a[w]}, - ${n[w]}, ${r[w]}, ${i[w]}, ${i[w]} + ${r.length}); - var fractOriginalIdx: ${c} = originalIdx - floor(originalIdx); - var coefs = getCubicInterpolationCoefs(fractOriginalIdx); - - if (${o} && (originalIdx < 0 || originalIdx > (${r[w]} - 1))) { - return ${u}; - } - var data: array<${c}, 4> = array<${c}, 4>(0.0, 0.0, 0.0, 0.0); - for (var i: i32 = -1; i < 3; i++) { - var ${v}: ${c} = originalIdx + ${c}(i); - if (${v} < 0 || ${v} >= ${r[w]}) { - ${l?`coefs[i + 1] = 0.0; - continue;`:o?`return ${u};`:`${v} = max(0, min(${v}, ${r[w]} - 1));`}; - } - var input_indices_copy: ${t.type.indices} = input_indices; - ${t.indicesSet("input_indices_copy",w,`u32(${v})`)}; - data[i + 1] = ${w===f?t.getByIndices("input_indices_copy"):"rowCubicInterpolation(input_indices_copy, output_indices)"}; - } - return cubicInterpolation1D(data, coefs); - }`};return` - ${y(f)}; - ${y(m)}; - fn getCubicInterpolationCoefs(s: ${c}) -> array<${c}, 4> { - var absS = abs(s); - var coeffs: array<${c}, 4> = array<${c}, 4>(0.0, 0.0, 0.0, 0.0); - var oneMinusAbsS: ${c} = 1.0 - absS; - var twoMinusAbsS: ${c} = 2.0 - absS; - var onePlusAbsS: ${c} = 1.0 + absS; - coeffs[0] = ((${s} * onePlusAbsS - 5 * ${s}) * onePlusAbsS + 8 * ${s}) * onePlusAbsS - 4 * ${s}; - coeffs[1] = ((${s} + 2) * absS - (${s} + 3)) * absS * absS + 1; - coeffs[2] = ((${s} + 2) * oneMinusAbsS - (${s} + 3)) * oneMinusAbsS * oneMinusAbsS + 1; - coeffs[3] = ((${s} * twoMinusAbsS - 5 * ${s}) * twoMinusAbsS + 8 * ${s}) * twoMinusAbsS - 4 * ${s}; - return coeffs; - } - - fn cubicInterpolation1D(x: array<${c}, 4>, coefs: array<${c}, 4>) -> ${c} { - var coefsSum: ${c} = coefs[0] + coefs[1] + coefs[2] + coefs[3]; - return (x[0] * coefs[0] + x[1] * coefs[1]+ x[2] * coefs[2]+ x[3] * coefs[3]) / coefsSum; - } - - fn bicubicInterpolation(output_indices: ${e.type.indices}) -> ${c} { - var input_indices: ${t.type.indices} = output_indices; - return colCubicInterpolation(input_indices, output_indices); - } - `},$c=(t,e,r,n,a)=>{let[i,s,o,u,l]=r.length===3?[-1,0,1,2,-1]:[0,2,3,4,1],p=t.type.value;return` - fn getInputValue(batch: u32, channel: u32, depth:u32, height: u32, width: u32) -> ${p} { - var input_indices: ${t.type.indices}; - ${t.indicesSet("input_indices",s,`max(0, min(depth, ${r[s]} - 1))`)}; - ${t.indicesSet("input_indices",o,`max(0, min(height, ${r[o]} - 1))`)}; - ${t.indicesSet("input_indices",u,`max(0, min(width, ${r[u]} - 1))`)}; - ${Xs(t,l,i,3)} - return ${t.getByIndices("input_indices")}; - } - - fn trilinearInterpolation(output_indices: ${e.type.indices}) -> ${p} { - var originalIndices = calculateOriginalIndicesFromOutputIndices(output_indices); - var depth:${p} = originalIndices[${s}]; - var height:${p} = originalIndices[${o}]; - var width:${p} = originalIndices[${u}]; - ${n?`if (depth < 0 || depth > (${r[s]} - 1) || height < 0 || height > (${r[o]} - 1) || width < 0 || (width > ${r[u]} - 1)) { - return ${a}; - }`:""}; - - depth = max(0, min(depth, ${r[s]} - 1)); - height = max(0, min(height, ${r[o]} - 1)); - width = max(0, min(width, ${r[u]} - 1)); - var depth1: u32 = u32(depth); - var height1: u32 = u32(height); - var width1: u32 = u32(width); - var depth2: u32 = u32(depth + 1); - var height2: u32 = u32(height + 1); - var width2: u32 = u32(width + 1); - var channel: u32 = ${r.length>3?`u32(originalIndices[${l}])`:"0"}; - var batch: u32 = ${r.length>3?`u32(originalIndices[${i}])`:"0"}; - - var x111: ${p} = getInputValue(batch, channel, depth1, height1, width1); - var x112: ${p} = getInputValue(batch, channel, depth1, height1, width2); - var x121: ${p} = getInputValue(batch, channel, depth1, height2, width1); - var x122: ${p} = getInputValue(batch, channel, depth1, height2, width2); - var x211: ${p} = getInputValue(batch, channel, depth2, height1, width1); - var x212: ${p} = getInputValue(batch, channel, depth2, height1, width2); - var x221: ${p} = getInputValue(batch, channel, depth2, height2, width1); - var x222: ${p} = getInputValue(batch, channel, depth2, height2, width2); - var dx1: ${p} = abs(depth - ${p}(depth1)); - var dx2: ${p} = abs(${p}(depth2) - depth); - var dy1: ${p} = abs(height - ${p}(height1)); - var dy2: ${p} = abs(${p}(height2) - height); - var dz1: ${p} = abs(width - ${p}(width1)); - var dz2: ${p} = abs(${p}(width2) - width); - if (depth1 == depth2) { - dx1 = 0.5; - dx2 = 0.5; - } - if (height1 == height2) { - dy1 = 0.5; - dy2 = 0.5; - } - if (width1 == width2) { - dz1 = 0.5; - dz2 = 0.5; - } - return (x111 * dx2 * dy2 * dz2 + x112 * dx2 * dy2 * dz1 + x121 * dx2 * dy1 *dz2 + x122 * dx2 * dy1 * dz1 + - x211 * dx1 * dy2 * dz2 + x212 * dx1 * dy2 * dz1 + x221 * dx1 * dy1 *dz2 + x222 * dx1 * dy1 * dz1); - }`},xc=(t,e,r,n,a,i)=>{let s=t.dims,o=fc(i,e.axes,s.length),u=mc(s,n,a,e.axes),l=n.slice();n.length===0&&(l=s.map(($,C)=>$===0?1:u[C]/$),e.keepAspectRatioPolicy!=="stretch"&&(u=gc(s,l,e)));let p=ge("output",t.dataType,u.length),f=Q("input",t.dataType,s.length),m=Y.size(u),c=s.length===u.length&&s.every(($,C)=>$===u[C]),y=e.coordinateTransformMode==="tf_crop_and_resize",w=e.extrapolationValue,v=f.type.value,k=$=>` - ${c?"":` - ${pc(e.coordinateTransformMode,v)}; - ${(()=>{switch(e.mode){case"nearest":return` - ${wc(f,s)}; - ${hc(e.nearestMode,r,v)}; - ${yc(f,p,s,u,l.length,o.length,y)}; - `;case"linear":return` - ${_c(p,s,u,l.length,o.length)}; - ${(()=>{if(s.length===2||s.length===4)return`${bc(f,p,s,y,w)}`;if(s.length===3||s.length===5)return`${$c(f,p,s,y,w)}`;throw Error("Linear mode only supports input dims 2, 3, 4 and 5 are supported in linear mode.")})()}; - `;case"cubic":return` - ${(()=>{if(s.length===2||s.length===4)return`${vc(f,p,s,u,l,o,e.cubicCoeffA,y,e.extrapolationValue,e.excludeOutside)}`;throw Error("Cubic mode only supports input dims 2 and 4 are supported in linear mode.")})()}; - `;default:throw Error("Invalid resize mode")}})()}; - `} - ${$.registerUniform("output_size","u32").registerUniform("scales","f32",l.length).registerUniform("roi","f32",o.length).declareVariables(f,p)} - ${$.mainStart()} - ${$.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} - ${c?"output[global_idx] = input[global_idx];":` - let output_indices = ${p.offsetToIndices("global_idx")}; - var input_indices: ${f.type.indices}; - ${(()=>{switch(e.mode){case"nearest":return`input_indices = calculateInputIndicesFromOutputIndices(output_indices); - if (checkInputIndices(input_indices)) { - output[global_idx] = ${f.getByIndices("input_indices")}; - } else { - output[global_idx] = ${e.extrapolationValue}; - }`;case"linear":return`output[global_idx] = ${s.length===2||s.length===4?"bilinearInterpolation":"trilinearInterpolation"}(output_indices);`;case"cubic":return"output[global_idx] = bicubicInterpolation(output_indices);";default:throw Error(`Unsupported resize mode: ${e.mode}`)}})()}; -`} - }`;return{name:"Resize",shaderCache:{hint:`${e.cacheKey}|${r}|${l.length>0?l:""}|${a.length>0?a:""}|${o.length>0?o:""}|${c}|${s}`,inputDependencies:["rank"]},getShaderSource:k,getRunData:()=>({outputs:[{dims:u,dataType:t.dataType}],dispatchGroup:{x:Math.ceil(m/64)},programUniforms:[{type:12,data:m},{type:1,data:l},{type:1,data:o},...ye(s,u)]})}},Sc=t=>{let e=t.customDataBuffer;return new Uint32Array(e,e.byteOffset,1)[0]},xm=(t,e)=>{let r=[],n=[],a=[],i=Sc(t);if(e.antialias!==0)throw Error("Only default value (0) for Antialias attribute is supported");cc(t.inputs,e,i,r,n,a),t.compute(xc(t.inputs[0],e,i,r,n,a),{inputs:[0]})},Sm=t=>{let e=t.antialias,r=t.axes,n=t.coordinateTransformMode,a=t.cubicCoeffA,i=t.excludeOutside!==0,s=t.extrapolationValue,o=t.keepAspectRatioPolicy,u=t.mode,l=t.nearestMode===""?"simple":t.nearestMode;return qe({antialias:e,axes:r,coordinateTransformMode:n,cubicCoeffA:a,excludeOutside:i,extrapolationValue:s,keepAspectRatioPolicy:o,mode:u,nearestMode:l})}}),kc,Ec,km,Ey=Z(()=>{$e(),Ae(),lt(),Te(),kc=(t,e)=>{let[r,n,a,i]=t,{numHeads:s,rotaryEmbeddingDim:o}=e;if(r.dims.length!==3&&r.dims.length!==4)throw new Error(`Input 'x' is expected to have 3 or 4 dimensions, got ${r.dims.length}`);if(!Y.areEqual(n.dims,[])&&!Y.areEqual(n.dims,[1])&&n.dims.length!==2)throw new Error(`Input 'position_ids' is expected to have 0, 1, or 2 dimensions, got ${n.dims.length}`);if(a.dims.length!==2)throw new Error(`Input 'cos_cache' is expected to have 2 dimensions, got ${a.dims.length}`);if(i.dims.length!==2)throw new Error(`Input 'sin_cache' is expected to have 2 dimensions, got ${i.dims.length}`);if(!Y.areEqual(a.dims,i.dims))throw new Error("Inputs 'cos_cache' and 'sin_cache' are expected to have the same shape");if(o>0&&s===0)throw new Error("num_heads must be provided if rotary_embedding_dim is specified");let u=r.dims[0],l=r.dims[r.dims.length-2],p=a.dims[0],f=Y.sizeFromDimension(r.dims,1)/l,m=o===0?a.dims[1]*2:f/s;if(o>m)throw new Error("rotary_embedding_dim must be less than or equal to head_size");if(n.dims.length===2){if(u!==n.dims[0])throw new Error(`Input 'position_ids' dimension 0 should be of size batch_size, got ${n.dims[0]}`);if(l!==n.dims[1])throw new Error(`Input 'position_ids' dimension 1 should be of size sequence_length, got ${n.dims[1]}`)}if(m/2!==a.dims[1]&&o/2!==a.dims[1])throw new Error(`Input 'cos_cache' dimension 1 should be same as head_size / 2 or rotary_embedding_dim / 2, got ${a.dims[1]}`);if(l>p)throw new Error("Updating cos_cache and sin_cache in RotaryEmbedding is not currently supported")},Ec=(t,e)=>{let{interleaved:r,numHeads:n,rotaryEmbeddingDim:a,scale:i}=e,s=t[0].dims[0],o=Y.sizeFromDimension(t[0].dims,1),u=t[0].dims[t[0].dims.length-2],l=o/u,p=t[2].dims[1],f=a===0?p*2:l/n,m=new Array(s,u,l/f,f-p),c=Y.computeStrides(m),y=[{type:1,data:i},{type:12,data:m},{type:12,data:c},...t[0].dims.length===3?new Array({type:12,data:[o,l,f,1]}):[],...t[0].dims.length===4?new Array({type:12,data:[o,f,u*f,1]}):[],...ye(t[0].dims,t[1].dims,t[2].dims,t[3].dims,t[0].dims)],w=v=>{let k=Q("input",t[0].dataType,t[0].dims.length),$=Q("position_ids",t[1].dataType,t[1].dims.length),C=Q("cos_cache",t[2].dataType,t[2].dims.length),T=Q("sin_cache",t[3].dataType,t[3].dims.length),A=ge("output",t[0].dataType,t[0].dims.length);return v.registerUniforms([{name:"scale",type:"f32"},{name:"global_shape",type:"u32",length:m.length},{name:"global_strides",type:"u32",length:c.length},{name:"input_output_strides",type:"u32",length:c.length}]),` - ${v.declareVariables(k,$,C,T,A)} - - ${v.mainStart(Cn)} - let half_rotary_emb_dim = uniforms.${C.name}_shape[1]; - let bsnh = global_idx / uniforms.global_strides % uniforms.global_shape; - let size = uniforms.global_shape[0] * uniforms.global_strides[0]; - ${v.guardAgainstOutOfBoundsWorkgroupSizes("size")} - - if (bsnh[3] < half_rotary_emb_dim) { - let position_ids_idx = - ${$.broadcastedIndicesToOffset("bsnh.xy",ge("",$.type.tensor,2))}; - let position_id = - u32(${$.getByOffset("position_ids_idx")}) + select(0, bsnh[1], position_ids_idx == 0); - let i = dot(bsnh, uniforms.input_output_strides) + select(0, bsnh[3], ${r}); - let j = i + select(half_rotary_emb_dim, 1, ${r}); - let re = ${k.getByOffset("i")} * ${C.get("position_id","bsnh[3]")} - - ${k.getByOffset("j")} * ${T.get("position_id","bsnh[3]")}; - ${A.setByOffset("i","re")} - let im = ${k.getByOffset("i")} * ${T.get("position_id","bsnh[3]")} + - ${k.getByOffset("j")} * ${C.get("position_id","bsnh[3]")}; - ${A.setByOffset("j","im")} - } else { - let k = dot(bsnh, uniforms.input_output_strides) + half_rotary_emb_dim; - ${A.setByOffset("k",k.getByOffset("k"))} - } - }`};return{name:"RotaryEmbedding",shaderCache:{hint:qe({interleaved:r}).cacheKey,inputDependencies:["rank","rank","rank","rank"]},getShaderSource:w,getRunData:()=>({outputs:[{dims:t[0].dims,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(Y.size(m)/Cn)},programUniforms:y})}},km=(t,e)=>{kc(t.inputs,e),t.compute(Ec(t.inputs,e))}}),Cc,Tc,Em,Cy=Z(()=>{$e(),Ae(),Te(),Cc=t=>{if(!t||t.length<3)throw new Error("layerNorm requires at least 3 inputs.");let e=t[0],r=t[1],n=t[2];if(e.dataType!==r.dataType||e.dataType!==n.dataType)throw new Error("All inputs must have the same data type");if(e.dims.length!==3&&e.dims.length!==2)throw new Error("Input must be 2D or 3D");if(r.dims.length!==3&&r.dims.length!==2)throw new Error("Skip must be 2D or 3D");let a=e.dims[e.dims.length-1],i=e.dims[e.dims.length-2];if(r.dims[r.dims.length-1]!==a)throw new Error("Skip must have the same hidden size as input");if(r.dims[r.dims.length-2]!==i)throw new Error("Skip must have the same sequence length as input");if(n.dims.length!==1)throw new Error("Gamma must be 1D");if(n.dims[n.dims.length-1]!==a)throw new Error("Gamma must have the same hidden size as input");if(t.length>3){let s=t[3];if(s.dims.length!==1)throw new Error("Beta must be 1D");if(s.dims[s.dims.length-1]!==a)throw new Error("Beta must have the same hidden size as input")}if(t.length>4){let s=t[4];if(s.dims.length!==1)throw new Error("Bias must be 1D");if(s.dims[s.dims.length-1]!==a)throw new Error("Bias must have the same hidden size as input")}},Tc=(t,e,r,n)=>{let a=e.simplified,i=t[0].dims,s=Y.size(i),o=i,u=s,l=i.slice(-1)[0],p=n?i.slice(0,-1).concat(1):[],f=!a&&t.length>3,m=t.length>4,c=n&&r>1,y=n&&r>2,w=r>3,v=it(l),k=[{type:12,data:u},{type:12,data:v},{type:12,data:l},{type:1,data:e.epsilon}],$=T=>{let A=[{name:"output_size",type:"u32"},{name:"components",type:"u32"},{name:"hidden_size",type:"u32"},{name:"epsilon",type:"f32"}],B=[Q("x",t[0].dataType,t[0].dims,v),Q("skip",t[1].dataType,t[1].dims,v),Q("gamma",t[2].dataType,t[2].dims,v)];f&&B.push(Q("beta",t[3].dataType,t[3].dims,v)),m&&B.push(Q("bias",t[4].dataType,t[4].dims,v)),B.push(ge("output",t[0].dataType,o,v)),c&&B.push(ge("mean_output",1,p)),y&&B.push(ge("inv_std_output",1,p)),w&&B.push(ge("input_skip_bias_sum",t[0].dataType,o,v));let R=pt(t[0].dataType);return` - - ${T.registerUniforms(A).declareVariables(...B)} - - ${T.mainStart()} - ${T.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size / uniforms.hidden_size")} - let hidden_size_vectorized: u32 = uniforms.hidden_size / uniforms.components; - let offset = global_idx * hidden_size_vectorized; - var sum = ${wr("f32",v)}; - var squareSum = ${wr("f32",v)}; - for (var i: u32 = 0; i < hidden_size_vectorized; i++) { - let skip_value = skip[offset + i]; - let bias_value = ${m?"bias[i]":R+"(0.0)"}; - let input_value = x[offset + i]; - let value = input_value + skip_value + bias_value; - ${w?"input_skip_bias_sum[offset + i] = value;":""} - output[offset + i] = value; - let f32_value = ${Sn(R,v,"value")}; - sum += f32_value; - squareSum += f32_value * f32_value; - } - let mean = ${Or("sum",v)} / f32(uniforms.hidden_size); - let inv_std_dev = inverseSqrt(${Or("squareSum",v)} / f32(uniforms.hidden_size) ${a?"":"- mean * mean"} + uniforms.epsilon); - ${c?"mean_output[global_idx] = mean;":""} - ${y?"inv_std_output[global_idx] = inv_std_dev;":""} - for (var i: u32 = 0; i < hidden_size_vectorized; i++) { - output[offset + i] = (output[offset + i] ${a?"":`- ${R}(mean)`}) * ${R}(inv_std_dev) * gamma[i] ${f?"+ beta[i]":""}; - } - }`},C=[{dims:o,dataType:t[0].dataType}];return r>1&&C.push({dims:p,dataType:1}),r>2&&C.push({dims:p,dataType:1}),r>3&&C.push({dims:i,dataType:t[0].dataType}),{name:"SkipLayerNormalization",shaderCache:{hint:`${v};${c};${y};${w}`,inputDependencies:t.map((T,A)=>"type")},getShaderSource:$,getRunData:()=>({outputs:C,dispatchGroup:{x:Math.ceil(u/l/64)},programUniforms:k})}},Em=(t,e)=>{Cc(t.inputs);let r=[0];t.outputCount>1&&r.push(-3),t.outputCount>2&&r.push(-3),t.outputCount>3&&r.push(3),t.compute(Tc(t.inputs,e,t.outputCount,!1),{outputs:r})}}),Ic,na,Ac,Qs,Mc,Oc,Cm,Tm,Ty=Z(()=>{$e(),Ae(),lt(),Te(),Ic=(t,e)=>{if(!t||t.length<1)throw new Error("too few inputs");if(e.axes.length!==0){if(e.axes.length!==e.starts.length||e.axes.length!==e.ends.length)throw new Error("axes, starts and ends must have the same length")}else if(e.starts.length!==e.ends.length)throw new Error("starts and ends must have the same length");t.slice(1).forEach((r,n)=>{if(t[n+1].dataType!==6&&t[n+1].dataType!==7)throw new Error(`Input ${n} must be an array of int32 or int64`)})},na=(t,e)=>{let r=[];if(t.length>e)if(t[e].dataType===7)t[e].getBigInt64Array().forEach(n=>r.push(Number(n)));else if(t[e].dataType===6)t[e].getInt32Array().forEach(n=>r.push(Number(n)));else throw new Error(`Input ${e} must be an array of int32 or int64`);return r},Ac=(t,e)=>{if(t.length>1){let r=na(t,1),n=na(t,2),a=na(t,3);return a.length===0&&(a=[...Array(t[0].dims.length).keys()]),qe({starts:r,ends:n,axes:a})}else return e},Qs=(t,e,r,n,a)=>{let i=t;return t<0&&(i+=r[n[e]]),a[e]<0?Math.max(0,Math.min(i,r[n[e]]-1)):Math.max(0,Math.min(i,r[n[e]]))},Mc=(t,e,r)=>`fn calculateInputIndices(output_indices: ${e.type.indices}) -> ${t.type.indices} { - var input_indices: ${t.type.indices}; - var carry = 0u; - for (var i = ${r.length}; i >= 0; i--) { - let input_shape_i = ${Se("uniforms.input_shape","i",r.length)}; - let steps_i = ${Se("uniforms.steps","i",r.length)}; - let signs_i = ${Se("uniforms.signs","i",r.length)}; - let starts_i = ${Se("uniforms.starts","i",r.length)}; - var output_index = ${e.indicesGet("output_indices","i")}; - var input_index = output_index * steps_i + starts_i + carry; - carry = input_index / input_shape_i; - input_index = input_index % input_shape_i; - if (signs_i < 0) { - input_index = input_shape_i - input_index - 1u + starts_i; - } - ${t.indicesSet("input_indices","i","input_index")}; - } - return input_indices; - }`,Oc=(t,e)=>{let r=t[0].dims,n=Y.size(r),a=e.axes.length>0?Y.normalizeAxes(e.axes,r.length):[...Array(r.length).keys()],i=na(t,4);i.forEach(k=>k!==0||(()=>{throw new Error("step cannot be 0")})),i.length===0&&(i=Array(a.length).fill(1));let s=e.starts.map((k,$)=>Qs(k,$,r,a,i)),o=e.ends.map((k,$)=>Qs(k,$,r,a,i));if(a.length!==s.length||a.length!==o.length)throw new Error("start, ends and axes should have the same number of elements");if(a.length!==r.length)for(let k=0;kMath.sign(k));i.forEach((k,$,C)=>{if(k<0){let T=(o[$]-s[$])/k,A=s[$],B=A+T*i[$];s[$]=B,o[$]=A,C[$]=-k}});let l=r.slice(0);a.forEach((k,$)=>{l[k]=Math.ceil((o[k]-s[k])/i[k])});let p={dims:l,dataType:t[0].dataType},f=ge("output",t[0].dataType,l.length),m=Q("input",t[0].dataType,t[0].dims.length),c=Y.size(l),y=[{name:"outputSize",type:"u32"},{name:"starts",type:"u32",length:s.length},{name:"signs",type:"i32",length:u.length},{name:"steps",type:"u32",length:i.length}],w=[{type:12,data:c},{type:12,data:s},{type:6,data:u},{type:12,data:i},...ye(t[0].dims,l)],v=k=>` - ${k.registerUniforms(y).declareVariables(m,f)} - ${Mc(m,f,r)} - ${k.mainStart()} - ${k.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")} - let output_indices = ${f.offsetToIndices("global_idx")}; - let input_indices = calculateInputIndices(output_indices); - ${f.setByOffset("global_idx",m.getByIndices("input_indices"))} - }`;return{name:"Slice",shaderCache:{hint:`${u.length}_${s.length}_${i.length}`,inputDependencies:["rank"]},getShaderSource:v,getRunData:()=>({outputs:[p],dispatchGroup:{x:Math.ceil(n/64)},programUniforms:w})}},Cm=(t,e)=>{Ic(t.inputs,e);let r=Ac(t.inputs,e);t.compute(Oc(t.inputs,r),{inputs:[0]})},Tm=t=>{let e=t.starts,r=t.ends,n=t.axes;return qe({starts:e,ends:r,axes:n})}}),zc,Pc,Im,Am,Iy=Z(()=>{$e(),Ae(),lt(),Te(),zc=t=>{if(!t||t.length!==1)throw new Error("Softmax op requires 1 input.")},Pc=(t,e)=>{let r=t.dims,n=Y.size(r),a=64,i=e.axis;if(i<0&&(i=r.length+i),ik===4?`max(max(${v}.x, ${v}.y), max(${v}.z, ${v}.w))`:k===2?`max(${v}.x, ${v}.y)`:k===3?`max(max(${v}.x, ${v}.y), ${v}.z)`:v,f=Q("x",t.dataType,t.dims,u),m=ge("result",t.dataType,t.dims,u),c=f.type.value,y=pt(t.dataType)==="f32"?`var threadMax = ${c}(-3.402823e+38f);`:`var threadMax = ${c}(-65504.0h);`,w=v=>` - var rowMaxShared : ${c}; - var rowSumShared : ${c}; - var threadShared : array<${c}, ${a}>; - - fn getValue(row: i32, col: i32, row_stride: i32) -> ${c} { - let index = row * row_stride + col; - return x[index]; - } - - fn setValue(row: i32, col: i32, row_stride: i32, value: ${c}) { - let index = row * row_stride + col; - result[index] = value; - } - ${v.registerUniform("packedCols","i32").declareVariables(f,m)} - ${v.mainStart()} - let gindex = i32(global_idx); - let lindex = i32(local_idx); - const wg = ${a}; - let row = gindex / wg; - let cols = uniforms.packedCols; - let row_stride : i32 = uniforms.packedCols; - - // find the rows max - ${y} - for (var col = lindex; col < cols; col += wg) { - let value = getValue(row, col, row_stride); - threadMax = max(threadMax, value); - } - if (lindex < cols) { - threadShared[lindex] = threadMax; - } - workgroupBarrier(); - - var reduceSize = min(cols, wg); - for (var currSize = reduceSize >> 1; currSize > 0; currSize = reduceSize >> 1) { - reduceSize = currSize + (reduceSize & 1); - if (lindex < currSize) { - threadShared[lindex] = max(threadShared[lindex], threadShared[lindex + reduceSize]); - } - workgroupBarrier(); - } - if (lindex == 0) { - rowMaxShared = ${c}(${p("threadShared[0]",u)}); - } - workgroupBarrier(); - - // find the rows sum - var threadSum = ${c}(0.0); - for (var col = lindex; col < cols; col += wg) { - let subExp = exp(getValue(row, col, row_stride) - rowMaxShared); - threadSum += subExp; - } - threadShared[lindex] = threadSum; - workgroupBarrier(); - - for (var currSize = wg >> 1; currSize > 0; currSize = currSize >> 1) { - if (lindex < currSize) { - threadShared[lindex] = threadShared[lindex] + threadShared[lindex + currSize]; - } - workgroupBarrier(); - } - if (lindex == 0) { - rowSumShared = ${c}(${Or("threadShared[0]",u)}); - } - workgroupBarrier(); - - // calculate final value for each element in the row - for (var col = lindex; col < cols; col += wg) { - let value = exp(getValue(row, col, row_stride) - rowMaxShared) / rowSumShared; - setValue(row, col, row_stride, value); - } - }`;return{name:"Softmax",shaderCache:{hint:`${u}`,inputDependencies:["type"]},getRunData:()=>({outputs:[{dims:r,dataType:t.dataType}],dispatchGroup:{x:o},programUniforms:[{type:6,data:l}]}),getShaderSource:w}},Im=(t,e)=>{zc(t.inputs),t.compute(Pc(t.inputs[0],e))},Am=t=>qe({axis:t.axis})}),Rc,Bc,Dc,Nc,Fc,Mm,Om,Ay=Z(()=>{$e(),Ae(),lt(),Te(),Rc=t=>{if(!t||t.length<1)throw new Error("too few inputs")},Bc=(t,e)=>{let r=[],n=e.numOutputs;return t[1].dims[0]>0&&(t[1].getBigInt64Array().forEach(a=>r.push(Number(a))),n=r.length),qe({numOutputs:n,axis:e.axis,splitSizes:r})},Dc=t=>` -fn calculateOutputIndex(index: u32) -> u32 { - for (var i: u32 = 0u; i < ${t}u; i += 1u ) { - if (index < ${Se("uniforms.size_in_split_axis","i",t)}) { - return i; - } - } - return ${t}u; -}`,Nc=t=>{let e=t.length,r=[];for(let n=0;n{let r=t[0].dims,n=Y.size(r),a=t[0].dataType,i=Y.normalizeAxis(e.axis,r.length),s=new Array(e.numOutputs),o=Q("input",a,r.length),u=new Array(e.numOutputs),l=[],p=[],f=0,m=[{type:12,data:n}];for(let y=0;y` - ${y.registerUniform("input_size","u32").registerUniform("size_in_split_axis","u32",u.length).declareVariables(o,...s)} - ${Dc(u.length)} - ${Nc(s)} - - ${y.mainStart()} - ${y.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.input_size")} - - var indices = ${o.offsetToIndices("global_idx")}; - var index = ${o.indicesGet("indices",i)}; - let output_number = calculateOutputIndex(index); - if (output_number != 0) { - index -= ${Se("uniforms.size_in_split_axis","output_number - 1u",u.length)}; - ${o.indicesSet("indices",i,"index")}; - } - writeBufferData(output_number, indices, global_idx); - }`;return{name:"Split",shaderCache:{hint:e.cacheKey,inputDependencies:["rank"]},getShaderSource:c,getRunData:()=>({outputs:l,dispatchGroup:{x:Math.ceil(n/64)},programUniforms:m})}},Mm=(t,e)=>{Rc(t.inputs);let r=t.inputs.length===1?e:Bc(t.inputs,e);t.compute(Fc(t.inputs,r),{inputs:[0]})},Om=t=>{let e=t.axis,r=t.splitSizes,n=t.numOutputs<0?r.length:t.numOutputs;if(n!==r.length)throw new Error("numOutputs and splitSizes lengh must be equal");return qe({axis:e,numOutputs:n,splitSizes:r})}}),Js,Lc,Uc,Wc,zm,My=Z(()=>{$e(),Ae(),Te(),Js=t=>Array.from(t.getBigInt64Array(),Number),Lc=t=>{if(!t||t.length!==2)throw new Error("Tile requires 2 inputs.");if(t[0].dataType!==1&&t[0].dataType!==6&&t[0].dataType!==12)throw new Error("Tile only support float, int32, and uint32 data types");if(t[1].dataType!==7)throw new Error("Tile `repeats` input should be of int64 data type");if(t[1].dims.length!==1)throw new Error("Tile `repeats` input should be 1-D");if(Js(t[1]).length!==t[0].dims.length)throw new Error("Tile `repeats` input should have same number of elements as rank of input data tensor")},Uc=(t,e)=>{let r=[];for(let n=0;n{let e=t[0].dims,r=Js(t[1]),n=Uc(e,r),a=Y.size(n),i=t[0].dataType,s=Q("input",i,e.length),o=ge("output",i,n.length),u=l=>` - const inputShape = ${s.indices(...e)}; - ${l.registerUniform("output_size","u32").declareVariables(s,o)} - ${l.mainStart()} - ${l.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")} - let output_indices = ${o.offsetToIndices("global_idx")}; - var input_indices: ${s.type.indices}; - for (var i = 0; i < ${e.length}; i++) { - let input_dim_i = ${s.indicesGet("uniforms.input_shape","i")}; - let input_dim_value = ${o.indicesGet("output_indices","i")} % input_dim_i; - - ${s.indicesSet("input_indices","i","input_dim_value")} - } - ${o.setByOffset("global_idx",s.getByIndices("input_indices"))} - }`;return{name:"Tile",shaderCache:{hint:`${r}`,inputDependencies:["rank"]},getRunData:()=>({outputs:[{dims:n,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(a/64)},programUniforms:[{type:12,data:a},...ye(t[0].dims,n)]}),getShaderSource:u}},zm=t=>{Lc(t.inputs),t.compute(Wc(t.inputs),{inputs:[0]})}}),Vc,Gc,Pm,Oy=Z(()=>{$e(),Ae(),Te(),Vc=(t,e,r,n,a)=>{let i=ge("output_data",a,r.length,4),s=Q("a_data",e[1].dataType,e[1].dims.length,4),o=Q("b_data",e[2].dataType,e[2].dims.length,4),u=Q("c_data",e[0].dataType,e[0].dims.length,4),l,p=(f,m,c)=>`select(${m}, ${f}, ${c})`;if(!n)l=i.setByOffset("global_idx",p(s.getByOffset("global_idx"),o.getByOffset("global_idx"),u.getByOffset("global_idx")));else{let f=(m,c,y="")=>{let w=`a_data[index_a${c}][component_a${c}]`,v=`b_data[index_b${c}][component_b${c}]`,k=`bool(c_data[index_c${c}] & (0xffu << (component_c${c} * 8)))`;return` - let output_indices${c} = ${i.offsetToIndices(`global_idx * 4u + ${c}u`)}; - let offset_a${c} = ${s.broadcastedIndicesToOffset(`output_indices${c}`,i)}; - let offset_b${c} = ${o.broadcastedIndicesToOffset(`output_indices${c}`,i)}; - let offset_c${c} = ${u.broadcastedIndicesToOffset(`output_indices${c}`,i)}; - let index_a${c} = offset_a${c} / 4u; - let index_b${c} = offset_b${c} / 4u; - let index_c${c} = offset_c${c} / 4u; - let component_a${c} = offset_a${c} % 4u; - let component_b${c} = offset_b${c} % 4u; - let component_c${c} = offset_c${c} % 4u; - ${m}[${c}] = ${y}(${p(w,v,k)}); - `};a===9?l=` - var data = vec4(0); - ${f("data",0,"u32")} - ${f("data",1,"u32")} - ${f("data",2,"u32")} - ${f("data",3,"u32")} - output_data[global_idx] = dot(vec4(0x1, 0x100, 0x10000, 0x1000000), vec4(data));`:l=` - ${f("output_data[global_idx]",0)} - ${f("output_data[global_idx]",1)} - ${f("output_data[global_idx]",2)} - ${f("output_data[global_idx]",3)} - `}return` - ${t.registerUniform("vec_size","u32").declareVariables(u,s,o,i)} - ${t.mainStart()} - ${t.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.vec_size")} - ${l} - }`},Gc=t=>{let e=t[1].dims,r=t[2].dims,n=t[0].dims,a=t[1].dataType,i=!(Y.areEqual(e,r)&&Y.areEqual(r,n)),s=e,o=Y.size(e);if(i){let l=En.calcShape(En.calcShape(e,r,!1),n,!1);if(!l)throw new Error("Can't perform where op on the given tensors");s=l,o=Y.size(s)}let u=Math.ceil(o/4);return{name:"Where",shaderCache:{inputDependencies:["rank","rank","rank"]},getShaderSource:l=>Vc(l,t,s,i,a),getRunData:()=>({outputs:[{dims:s,dataType:a}],dispatchGroup:{x:Math.ceil(o/64/4)},programUniforms:[{type:12,data:u},...ye(n,e,r,s)]})}},Pm=t=>{t.compute(Gc(t.inputs))}}),Rm,zy=Z(()=>{ey(),Vh(),ty(),ry(),ny(),ay(),Uh(),Vf(),ly(),dy(),cy(),py(),hy(),fy(),my(),gy(),_y(),yy(),wy(),Wf(),by(),vy(),$y(),xy(),Sy(),Yo(),ky(),Ey(),Cy(),Ty(),Iy(),Ay(),My(),Sa(),Xo(),Oy(),Rm=new Map([["Abs",[jh]],["Acos",[qh]],["Acosh",[Kh]],["Add",[Tf]],["ArgMax",[Nh,yo]],["ArgMin",[Dh,yo]],["Asin",[Yh]],["Asinh",[Xh]],["Atan",[Qh]],["Atanh",[Jh]],["Attention",[Wh]],["AveragePool",[mm,fm]],["BatchNormalization",[Gh]],["BiasAdd",[Hh]],["BiasSplitGelu",[Cf]],["Cast",[ef,Zh]],["Ceil",[rf]],["Clip",[tf]],["Concat",[Fh,Lh]],["Conv",[So,xo]],["ConvTranspose",[jf,Hf]],["Cos",[nf]],["Cosh",[af]],["CumSum",[qf,Kf]],["DepthToSpace",[Yf,Xf]],["Div",[If]],["Einsum",[Qf,Jf]],["Elu",[sf,Ci]],["Equal",[Af]],["Erf",[of]],["Exp",[uf]],["Expand",[Zf]],["FastGelu",[em]],["Floor",[lf]],["FusedConv",[So,xo]],["Gather",[rm,tm]],["GatherElements",[am,nm]],["Gelu",[df]],["Gemm",[sm,im]],["GlobalAveragePool",[_m,gm]],["GlobalMaxPool",[vm,bm]],["Greater",[Pf]],["GreaterOrEqual",[Bf]],["HardSigmoid",[yf,_f]],["InstanceNormalization",[om]],["LayerNormalization",[um]],["LeakyRelu",[cf,Ci]],["Less",[Rf]],["LessOrEqual",[Df]],["Log",[Ef]],["MatMul",[Uf]],["MatMulNBits",[lm,dm]],["MaxPool",[ym,wm]],["Mul",[Mf]],["MultiHeadAttention",[pm,cm]],["Neg",[hf]],["Not",[pf]],["Pad",[hm]],["Pow",[Of]],["Range",[$m]],["Reciprocal",[ff]],["ReduceMin",[Oh]],["ReduceMean",[Ch]],["ReduceMax",[Mh]],["ReduceSum",[Ph]],["ReduceProd",[zh]],["ReduceL1",[Th]],["ReduceL2",[Ih]],["ReduceLogSum",[Bh]],["ReduceLogSumExp",[Ah]],["ReduceSumSquare",[Rh]],["Relu",[mf]],["Resize",[xm,Sm]],["RotaryEmbedding",[km]],["Sigmoid",[gf]],["Sin",[wf]],["Sinh",[bf]],["Slice",[Cm,Tm]],["SkipLayerNormalization",[Em]],["Split",[Mm,Om]],["Sqrt",[vf]],["Softmax",[Im,Am]],["Sub",[zf]],["Tan",[$f]],["Tanh",[xf]],["ThresholdedRelu",[kf,Ci]],["Tile",[zm]],["Transpose",[mh,gh]],["Where",[Pm]]])}),Bm,Py=Z(()=>{ar(),nn(),Te(),Bm=class{constructor(t){this.backend=t,this.repo=new Map,this.attributesBound=!1}getArtifact(t){return this.repo.get(t)}setArtifact(t,e){this.repo.set(t,e)}run(t,e,r,n,a){nr(t.programInfo.name);let i=this.backend.device,s=this.backend.getComputePassEncoder();this.backend.writeTimestamp(this.backend.pendingDispatchNumber*2);let o=[];for(let l of e)o.push({binding:o.length,resource:{buffer:l.buffer}});for(let l of r)o.push({binding:o.length,resource:{buffer:l.buffer}});a&&o.push({binding:o.length,resource:a});let u=i.createBindGroup({layout:t.computePipeline.getBindGroupLayout(0),entries:o,label:t.programInfo.name});if(this.backend.sessionStatus==="capturing"){let l={kernelId:this.backend.currentKernelId,computePipeline:t.computePipeline,bindGroup:u,dispatchGroup:n};this.backend.capturedCommandList.get(this.backend.currentSessionId).push(l)}s.setPipeline(t.computePipeline),s.setBindGroup(0,u),s.dispatchWorkgroups(...n),this.backend.writeTimestamp(this.backend.pendingDispatchNumber*2+1),this.backend.pendingDispatchNumber++,(this.backend.pendingDispatchNumber>=this.backend.maxDispatchNumber||this.backend.queryType==="at-passes")&&this.backend.endComputePass(),this.backend.pendingDispatchNumber>=this.backend.maxDispatchNumber&&this.backend.flush(),Lt(t.programInfo.name)}dispose(){}build(t,e){nr(t.name);let r=this.backend.device,n=[];r.features.has("shader-f16")&&n.push("enable f16;");let a=fh(e,this.backend.device.limits),i=t.getShaderSource(a),s=`${n.join(` -`)} -${a.additionalImplementations} -${i}`,o=r.createShaderModule({code:s,label:t.name});rt("verbose",()=>`[WebGPU] ${t.name} shader code: ${s}`);let u=r.createComputePipeline({compute:{module:o,entryPoint:"main"},layout:"auto",label:t.name});return Lt(t.name),{programInfo:t,computePipeline:u,uniformVariablesInfo:a.variablesInfo}}normalizeDispatchGroupSize(t){let e=typeof t=="number"?t:t.x,r=typeof t=="number"?1:t.y||1,n=typeof t=="number"?1:t.z||1,a=this.backend.device.limits.maxComputeWorkgroupsPerDimension;if(e<=a&&r<=a&&n<=a)return[e,r,n];let i=e*r*n,s=Math.ceil(Math.sqrt(i));if(s>a){if(s=Math.ceil(Math.cbrt(i)),s>a)throw new Error("Total dispatch size exceeds WebGPU maximum.");return[s,s,s]}else return[s,s,1]}}}),Hc,jc,qc,Dm,Ry=Z(()=>{ar(),$e(),nn(),Q_(),J_(),zy(),Py(),Hc=(t,e)=>{if(e.length!==t.length)throw new Error(`inputDependencies length ${e.length} is not equal to inputTensors length ${t.length}.`);let r=[];for(let n=0;n{let n=t.name;return t.shaderCache?.hint&&(n+="["+t.shaderCache.hint+"]"),n+=":"+r+`:${Hc(e,t.shaderCache?.inputDependencies??new Array(e.length).fill("dims"))}`,n},qc=class{constructor(t){t&&(this.architecture=t.architecture,this.vendor=t.vendor)}isArchitecture(t){return this.architecture===t}isVendor(t){return this.vendor===t}},Dm=class{constructor(){this.currentSessionId=null,this.currentKernelId=null,this.commandEncoder=null,this.computePassEncoder=null,this.maxDispatchNumber=16,this.pendingDispatchNumber=0,this.pendingKernels=[],this.pendingQueries=new Map,this.sessionStatus="default",this.capturedCommandList=new Map,this.capturedPendingKernels=new Map,this.sessionExternalDataMapping=new Map}get currentKernelCustomData(){if(this.currentKernelId===null)throw new Error("currentKernelCustomData(): currentKernelId is null. (should not happen)");let t=this.kernelCustomData.get(this.currentKernelId);return t||(t={},this.kernelCustomData.set(this.currentKernelId,t)),t}async initialize(t,e){this.env=t;let r=[],n={requiredLimits:{maxComputeWorkgroupStorageSize:e.limits.maxComputeWorkgroupStorageSize,maxComputeWorkgroupsPerDimension:e.limits.maxComputeWorkgroupsPerDimension,maxStorageBufferBindingSize:e.limits.maxStorageBufferBindingSize,maxBufferSize:e.limits.maxBufferSize,maxComputeInvocationsPerWorkgroup:e.limits.maxComputeInvocationsPerWorkgroup,maxComputeWorkgroupSizeX:e.limits.maxComputeWorkgroupSizeX,maxComputeWorkgroupSizeY:e.limits.maxComputeWorkgroupSizeY,maxComputeWorkgroupSizeZ:e.limits.maxComputeWorkgroupSizeZ},requiredFeatures:r};e.features.has("chromium-experimental-timestamp-query-inside-passes")?r.push("chromium-experimental-timestamp-query-inside-passes"):e.features.has("timestamp-query")&&r.push("timestamp-query"),e.features.has("shader-f16")&&r.push("shader-f16"),this.device=await e.requestDevice(n),this.adapterInfo=new qc(await e.requestAdapterInfo()),this.gpuDataManager=ph(this),this.programManager=new Bm(this),this.kernels=new Map,this.kernelPersistentData=new Map,this.kernelCustomData=new Map,dh(t.logLevel,!!t.debug),this.device.onuncapturederror=a=>{a.error instanceof GPUValidationError&&console.error(`An uncaught WebGPU validation error was raised: ${a.error.message}`)},Object.defineProperty(this.env.webgpu,"device",{value:this.device,writable:!1,enumerable:!0,configurable:!1}),Object.defineProperty(this.env.webgpu,"adapter",{value:e,writable:!1,enumerable:!0,configurable:!1}),this.setQueryType()}dispose(){typeof this.querySet<"u"&&this.querySet.destroy(),this.gpuDataManager.dispose()}getCommandEncoder(){return this.commandEncoder||(this.commandEncoder=this.device.createCommandEncoder()),this.commandEncoder}getComputePassEncoder(){if(!this.computePassEncoder){let t=this.getCommandEncoder(),e={};this.queryType==="at-passes"&&(e.timestampWrites={querySet:this.querySet,beginningOfPassWriteIndex:this.pendingDispatchNumber*2,endOfPassWriteIndex:this.pendingDispatchNumber*2+1}),this.computePassEncoder=t.beginComputePass(e)}return this.computePassEncoder}endComputePass(){this.computePassEncoder&&(this.computePassEncoder.end(),this.computePassEncoder=null)}flush(){if(!this.commandEncoder)return;nr(),this.endComputePass();let t;this.queryType!=="none"&&(this.commandEncoder.resolveQuerySet(this.querySet,0,this.pendingDispatchNumber*2,this.queryResolveBuffer,0),t=this.device.createBuffer({size:this.pendingDispatchNumber*2*8,usage:GPUBufferUsage.MAP_READ|GPUBufferUsage.COPY_DST}),this.pendingQueries.set(t,this.pendingKernels),this.pendingKernels=[],this.commandEncoder.copyBufferToBuffer(this.queryResolveBuffer,0,t,0,this.pendingDispatchNumber*2*8)),this.device.queue.submit([this.commandEncoder.finish()]),this.gpuDataManager.refreshPendingBuffers(),this.commandEncoder=null,this.pendingDispatchNumber=0,this.queryType!=="none"&&t.mapAsync(GPUMapMode.READ).then(()=>{let e=new BigUint64Array(t.getMappedRange()),r=this.pendingQueries.get(t);for(let n=0;n"u"&&(this.queryTimeBase=m);let y=Number(m-this.queryTimeBase),w=Number(c-this.queryTimeBase);if(!Number.isSafeInteger(y)||!Number.isSafeInteger(w))throw new RangeError("incorrect timestamp range");if(this.env.webgpu.profiling?.ondata)this.env.webgpu.profiling.ondata({version:1,inputsMetadata:p.map(v=>({dims:v.dims,dataType:Kr(v.dataType)})),outputsMetadata:f.map(v=>({dims:v.dims,dataType:Kr(v.dataType)})),kernelId:i,kernelType:o,kernelName:u,programName:l,startTime:y,endTime:w});else{let v="";p.forEach(($,C)=>{v+=`input[${C}]: [${$.dims}] | ${Kr($.dataType)}, `});let k="";f.forEach(($,C)=>{k+=`output[${C}]: [${$.dims}] | ${Kr($.dataType)}, `}),console.log(`[profiling] kernel "${i}|${o}|${u}|${l}" ${v}${k}execution time: ${w-y} ns`)}ma("GPU",`${l}::${m}::${c}`)}t.unmap(),this.pendingQueries.delete(t)}),Lt()}run(t,e,r,n,a,i){nr(t.name);let s=[];for(let $=0;$C):r;if(p.length!==o.length)throw new Error(`Output size ${p.length} must be equal to ${o.length}.`);let f=[],m=[];for(let $=0;$=i)throw new Error(`Invalid output index: ${p[$]}`);if(p[$]===-3)continue;let C=p[$]===-1,T=p[$]===-2,A=C||T?a(o[$].dataType,o[$].dims):n(p[$],o[$].dataType,o[$].dims);if(f.push(A),A.data===0)continue;let B=this.gpuDataManager.get(A.data);if(!B)throw new Error(`no GPU data for output: ${A.data}`);if(C&&this.temporaryData.push(B),T){let R=this.kernelPersistentData.get(this.currentKernelId);R||(R=[],this.kernelPersistentData.set(this.currentKernelId,R)),R.push(B)}m.push(B)}if(s.length!==e.length||m.length!==f.length){if(m.length===0)return Lt(t.name),f;throw new Error(`Program ${t.name} has zero-sized tensor(s) in inputs or outputs. This is not supported now.`)}let c;if(l){let $=0,C=[];l.forEach(R=>{let D=typeof R.data=="number"?[R.data]:R.data;if(D.length===0)return;let K=R.type===10?2:4,j,ie;R.type===10?(ie=D.length>4?16:D.length>2?8:D.length*K,j=D.length>4?16:K*D.length):(ie=D.length<=2?D.length*K:16,j=16),$=Math.ceil($/ie)*ie,C.push($);let te=R.type===10?8:4;$+=D.length>4?Math.ceil(D.length/te)*j:D.length*K});let T=16;$=Math.ceil($/T)*T;let A=new ArrayBuffer($);l.forEach((R,D)=>{let K=C[D],j=typeof R.data=="number"?[R.data]:R.data;if(R.type===6)new Int32Array(A,K,j.length).set(j);else if(R.type===12)new Uint32Array(A,K,j.length).set(j);else if(R.type===10)new Uint16Array(A,K,j.length).set(j);else if(R.type===1)new Float32Array(A,K,j.length).set(j);else throw new Error(`Unsupported uniform type: ${Kr(R.type)}`)});let B=this.gpuDataManager.create($,GPUBufferUsage.COPY_DST|GPUBufferUsage.UNIFORM);this.device.queue.writeBuffer(B.buffer,0,A,0,$),this.gpuDataManager.release(B.id),c={offset:0,size:$,buffer:B.buffer}}let y=this.programManager.normalizeDispatchGroupSize(u),w=y[1]===1&&y[2]===1,v=jc(t,e,w),k=this.programManager.getArtifact(v);if(k||(k=this.programManager.build(t,y),this.programManager.setArtifact(v,k),rt("info",()=>`[artifact] key: ${v}, programName: ${t.name}`)),l&&k.uniformVariablesInfo){if(l.length!==k.uniformVariablesInfo.length)throw new Error(`Uniform variables count mismatch: expect ${k.uniformVariablesInfo.length}, got ${l.length} in program "${k.programInfo.name}".`);for(let $=0;$`[ProgramManager] run "${t.name}" (key=${v}) with ${y[0]}x${y[1]}x${y[2]}`),this.queryType!=="none"||this.sessionStatus==="capturing"){let $={kernelId:this.currentKernelId,programName:k.programInfo.name,inputTensorViews:e,outputTensorViews:f};this.pendingKernels.push($),this.sessionStatus==="capturing"&&this.capturedPendingKernels.get(this.currentSessionId).push($)}return this.programManager.run(k,s,m,y,c),Lt(t.name),f}upload(t,e){this.gpuDataManager.upload(t,e)}memcpy(t,e){this.gpuDataManager.memcpy(t,e)}async download(t,e){await this.gpuDataManager.download(t,e)}alloc(t){return this.gpuDataManager.create(t).id}free(t){return this.gpuDataManager.release(t)}createKernel(t,e,r,n){let a=Rm.get(t);if(!a)throw new Error(`kernel not implemented: ${t}`);let i={kernelType:t,kernelName:n,kernelEntry:a[0],attributes:[a[1],r]};this.kernels.set(e,i)}releaseKernel(t){let e=this.kernelPersistentData.get(t);if(e){for(let r of e)this.gpuDataManager.release(r.id);this.kernelPersistentData.delete(t)}this.kernelCustomData.delete(t),this.kernels.delete(t)}computeKernel(t,e,r){let n=this.kernels.get(t);if(!n)throw new Error(`kernel not created: ${t}`);let a=n.kernelType,i=n.kernelName,s=n.kernelEntry,o=n.attributes;if(this.currentKernelId!==null)throw new Error(`kernel "[${a}] ${i}" is not allowed to be called recursively`);this.currentKernelId=t,o[0]&&(o[1]=o[0](o[1]),o[0]=void 0),rt("info",()=>`[WebGPU] Start to run kernel "[${a}] ${i}"...`);let u=this.env.debug;this.temporaryData=[];try{return u&&this.device.pushErrorScope("validation"),s(e,o[1]),0}catch(l){return r.push(Promise.resolve(`[WebGPU] Kernel "[${a}] ${i}" failed. ${l}`)),1}finally{u&&r.push(this.device.popErrorScope().then(l=>l?`GPU validation error for kernel "[${a}] ${i}": ${l.message}`:null));for(let l of this.temporaryData)this.gpuDataManager.release(l.id);this.temporaryData=[],this.currentKernelId=null}}registerBuffer(t,e,r,n){let a=this.sessionExternalDataMapping.get(t);a||(a=new Map,this.sessionExternalDataMapping.set(t,a));let i=a.get(e),s=this.gpuDataManager.registerExternalBuffer(r,n,i?.[1]);return a.set(e,[s,r]),s}unregisterBuffers(t){let e=this.sessionExternalDataMapping.get(t);e&&(e.forEach(r=>this.gpuDataManager.unregisterExternalBuffer(r[1])),this.sessionExternalDataMapping.delete(t))}getBuffer(t){let e=this.gpuDataManager.get(t);if(!e)throw new Error(`no GPU data for buffer: ${t}`);return e.buffer}createDownloader(t,e,r){return async()=>{let n=await go(this,t,e);return ch(n.buffer,r)}}writeTimestamp(t){this.queryType==="inside-passes"&&this.computePassEncoder.writeTimestamp(this.querySet,t)}setQueryType(){this.queryType="none",(this.env.webgpu.profiling?.mode==="default"||(typeof this.env.trace>"u"?this.env.wasm.trace:this.env.trace))&&(this.device.features.has("chromium-experimental-timestamp-query-inside-passes")?this.queryType="inside-passes":this.device.features.has("timestamp-query")&&(this.queryType="at-passes"),this.queryType!=="none"&&typeof this.querySet>"u"&&(this.querySet=this.device.createQuerySet({type:"timestamp",count:this.maxDispatchNumber*2}),this.queryResolveBuffer=this.device.createBuffer({size:this.maxDispatchNumber*2*8,usage:GPUBufferUsage.COPY_SRC|GPUBufferUsage.QUERY_RESOLVE})))}captureBegin(){rt("info","captureBegin"),this.capturedCommandList.get(this.currentSessionId)||this.capturedCommandList.set(this.currentSessionId,[]),this.capturedPendingKernels.get(this.currentSessionId)||this.capturedPendingKernels.set(this.currentSessionId,[]),this.flush(),this.sessionStatus="capturing"}captureEnd(){rt("info","captureEnd"),this.flush(),this.sessionStatus="default"}replay(){rt("info","replay"),this.sessionStatus="replaying";let t=this.capturedCommandList.get(this.currentSessionId),e=this.capturedPendingKernels.get(this.currentSessionId),r=t.length;this.pendingKernels=[];for(let n=0;n=this.maxDispatchNumber||this.queryType==="at-passes")&&this.endComputePass(),this.pendingDispatchNumber>=this.maxDispatchNumber&&this.flush()}this.flush(),this.sessionStatus="default"}onReleaseSession(t){this.unregisterBuffers(t),this.capturedCommandList.has(t)&&this.capturedCommandList.delete(t),this.capturedPendingKernels.has(t)&&this.capturedPendingKernels.delete(t),this.gpuDataManager.onReleaseSession(t)}onRunStart(t){this.currentSessionId=t,this.setQueryType()}}}),Nm={};Mn(Nm,{init:()=>Fm});var wi,Kc,Fm,By=Z(()=>{$e(),Ry(),nn(),Ae(),wi=class Lm{constructor(e,r,n,a){this.module=e,this.dataType=r,this.data=n,this.dims=a}getFloat32Array(){if(this.dataType!==1)throw new Error("Invalid data type");let e=Y.size(this.dims);return e===0?new Float32Array:new Float32Array(this.module.HEAP8.buffer,this.data,e)}getBigInt64Array(){if(this.dataType!==7)throw new Error("Invalid data type");let e=Y.size(this.dims);return e===0?new BigInt64Array:new BigInt64Array(this.module.HEAP8.buffer,this.data,e)}getInt32Array(){if(this.dataType!==6)throw new Error("Invalid data type");let e=Y.size(this.dims);return e===0?new Int32Array:new Int32Array(this.module.HEAP8.buffer,this.data,e)}reshape(e){if(Y.size(e)!==Y.size(this.dims))throw new Error("Invalid new shape");return new Lm(this.module,this.dataType,this.data,e)}},Kc=class{constructor(t,e,r){this.module=t,this.backend=e,this.customDataOffset=0,this.customDataSize=0,this.adapterInfo=e.adapterInfo;let n=t.HEAPU32,a=r>>>2;this.opKernelContext=n[a++];let i=n[a++];this.outputCount=n[a++],this.customDataOffset=n[a++],this.customDataSize=n[a++];let s=[];for(let o=0;otypeof s=="number"?this.inputs[s]:s)??this.inputs,n=e?.outputs??[],a=(s,o,u)=>new wi(this.module,o,this.output(s,u),u),i=(s,o)=>{let u=ga(s);if(!u)throw new Error(`Unsupported data type: ${s}`);let l=u*Y.size(o),p=l>0?this.backend.gpuDataManager.create(l).id:0;return new wi(this.module,s,p,o)};return this.backend.run(t,r,n,a,i,this.outputCount)}output(t,e){let r=this.module.stackSave();try{let n=this.module.stackAlloc((1+e.length)*4),a=n>>2;this.module.HEAPU32[a++]=e.length;for(let i=0;i{let a=e.jsepInit;if(!a)throw new Error("Failed to initialize JSEP. The WebAssembly module is not built with JSEP support.");if(t==="webgpu"){let i=new Dm;await i.initialize(r,n),a("webgpu",[i,s=>i.alloc(s),s=>i.free(s),(s,o,u,l=!1)=>{if(l)rt("verbose",()=>`[WebGPU] jsepCopyGpuToGpu: src=${s}, dst=${o}, size=${u}`),i.memcpy(s,o);else{rt("verbose",()=>`[WebGPU] jsepCopyCpuToGpu: dataOffset=${s}, gpuDataId=${o}, size=${u}`);let p=e.HEAPU8.subarray(s>>>0,(s>>>0)+u);i.upload(o,p)}},async(s,o,u)=>{rt("verbose",()=>`[WebGPU] jsepCopyGpuToCpu: gpuDataId=${s}, dataOffset=${o}, size=${u}`),await i.download(s,()=>e.HEAPU8.subarray(o>>>0,(o>>>0)+u))},(s,o,u)=>i.createKernel(s,o,u,e.UTF8ToString(e._JsepGetNodeName(o))),s=>i.releaseKernel(s),(s,o,u,l)=>{rt("verbose",()=>`[WebGPU] jsepRun: sessionHandle=${u}, kernel=${s}, contextDataOffset=${o}`);let p=new Kc(e,i,o);return i.computeKernel(s,p,l)},()=>i.captureBegin(),()=>i.captureEnd(),()=>i.replay()])}else a("webnn")}}),Yc,Um,Wm,Tr,Xc,Eo,Vm,Gm,Zs,Hm,jm,qm,Dy=Z(()=>{Y_(),X_(),$e(),xa(),Wo(),lh(),Yc=(t,e)=>{at()._OrtInit(t,e)!==0&&je("Can't initialize onnxruntime.")},Um=async t=>{Yc(t.wasm.numThreads,Di(t.logLevel))},Wm=async(t,e)=>{{let r=(By(),Jr(Nm)).init;if(e==="webgpu"){if(typeof navigator>"u"||!navigator.gpu)throw new Error("WebGPU is not supported in current environment");let n=t.webgpu.adapter;if(n){if(typeof n.limits!="object"||typeof n.features!="object"||typeof n.requestDevice!="function")throw new Error("Invalid GPU adapter set in `env.webgpu.adapter`. It must be a GPUAdapter object.")}else{let a=t.webgpu.powerPreference;if(a!==void 0&&a!=="low-power"&&a!=="high-performance")throw new Error(`Invalid powerPreference setting: "${a}"`);let i=t.webgpu.forceFallbackAdapter;if(i!==void 0&&typeof i!="boolean")throw new Error(`Invalid forceFallbackAdapter setting: "${i}"`);if(n=await navigator.gpu.requestAdapter({powerPreference:a,forceFallbackAdapter:i}),!n)throw new Error('Failed to get GPU adapter. You may need to enable flag "--enable-unsafe-webgpu" if you are using Chrome.')}if(!t.wasm.simd)throw new Error("Not supported for WebGPU=ON and SIMD=OFF. Please set `env.wasm.simd` to true when using `webgpu` EP");await r("webgpu",at(),t,n)}if(e==="webnn"){if(typeof navigator>"u"||!navigator.ml)throw new Error("WebNN is not supported in current environment");await r("webnn",at(),t)}}},Tr=new Map,Xc=t=>{let e=at(),r=e.stackSave();try{let n=e.stackAlloc(8);return e._OrtGetInputOutputCount(t,n,n+4)!==0&&je("Can't get session input/output count."),[e.HEAP32[n/4],e.HEAP32[n/4+1]]}finally{e.stackRestore(r)}},Eo=t=>{let e=at(),r=e._malloc(t.byteLength);if(r===0)throw new Error(`Can't create a session. failed to allocate a buffer of size ${t.byteLength}.`);return e.HEAPU8.set(t,r),[r,t.byteLength]},Vm=async(t,e)=>{let r,n,a=at();Array.isArray(t)?[r,n]=t:t.buffer===a.HEAPU8.buffer?[r,n]=[t.byteOffset,t.byteLength]:[r,n]=Eo(t);let i=0,s=0,o=0,u=[],l=[],p=[];try{if([s,u]=uh(e),e?.externalData&&a.mountExternalData){let $=[];for(let C of e.externalData){let T=typeof C=="string"?C:C.path;$.push(Ni(typeof C=="string"?C:C.data).then(A=>{a.mountExternalData(T,A)}))}await Promise.all($)}i=await a._OrtCreateSession(r,n,s),i===0&&je("Can't create a session.");let[f,m]=Xc(i),c=!!e?.enableGraphCapture,y=[],w=[],v=[];for(let $=0;$$==="gpu-buffer")&&(o=a._OrtCreateBinding(i),o===0&&je("Can't create IO binding."),k={handle:o,outputPreferredLocations:v,outputPreferredLocationsEncoded:v.map($=>mo($))}),Tr.set(i,[i,l,p,k,c,!1]),[i,y,w]}catch(f){throw l.forEach(m=>a._OrtFree(m)),p.forEach(m=>a._OrtFree(m)),o!==0&&a._OrtReleaseBinding(o),i!==0&&a._OrtReleaseSession(i),f}finally{a._free(r),s!==0&&a._OrtReleaseSessionOptions(s),u.forEach(f=>a._free(f)),a.unmountExternalData?.()}},Gm=t=>{let e=at(),r=Tr.get(t);if(!r)throw new Error(`cannot release session. invalid session id: ${t}`);let[n,a,i,s,o]=r;s&&(o&&e._OrtClearBoundOutputs(s.handle),e._OrtReleaseBinding(s.handle)),e.jsepOnReleaseSession?.(t),a.forEach(u=>e._OrtFree(u)),i.forEach(u=>e._OrtFree(u)),e._OrtReleaseSession(n),Tr.delete(t)},Zs=(t,e,r,n,a,i=!1)=>{if(!t){e.push(0);return}let s=at(),o=t[0],u=t[1],l=t[3],p,f;if(o==="string"&&l==="gpu-buffer")throw new Error("String tensor is not supported on GPU.");if(i&&l!=="gpu-buffer")throw new Error(`External buffer must be provided for input/output index ${a} when enableGraphCapture is true.`);if(l==="gpu-buffer"){let y=t[2].gpuBuffer,w=ga(fo(o));f=u.reduce((k,$)=>k*$,1)*w;let v=s.jsepRegisterBuffer;if(!v)throw new Error('Tensor location "gpu-buffer" is not supported without using WebGPU.');p=v(n,a,y,f)}else{let y=t[2];if(Array.isArray(y)){f=4*y.length,p=s._malloc(f),r.push(p);let w=p/4;for(let v=0;vs.HEAP32[y++]=v);let w=s._OrtCreateTensor(fo(o),p,f,c,u.length,mo(l));w===0&&je(`Can't create tensor for input/output. session=${n}, index=${a}.`),e.push(w)}finally{s.stackRestore(m)}},Hm=async(t,e,r,n,a,i)=>{let s=at(),o=Tr.get(t);if(!o)throw new Error(`cannot run inference. invalid session id: ${t}`);let u=o[0],l=o[1],p=o[2],f=o[3],m=o[4],c=o[5],y=e.length,w=n.length,v=0,k=[],$=[],C=[],T=[],A=s.stackSave(),B=s.stackAlloc(y*4),R=s.stackAlloc(y*4),D=s.stackAlloc(w*4),K=s.stackAlloc(w*4);try{[v,k]=oh(i);for(let P=0;PVe*Ne,1);N=Kr(Ce);let dt=f?.outputPreferredLocations[n[P]];if(N==="string"){if(dt==="gpu-buffer")throw new Error("String tensor is not supported on GPU.");let Ve=[],Ne=ae/4;for(let ht=0;ht0){let Ve=s.jsepGetBuffer;if(!Ve)throw new Error('preferredLocation "gpu-buffer" is not supported without using WebGPU.');let Ne=Ve(ae),ht=ga(Ce);if(ht===void 0||!Go(N))throw new Error(`Unsupported data type: ${N}`);ne=!0,M.push([N,Qe,{gpuBuffer:Ne,download:s.jsepCreateDownloader(Ne,We*ht,N),dispose:()=>{s._OrtReleaseTensor(H)}},"gpu-buffer"])}else{let Ve=Vo(N),Ne=new Ve(We);new Uint8Array(Ne.buffer,Ne.byteOffset,Ne.byteLength).set(s.HEAPU8.subarray(ae,ae+Ne.byteLength)),M.push([N,Qe,Ne,"cpu"])}}finally{s.stackRestore(le),N==="string"&&ae&&s._free(ae),ne||s._OrtReleaseTensor(H)}}return f&&!m&&(s._OrtClearBoundOutputs(f.handle),Tr.set(t,[u,l,p,f,m,!1])),M}finally{s.stackRestore(A),$.forEach(j=>s._OrtReleaseTensor(j)),C.forEach(j=>s._OrtReleaseTensor(j)),T.forEach(j=>s._free(j)),v!==0&&s._OrtReleaseRunOptions(v),k.forEach(j=>s._free(j))}},jm=t=>{let e=at(),r=Tr.get(t);if(!r)throw new Error("invalid session id");let n=r[0],a=e._OrtEndProfiling(n);a===0&&je("Can't get an profile file name."),e._OrtFree(a)},qm=t=>{let e=[];for(let r of t){let n=r[2];!Array.isArray(n)&&"buffer"in n&&e.push(n.buffer)}return e}}),Ny=An((t,e)=>{e.exports='/*!\n * ONNX Runtime Web v1.18.0\n * Copyright (c) Microsoft Corporation. All rights reserved.\n * Licensed under the MIT License.\n */\n"use strict";(()=>{var ao=Object.defineProperty;var nl=Object.getOwnPropertyDescriptor;var ol=Object.getOwnPropertyNames;var il=Object.prototype.hasOwnProperty;var Y=(e,t)=>()=>(e&&(t=e(e=0)),t);var Wr=(e,t)=>()=>(t||e((t={exports:{}}).exports,t),t.exports),gn=(e,t)=>{for(var r in t)ao(e,r,{get:t[r],enumerable:!0})},al=(e,t,r,o)=>{if(t&&typeof t=="object"||typeof t=="function")for(let i of ol(t))!il.call(e,i)&&i!==r&&ao(e,i,{get:()=>t[i],enumerable:!(o=nl(t,i))||o.enumerable});return e};var wr=e=>al(ao({},"__esModule",{value:!0}),e);var so={};gn(so,{createReadStream:()=>Ai,readFile:()=>sl,readFileSync:()=>ul});var sl,ul,Ai,uo=Y(()=>{sl=void 0,ul=void 0,Ai=void 0});var lo={};gn(lo,{join:()=>dl});var dl,co=Y(()=>{dl=void 0});var Ei=Wr((Ti,po)=>{"use strict";var Ii=(()=>{var e=typeof document<"u"?document.currentScript?.src:void 0;return typeof __filename<"u"&&(e||=__filename),function(t={}){var r=t,o,i,u=new Promise((s,m)=>{o=s,i=m});r.mountExternalData=(s,m)=>{(r.eb||(r.eb=new Map)).set(s,m)},r.unmountExternalData=()=>{delete r.eb};let a=()=>{let s=(g,$,T)=>(...B)=>{let H=dt,q=$?.();B=g(...B);let te=$?.();return q!==te&&(g=te,T(q),$=T=null),dt!=H?tn():B},m=g=>async(...$)=>{try{if(r.cb)throw Error("Session already started");let T=r.cb={xb:$[0],errors:[]},B=await g(...$);if(r.cb!==T)throw Error("Session mismatch");r.kb?.flush();let H=T.errors;if(0te),0r._OrtCreateSession,g=>r._OrtCreateSession=g),r._OrtRun=m(s(r._OrtRun,()=>r._OrtRun,g=>r._OrtRun=g)),r._OrtRunWithBinding=m(s(r._OrtRunWithBinding,()=>r._OrtRunWithBinding,g=>r._OrtRunWithBinding=g)),r._OrtBindInput=s(r._OrtBindInput,()=>r._OrtBindInput,g=>r._OrtBindInput=g),a=void 0};r.jsepInit=(s,m)=>{if(a?.(),s==="webgpu"){[r.kb,r.pb,r.tb,r.lb,r.sb,r.Ra,r.ub,r.wb,r.qb,r.rb,r.vb]=m;let g=r.kb;r.jsepRegisterBuffer=($,T,B,H)=>g.registerBuffer($,T,B,H),r.jsepGetBuffer=$=>g.getBuffer($),r.jsepCreateDownloader=($,T,B)=>g.createDownloader($,T,B),r.jsepOnReleaseSession=$=>{g.onReleaseSession($)},r.jsepOnRunStart=$=>g.onRunStart($)}};var c=Object.assign({},r),p="./this.program",h=(s,m)=>{throw m},d=typeof window=="object",y=typeof importScripts=="function",w=typeof process=="object"&&typeof process.versions=="object"&&typeof process.versions.node=="string",_="",v,S,A;if(w){var I=(uo(),wr(so)),x=(co(),wr(lo));_=y?x.dirname(_)+"/":__dirname+"/",v=(s,m)=>(s=Ke(s)?new URL(s):x.normalize(s),I.readFileSync(s,m?void 0:"utf8")),A=s=>(s=v(s,!0),s.buffer||(s=new Uint8Array(s)),s),S=(s,m,g,$=!0)=>{s=Ke(s)?new URL(s):x.normalize(s),I.readFile(s,$?void 0:"utf8",(T,B)=>{T?g(T):m($?B.buffer:B)})},!r.thisProgram&&1{throw process.exitCode=s,m}}else(d||y)&&(y?_=self.location.href:typeof document<"u"&&document.currentScript&&(_=document.currentScript.src),e&&(_=e),_.startsWith("blob:")?_="":_=_.substr(0,_.replace(/[?#].*/,"").lastIndexOf("/")+1),v=s=>{var m=new XMLHttpRequest;return m.open("GET",s,!1),m.send(null),m.responseText},y&&(A=s=>{var m=new XMLHttpRequest;return m.open("GET",s,!1),m.responseType="arraybuffer",m.send(null),new Uint8Array(m.response)}),S=(s,m,g)=>{var $=new XMLHttpRequest;$.open("GET",s,!0),$.responseType="arraybuffer",$.onload=()=>{$.status==200||$.status==0&&$.response?m($.response):g()},$.onerror=g,$.send(null)});var E=console.log.bind(console),P=console.error.bind(console);Object.assign(r,c),c=null;var O,R=!1,L,N,K,Q,he,W,se,Ce,We,ee,ae;function Ae(){var s=O.buffer;r.HEAP8=N=new Int8Array(s),r.HEAP16=Q=new Int16Array(s),r.HEAPU8=K=new Uint8Array(s),r.HEAPU16=he=new Uint16Array(s),r.HEAP32=W=new Int32Array(s),r.HEAPU32=se=new Uint32Array(s),r.HEAPF32=Ce=new Float32Array(s),r.HEAPF64=ae=new Float64Array(s),r.HEAP64=We=new BigInt64Array(s),r.HEAPU64=ee=new BigUint64Array(s)}var me=[],ie=[],ue=[],le=0,qe=null,G=null;function ne(s){throw s="Aborted("+s+")",P(s),R=!0,L=1,s=new WebAssembly.RuntimeError(s+". Build with -sASSERTIONS for more info."),i(s),s}var xe=s=>s.startsWith("data:application/octet-stream;base64,"),Ke=s=>s.startsWith("file://"),Be;if(Be="ort-wasm-simd.wasm",!xe(Be)){var Ge=Be;Be=r.locateFile?r.locateFile(Ge,_):_+Ge}function Ut(s){if(A)return A(s);throw"both async and sync fetching of the wasm failed"}function Ne(s){if(d||y){if(typeof fetch=="function"&&!Ke(s))return fetch(s,{credentials:"same-origin"}).then(m=>{if(!m.ok)throw`failed to load wasm binary file at \'${s}\'`;return m.arrayBuffer()}).catch(()=>Ut(s));if(S)return new Promise((m,g)=>{S(s,$=>m(new Uint8Array($)),g)})}return Promise.resolve().then(()=>Ut(s))}function Ye(s,m,g){return Ne(s).then($=>WebAssembly.instantiate($,m)).then(g,$=>{P(`failed to asynchronously prepare wasm: ${$}`),ne($)})}function mt(s,m){var g=Be;return typeof WebAssembly.instantiateStreaming!="function"||xe(g)||Ke(g)||w||typeof fetch!="function"?Ye(g,s,m):fetch(g,{credentials:"same-origin"}).then($=>WebAssembly.instantiateStreaming($,s).then(m,function(T){return P(`wasm streaming compile failed: ${T}`),P("falling back to ArrayBuffer instantiation"),Ye(g,s,m)}))}var Rt={824920:(s,m,g,$)=>{if(typeof r>"u"||!r.eb)return 1;if(s=je(s>>>0),s.startsWith("./")&&(s=s.substring(2)),s=r.eb.get(s),!s)return 2;if(m>>>=0,g>>>=0,m+g>s.byteLength)return 3;try{return K.set(s.subarray(m,m+g),$>>>0>>>0),0}catch{return 4}},825421:()=>{r.qb()},825452:()=>{r.rb()},825481:()=>{r.vb()},825506:s=>r.pb(s),825539:s=>r.tb(s),825571:(s,m,g)=>{r.lb(s,m,g,!0)},825610:(s,m,g)=>{r.lb(s,m,g)},825643:s=>{r.Ra("Abs",s,void 0)},825694:s=>{r.Ra("Neg",s,void 0)},825745:s=>{r.Ra("Floor",s,void 0)},825798:s=>{r.Ra("Ceil",s,void 0)},825850:s=>{r.Ra("Reciprocal",s,void 0)},825908:s=>{r.Ra("Sqrt",s,void 0)},825960:s=>{r.Ra("Exp",s,void 0)},826011:s=>{r.Ra("Erf",s,void 0)},826062:s=>{r.Ra("Sigmoid",s,void 0)},826117:(s,m,g)=>{r.Ra("HardSigmoid",s,{alpha:m,beta:g})},826196:s=>{r.Ra("Log",s,void 0)},826247:s=>{r.Ra("Sin",s,void 0)},826298:s=>{r.Ra("Cos",s,void 0)},826349:s=>{r.Ra("Tan",s,void 0)},826400:s=>{r.Ra("Asin",s,void 0)},826452:s=>{r.Ra("Acos",s,void 0)},826504:s=>{r.Ra("Atan",s,void 0)},826556:s=>{r.Ra("Sinh",s,void 0)},826608:s=>{r.Ra("Cosh",s,void 0)},826660:s=>{r.Ra("Asinh",s,void 0)},826713:s=>{r.Ra("Acosh",s,void 0)},826766:s=>{r.Ra("Atanh",s,void 0)},826819:s=>{r.Ra("Tanh",s,void 0)},826871:s=>{r.Ra("Not",s,void 0)},826922:(s,m,g)=>{r.Ra("Clip",s,{min:m,max:g})},826991:s=>{r.Ra("Clip",s,void 0)},827043:(s,m)=>{r.Ra("Elu",s,{alpha:m})},827101:s=>{r.Ra("Relu",s,void 0)},827153:(s,m)=>{r.Ra("LeakyRelu",s,{alpha:m})},827217:(s,m)=>{r.Ra("ThresholdedRelu",s,{alpha:m})},827287:(s,m)=>{r.Ra("Cast",s,{to:m})},827345:s=>{r.Ra("Add",s,void 0)},827396:s=>{r.Ra("Sub",s,void 0)},827447:s=>{r.Ra("Mul",s,void 0)},827498:s=>{r.Ra("Div",s,void 0)},827549:s=>{r.Ra("Pow",s,void 0)},827600:s=>{r.Ra("Equal",s,void 0)},827653:s=>{r.Ra("Greater",s,void 0)},827708:s=>{r.Ra("GreaterOrEqual",s,void 0)},827770:s=>{r.Ra("Less",s,void 0)},827822:s=>{r.Ra("LessOrEqual",s,void 0)},827881:(s,m,g,$,T)=>{r.Ra("ReduceMean",s,{keepDims:!!m,noopWithEmptyAxes:!!g,axes:$?Array.from(W.subarray($>>>0,T>>>0)):[]})},828040:(s,m,g,$,T)=>{r.Ra("ReduceMax",s,{keepDims:!!m,noopWithEmptyAxes:!!g,axes:$?Array.from(W.subarray($>>>0,T>>>0)):[]})},828198:(s,m,g,$,T)=>{r.Ra("ReduceMin",s,{keepDims:!!m,noopWithEmptyAxes:!!g,axes:$?Array.from(W.subarray($>>>0,T>>>0)):[]})},828356:(s,m,g,$,T)=>{r.Ra("ReduceProd",s,{keepDims:!!m,noopWithEmptyAxes:!!g,axes:$?Array.from(W.subarray($>>>0,T>>>0)):[]})},828515:(s,m,g,$,T)=>{r.Ra("ReduceSum",s,{keepDims:!!m,noopWithEmptyAxes:!!g,axes:$?Array.from(W.subarray($>>>0,T>>>0)):[]})},828673:(s,m,g,$,T)=>{r.Ra("ReduceL1",s,{keepDims:!!m,noopWithEmptyAxes:!!g,axes:$?Array.from(W.subarray($>>>0,T>>>0)):[]})},828830:(s,m,g,$,T)=>{r.Ra("ReduceL2",s,{keepDims:!!m,noopWithEmptyAxes:!!g,axes:$?Array.from(W.subarray($>>>0,T>>>0)):[]})},828987:(s,m,g,$,T)=>{r.Ra("ReduceLogSum",s,{keepDims:!!m,noopWithEmptyAxes:!!g,axes:$?Array.from(W.subarray($>>>0,T>>>0)):[]})},829148:(s,m,g,$,T)=>{r.Ra("ReduceSumSquare",s,{keepDims:!!m,noopWithEmptyAxes:!!g,axes:$?Array.from(W.subarray($>>>0,T>>>0)):[]})},829312:(s,m,g,$,T)=>{r.Ra("ReduceLogSumExp",s,{keepDims:!!m,noopWithEmptyAxes:!!g,axes:$?Array.from(W.subarray($>>>0,T>>>0)):[]})},829476:s=>{r.Ra("Where",s,void 0)},829529:(s,m,g)=>{r.Ra("Transpose",s,{perm:m?Array.from(W.subarray(m>>>0,g>>>0)):[]})},829637:(s,m,g,$)=>{r.Ra("DepthToSpace",s,{blocksize:m,mode:je(g),format:$?"NHWC":"NCHW"})},829770:(s,m,g,$)=>{r.Ra("DepthToSpace",s,{blocksize:m,mode:je(g),format:$?"NHWC":"NCHW"})},829903:(s,m,g,$,T,B,H,q,te,X,de,Ee,Oe,D,be)=>{r.Ra("ConvTranspose",s,{format:te?"NHWC":"NCHW",autoPad:m,dilations:[g],group:$,kernelShape:[T],pads:[B,H],strides:[q],wIsConst:()=>!!N[X>>>0],outputPadding:de?Array.from(W.subarray(de>>>0,Ee>>>0)):[],outputShape:Oe?Array.from(W.subarray(Oe>>>0,D>>>0)):[],activation:je(be)})},830304:(s,m,g,$,T,B,H,q,te,X,de,Ee,Oe,D)=>{r.Ra("ConvTranspose",s,{format:q?"NHWC":"NCHW",autoPad:m,dilations:Array.from(W.subarray(g>>>0,(g>>>0)+2>>>0)),group:$,kernelShape:Array.from(W.subarray(T>>>0,(T>>>0)+2>>>0)),pads:Array.from(W.subarray(B>>>0,(B>>>0)+4>>>0)),strides:Array.from(W.subarray(H>>>0,(H>>>0)+2>>>0)),wIsConst:()=>!!N[te>>>0],outputPadding:X?Array.from(W.subarray(X>>>0,de>>>0)):[],outputShape:Ee?Array.from(W.subarray(Ee>>>0,Oe>>>0)):[],activation:je(D)})},830869:(s,m,g,$,T,B,H,q,te,X,de,Ee,Oe,D,be)=>{r.Ra("ConvTranspose",s,{format:te?"NHWC":"NCHW",autoPad:m,dilations:[g],group:$,kernelShape:[T],pads:[B,H],strides:[q],wIsConst:()=>!!N[X>>>0],outputPadding:de?Array.from(W.subarray(de>>>0,Ee>>>0)):[],outputShape:Oe?Array.from(W.subarray(Oe>>>0,D>>>0)):[],activation:je(be)})},831270:(s,m,g,$,T,B,H,q,te,X,de,Ee,Oe,D)=>{r.Ra("ConvTranspose",s,{format:q?"NHWC":"NCHW",autoPad:m,dilations:Array.from(W.subarray(g>>>0,(g>>>0)+2>>>0)),group:$,kernelShape:Array.from(W.subarray(T>>>0,(T>>>0)+2>>>0)),pads:Array.from(W.subarray(B>>>0,(B>>>0)+4>>>0)),strides:Array.from(W.subarray(H>>>0,(H>>>0)+2>>>0)),wIsConst:()=>!!N[te>>>0],outputPadding:X?Array.from(W.subarray(X>>>0,de>>>0)):[],outputShape:Ee?Array.from(W.subarray(Ee>>>0,Oe>>>0)):[],activation:je(D)})},831835:(s,m)=>{r.Ra("GlobalAveragePool",s,{format:m?"NHWC":"NCHW"})},831926:(s,m,g,$,T,B,H,q,te,X,de,Ee,Oe,D,be,Ie)=>{r.Ra("AveragePool",s,{format:Ie?"NHWC":"NCHW",auto_pad:m,ceil_mode:g,count_include_pad:$,storage_order:T,dilations:[B,H],kernel_shape:[q,te],pads:[X,de,Ee,Oe],strides:[D,be]})},832210:(s,m)=>{r.Ra("GlobalAveragePool",s,{format:m?"NHWC":"NCHW"})},832301:(s,m,g,$,T,B,H,q,te,X,de,Ee,Oe,D,be,Ie)=>{r.Ra("AveragePool",s,{format:Ie?"NHWC":"NCHW",auto_pad:m,ceil_mode:g,count_include_pad:$,storage_order:T,dilations:[B,H],kernel_shape:[q,te],pads:[X,de,Ee,Oe],strides:[D,be]})},832585:(s,m)=>{r.Ra("GlobalMaxPool",s,{format:m?"NHWC":"NCHW"})},832672:(s,m,g,$,T,B,H,q,te,X,de,Ee,Oe,D,be,Ie)=>{r.Ra("MaxPool",s,{format:Ie?"NHWC":"NCHW",auto_pad:m,ceil_mode:g,count_include_pad:$,storage_order:T,dilations:[B,H],kernel_shape:[q,te],pads:[X,de,Ee,Oe],strides:[D,be]})},832952:(s,m)=>{r.Ra("GlobalMaxPool",s,{format:m?"NHWC":"NCHW"})},833039:(s,m,g,$,T,B,H,q,te,X,de,Ee,Oe,D,be,Ie)=>{r.Ra("MaxPool",s,{format:Ie?"NHWC":"NCHW",auto_pad:m,ceil_mode:g,count_include_pad:$,storage_order:T,dilations:[B,H],kernel_shape:[q,te],pads:[X,de,Ee,Oe],strides:[D,be]})},833319:(s,m,g,$,T)=>{r.Ra("Gemm",s,{alpha:m,beta:g,transA:$,transB:T})},833423:s=>{r.Ra("MatMul",s,void 0)},833477:(s,m,g,$)=>{r.Ra("ArgMax",s,{keepDims:!!m,selectLastIndex:!!g,axis:$})},833585:(s,m,g,$)=>{r.Ra("ArgMin",s,{keepDims:!!m,selectLastIndex:!!g,axis:$})},833693:(s,m)=>{r.Ra("Softmax",s,{axis:m})},833756:(s,m)=>{r.Ra("Concat",s,{axis:m})},833816:(s,m,g,$,T)=>{r.Ra("Split",s,{axis:m,numOutputs:g,splitSizes:$?Array.from(W.subarray($>>>0,T>>>0)):[]})},833956:s=>{r.Ra("Expand",s,void 0)},834010:(s,m)=>{r.Ra("Gather",s,{axis:Number(m)})},834081:(s,m)=>{r.Ra("GatherElements",s,{axis:Number(m)})},834160:(s,m,g,$,T,B,H,q,te,X,de)=>{r.Ra("Resize",s,{antialias:m,axes:g?Array.from(W.subarray(g>>>0,$>>>0)):[],coordinateTransformMode:je(T),cubicCoeffA:B,excludeOutside:H,extrapolationValue:q,keepAspectRatioPolicy:je(te),mode:je(X),nearestMode:je(de)})},834506:(s,m,g,$,T,B,H)=>{r.Ra("Slice",s,{starts:m?Array.from(W.subarray(m>>>0,g>>>0)):[],ends:$?Array.from(W.subarray($>>>0,T>>>0)):[],axes:B?Array.from(W.subarray(B>>>0,H>>>0)):[]})},834722:s=>{r.Ra("Tile",s,void 0)},834774:(s,m,g,$)=>{r.Ra("LayerNormalization",s,{axis:m,epsilon:g,simplified:!!$})},834885:(s,m,g)=>{r.Ra("InstanceNormalization",s,{epsilon:m,format:g?"NHWC":"NCHW"})},834999:(s,m,g)=>{r.Ra("InstanceNormalization",s,{epsilon:m,format:g?"NHWC":"NCHW"})},835113:s=>{r.Ra("Range",s,void 0)},835166:(s,m)=>{r.Ra("Einsum",s,{equation:je(m)})},835247:(s,m,g,$,T)=>{r.Ra("Pad",s,{mode:m,value:g,pads:$?Array.from(W.subarray($>>>0,T>>>0)):[]})},835374:(s,m,g,$,T,B)=>{r.Ra("BatchNormalization",s,{epsilon:m,momentum:g,spatial:!!T,trainingMode:!!$,format:B?"NHWC":"NCHW"})},835543:(s,m,g,$,T,B)=>{r.Ra("BatchNormalization",s,{epsilon:m,momentum:g,spatial:!!T,trainingMode:!!$,format:B?"NHWC":"NCHW"})},835712:(s,m,g)=>{r.Ra("CumSum",s,{exclusive:Number(m),reverse:Number(g)})},835809:(s,m,g,$,T,B,H,q,te)=>{r.Ra("Attention",s,{numHeads:m,isUnidirectional:g,maskFilterValue:$,scale:T,doRotary:B,qkvHiddenSizes:H?Array.from(W.subarray(Number(q)>>>0,Number(q)+H>>>0)):[],pastPresentShareBuffer:!!te})},836081:s=>{r.Ra("BiasAdd",s,void 0)},836136:s=>{r.Ra("BiasSplitGelu",s,void 0)},836197:s=>{r.Ra("FastGelu",s,void 0)},836253:(s,m,g,$,T,B,H,q,te,X,de,Ee,Oe)=>{r.Ra("Conv",s,{format:te?"NHWC":"NCHW",auto_pad:m,dilations:[g],group:$,kernel_shape:[T],pads:B?Array.from(W.subarray(B>>>0,H>>>0)):[],strides:[q],w_is_const:()=>!!N[X>>>0],activation:je(de),activation_params:Ee?Array.from(Ce.subarray(Ee>>>0,Oe>>>0)):[]})},836623:(s,m,g,$,T,B,H,q,te,X,de,Ee,Oe,D,be,Ie)=>{r.Ra("Conv",s,{format:Ee?"NHWC":"NCHW",auto_pad:m,dilations:[g,$],group:T,kernel_shape:[B,H],pads:q?Array.from(W.subarray(q>>>0,te>>>0)):[],strides:[X,de],w_is_const:()=>!!N[Oe>>>0],activation:je(D),activation_params:be?Array.from(Ce.subarray(be>>>0,Ie>>>0)):[]})},837014:s=>{r.Ra("Gelu",s,void 0)},837066:(s,m,g,$,T,B)=>{r.Ra("MatMulNBits",s,{k:m,n:g,accuracyLevel:$,bits:T,blockSize:B})},837193:(s,m,g,$,T,B)=>{r.Ra("MultiHeadAttention",s,{numHeads:m,isUnidirectional:g,maskFilterValue:$,scale:T,doRotary:B})},837352:(s,m,g,$,T)=>{r.Ra("RotaryEmbedding",s,{interleaved:!!m,numHeads:g,rotaryEmbeddingDim:$,scale:T})},837491:(s,m,g)=>{r.Ra("SkipLayerNormalization",s,{epsilon:m,simplified:!!g})},837593:(s,m,g)=>{r.Ra("SkipLayerNormalization",s,{epsilon:m,simplified:!!g})},837695:(s,m,g,$)=>{r.Ra("LayerNormalization",s,{axis:m,epsilon:g,simplified:!!$})},837806:s=>{r.ub(s)},837840:(s,m)=>r.wb(s,m,r.cb.xb,r.cb.errors)};function qt(s){this.name="ExitStatus",this.message=`Program terminated with exit(${s})`,this.status=s}class Vt{constructor(m){this.hb=m-24}}var sr=0,jt=0,xr=typeof TextDecoder<"u"?new TextDecoder("utf8"):void 0,Kt=(s,m,g)=>{m>>>=0;var $=m+g;for(g=m;s[g]&&!(g>=$);)++g;if(16T?$+=String.fromCharCode(T):(T-=65536,$+=String.fromCharCode(55296|T>>10,56320|T&1023))}}else $+=String.fromCharCode(T)}return $},je=(s,m)=>(s>>>=0)?Kt(K,s,m):"",Wt=s=>{for(var m=0,g=0;g=$?m++:2047>=$?m+=2:55296<=$&&57343>=$?(m+=4,++g):m+=3}return m},at=(s,m,g,$)=>{if(g>>>=0,!(0<$))return 0;var T=g;$=g+$-1;for(var B=0;B=H){var q=s.charCodeAt(++B);H=65536+((H&1023)<<10)|q&1023}if(127>=H){if(g>=$)break;m[g++>>>0]=H}else{if(2047>=H){if(g+1>=$)break;m[g++>>>0]=192|H>>6}else{if(65535>=H){if(g+2>=$)break;m[g++>>>0]=224|H>>12}else{if(g+3>=$)break;m[g++>>>0]=240|H>>18,m[g++>>>0]=128|H>>12&63}m[g++>>>0]=128|H>>6&63}m[g++>>>0]=128|H&63}}return m[g>>>0]=0,g-T},Cr,ft=s=>{for(var m="";K[s>>>0];)m+=Cr[K[s++>>>0]];return m},ur={},Ar={},Ir={},st;function Tr(s,m,g={}){var $=m.name;if(!s)throw new st(`type "${$}" must have a positive integer typeid pointer`);if(Ar.hasOwnProperty(s)){if(g.nb)return;throw new st(`Cannot register type \'${$}\' twice`)}Ar[s]=m,delete Ir[s],ur.hasOwnProperty(s)&&(m=ur[s],delete ur[s],m.forEach(T=>T()))}function ht(s,m,g={}){if(!("argPackAdvance"in m))throw new TypeError("registerType registeredInstance requires argPackAdvance");return Tr(s,m,g)}var bt=(s,m,g)=>{switch(m){case 1:return g?$=>N[$>>>0]:$=>K[$>>>0];case 2:return g?$=>Q[$>>>1>>>0]:$=>he[$>>>1>>>0];case 4:return g?$=>W[$>>>2>>>0]:$=>se[$>>>2>>>0];case 8:return g?$=>We[$>>>3]:$=>ee[$>>>3];default:throw new TypeError(`invalid integer width (${m}): ${s}`)}},Er=[],Te=[];function dr(s){s>>>=0,9{if(!s)throw new st("Cannot use deleted val. handle = "+s);return Te[s]},ut=s=>{switch(s){case void 0:return 2;case null:return 4;case!0:return 6;case!1:return 8;default:let m=Er.pop()||Te.length;return Te[m]=s,Te[m+1]=1,m}};function lr(s){return this.fromWireType(se[s>>>2>>>0])}var Fn={name:"emscripten::val",fromWireType:s=>{var m=Xe(s);return dr(s),m},toWireType:(s,m)=>ut(m),argPackAdvance:8,readValueFromPointer:lr,bb:null},ge=(s,m)=>{switch(m){case 4:return function(g){return this.fromWireType(Ce[g>>>2>>>0])};case 8:return function(g){return this.fromWireType(ae[g>>>3>>>0])};default:throw new TypeError(`invalid float width (${m}): ${s}`)}},Yt=typeof TextDecoder<"u"?new TextDecoder("utf-16le"):void 0,jr=(s,m)=>{for(var g=s>>1,$=g+m/2;!(g>=$)&&he[g>>>0];)++g;if(g<<=1,32>>0,g>>>0));for(g="",$=0;!($>=m/2);++$){var T=Q[s+2*$>>>1>>>0];if(T==0)break;g+=String.fromCharCode(T)}return g},qn=(s,m,g)=>{if(g??=2147483647,2>g)return 0;g-=2;var $=m;g=g<2*s.length?g/2:s.length;for(var T=0;T>>1>>>0]=s.charCodeAt(T),m+=2;return Q[m>>>1>>>0]=0,m-$},Kr=s=>2*s.length,jn=(s,m)=>{for(var g=0,$="";!(g>=m/4);){var T=W[s+4*g>>>2>>>0];if(T==0)break;++g,65536<=T?(T-=65536,$+=String.fromCharCode(55296|T>>10,56320|T&1023)):$+=String.fromCharCode(T)}return $},Yr=(s,m,g)=>{if(m>>>=0,g??=2147483647,4>g)return 0;var $=m;g=$+g-4;for(var T=0;T=B){var H=s.charCodeAt(++T);B=65536+((B&1023)<<10)|H&1023}if(W[m>>>2>>>0]=B,m+=4,m+4>g)break}return W[m>>>2>>>0]=0,m-$},Zr=s=>{for(var m=0,g=0;g=$&&++g,m+=4}return m},cr=(s,m)=>{var g=Ar[s];if(g===void 0)throw s=Mr(s),g=ft(s),rt(s),new st(`${m} has unknown type ${g}`);return g},Pr=(s,m,g)=>{var $=[];return s=s.toWireType($,g),$.length&&(se[m>>>2>>>0]=ut($)),s},He=s=>{try{s()}catch(m){ne(m)}},Xr=s=>{if(!R)try{s();try{L=L=s=L,r.onExit?.(s),R=!0,h(s,new qt(s))}catch(m){m instanceof qt||m=="unwind"||h(1,m)}}catch(m){m instanceof qt||m=="unwind"||h(1,m)}};function Qr(){var s=pe,m={};for(let[g,$]of Object.entries(s))m[g]=typeof $=="function"?(...T)=>{Zt.push(g);try{return $(...T)}finally{R||(Zt.pop(),dt&>===1&&Zt.length===0&&(gt=0,He(dn),typeof Fibers<"u"&&Fibers.Db()))}}:$;return m}var gt=0,dt=null,Bt=0,Zt=[],kr={},Or={},Jr=0,pr=null,en=[];function tn(){return new Promise((s,m)=>{pr={resolve:s,reject:m}})}function rn(){var s=Nt(65548),m=s+12;se[s>>>2>>>0]=m,se[s+4>>>2>>>0]=m+65536,m=Zt[0];var g=kr[m];return g===void 0&&(g=Jr++,kr[m]=g,Or[g]=m),W[s+8>>>2>>>0]=g,s}function nn(s){if(!R){if(gt===0){var m=!1,g=!1;s(($=0)=>{if(!R&&(Bt=$,m=!0,g)){gt=2,He(()=>vt(dt)),typeof Browser<"u"&&Browser.ib.mb&&Browser.ib.resume(),$=!1;try{var T=(0,pe[Or[W[dt+8>>>2>>>0]]])()}catch(q){T=q,$=!0}var B=!1;if(!dt){var H=pr;H&&(pr=null,($?H.reject:H.resolve)(T),B=!0)}if($&&!B)throw T}}),g=!0,m||(gt=1,dt=rn(),typeof Browser<"u"&&Browser.ib.mb&&Browser.ib.pause(),He(()=>Jt(dt)))}else gt===2?(gt=0,He(ct),rt(dt),dt=null,en.forEach(Xr)):ne(`invalid state: ${gt}`);return Bt}}function Rr(s){return nn(m=>{s().then(m)})}var Xt=[],on={},nt=s=>{var m=on[s];return m===void 0?ft(s):m},mr=()=>typeof globalThis=="object"?globalThis:Function("return this")(),Br=s=>{var m=Xt.length;return Xt.push(s),m},Kn=(s,m)=>{for(var g=Array(s),$=0;$>>2>>>0],"parameter "+$);return g},wt=(s,m)=>Object.defineProperty(m,"name",{value:s});function Yn(s){var m=Function;if(!(m instanceof Function))throw new TypeError(`new_ called with constructor type ${typeof m} which is not a function`);var g=wt(m.name||"unknownFunctionName",function(){});return g.prototype=m.prototype,g=new g,s=m.apply(g,s),s instanceof Object?s:g}var Je=s=>s%4===0&&(s%100!==0||s%400===0),Dr=[0,31,60,91,121,152,182,213,244,274,305,335],fr=[0,31,59,90,120,151,181,212,243,273,304,334],lt=[],hr=(s,m)=>{lt.length=0;for(var g;g=K[s++>>>0];){var $=g!=105;$&=g!=112,m+=$&&m%8?4:0,lt.push(g==112?se[m>>>2>>>0]:g==106?We[m>>>3]:g==105?W[m>>>2>>>0]:ae[m>>>3>>>0]),m+=$?8:4}return lt},Qe={},ot=()=>{if(!Qt){var s={USER:"web_user",LOGNAME:"web_user",PATH:"/",PWD:"/",HOME:"/home/web_user",LANG:(typeof navigator=="object"&&navigator.languages&&navigator.languages[0]||"C").replace("-","_")+".UTF-8",_:p||"./this.program"},m;for(m in Qe)Qe[m]===void 0?delete s[m]:s[m]=Qe[m];var g=[];for(m in s)g.push(`${m}=${s[m]}`);Qt=g}return Qt},Qt,Zn=[null,[],[]],an=[31,29,31,30,31,30,31,31,30,31,30,31],zr=[31,28,31,30,31,30,31,31,30,31,30,31];function Xn(s){var m=Array(Wt(s)+1);return at(s,m,0,m.length),m}function sn(s,m,g,$){function T(D,be,Ie){for(D=typeof D=="number"?D.toString():D||"";D.lengthMt?-1:0zt-D.getDate())be-=zt-D.getDate()+1,D.setDate(1),11>Ie?D.setMonth(Ie+1):(D.setMonth(0),D.setFullYear(D.getFullYear()+1));else{D.setDate(D.getDate()+be);break}}return Ie=new Date(D.getFullYear()+1,0,4),be=q(new Date(D.getFullYear(),0,4)),Ie=q(Ie),0>=H(be,D)?0>=H(Ie,D)?D.getFullYear()+1:D.getFullYear():D.getFullYear()-1}s>>>=0,m>>>=0,g>>>=0,$>>>=0;var X=se[$+40>>>2>>>0];$={Ab:W[$>>>2>>>0],zb:W[$+4>>>2>>>0],fb:W[$+8>>>2>>>0],jb:W[$+12>>>2>>>0],gb:W[$+16>>>2>>>0],ab:W[$+20>>>2>>>0],Va:W[$+24>>>2>>>0],$a:W[$+28>>>2>>>0],Cb:W[$+32>>>2>>>0],yb:W[$+36>>>2>>>0],Bb:X?je(X):""},g=je(g),X={"%c":"%a %b %d %H:%M:%S %Y","%D":"%m/%d/%y","%F":"%Y-%m-%d","%h":"%b","%r":"%I:%M:%S %p","%R":"%H:%M","%T":"%H:%M:%S","%x":"%m/%d/%y","%X":"%H:%M:%S","%Ec":"%c","%EC":"%C","%Ex":"%m/%d/%y","%EX":"%H:%M:%S","%Ey":"%y","%EY":"%Y","%Od":"%d","%Oe":"%e","%OH":"%H","%OI":"%I","%Om":"%m","%OM":"%M","%OS":"%S","%Ou":"%u","%OU":"%U","%OV":"%V","%Ow":"%w","%OW":"%W","%Oy":"%y"};for(var de in X)g=g.replace(new RegExp(de,"g"),X[de]);var Ee="Sunday Monday Tuesday Wednesday Thursday Friday Saturday".split(" "),Oe="January February March April May June July August September October November December".split(" ");X={"%a":D=>Ee[D.Va].substring(0,3),"%A":D=>Ee[D.Va],"%b":D=>Oe[D.gb].substring(0,3),"%B":D=>Oe[D.gb],"%C":D=>B((D.ab+1900)/100|0,2),"%d":D=>B(D.jb,2),"%e":D=>T(D.jb,2," "),"%g":D=>te(D).toString().substring(2),"%G":te,"%H":D=>B(D.fb,2),"%I":D=>(D=D.fb,D==0?D=12:12{for(var be=0,Ie=0;Ie<=D.gb-1;be+=(Je(D.ab+1900)?an:zr)[Ie++]);return B(D.jb+be,3)},"%m":D=>B(D.gb+1,2),"%M":D=>B(D.zb,2),"%n":()=>`\n`,"%p":D=>0<=D.fb&&12>D.fb?"AM":"PM","%S":D=>B(D.Ab,2),"%t":()=>" ","%u":D=>D.Va||7,"%U":D=>B(Math.floor((D.$a+7-D.Va)/7),2),"%V":D=>{var be=Math.floor((D.$a+7-(D.Va+6)%7)/7);if(2>=(D.Va+371-D.$a-2)%7&&be++,be)be==53&&(Ie=(D.Va+371-D.$a)%7,Ie==4||Ie==3&&Je(D.ab)||(be=1));else{be=52;var Ie=(D.Va+7-D.$a-1)%7;(Ie==4||Ie==5&&Je(D.ab%400-1))&&be++}return B(be,2)},"%w":D=>D.Va,"%W":D=>B(Math.floor((D.$a+7-(D.Va+6)%7)/7),2),"%y":D=>(D.ab+1900).toString().substring(2),"%Y":D=>D.ab+1900,"%z":D=>{D=D.yb;var be=0<=D;return D=Math.abs(D)/60,(be?"+":"-")+("0000"+(D/60*100+D%60)).slice(-4)},"%Z":D=>D.Bb,"%%":()=>"%"},g=g.replace(/%%/g,"\\0\\0");for(de in X)g.includes(de)&&(g=g.replace(new RegExp(de,"g"),X[de]($)));return g=g.replace(/\\0\\0/g,"%"),de=Xn(g),de.length>m?0:(N.set(de,s>>>0),de.length-1)}for(var un=Array(256),gr=0;256>gr;++gr)un[gr]=String.fromCharCode(gr);Cr=un,st=r.BindingError=class extends Error{constructor(s){super(s),this.name="BindingError"}},r.InternalError=class extends Error{constructor(s){super(s),this.name="InternalError"}},Te.push(0,1,void 0,1,null,1,!0,1,!1,1),r.count_emval_handles=()=>Te.length/2-5-Er.length;var Qn={ia:function(s,m,g){return Rr(async()=>{await r.sb(s,m,g)})},a:function(s,m,g){s>>>=0;var $=new Vt(s);throw se[$.hb+16>>>2>>>0]=0,se[$.hb+4>>>2>>>0]=m>>>0,se[$.hb+8>>>2>>>0]=g>>>0,sr=s,jt++,sr},y:function(){return 0},ea:function(){},R:function(){},T:function(){},ga:function(){return 0},ca:function(){},Z:function(){},ba:function(){},G:function(){},S:function(){},P:function(){},da:function(){},Q:function(){},C:function(s,m,g){m=ft(m>>>0),ht(s>>>0,{name:m,fromWireType:$=>$,toWireType:function($,T){if(typeof T!="bigint"&&typeof T!="number")throw T===null?T="null":($=typeof T,T=$==="object"||$==="array"||$==="function"?T.toString():""+T),new TypeError(`Cannot convert "${T}" to ${this.name}`);return typeof T=="number"&&(T=BigInt(T)),T},argPackAdvance:8,readValueFromPointer:bt(m,g>>>0,m.indexOf("u")==-1),bb:null})},K:function(s,m,g,$){m=ft(m>>>0),ht(s>>>0,{name:m,fromWireType:function(T){return!!T},toWireType:function(T,B){return B?g:$},argPackAdvance:8,readValueFromPointer:function(T){return this.fromWireType(K[T>>>0])},bb:null})},J:function(s){return ht(s>>>0,Fn)},B:function(s,m,g){m=ft(m>>>0),ht(s>>>0,{name:m,fromWireType:$=>$,toWireType:($,T)=>T,argPackAdvance:8,readValueFromPointer:ge(m,g>>>0),bb:null})},s:function(s,m,g,$,T){if(s>>>=0,g>>>=0,m=ft(m>>>0),T===-1&&(T=4294967295),T=q=>q,$===0){var B=32-8*g;T=q=>q<>>B}var H=m.includes("unsigned")?function(q,te){return te>>>0}:function(q,te){return te};ht(s,{name:m,fromWireType:T,toWireType:H,argPackAdvance:8,readValueFromPointer:bt(m,g,$!==0),bb:null})},o:function(s,m,g){function $(B){return new T(N.buffer,se[B+4>>>2>>>0],se[B>>>2>>>0])}var T=[Int8Array,Uint8Array,Int16Array,Uint16Array,Int32Array,Uint32Array,Float32Array,Float64Array,BigInt64Array,BigUint64Array][m];g=ft(g>>>0),ht(s>>>0,{name:g,fromWireType:$,argPackAdvance:8,readValueFromPointer:$},{nb:!0})},D:function(s,m){m=ft(m>>>0);var g=m==="std::string";ht(s>>>0,{name:m,fromWireType:function($){var T=se[$>>>2>>>0],B=$+4;if(g)for(var H=B,q=0;q<=T;++q){var te=B+q;if(q==T||K[te>>>0]==0){if(H=je(H,te-H),X===void 0)var X=H;else X+=String.fromCharCode(0),X+=H;H=te+1}}else{for(X=Array(T),q=0;q>>0]);X=X.join("")}return rt($),X},toWireType:function($,T){T instanceof ArrayBuffer&&(T=new Uint8Array(T));var B=typeof T=="string";if(!(B||T instanceof Uint8Array||T instanceof Uint8ClampedArray||T instanceof Int8Array))throw new st("Cannot pass non-string to std::string");var H=g&&B?Wt(T):T.length,q=Nt(4+H+1),te=q+4;if(se[q>>>2>>>0]=H,g&&B)at(T,K,te,H+1);else if(B)for(B=0;B>>0]=X}else for(B=0;B>>0]=T[B];return $!==null&&$.push(rt,q),q},argPackAdvance:8,readValueFromPointer:lr,bb($){rt($)}})},x:function(s,m,g){if(m>>>=0,g>>>=0,g=ft(g),m===2)var $=jr,T=qn,B=Kr,H=q=>he[q>>>1>>>0];else m===4&&($=jn,T=Yr,B=Zr,H=q=>se[q>>>2>>>0]);ht(s>>>0,{name:g,fromWireType:q=>{for(var te=se[q>>>2>>>0],X,de=q+4,Ee=0;Ee<=te;++Ee){var Oe=q+4+Ee*m;(Ee==te||H(Oe)==0)&&(de=$(de,Oe-de),X===void 0?X=de:(X+=String.fromCharCode(0),X+=de),de=Oe+m)}return rt(q),X},toWireType:(q,te)=>{if(typeof te!="string")throw new st(`Cannot pass non-string to C++ string type ${g}`);var X=B(te),de=Nt(4+X+m);return se[de>>>2>>>0]=X/m,T(te,de+4,X+m),q!==null&&q.push(rt,de),de},argPackAdvance:8,readValueFromPointer:lr,bb(q){rt(q)}})},L:function(s,m){m=ft(m>>>0),ht(s>>>0,{ob:!0,name:m,argPackAdvance:0,fromWireType:()=>{},toWireType:()=>{}})},ha:()=>1,u:function(s,m,g){return m>>>=0,g>>>=0,s=Xe(s>>>0),m=cr(m,"emval::as"),Pr(m,g,s)},w:function(s){return s>>>=0,Rr(()=>(s=Xe(s),s.then(ut)))},n:function(s,m,g,$){return g>>>=0,$>>>=0,s=Xt[s>>>0],m=Xe(m>>>0),s(null,m,g,$)},j:function(s,m,g,$,T){return g>>>=0,$>>>=0,T>>>=0,s=Xt[s>>>0],m=Xe(m>>>0),g=nt(g),s(m,m[g],$,T)},b:dr,A:function(s,m){return m>>>=0,s=Xe(s>>>0),m=Xe(m),s==m},m:function(s){return s>>>=0,s===0?ut(mr()):(s=nt(s),ut(mr()[s]))},i:function(s,m,g){m=Kn(s,m>>>0);var $=m.shift();s--;var T=`return function (obj, func, destructorsRef, args) {\n`,B=0,H=[];g===0&&H.push("obj");for(var q=["retType"],te=[$],X=0;Xde.name).join(", ")}) => ${$.name}>`,Br(wt(g,s))},r:function(s,m){return m>>>=0,s=Xe(s>>>0),m=Xe(m),ut(s[m])},e:function(s){s>>>=0,9>>0);for(var m=Array(s.length),g=0;g>>0))},k:function(){return ut({})},h:function(s){s>>>=0;for(var m=Xe(s);m.length;){var g=m.pop();m.pop()(g)}dr(s)},g:function(s,m,g){m>>>=0,g>>>=0,s=Xe(s>>>0),m=Xe(m),g=Xe(g),s[m]=g},c:function(s,m){return m>>>=0,s=cr(s>>>0,"_emval_take_value"),s=s.readValueFromPointer(m),ut(s)},W:function(s,m){s=-9007199254740992>s||9007199254740992>>=0,s=new Date(1e3*s),W[m>>>2>>>0]=s.getUTCSeconds(),W[m+4>>>2>>>0]=s.getUTCMinutes(),W[m+8>>>2>>>0]=s.getUTCHours(),W[m+12>>>2>>>0]=s.getUTCDate(),W[m+16>>>2>>>0]=s.getUTCMonth(),W[m+20>>>2>>>0]=s.getUTCFullYear()-1900,W[m+24>>>2>>>0]=s.getUTCDay(),W[m+28>>>2>>>0]=(s.getTime()-Date.UTC(s.getUTCFullYear(),0,1,0,0,0,0))/864e5|0},X:function(s,m){s=-9007199254740992>s||9007199254740992>>=0,s=new Date(1e3*s),W[m>>>2>>>0]=s.getSeconds(),W[m+4>>>2>>>0]=s.getMinutes(),W[m+8>>>2>>>0]=s.getHours(),W[m+12>>>2>>>0]=s.getDate(),W[m+16>>>2>>>0]=s.getMonth(),W[m+20>>>2>>>0]=s.getFullYear()-1900,W[m+24>>>2>>>0]=s.getDay(),W[m+28>>>2>>>0]=(Je(s.getFullYear())?Dr:fr)[s.getMonth()]+s.getDate()-1|0,W[m+36>>>2>>>0]=-(60*s.getTimezoneOffset());var g=new Date(s.getFullYear(),6,1).getTimezoneOffset(),$=new Date(s.getFullYear(),0,1).getTimezoneOffset();W[m+32>>>2>>>0]=(g!=$&&s.getTimezoneOffset()==Math.min($,g))|0},Y:function(s){s>>>=0;var m=new Date(W[s+20>>>2>>>0]+1900,W[s+16>>>2>>>0],W[s+12>>>2>>>0],W[s+8>>>2>>>0],W[s+4>>>2>>>0],W[s>>>2>>>0],0),g=W[s+32>>>2>>>0],$=m.getTimezoneOffset(),T=new Date(m.getFullYear(),6,1).getTimezoneOffset(),B=new Date(m.getFullYear(),0,1).getTimezoneOffset(),H=Math.min(B,T);return 0>g?W[s+32>>>2>>>0]=+(T!=B&&H==$):0>>2>>>0]=m.getDay(),W[s+28>>>2>>>0]=(Je(m.getFullYear())?Dr:fr)[m.getMonth()]+m.getDate()-1|0,W[s>>>2>>>0]=m.getSeconds(),W[s+4>>>2>>>0]=m.getMinutes(),W[s+8>>>2>>>0]=m.getHours(),W[s+12>>>2>>>0]=m.getDate(),W[s+16>>>2>>>0]=m.getMonth(),W[s+20>>>2>>>0]=m.getYear(),s=m.getTime(),BigInt(isNaN(s)?-1:s/1e3)},U:function(){return-52},V:function(){},N:function(s,m,g,$){g>>>=0,$>>>=0;var T=new Date().getFullYear(),B=new Date(T,0,1),H=new Date(T,6,1);T=B.getTimezoneOffset();var q=H.getTimezoneOffset();se[s>>>0>>>2>>>0]=60*Math.max(T,q),W[m>>>0>>>2>>>0]=+(T!=q),s=te=>te.toLocaleTimeString(void 0,{hour12:!1,timeZoneName:"short"}).split(" ")[1],B=s(B),H=s(H),q{ne("")},d:function(s,m,g){return s>>>=0,m=hr(m>>>0,g>>>0),Rt[s](...m)},I:function(s,m,g){return s>>>=0,m=hr(m>>>0,g>>>0),Rt[s](...m)},H:()=>Date.now(),O:function(){return 4294901760},q:()=>performance.now(),M:function(s){s>>>=0;var m=K.length;if(4294901760=g;g*=2){var $=m*(1+.2/g);$=Math.min($,s+100663296);var T=Math;$=Math.max(s,$);e:{T=(T.min.call(T,4294901760,$+(65536-$%65536)%65536)-O.buffer.byteLength+65535)/65536;try{O.grow(T),Ae();var B=1;break e}catch{}B=void 0}if(B)return!0}return!1},$:function(s,m){s>>>=0,m>>>=0;var g=0;return ot().forEach(($,T)=>{var B=m+g;for(T=se[s+4*T>>>2>>>0]=B,B=0;B<$.length;++B)N[T++>>>0]=$.charCodeAt(B);N[T>>>0]=0,g+=$.length+1}),0},aa:function(s,m){s>>>=0,m>>>=0;var g=ot();se[s>>>2>>>0]=g.length;var $=0;return g.forEach(T=>$+=T.length+1),se[m>>>2>>>0]=$,0},z:()=>52,F:function(){return 52},_:function(){return 70},E:function(s,m,g,$){m>>>=0,g>>>=0,$>>>=0;for(var T=0,B=0;B>>2>>>0],q=se[m+4>>>2>>>0];m+=8;for(var te=0;te>>0],de=Zn[s];X===0||X===10?((s===1?E:P)(Kt(de,0)),de.length=0):de.push(X)}T+=q}return se[$>>>2>>>0]=T,0},fa:sn,p:function(s,m,g,$){return sn(s>>>0,m>>>0,g>>>0,$>>>0)}},pe=function(){function s(g){return pe=g.exports,pe=Qr(),pe=ln(),O=pe.ja,Ae(),ie.unshift(pe.ka),le--,le==0&&(qe!==null&&(clearInterval(qe),qe=null),G&&(g=G,G=null,g())),pe}var m={a:Qn};if(le++,r.instantiateWasm)try{return r.instantiateWasm(m,s)}catch(g){P(`Module.instantiateWasm callback failed with error: ${g}`),i(g)}return mt(m,function(g){s(g.instance)}).catch(i),{}}(),Mr=s=>(Mr=pe.la)(s);r._OrtInit=(s,m)=>(r._OrtInit=pe.ma)(s,m),r._OrtGetLastError=(s,m)=>(r._OrtGetLastError=pe.na)(s,m),r._OrtCreateSessionOptions=(s,m,g,$,T,B,H,q,te,X)=>(r._OrtCreateSessionOptions=pe.oa)(s,m,g,$,T,B,H,q,te,X),r._OrtAppendExecutionProvider=(s,m)=>(r._OrtAppendExecutionProvider=pe.pa)(s,m),r._OrtAddFreeDimensionOverride=(s,m,g)=>(r._OrtAddFreeDimensionOverride=pe.qa)(s,m,g),r._OrtAddSessionConfigEntry=(s,m,g)=>(r._OrtAddSessionConfigEntry=pe.ra)(s,m,g),r._OrtReleaseSessionOptions=s=>(r._OrtReleaseSessionOptions=pe.sa)(s),r._OrtCreateSession=(s,m,g)=>(r._OrtCreateSession=pe.ta)(s,m,g),r._OrtReleaseSession=s=>(r._OrtReleaseSession=pe.ua)(s),r._OrtGetInputOutputCount=(s,m,g)=>(r._OrtGetInputOutputCount=pe.va)(s,m,g),r._OrtGetInputName=(s,m)=>(r._OrtGetInputName=pe.wa)(s,m),r._OrtGetOutputName=(s,m)=>(r._OrtGetOutputName=pe.xa)(s,m),r._OrtFree=s=>(r._OrtFree=pe.ya)(s),r._OrtCreateTensor=(s,m,g,$,T,B)=>(r._OrtCreateTensor=pe.za)(s,m,g,$,T,B),r._OrtGetTensorData=(s,m,g,$,T)=>(r._OrtGetTensorData=pe.Aa)(s,m,g,$,T),r._OrtReleaseTensor=s=>(r._OrtReleaseTensor=pe.Ba)(s),r._OrtCreateRunOptions=(s,m,g,$)=>(r._OrtCreateRunOptions=pe.Ca)(s,m,g,$),r._OrtAddRunConfigEntry=(s,m,g)=>(r._OrtAddRunConfigEntry=pe.Da)(s,m,g),r._OrtReleaseRunOptions=s=>(r._OrtReleaseRunOptions=pe.Ea)(s),r._OrtCreateBinding=s=>(r._OrtCreateBinding=pe.Fa)(s),r._OrtBindInput=(s,m,g)=>(r._OrtBindInput=pe.Ga)(s,m,g),r._OrtBindOutput=(s,m,g,$)=>(r._OrtBindOutput=pe.Ha)(s,m,g,$),r._OrtClearBoundOutputs=s=>(r._OrtClearBoundOutputs=pe.Ia)(s),r._OrtReleaseBinding=s=>(r._OrtReleaseBinding=pe.Ja)(s),r._OrtRunWithBinding=(s,m,g,$,T)=>(r._OrtRunWithBinding=pe.Ka)(s,m,g,$,T),r._OrtRun=(s,m,g,$,T,B,H,q)=>(r._OrtRun=pe.La)(s,m,g,$,T,B,H,q),r._OrtEndProfiling=s=>(r._OrtEndProfiling=pe.Ma)(s),r._JsepOutput=(s,m,g)=>(r._JsepOutput=pe.Na)(s,m,g),r._JsepGetNodeName=s=>(r._JsepGetNodeName=pe.Oa)(s);var Nt=r._malloc=s=>(Nt=r._malloc=pe.Pa)(s),rt=r._free=s=>(rt=r._free=pe.Qa)(s),yr=s=>(yr=pe.Sa)(s),br=s=>(br=pe.Ta)(s),Ur=()=>(Ur=pe.Ua)(),Jt=s=>(Jt=pe.Wa)(s),dn=()=>(dn=pe.Xa)(),vt=s=>(vt=pe.Ya)(s),ct=()=>(ct=pe.Za)();r.___start_em_js=837952,r.___stop_em_js=838113;function ln(){var s=pe;s=Object.assign({},s);var m=g=>$=>g($)>>>0;return s.la=m(s.la),s.Pa=m(s.Pa),s.Ta=m(s.Ta),s.Ua=(g=>()=>g()>>>0)(s.Ua),s}r.stackSave=()=>Ur(),r.stackRestore=s=>yr(s),r.stackAlloc=s=>br(s),r.UTF8ToString=je,r.stringToUTF8=(s,m,g)=>at(s,K,m,g),r.lengthBytesUTF8=Wt;var Dt;G=function s(){Dt||Vr(),Dt||(G=s)};function Vr(){if(!(0Ii)});var Pi=Wr(()=>{});var ki=Wr(()=>{});var Oi={};gn(Oi,{cpus:()=>ll});var ll,Ri=Y(()=>{ll=void 0});var zi=Wr((Di,mo)=>{"use strict";var Bi=(()=>{var e=typeof document<"u"?document.currentScript?.src:void 0;return typeof __filename<"u"&&(e||=__filename),function(t={}){function r(){return ae.buffer!=ue.buffer&&Ne(),ue}function o(){return ae.buffer!=ue.buffer&&Ne(),le}function i(){return ae.buffer!=ue.buffer&&Ne(),qe}function u(){return ae.buffer!=ue.buffer&&Ne(),G}function a(){return ae.buffer!=ue.buffer&&Ne(),ne}function c(){return ae.buffer!=ue.buffer&&Ne(),xe}function p(){return ae.buffer!=ue.buffer&&Ne(),Ke}function h(){return ae.buffer!=ue.buffer&&Ne(),Ut}var d=t,y,w,_=new Promise((n,l)=>{y=n,w=l});d.mountExternalData=(n,l)=>{(d.Db||(d.Db=new Map)).set(n,l)},d.unmountExternalData=()=>{delete d.Db};let v=()=>{let n=(f,b,C)=>(...k)=>{let V=ct,F=b?.();k=f(...k);let re=b?.();return F!==re&&(f=re,C(F),b=C=null),ct!=V?T():k},l=f=>async(...b)=>{try{if(d.Cb)throw Error("Session already started");let C=d.Cb={ec:b[0],errors:[]},k=await f(...b);if(d.Cb!==C)throw Error("Session mismatch");d.Kb?.flush();let V=C.errors;if(0re),0d._OrtCreateSession,f=>d._OrtCreateSession=f),d._OrtRun=l(n(d._OrtRun,()=>d._OrtRun,f=>d._OrtRun=f)),d._OrtRunWithBinding=l(n(d._OrtRunWithBinding,()=>d._OrtRunWithBinding,f=>d._OrtRunWithBinding=f)),d._OrtBindInput=n(d._OrtBindInput,()=>d._OrtBindInput,f=>d._OrtBindInput=f),v=void 0};d.jsepInit=(n,l)=>{if(v?.(),n==="webgpu"){[d.Kb,d.Wb,d.$b,d.Lb,d.Zb,d.ob,d.ac,d.cc,d.Xb,d.Yb,d.bc]=l;let f=d.Kb;d.jsepRegisterBuffer=(b,C,k,V)=>f.registerBuffer(b,C,k,V),d.jsepGetBuffer=b=>f.getBuffer(b),d.jsepCreateDownloader=(b,C,k)=>f.createDownloader(b,C,k),d.jsepOnReleaseSession=b=>{f.onReleaseSession(b)},d.jsepOnRunStart=b=>f.onRunStart(b)}};var S=Object.assign({},d),A="./this.program",I=(n,l)=>{throw l},x=typeof window=="object",E=typeof importScripts=="function",P=typeof process=="object"&&typeof process.versions=="object"&&typeof process.versions.node=="string",O=d.ENVIRONMENT_IS_PTHREAD||!1,R="";function L(n){return d.locateFile?d.locateFile(n,R):R+n}var N,K,Q;if(P){var he=(uo(),wr(so)),W=(co(),wr(lo));R=E?W.dirname(R)+"/":__dirname+"/",N=(n,l)=>(n=Wt(n)?new URL(n):W.normalize(n),he.readFileSync(n,l?void 0:"utf8")),Q=n=>(n=N(n,!0),n.buffer||(n=new Uint8Array(n)),n),K=(n,l,f,b=!0)=>{n=Wt(n)?new URL(n):W.normalize(n),he.readFile(n,b?void 0:"utf8",(C,k)=>{C?f(C):l(b?k.buffer:k)})},!d.thisProgram&&1{throw process.exitCode=n,l},global.Worker=Pi().Worker}else(x||E)&&(E?R=self.location.href:typeof document<"u"&&document.currentScript&&(R=document.currentScript.src),typeof e<"u"&&e&&(R=e),R.startsWith("blob:")?R="":R=R.substr(0,R.replace(/[?#].*/,"").lastIndexOf("/")+1),P||(N=n=>{var l=new XMLHttpRequest;return l.open("GET",n,!1),l.send(null),l.responseText},E&&(Q=n=>{var l=new XMLHttpRequest;return l.open("GET",n,!1),l.responseType="arraybuffer",l.send(null),new Uint8Array(l.response)}),K=(n,l,f)=>{var b=new XMLHttpRequest;b.open("GET",n,!0),b.responseType="arraybuffer",b.onload=()=>{b.status==200||b.status==0&&b.response?l(b.response):f()},b.onerror=f,b.send(null)}));P&&typeof performance>"u"&&(global.performance=ki().performance);var se=console.log.bind(console),Ce=console.error.bind(console);P&&(se=(...n)=>he.writeSync(1,n.join(" ")+`\n`),Ce=(...n)=>he.writeSync(2,n.join(" ")+`\n`));var We=se,ee=Ce;Object.assign(d,S),S=null;var ae,Ae,me=!1,ie,ue,le,qe,G,ne,xe,Ke,Be,Ge,Ut;function Ne(){var n=ae.buffer;d.HEAP8=ue=new Int8Array(n),d.HEAP16=qe=new Int16Array(n),d.HEAPU8=le=new Uint8Array(n),d.HEAPU16=G=new Uint16Array(n),d.HEAP32=ne=new Int32Array(n),d.HEAPU32=xe=new Uint32Array(n),d.HEAPF32=Ke=new Float32Array(n),d.HEAPF64=Ut=new Float64Array(n),d.HEAP64=Be=new BigInt64Array(n),d.HEAPU64=Ge=new BigUint64Array(n)}var Ye=16777216;if(O)ae=d.wasmMemory;else if(d.wasmMemory)ae=d.wasmMemory;else if(ae=new WebAssembly.Memory({initial:Ye/65536,maximum:65536,shared:!0}),!(ae.buffer instanceof SharedArrayBuffer))throw ee("requested a shared WebAssembly.Memory but the returned buffer is not a SharedArrayBuffer, indicating that while the browser has SharedArrayBuffer it does not have WebAssembly threads support - you may need to set a flag"),P&&ee("(on node you may need: --experimental-wasm-threads --experimental-wasm-bulk-memory and/or recent version)"),Error("bad memory");Ne(),Ye=ae.buffer.byteLength;var mt=[],Rt=[],qt=[],Vt=0,sr=null,jt=null;function xr(){if(Vt--,Vt==0&&(sr!==null&&(clearInterval(sr),sr=null),jt)){var n=jt;jt=null,n()}}function Kt(n){throw n="Aborted("+n+")",ee(n),me=!0,ie=1,n=new WebAssembly.RuntimeError(n+". Build with -sASSERTIONS for more info."),w(n),n}var je=n=>n.startsWith("data:application/octet-stream;base64,"),Wt=n=>n.startsWith("file://"),at;at="ort-wasm-simd-threaded.wasm",je(at)||(at=L(at));function Cr(n){if(Q)return Q(n);throw"both async and sync fetching of the wasm failed"}function ft(n){if(x||E){if(typeof fetch=="function"&&!Wt(n))return fetch(n,{credentials:"same-origin"}).then(l=>{if(!l.ok)throw`failed to load wasm binary file at \'${n}\'`;return l.arrayBuffer()}).catch(()=>Cr(n));if(K)return new Promise((l,f)=>{K(n,b=>l(new Uint8Array(b)),f)})}return Promise.resolve().then(()=>Cr(n))}function ur(n,l,f){return ft(n).then(b=>WebAssembly.instantiate(b,l)).then(f,b=>{ee(`failed to asynchronously prepare wasm: ${b}`),Kt(b)})}function Ar(n,l){var f=at;return typeof WebAssembly.instantiateStreaming!="function"||je(f)||Wt(f)||P||typeof fetch!="function"?ur(f,n,l):fetch(f,{credentials:"same-origin"}).then(b=>WebAssembly.instantiateStreaming(b,n).then(l,function(C){return ee(`wasm streaming compile failed: ${C}`),ee("falling back to ArrayBuffer instantiation"),ur(f,n,l)}))}var Ir={826468:(n,l,f,b)=>{if(typeof d>"u"||!d.Db)return 1;if(n=He(n>>>0),n.startsWith("./")&&(n=n.substring(2)),n=d.Db.get(n),!n)return 2;if(l>>>=0,f>>>=0,b>>>=0,l+f>n.byteLength)return 3;try{return o().set(n.subarray(l,l+f),b>>>0),0}catch{return 4}},826969:()=>{d.Xb()},827e3:()=>{d.Yb()},827029:()=>{d.bc()},827054:n=>d.Wb(n),827087:n=>d.$b(n),827119:(n,l,f)=>{d.Lb(n,l,f,!0)},827158:(n,l,f)=>{d.Lb(n,l,f)},827191:n=>{d.ob("Abs",n,void 0)},827242:n=>{d.ob("Neg",n,void 0)},827293:n=>{d.ob("Floor",n,void 0)},827346:n=>{d.ob("Ceil",n,void 0)},827398:n=>{d.ob("Reciprocal",n,void 0)},827456:n=>{d.ob("Sqrt",n,void 0)},827508:n=>{d.ob("Exp",n,void 0)},827559:n=>{d.ob("Erf",n,void 0)},827610:n=>{d.ob("Sigmoid",n,void 0)},827665:(n,l,f)=>{d.ob("HardSigmoid",n,{alpha:l,beta:f})},827744:n=>{d.ob("Log",n,void 0)},827795:n=>{d.ob("Sin",n,void 0)},827846:n=>{d.ob("Cos",n,void 0)},827897:n=>{d.ob("Tan",n,void 0)},827948:n=>{d.ob("Asin",n,void 0)},828e3:n=>{d.ob("Acos",n,void 0)},828052:n=>{d.ob("Atan",n,void 0)},828104:n=>{d.ob("Sinh",n,void 0)},828156:n=>{d.ob("Cosh",n,void 0)},828208:n=>{d.ob("Asinh",n,void 0)},828261:n=>{d.ob("Acosh",n,void 0)},828314:n=>{d.ob("Atanh",n,void 0)},828367:n=>{d.ob("Tanh",n,void 0)},828419:n=>{d.ob("Not",n,void 0)},828470:(n,l,f)=>{d.ob("Clip",n,{min:l,max:f})},828539:n=>{d.ob("Clip",n,void 0)},828591:(n,l)=>{d.ob("Elu",n,{alpha:l})},828649:n=>{d.ob("Relu",n,void 0)},828701:(n,l)=>{d.ob("LeakyRelu",n,{alpha:l})},828765:(n,l)=>{d.ob("ThresholdedRelu",n,{alpha:l})},828835:(n,l)=>{d.ob("Cast",n,{to:l})},828893:n=>{d.ob("Add",n,void 0)},828944:n=>{d.ob("Sub",n,void 0)},828995:n=>{d.ob("Mul",n,void 0)},829046:n=>{d.ob("Div",n,void 0)},829097:n=>{d.ob("Pow",n,void 0)},829148:n=>{d.ob("Equal",n,void 0)},829201:n=>{d.ob("Greater",n,void 0)},829256:n=>{d.ob("GreaterOrEqual",n,void 0)},829318:n=>{d.ob("Less",n,void 0)},829370:n=>{d.ob("LessOrEqual",n,void 0)},829429:(n,l,f,b,C)=>{d.ob("ReduceMean",n,{keepDims:!!l,noopWithEmptyAxes:!!f,axes:b?Array.from(a().subarray(b>>>0,C>>>0)):[]})},829588:(n,l,f,b,C)=>{d.ob("ReduceMax",n,{keepDims:!!l,noopWithEmptyAxes:!!f,axes:b?Array.from(a().subarray(b>>>0,C>>>0)):[]})},829746:(n,l,f,b,C)=>{d.ob("ReduceMin",n,{keepDims:!!l,noopWithEmptyAxes:!!f,axes:b?Array.from(a().subarray(b>>>0,C>>>0)):[]})},829904:(n,l,f,b,C)=>{d.ob("ReduceProd",n,{keepDims:!!l,noopWithEmptyAxes:!!f,axes:b?Array.from(a().subarray(b>>>0,C>>>0)):[]})},830063:(n,l,f,b,C)=>{d.ob("ReduceSum",n,{keepDims:!!l,noopWithEmptyAxes:!!f,axes:b?Array.from(a().subarray(b>>>0,C>>>0)):[]})},830221:(n,l,f,b,C)=>{d.ob("ReduceL1",n,{keepDims:!!l,noopWithEmptyAxes:!!f,axes:b?Array.from(a().subarray(b>>>0,C>>>0)):[]})},830378:(n,l,f,b,C)=>{d.ob("ReduceL2",n,{keepDims:!!l,noopWithEmptyAxes:!!f,axes:b?Array.from(a().subarray(b>>>0,C>>>0)):[]})},830535:(n,l,f,b,C)=>{d.ob("ReduceLogSum",n,{keepDims:!!l,noopWithEmptyAxes:!!f,axes:b?Array.from(a().subarray(b>>>0,C>>>0)):[]})},830696:(n,l,f,b,C)=>{d.ob("ReduceSumSquare",n,{keepDims:!!l,noopWithEmptyAxes:!!f,axes:b?Array.from(a().subarray(b>>>0,C>>>0)):[]})},830860:(n,l,f,b,C)=>{d.ob("ReduceLogSumExp",n,{keepDims:!!l,noopWithEmptyAxes:!!f,axes:b?Array.from(a().subarray(b>>>0,C>>>0)):[]})},831024:n=>{d.ob("Where",n,void 0)},831077:(n,l,f)=>{d.ob("Transpose",n,{perm:l?Array.from(a().subarray(l>>>0,f>>>0)):[]})},831185:(n,l,f,b)=>{d.ob("DepthToSpace",n,{blocksize:l,mode:He(f),format:b?"NHWC":"NCHW"})},831318:(n,l,f,b)=>{d.ob("DepthToSpace",n,{blocksize:l,mode:He(f),format:b?"NHWC":"NCHW"})},831451:(n,l,f,b,C,k,V,F,re,J,ce,Re,ze,z,we)=>{d.ob("ConvTranspose",n,{format:re?"NHWC":"NCHW",autoPad:l,dilations:[f],group:b,kernelShape:[C],pads:[k,V],strides:[F],wIsConst:()=>!!r()[J>>>0],outputPadding:ce?Array.from(a().subarray(ce>>>0,Re>>>0)):[],outputShape:ze?Array.from(a().subarray(ze>>>0,z>>>0)):[],activation:He(we)})},831852:(n,l,f,b,C,k,V,F,re,J,ce,Re,ze,z)=>{d.ob("ConvTranspose",n,{format:F?"NHWC":"NCHW",autoPad:l,dilations:Array.from(a().subarray(f>>>0,(f>>>0)+2>>>0)),group:b,kernelShape:Array.from(a().subarray(C>>>0,(C>>>0)+2>>>0)),pads:Array.from(a().subarray(k>>>0,(k>>>0)+4>>>0)),strides:Array.from(a().subarray(V>>>0,(V>>>0)+2>>>0)),wIsConst:()=>!!r()[re>>>0],outputPadding:J?Array.from(a().subarray(J>>>0,ce>>>0)):[],outputShape:Re?Array.from(a().subarray(Re>>>0,ze>>>0)):[],activation:He(z)})},832417:(n,l,f,b,C,k,V,F,re,J,ce,Re,ze,z,we)=>{d.ob("ConvTranspose",n,{format:re?"NHWC":"NCHW",autoPad:l,dilations:[f],group:b,kernelShape:[C],pads:[k,V],strides:[F],wIsConst:()=>!!r()[J>>>0],outputPadding:ce?Array.from(a().subarray(ce>>>0,Re>>>0)):[],outputShape:ze?Array.from(a().subarray(ze>>>0,z>>>0)):[],activation:He(we)})},832818:(n,l,f,b,C,k,V,F,re,J,ce,Re,ze,z)=>{d.ob("ConvTranspose",n,{format:F?"NHWC":"NCHW",autoPad:l,dilations:Array.from(a().subarray(f>>>0,(f>>>0)+2>>>0)),group:b,kernelShape:Array.from(a().subarray(C>>>0,(C>>>0)+2>>>0)),pads:Array.from(a().subarray(k>>>0,(k>>>0)+4>>>0)),strides:Array.from(a().subarray(V>>>0,(V>>>0)+2>>>0)),wIsConst:()=>!!r()[re>>>0],outputPadding:J?Array.from(a().subarray(J>>>0,ce>>>0)):[],outputShape:Re?Array.from(a().subarray(Re>>>0,ze>>>0)):[],activation:He(z)})},833383:(n,l)=>{d.ob("GlobalAveragePool",n,{format:l?"NHWC":"NCHW"})},833474:(n,l,f,b,C,k,V,F,re,J,ce,Re,ze,z,we,Pe)=>{d.ob("AveragePool",n,{format:Pe?"NHWC":"NCHW",auto_pad:l,ceil_mode:f,count_include_pad:b,storage_order:C,dilations:[k,V],kernel_shape:[F,re],pads:[J,ce,Re,ze],strides:[z,we]})},833758:(n,l)=>{d.ob("GlobalAveragePool",n,{format:l?"NHWC":"NCHW"})},833849:(n,l,f,b,C,k,V,F,re,J,ce,Re,ze,z,we,Pe)=>{d.ob("AveragePool",n,{format:Pe?"NHWC":"NCHW",auto_pad:l,ceil_mode:f,count_include_pad:b,storage_order:C,dilations:[k,V],kernel_shape:[F,re],pads:[J,ce,Re,ze],strides:[z,we]})},834133:(n,l)=>{d.ob("GlobalMaxPool",n,{format:l?"NHWC":"NCHW"})},834220:(n,l,f,b,C,k,V,F,re,J,ce,Re,ze,z,we,Pe)=>{d.ob("MaxPool",n,{format:Pe?"NHWC":"NCHW",auto_pad:l,ceil_mode:f,count_include_pad:b,storage_order:C,dilations:[k,V],kernel_shape:[F,re],pads:[J,ce,Re,ze],strides:[z,we]})},834500:(n,l)=>{d.ob("GlobalMaxPool",n,{format:l?"NHWC":"NCHW"})},834587:(n,l,f,b,C,k,V,F,re,J,ce,Re,ze,z,we,Pe)=>{d.ob("MaxPool",n,{format:Pe?"NHWC":"NCHW",auto_pad:l,ceil_mode:f,count_include_pad:b,storage_order:C,dilations:[k,V],kernel_shape:[F,re],pads:[J,ce,Re,ze],strides:[z,we]})},834867:(n,l,f,b,C)=>{d.ob("Gemm",n,{alpha:l,beta:f,transA:b,transB:C})},834971:n=>{d.ob("MatMul",n,void 0)},835025:(n,l,f,b)=>{d.ob("ArgMax",n,{keepDims:!!l,selectLastIndex:!!f,axis:b})},835133:(n,l,f,b)=>{d.ob("ArgMin",n,{keepDims:!!l,selectLastIndex:!!f,axis:b})},835241:(n,l)=>{d.ob("Softmax",n,{axis:l})},835304:(n,l)=>{d.ob("Concat",n,{axis:l})},835364:(n,l,f,b,C)=>{d.ob("Split",n,{axis:l,numOutputs:f,splitSizes:b?Array.from(a().subarray(b>>>0,C>>>0)):[]})},835504:n=>{d.ob("Expand",n,void 0)},835558:(n,l)=>{d.ob("Gather",n,{axis:Number(l)})},835629:(n,l)=>{d.ob("GatherElements",n,{axis:Number(l)})},835708:(n,l,f,b,C,k,V,F,re,J,ce)=>{d.ob("Resize",n,{antialias:l,axes:f?Array.from(a().subarray(f>>>0,b>>>0)):[],coordinateTransformMode:He(C),cubicCoeffA:k,excludeOutside:V,extrapolationValue:F,keepAspectRatioPolicy:He(re),mode:He(J),nearestMode:He(ce)})},836054:(n,l,f,b,C,k,V)=>{d.ob("Slice",n,{starts:l?Array.from(a().subarray(l>>>0,f>>>0)):[],ends:b?Array.from(a().subarray(b>>>0,C>>>0)):[],axes:k?Array.from(a().subarray(k>>>0,V>>>0)):[]})},836270:n=>{d.ob("Tile",n,void 0)},836322:(n,l,f,b)=>{d.ob("LayerNormalization",n,{axis:l,epsilon:f,simplified:!!b})},836433:(n,l,f)=>{d.ob("InstanceNormalization",n,{epsilon:l,format:f?"NHWC":"NCHW"})},836547:(n,l,f)=>{d.ob("InstanceNormalization",n,{epsilon:l,format:f?"NHWC":"NCHW"})},836661:n=>{d.ob("Range",n,void 0)},836714:(n,l)=>{d.ob("Einsum",n,{equation:He(l)})},836795:(n,l,f,b,C)=>{d.ob("Pad",n,{mode:l,value:f,pads:b?Array.from(a().subarray(b>>>0,C>>>0)):[]})},836922:(n,l,f,b,C,k)=>{d.ob("BatchNormalization",n,{epsilon:l,momentum:f,spatial:!!C,trainingMode:!!b,format:k?"NHWC":"NCHW"})},837091:(n,l,f,b,C,k)=>{d.ob("BatchNormalization",n,{epsilon:l,momentum:f,spatial:!!C,trainingMode:!!b,format:k?"NHWC":"NCHW"})},837260:(n,l,f)=>{d.ob("CumSum",n,{exclusive:Number(l),reverse:Number(f)})},837357:(n,l,f,b,C,k,V,F,re)=>{d.ob("Attention",n,{numHeads:l,isUnidirectional:f,maskFilterValue:b,scale:C,doRotary:k,qkvHiddenSizes:V?Array.from(a().subarray(Number(F)>>>0,Number(F)+V>>>0)):[],pastPresentShareBuffer:!!re})},837629:n=>{d.ob("BiasAdd",n,void 0)},837684:n=>{d.ob("BiasSplitGelu",n,void 0)},837745:n=>{d.ob("FastGelu",n,void 0)},837801:(n,l,f,b,C,k,V,F,re,J,ce,Re,ze)=>{d.ob("Conv",n,{format:re?"NHWC":"NCHW",auto_pad:l,dilations:[f],group:b,kernel_shape:[C],pads:k?Array.from(a().subarray(k>>>0,V>>>0)):[],strides:[F],w_is_const:()=>!!r()[J>>>0],activation:He(ce),activation_params:Re?Array.from(p().subarray(Re>>>0,ze>>>0)):[]})},838171:(n,l,f,b,C,k,V,F,re,J,ce,Re,ze,z,we,Pe)=>{d.ob("Conv",n,{format:Re?"NHWC":"NCHW",auto_pad:l,dilations:[f,b],group:C,kernel_shape:[k,V],pads:F?Array.from(a().subarray(F>>>0,re>>>0)):[],strides:[J,ce],w_is_const:()=>!!r()[ze>>>0],activation:He(z),activation_params:we?Array.from(p().subarray(we>>>0,Pe>>>0)):[]})},838562:n=>{d.ob("Gelu",n,void 0)},838614:(n,l,f,b,C,k)=>{d.ob("MatMulNBits",n,{k:l,n:f,accuracyLevel:b,bits:C,blockSize:k})},838741:(n,l,f,b,C,k)=>{d.ob("MultiHeadAttention",n,{numHeads:l,isUnidirectional:f,maskFilterValue:b,scale:C,doRotary:k})},838900:(n,l,f,b,C)=>{d.ob("RotaryEmbedding",n,{interleaved:!!l,numHeads:f,rotaryEmbeddingDim:b,scale:C})},839039:(n,l,f)=>{d.ob("SkipLayerNormalization",n,{epsilon:l,simplified:!!f})},839141:(n,l,f)=>{d.ob("SkipLayerNormalization",n,{epsilon:l,simplified:!!f})},839243:(n,l,f,b)=>{d.ob("LayerNormalization",n,{axis:l,epsilon:f,simplified:!!b})},839354:n=>{d.ac(n)},839388:(n,l)=>d.cc(n,l,d.Cb.ec,d.Cb.errors)};function st(n){this.name="ExitStatus",this.message=`Program terminated with exit(${n})`,this.status=n}var Tr=n=>{n.terminate(),n.onmessage=()=>{}},ht=n=>{ge.xb.length==0&&(lr(),ge.Mb(ge.xb[0]));var l=ge.xb.pop();if(!l)return 6;ge.yb.push(l),ge.ub[n.wb]=l,l.wb=n.wb;var f={cmd:"run",start_routine:n.fc,arg:n.Rb,pthread_ptr:n.wb};return P&&l.unref(),l.postMessage(f,n.mc),0},bt=0,Er=n=>{var l=io();return n=n(),fn(l),n},Te=(n,l,...f)=>Er(()=>{for(var b=2*f.length,C=oo(8*b),k=C>>>3,V=0;V>>0]=F)}return gi(n,0,b,C,l)});function dr(n){if(O)return Te(0,1,n);ie=n,0{if(ie=n,O)throw jr(n),"unwind";dr(n)};function ut(){for(var n=d.numThreads;n--;)lr();mt.unshift(()=>{Vt++,Fn(()=>xr())})}function lr(){var n=L("ort-wasm-simd-threaded.worker.js");n=new Worker(n),ge.xb.push(n)}function Fn(n){O?n():Promise.all(ge.xb.map(ge.Mb)).then(n)}var ge={xb:[],yb:[],Qb:[],ub:{},Gb(){O?(ge.receiveObjectTransfer=ge.dc,ge.threadInitTLS=ge.Pb,ge.setExitStatus=ge.Ob):ut()},Ob:n=>ie=n,pc:["$terminateWorker"],hc:()=>{for(var n of ge.yb)Tr(n);for(n of ge.xb)Tr(n);ge.xb=[],ge.yb=[],ge.ub=[]},Nb:n=>{var l=n.wb;delete ge.ub[l],ge.xb.push(n),ge.yb.splice(ge.yb.indexOf(n),1),n.wb=0,ro(l)},dc(){},Pb(){ge.Qb.forEach(n=>n())},Mb:n=>new Promise(l=>{n.onmessage=k=>{k=k.data;var V=k.cmd;if(k.targetThread&&k.targetThread!=pn()){var F=ge.ub[k.targetThread];F?F.postMessage(k,k.transferList):ee(`Internal error! Worker sent a message "${V}" to target pthread ${k.targetThread}, but that thread no longer exists!`)}else V==="checkMailbox"?rt():V==="spawnThread"?ht(k):V==="cleanupThread"?ge.Nb(ge.ub[k.thread]):V==="killThread"?(k=k.thread,V=ge.ub[k],delete ge.ub[k],Tr(V),ro(k),ge.yb.splice(ge.yb.indexOf(V),1),V.wb=0):V==="cancelThread"?ge.ub[k.thread].postMessage({cmd:"cancel"}):V==="loaded"?(n.loaded=!0,P&&!n.wb&&n.unref(),l(n)):V==="alert"?alert(`Thread ${k.threadId}: ${k.text}`):k.target==="setimmediate"?n.postMessage(k):V==="callHandler"?d[k.handler](...k.args):V&&ee(`worker sent an unknown command ${V}`)},n.onerror=k=>{throw ee(`worker sent an error! ${k.filename}:${k.lineno}: ${k.message}`),k},P&&(n.on("message",k=>n.onmessage({data:k})),n.on("error",k=>n.onerror(k)));var f=[],b=["onExit"],C;for(C of b)d.hasOwnProperty(C)&&f.push(C);n.postMessage({cmd:"load",handlers:f,urlOrBlob:d.mainScriptUrlOrBlob||e,wasmMemory:ae,wasmModule:Ae})})};d.PThread=ge;var Yt=n=>{for(;0{var n=pn(),l=c()[n+52>>>2>>>0];n=c()[n+56>>>2>>>0],bi(l,l-n),fn(l)};function jr(n){if(O)return Te(1,0,n);Xe(n)}d.invokeEntryPoint=(n,l)=>{bt=0,n=wi(n,l),0>>2>>>0]=0,c()[this.Ib+4>>>2>>>0]=l,c()[this.Ib+8>>>2>>>0]=f}}var Kr=0,jn=0;function Yr(n,l,f,b){return O?Te(2,1,n,l,f,b):Zr(n,l,f,b)}function Zr(n,l,f,b){if(n>>>=0,l>>>=0,f>>>=0,b>>>=0,typeof SharedArrayBuffer>"u")return ee("Current environment does not support SharedArrayBuffer, pthreads are not available!"),6;var C=[];return O&&C.length===0?Yr(n,l,f,b):(n={fc:f,wb:n,Rb:b,mc:C},O?(n.oc="spawnThread",postMessage(n,C),0):ht(n))}var cr=typeof TextDecoder<"u"?new TextDecoder("utf8"):void 0,Pr=(n,l,f)=>{l>>>=0;var b=l+f;for(f=l;n[f]&&!(f>=b);)++f;if(16C?b+=String.fromCharCode(C):(C-=65536,b+=String.fromCharCode(55296|C>>10,56320|C&1023))}}else b+=String.fromCharCode(C)}return b},He=(n,l)=>(n>>>=0)?Pr(o(),n,l):"";function Xr(n,l,f){return O?Te(3,1,n,l,f):0}function Qr(n,l){if(O)return Te(4,1,n,l)}var gt=n=>{for(var l=0,f=0;f=b?l++:2047>=b?l+=2:55296<=b&&57343>=b?(l+=4,++f):l+=3}return l},dt=(n,l,f,b)=>{if(f>>>=0,!(0=V){var F=n.charCodeAt(++k);V=65536+((V&1023)<<10)|F&1023}if(127>=V){if(f>=b)break;l[f++>>>0]=V}else{if(2047>=V){if(f+1>=b)break;l[f++>>>0]=192|V>>6}else{if(65535>=V){if(f+2>=b)break;l[f++>>>0]=224|V>>12}else{if(f+3>=b)break;l[f++>>>0]=240|V>>18,l[f++>>>0]=128|V>>12&63}l[f++>>>0]=128|V>>6&63}l[f++>>>0]=128|V&63}}return l[f>>>0]=0,f-C},Bt=(n,l,f)=>dt(n,o(),l,f);function Zt(n,l){if(O)return Te(5,1,n,l)}function kr(n,l,f){if(O)return Te(6,1,n,l,f)}function Or(n,l,f){return O?Te(7,1,n,l,f):0}function Jr(n,l){if(O)return Te(8,1,n,l)}function pr(n,l,f){if(O)return Te(9,1,n,l,f)}function en(n,l,f,b){if(O)return Te(10,1,n,l,f,b)}function tn(n,l,f,b){if(O)return Te(11,1,n,l,f,b)}function rn(n,l,f,b){if(O)return Te(12,1,n,l,f,b)}function nn(n){if(O)return Te(13,1,n)}function Rr(n,l){if(O)return Te(14,1,n,l)}function Xt(n,l,f){if(O)return Te(15,1,n,l,f)}var on,nt=n=>{for(var l="";o()[n>>>0];)l+=on[o()[n++>>>0]];return l},mr={},Br={},Kn={},wt;function Yn(n,l,f={}){var b=l.name;if(!n)throw new wt(`type "${b}" must have a positive integer typeid pointer`);if(Br.hasOwnProperty(n)){if(f.Ub)return;throw new wt(`Cannot register type \'${b}\' twice`)}Br[n]=l,delete Kn[n],mr.hasOwnProperty(n)&&(l=mr[n],delete mr[n],l.forEach(C=>C()))}function Je(n,l,f={}){if(!("argPackAdvance"in l))throw new TypeError("registerType registeredInstance requires argPackAdvance");return Yn(n,l,f)}var Dr=(n,l,f)=>{switch(l){case 1:return f?b=>r()[b>>>0]:b=>o()[b>>>0];case 2:return f?b=>i()[b>>>1>>>0]:b=>u()[b>>>1>>>0];case 4:return f?b=>a()[b>>>2>>>0]:b=>c()[b>>>2>>>0];case 8:return f?b=>Be[b>>>3]:b=>Ge[b>>>3];default:throw new TypeError(`invalid integer width (${l}): ${n}`)}},fr=[],lt=[];function hr(n){n>>>=0,9{if(!n)throw new wt("Cannot use deleted val. handle = "+n);return lt[n]},ot=n=>{switch(n){case void 0:return 2;case null:return 4;case!0:return 6;case!1:return 8;default:let l=fr.pop()||lt.length;return lt[l]=n,lt[l+1]=1,l}};function Qt(n){return this.fromWireType(c()[n>>>2>>>0])}var Zn={name:"emscripten::val",fromWireType:n=>{var l=Qe(n);return hr(n),l},toWireType:(n,l)=>ot(l),argPackAdvance:8,readValueFromPointer:Qt,Bb:null},an=(n,l)=>{switch(l){case 4:return function(f){return this.fromWireType(p()[f>>>2>>>0])};case 8:return function(f){return this.fromWireType(h()[f>>>3>>>0])};default:throw new TypeError(`invalid float width (${l}): ${n}`)}},zr=typeof TextDecoder<"u"?new TextDecoder("utf-16le"):void 0,Xn=(n,l)=>{for(var f=n>>1,b=f+l/2;!(f>=b)&&u()[f>>>0];)++f;if(f<<=1,32=l/2);++b){var C=i()[n+2*b>>>1>>>0];if(C==0)break;f+=String.fromCharCode(C)}return f},sn=(n,l,f)=>{if(f??=2147483647,2>f)return 0;f-=2;var b=l;f=f<2*n.length?f/2:n.length;for(var C=0;C>>1>>>0]=k,l+=2}return i()[l>>>1>>>0]=0,l-b},un=n=>2*n.length,gr=(n,l)=>{for(var f=0,b="";!(f>=l/4);){var C=a()[n+4*f>>>2>>>0];if(C==0)break;++f,65536<=C?(C-=65536,b+=String.fromCharCode(55296|C>>10,56320|C&1023)):b+=String.fromCharCode(C)}return b},Qn=(n,l,f)=>{if(l>>>=0,f??=2147483647,4>f)return 0;var b=l;f=b+f-4;for(var C=0;C=k){var V=n.charCodeAt(++C);k=65536+((k&1023)<<10)|V&1023}if(a()[l>>>2>>>0]=k,l+=4,l+4>f)break}return a()[l>>>2>>>0]=0,l-b},pe=n=>{for(var l=0,f=0;f=b&&++f,l+=4}return l},Mr=n=>{if(!me)try{if(n(),!(0>>=0,typeof Atomics.nc=="function"&&(Atomics.nc(a(),n>>>2,n).value.then(rt),n+=128,Atomics.store(a(),n>>>2,1))}d.__emscripten_thread_mailbox_await=Nt;var rt=()=>{var n=pn();n&&(Nt(n),Mr(yi))};d.checkMailbox=rt;var yr=[],br=(n,l)=>{var f=Br[n];if(f===void 0)throw n=fi(n),f=nt(n),At(n),new wt(`${l} has unknown type ${f}`);return f},Ur=(n,l,f)=>{var b=[];return n=n.toWireType(b,f),b.length&&(c()[l>>>2>>>0]=ot(b)),n},Jt=n=>{try{n()}catch(l){Kt(l)}};function dn(){var n=oe,l={};for(let[f,b]of Object.entries(n))l[f]=typeof b=="function"?(...C)=>{Dt.push(f);try{return b(...C)}finally{me||(Dt.pop(),ct&&vt===1&&Dt.length===0&&(vt=0,bt+=1,Jt($i),typeof Fibers<"u"&&Fibers.rc()))}}:b;return l}var vt=0,ct=null,ln=0,Dt=[],Vr={},s={},m=0,g=null,$=[];function T(){return new Promise((n,l)=>{g={resolve:n,reject:l}})}function B(){var n=mn(65548),l=n+12;c()[n>>>2>>>0]=l,c()[n+4>>>2>>>0]=l+65536,l=Dt[0];var f=Vr[l];return f===void 0&&(f=m++,Vr[l]=f,s[f]=l),l=f,a()[n+8>>>2>>>0]=l,n}function H(){var n=a()[ct+8>>>2>>>0];return n=oe[s[n]],--bt,n()}function q(n){if(!me){if(vt===0){var l=!1,f=!1;n((b=0)=>{if(!me&&(ln=b,l=!0,f)){vt=2,Jt(()=>_i(ct)),typeof Browser<"u"&&Browser.Hb.Tb&&Browser.Hb.resume(),b=!1;try{var C=H()}catch(F){C=F,b=!0}var k=!1;if(!ct){var V=g;V&&(g=null,(b?V.reject:V.resolve)(C),k=!0)}if(b&&!k)throw C}}),f=!0,l||(vt=1,ct=B(),typeof Browser<"u"&&Browser.Hb.Tb&&Browser.Hb.pause(),Jt(()=>vi(ct)))}else vt===2?(vt=0,Jt(Si),At(ct),ct=null,$.forEach(Mr)):Kt(`invalid state: ${vt}`);return ln}}function te(n){return q(l=>{n().then(l)})}var X=[],de={},Ee=n=>{var l=de[n];return l===void 0?nt(n):l},Oe=()=>typeof globalThis=="object"?globalThis:Function("return this")(),D=n=>{var l=X.length;return X.push(n),l},be=(n,l)=>{for(var f=Array(n),b=0;b>>2>>>0],"parameter "+b);return f},Ie=(n,l)=>Object.defineProperty(l,"name",{value:n});function zt(n){var l=Function;if(!(l instanceof Function))throw new TypeError(`new_ called with constructor type ${typeof l} which is not a function`);var f=Ie(l.name||"unknownFunctionName",function(){});return f.prototype=l.prototype,f=new f,n=l.apply(f,n),n instanceof Object?n:f}var Mt=n=>n%4===0&&(n%100!==0||n%400===0),Qo=[0,31,60,91,121,152,182,213,244,274,305,335],Jo=[0,31,59,90,120,151,181,212,243,273,304,334];function ei(n,l,f,b,C,k,V){return O?Te(16,1,n,l,f,b,C,k,V):-52}function ti(n,l,f,b,C,k){if(O)return Te(17,1,n,l,f,b,C,k)}var Jn=[],ri=(n,l)=>{Jn.length=0;for(var f;f=o()[n++>>>0];){var b=f!=105;b&=f!=112,l+=b&&l%8?4:0,Jn.push(f==112?c()[l>>>2>>>0]:f==106?Be[l>>>3]:f==105?a()[l>>>2>>>0]:h()[l>>>3>>>0]),l+=b?8:4}return Jn},eo={},ni=()=>{if(!to){var n={USER:"web_user",LOGNAME:"web_user",PATH:"/",PWD:"/",HOME:"/home/web_user",LANG:(typeof navigator=="object"&&navigator.languages&&navigator.languages[0]||"C").replace("-","_")+".UTF-8",_:A||"./this.program"},l;for(l in eo)eo[l]===void 0?delete n[l]:n[l]=eo[l];var f=[];for(l in n)f.push(`${l}=${n[l]}`);to=f}return to},to;function oi(n,l){if(O)return Te(18,1,n,l);n>>>=0,l>>>=0;var f=0;return ni().forEach((b,C)=>{var k=l+f;for(C=c()[n+4*C>>>2>>>0]=k,k=0;k>>0]=b.charCodeAt(k);r()[C>>>0]=0,f+=b.length+1}),0}function ii(n,l){if(O)return Te(19,1,n,l);n>>>=0,l>>>=0;var f=ni();c()[n>>>2>>>0]=f.length;var b=0;return f.forEach(C=>b+=C.length+1),c()[l>>>2>>>0]=b,0}function ai(n){return O?Te(20,1,n):52}function si(n,l,f,b){return O?Te(21,1,n,l,f,b):52}function ui(n,l,f,b){return O?Te(22,1,n,l,f,b):70}var Xd=[null,[],[]];function di(n,l,f,b){if(O)return Te(23,1,n,l,f,b);l>>>=0,f>>>=0,b>>>=0;for(var C=0,k=0;k>>2>>>0],F=c()[l+4>>>2>>>0];l+=8;for(var re=0;re>>0],ce=Xd[n];J===0||J===10?((n===1?We:ee)(Pr(ce,0)),ce.length=0):ce.push(J)}C+=F}return c()[b>>>2>>>0]=C,0}var li=[31,29,31,30,31,30,31,31,30,31,30,31],ci=[31,28,31,30,31,30,31,31,30,31,30,31];function Qd(n){var l=Array(gt(n)+1);return dt(n,l,0,l.length),l}var Jd=(n,l)=>{r().set(n,l>>>0)};function pi(n,l,f,b){function C(z,we,Pe){for(z=typeof z=="number"?z.toString():z||"";z.lengthCi?-1:0er-z.getDate())we-=er-z.getDate()+1,z.setDate(1),11>Pe?z.setMonth(Pe+1):(z.setMonth(0),z.setFullYear(z.getFullYear()+1));else{z.setDate(z.getDate()+we);break}}return Pe=new Date(z.getFullYear()+1,0,4),we=F(new Date(z.getFullYear(),0,4)),Pe=F(Pe),0>=V(we,z)?0>=V(Pe,z)?z.getFullYear()+1:z.getFullYear():z.getFullYear()-1}n>>>=0,l>>>=0,f>>>=0,b>>>=0;var J=c()[b+40>>>2>>>0];b={kc:a()[b>>>2>>>0],jc:a()[b+4>>>2>>>0],Eb:a()[b+8>>>2>>>0],Jb:a()[b+12>>>2>>>0],Fb:a()[b+16>>>2>>>0],Ab:a()[b+20>>>2>>>0],vb:a()[b+24>>>2>>>0],zb:a()[b+28>>>2>>>0],qc:a()[b+32>>>2>>>0],ic:a()[b+36>>>2>>>0],lc:J?He(J):""},f=He(f),J={"%c":"%a %b %d %H:%M:%S %Y","%D":"%m/%d/%y","%F":"%Y-%m-%d","%h":"%b","%r":"%I:%M:%S %p","%R":"%H:%M","%T":"%H:%M:%S","%x":"%m/%d/%y","%X":"%H:%M:%S","%Ec":"%c","%EC":"%C","%Ex":"%m/%d/%y","%EX":"%H:%M:%S","%Ey":"%y","%EY":"%Y","%Od":"%d","%Oe":"%e","%OH":"%H","%OI":"%I","%Om":"%m","%OM":"%M","%OS":"%S","%Ou":"%u","%OU":"%U","%OV":"%V","%Ow":"%w","%OW":"%W","%Oy":"%y"};for(var ce in J)f=f.replace(new RegExp(ce,"g"),J[ce]);var Re="Sunday Monday Tuesday Wednesday Thursday Friday Saturday".split(" "),ze="January February March April May June July August September October November December".split(" ");J={"%a":z=>Re[z.vb].substring(0,3),"%A":z=>Re[z.vb],"%b":z=>ze[z.Fb].substring(0,3),"%B":z=>ze[z.Fb],"%C":z=>k((z.Ab+1900)/100|0,2),"%d":z=>k(z.Jb,2),"%e":z=>C(z.Jb,2," "),"%g":z=>re(z).toString().substring(2),"%G":re,"%H":z=>k(z.Eb,2),"%I":z=>(z=z.Eb,z==0?z=12:12{for(var we=0,Pe=0;Pe<=z.Fb-1;we+=(Mt(z.Ab+1900)?li:ci)[Pe++]);return k(z.Jb+we,3)},"%m":z=>k(z.Fb+1,2),"%M":z=>k(z.jc,2),"%n":()=>`\n`,"%p":z=>0<=z.Eb&&12>z.Eb?"AM":"PM","%S":z=>k(z.kc,2),"%t":()=>" ","%u":z=>z.vb||7,"%U":z=>k(Math.floor((z.zb+7-z.vb)/7),2),"%V":z=>{var we=Math.floor((z.zb+7-(z.vb+6)%7)/7);if(2>=(z.vb+371-z.zb-2)%7&&we++,we)we==53&&(Pe=(z.vb+371-z.zb)%7,Pe==4||Pe==3&&Mt(z.Ab)||(we=1));else{we=52;var Pe=(z.vb+7-z.zb-1)%7;(Pe==4||Pe==5&&Mt(z.Ab%400-1))&&we++}return k(we,2)},"%w":z=>z.vb,"%W":z=>k(Math.floor((z.zb+7-(z.vb+6)%7)/7),2),"%y":z=>(z.Ab+1900).toString().substring(2),"%Y":z=>z.Ab+1900,"%z":z=>{z=z.ic;var we=0<=z;return z=Math.abs(z)/60,(we?"+":"-")+("0000"+(z/60*100+z%60)).slice(-4)},"%Z":z=>z.lc,"%%":()=>"%"},f=f.replace(/%%/g,"\\0\\0");for(ce in J)f.includes(ce)&&(f=f.replace(new RegExp(ce,"g"),J[ce](b)));return f=f.replace(/\\0\\0/g,"%"),ce=Qd(f),ce.length>l?0:(Jd(ce,n),ce.length-1)}ge.Gb();for(var mi=Array(256),cn=0;256>cn;++cn)mi[cn]=String.fromCharCode(cn);on=mi,wt=d.BindingError=class extends Error{constructor(n){super(n),this.name="BindingError"}},d.InternalError=class extends Error{constructor(n){super(n),this.name="InternalError"}},lt.push(0,1,void 0,1,null,1,!0,1,!1,1),d.count_emval_handles=()=>lt.length/2-5-fr.length;var el=[dr,jr,Yr,Xr,Qr,Zt,kr,Or,Jr,pr,en,tn,rn,nn,Rr,Xt,ei,ti,oi,ii,ai,si,ui,di],tl={ua:function(n,l,f){return te(async()=>{await d.Zb(n,l,f)})},b:function(n,l,f){throw n>>>=0,new qn(n).Gb(l>>>0,f>>>0),Kr=n,jn++,Kr},ia:function(n){hi(n>>>0,!E,1,!x,131072,!1),ge.Pb()},G:function(n){n>>>=0,O?postMessage({cmd:"cleanupThread",thread:n}):ge.Nb(ge.ub[n])},_:Zr,A:Xr,pa:Qr,W:Zt,Y:kr,qa:Or,na:Jr,fa:pr,ma:en,K:tn,X:rn,U:nn,oa:Rr,V:Xt,E:function(n,l,f){n>>>=0,f>>>=0,l=nt(l>>>0),Je(n,{name:l,fromWireType:b=>b,toWireType:function(b,C){if(typeof C!="bigint"&&typeof C!="number")throw C===null?C="null":(b=typeof C,C=b==="object"||b==="array"||b==="function"?C.toString():""+C),new TypeError(`Cannot convert "${C}" to ${this.name}`);return typeof C=="number"&&(C=BigInt(C)),C},argPackAdvance:8,readValueFromPointer:Dr(l,f,l.indexOf("u")==-1),Bb:null})},O:function(n,l,f,b){n>>>=0,l=nt(l>>>0),Je(n,{name:l,fromWireType:function(C){return!!C},toWireType:function(C,k){return k?f:b},argPackAdvance:8,readValueFromPointer:function(C){return this.fromWireType(o()[C>>>0])},Bb:null})},N:function(n){return Je(n>>>0,Zn)},D:function(n,l,f){n>>>=0,f>>>=0,l=nt(l>>>0),Je(n,{name:l,fromWireType:b=>b,toWireType:(b,C)=>C,argPackAdvance:8,readValueFromPointer:an(l,f),Bb:null})},t:function(n,l,f,b,C){if(n>>>=0,f>>>=0,l=nt(l>>>0),C===-1&&(C=4294967295),C=F=>F,b===0){var k=32-8*f;C=F=>F<>>k}var V=l.includes("unsigned")?function(F,re){return re>>>0}:function(F,re){return re};Je(n,{name:l,fromWireType:C,toWireType:V,argPackAdvance:8,readValueFromPointer:Dr(l,f,b!==0),Bb:null})},p:function(n,l,f){function b(k){var V=c()[k>>>2>>>0];return k=c()[k+4>>>2>>>0],new C(r().buffer,k,V)}n>>>=0;var C=[Int8Array,Uint8Array,Int16Array,Uint16Array,Int32Array,Uint32Array,Float32Array,Float64Array,BigInt64Array,BigUint64Array][l];f=nt(f>>>0),Je(n,{name:f,fromWireType:b,argPackAdvance:8,readValueFromPointer:b},{Ub:!0})},F:function(n,l){n>>>=0,l=nt(l>>>0);var f=l==="std::string";Je(n,{name:l,fromWireType:function(b){var C=c()[b>>>2>>>0],k=b+4;if(f)for(var V=k,F=0;F<=C;++F){var re=k+F;if(F==C||o()[re>>>0]==0){if(V=He(V,re-V),J===void 0)var J=V;else J+=String.fromCharCode(0),J+=V;V=re+1}}else{for(J=Array(C),F=0;F>>0]);J=J.join("")}return At(b),J},toWireType:function(b,C){C instanceof ArrayBuffer&&(C=new Uint8Array(C));var k=typeof C=="string";if(!(k||C instanceof Uint8Array||C instanceof Uint8ClampedArray||C instanceof Int8Array))throw new wt("Cannot pass non-string to std::string");var V=f&&k?gt(C):C.length,F=mn(4+V+1),re=F+4;if(c()[F>>>2>>>0]=V,f&&k)Bt(C,re,V+1);else if(k)for(k=0;k>>0]=J}else for(k=0;k>>0]=C[k];return b!==null&&b.push(At,F),F},argPackAdvance:8,readValueFromPointer:Qt,Bb(b){At(b)}})},z:function(n,l,f){if(n>>>=0,l>>>=0,f>>>=0,f=nt(f),l===2)var b=Xn,C=sn,k=un,V=F=>u()[F>>>1>>>0];else l===4&&(b=gr,C=Qn,k=pe,V=F=>c()[F>>>2>>>0]);Je(n,{name:f,fromWireType:F=>{for(var re=c()[F>>>2>>>0],J,ce=F+4,Re=0;Re<=re;++Re){var ze=F+4+Re*l;(Re==re||V(ze)==0)&&(ce=b(ce,ze-ce),J===void 0?J=ce:(J+=String.fromCharCode(0),J+=ce),ce=ze+l)}return At(F),J},toWireType:(F,re)=>{if(typeof re!="string")throw new wt(`Cannot pass non-string to C++ string type ${f}`);var J=k(re),ce=mn(4+J+l);return c()[ce>>>2>>>0]=J/l,C(re,ce+4,J+l),F!==null&&F.push(At,ce),ce},argPackAdvance:8,readValueFromPointer:Qt,Bb(F){At(F)}})},P:function(n,l){n>>>=0,l=nt(l>>>0),Je(n,{Vb:!0,name:l,argPackAdvance:0,fromWireType:()=>{},toWireType:()=>{}})},ta:()=>1,S:function(n,l){n>>>=0,n==l>>>0?setTimeout(rt):O?postMessage({targetThread:n,cmd:"checkMailbox"}):(n=ge.ub[n])&&n.postMessage({cmd:"checkMailbox"})},$:function(n,l,f,b,C){l>>>=0,f>>>=0,b/=2,yr.length=b,C=C>>>0>>>3;for(var k=0;k>>0];return n=l?Ir[l]:el[n],ge.Sb=f,f=n(...yr),ge.Sb=0,f},ha:Nt,sa:function(n){P&&ge.ub[n>>>0].ref()},w:function(n,l,f){return l>>>=0,f>>>=0,n=Qe(n>>>0),l=br(l,"emval::as"),Ur(l,f,n)},y:function(n){return n>>>=0,te(()=>(n=Qe(n),n.then(ot)))},o:function(n,l,f,b){return f>>>=0,b>>>=0,n=X[n>>>0],l=Qe(l>>>0),n(null,l,f,b)},k:function(n,l,f,b,C){return f>>>=0,b>>>=0,C>>>=0,n=X[n>>>0],l=Qe(l>>>0),f=Ee(f),n(l,l[f],b,C)},c:hr,C:function(n,l){return l>>>=0,n=Qe(n>>>0),l=Qe(l),n==l},n:function(n){return n>>>=0,n===0?ot(Oe()):(n=Ee(n),ot(Oe()[n]))},j:function(n,l,f){l=be(n,l>>>0);var b=l.shift();n--;var C=`return function (obj, func, destructorsRef, args) {\n`,k=0,V=[];f===0&&V.push("obj");for(var F=["retType"],re=[b],J=0;Jce.name).join(", ")}) => ${b.name}>`,D(Ie(f,n))},s:function(n,l){return l>>>=0,n=Qe(n>>>0),l=Qe(l),ot(n[l])},d:function(n){n>>>=0,9>>0);for(var l=Array(n.length),f=0;f>>0))},l:function(){return ot({})},i:function(n){n>>>=0;for(var l=Qe(n);l.length;){var f=l.pop();l.pop()(f)}hr(n)},h:function(n,l,f){l>>>=0,f>>>=0,n=Qe(n>>>0),l=Qe(l),f=Qe(f),n[l]=f},e:function(n,l){return l>>>=0,n=br(n>>>0,"_emval_take_value"),n=n.readValueFromPointer(l),ot(n)},ca:function(n,l){n=-9007199254740992>n||9007199254740992>>=0,n=new Date(1e3*n),a()[l>>>2>>>0]=n.getUTCSeconds(),a()[l+4>>>2>>>0]=n.getUTCMinutes(),a()[l+8>>>2>>>0]=n.getUTCHours(),a()[l+12>>>2>>>0]=n.getUTCDate(),a()[l+16>>>2>>>0]=n.getUTCMonth(),a()[l+20>>>2>>>0]=n.getUTCFullYear()-1900,a()[l+24>>>2>>>0]=n.getUTCDay(),n=(n.getTime()-Date.UTC(n.getUTCFullYear(),0,1,0,0,0,0))/864e5|0,a()[l+28>>>2>>>0]=n},da:function(n,l){n=-9007199254740992>n||9007199254740992>>=0,n=new Date(1e3*n),a()[l>>>2>>>0]=n.getSeconds(),a()[l+4>>>2>>>0]=n.getMinutes(),a()[l+8>>>2>>>0]=n.getHours(),a()[l+12>>>2>>>0]=n.getDate(),a()[l+16>>>2>>>0]=n.getMonth(),a()[l+20>>>2>>>0]=n.getFullYear()-1900,a()[l+24>>>2>>>0]=n.getDay();var f=(Mt(n.getFullYear())?Qo:Jo)[n.getMonth()]+n.getDate()-1|0;a()[l+28>>>2>>>0]=f,a()[l+36>>>2>>>0]=-(60*n.getTimezoneOffset()),f=new Date(n.getFullYear(),6,1).getTimezoneOffset();var b=new Date(n.getFullYear(),0,1).getTimezoneOffset();n=(f!=b&&n.getTimezoneOffset()==Math.min(b,f))|0,a()[l+32>>>2>>>0]=n},ea:function(n){n>>>=0;var l=new Date(a()[n+20>>>2>>>0]+1900,a()[n+16>>>2>>>0],a()[n+12>>>2>>>0],a()[n+8>>>2>>>0],a()[n+4>>>2>>>0],a()[n>>>2>>>0],0),f=a()[n+32>>>2>>>0],b=l.getTimezoneOffset(),C=new Date(l.getFullYear(),6,1).getTimezoneOffset(),k=new Date(l.getFullYear(),0,1).getTimezoneOffset(),V=Math.min(k,C);return 0>f?a()[n+32>>>2>>>0]=+(C!=k&&V==b):0>>2>>>0]=l.getDay(),f=(Mt(l.getFullYear())?Qo:Jo)[l.getMonth()]+l.getDate()-1|0,a()[n+28>>>2>>>0]=f,a()[n>>>2>>>0]=l.getSeconds(),a()[n+4>>>2>>>0]=l.getMinutes(),a()[n+8>>>2>>>0]=l.getHours(),a()[n+12>>>2>>>0]=l.getDate(),a()[n+16>>>2>>>0]=l.getMonth(),a()[n+20>>>2>>>0]=l.getYear(),n=l.getTime(),BigInt(isNaN(n)?-1:n/1e3)},aa:ei,ba:ti,R:function(n,l,f,b){n>>>=0,l>>>=0,f>>>=0,b>>>=0;var C=new Date().getFullYear(),k=new Date(C,0,1),V=new Date(C,6,1);C=k.getTimezoneOffset();var F=V.getTimezoneOffset(),re=Math.max(C,F);c()[n>>>2>>>0]=60*re,a()[l>>>2>>>0]=+(C!=F),n=J=>J.toLocaleTimeString(void 0,{hour12:!1,timeZoneName:"short"}).split(" ")[1],k=n(k),V=n(V),F{Kt("")},f:function(n,l,f){return n>>>=0,l=ri(l>>>0,f>>>0),Ir[n](...l)},M:function(n,l,f){return n>>>=0,l=ri(l>>>0,f>>>0),Ir[n](...l)},H:()=>{},L:()=>Date.now(),ra:()=>{throw bt+=1,"unwind"},T:function(){return 4294901760},u:()=>performance.timeOrigin+performance.now(),x:()=>P?(Ri(),wr(Oi)).cpus().length:navigator.hardwareConcurrency,Q:function(n){n>>>=0;var l=o().length;if(n<=l||4294901760=f;f*=2){var b=l*(1+.2/f);b=Math.min(b,n+100663296);var C=Math;b=Math.max(n,b);e:{C=(C.min.call(C,4294901760,b+(65536-b%65536)%65536)-ae.buffer.byteLength+65535)/65536;try{ae.grow(C),Ne();var k=1;break e}catch{}k=void 0}if(k)return!0}return!1},ja:oi,la:ii,Z:Xe,B:ai,J:si,ga:ui,I:di,a:ae||d.wasmMemory,ka:pi,r:function(n,l,f,b){return pi(n>>>0,l>>>0,f>>>0,b>>>0)}},oe=function(){function n(f,b){return oe=f.exports,oe=dn(),oe=rl(),ge.Qb.push(oe.cb),Rt.unshift(oe.va),Ae=b,xr(),oe}var l={a:tl};if(Vt++,d.instantiateWasm)try{return d.instantiateWasm(l,n)}catch(f){ee(`Module.instantiateWasm callback failed with error: ${f}`),w(f)}return Ar(l,function(f){n(f.instance,f.module)}).catch(w),{}}(),fi=n=>(fi=oe.wa)(n);d.__embind_initialize_bindings=()=>(d.__embind_initialize_bindings=oe.xa)(),d._OrtInit=(n,l)=>(d._OrtInit=oe.ya)(n,l),d._OrtGetLastError=(n,l)=>(d._OrtGetLastError=oe.za)(n,l),d._OrtCreateSessionOptions=(n,l,f,b,C,k,V,F,re,J)=>(d._OrtCreateSessionOptions=oe.Aa)(n,l,f,b,C,k,V,F,re,J),d._OrtAppendExecutionProvider=(n,l)=>(d._OrtAppendExecutionProvider=oe.Ba)(n,l),d._OrtAddFreeDimensionOverride=(n,l,f)=>(d._OrtAddFreeDimensionOverride=oe.Ca)(n,l,f),d._OrtAddSessionConfigEntry=(n,l,f)=>(d._OrtAddSessionConfigEntry=oe.Da)(n,l,f),d._OrtReleaseSessionOptions=n=>(d._OrtReleaseSessionOptions=oe.Ea)(n),d._OrtCreateSession=(n,l,f)=>(d._OrtCreateSession=oe.Fa)(n,l,f),d._OrtReleaseSession=n=>(d._OrtReleaseSession=oe.Ga)(n),d._OrtGetInputOutputCount=(n,l,f)=>(d._OrtGetInputOutputCount=oe.Ha)(n,l,f),d._OrtGetInputName=(n,l)=>(d._OrtGetInputName=oe.Ia)(n,l),d._OrtGetOutputName=(n,l)=>(d._OrtGetOutputName=oe.Ja)(n,l),d._OrtFree=n=>(d._OrtFree=oe.Ka)(n),d._OrtCreateTensor=(n,l,f,b,C,k)=>(d._OrtCreateTensor=oe.La)(n,l,f,b,C,k),d._OrtGetTensorData=(n,l,f,b,C)=>(d._OrtGetTensorData=oe.Ma)(n,l,f,b,C),d._OrtReleaseTensor=n=>(d._OrtReleaseTensor=oe.Na)(n),d._OrtCreateRunOptions=(n,l,f,b)=>(d._OrtCreateRunOptions=oe.Oa)(n,l,f,b),d._OrtAddRunConfigEntry=(n,l,f)=>(d._OrtAddRunConfigEntry=oe.Pa)(n,l,f),d._OrtReleaseRunOptions=n=>(d._OrtReleaseRunOptions=oe.Qa)(n),d._OrtCreateBinding=n=>(d._OrtCreateBinding=oe.Ra)(n),d._OrtBindInput=(n,l,f)=>(d._OrtBindInput=oe.Sa)(n,l,f),d._OrtBindOutput=(n,l,f,b)=>(d._OrtBindOutput=oe.Ta)(n,l,f,b),d._OrtClearBoundOutputs=n=>(d._OrtClearBoundOutputs=oe.Ua)(n),d._OrtReleaseBinding=n=>(d._OrtReleaseBinding=oe.Va)(n),d._OrtRunWithBinding=(n,l,f,b,C)=>(d._OrtRunWithBinding=oe.Wa)(n,l,f,b,C),d._OrtRun=(n,l,f,b,C,k,V,F)=>(d._OrtRun=oe.Xa)(n,l,f,b,C,k,V,F),d._OrtEndProfiling=n=>(d._OrtEndProfiling=oe.Ya)(n),d._JsepOutput=(n,l,f)=>(d._JsepOutput=oe.Za)(n,l,f),d._JsepGetNodeName=n=>(d._JsepGetNodeName=oe._a)(n);var pn=d._pthread_self=()=>(pn=d._pthread_self=oe.$a)(),mn=d._malloc=n=>(mn=d._malloc=oe.ab)(n),At=d._free=n=>(At=d._free=oe.bb)(n);d.__emscripten_tls_init=()=>(d.__emscripten_tls_init=oe.cb)();var hi=d.__emscripten_thread_init=(n,l,f,b,C,k)=>(hi=d.__emscripten_thread_init=oe.eb)(n,l,f,b,C,k);d.__emscripten_thread_crashed=()=>(d.__emscripten_thread_crashed=oe.fb)();var gi=(n,l,f,b,C)=>(gi=oe.gb)(n,l,f,b,C),ro=n=>(ro=oe.hb)(n),no=d.__emscripten_thread_exit=n=>(no=d.__emscripten_thread_exit=oe.ib)(n),yi=()=>(yi=oe.jb)(),bi=(n,l)=>(bi=oe.kb)(n,l),fn=n=>(fn=oe.lb)(n),oo=n=>(oo=oe.mb)(n),io=()=>(io=oe.nb)(),wi=d.dynCall_ii=(n,l)=>(wi=d.dynCall_ii=oe.pb)(n,l),vi=n=>(vi=oe.qb)(n),$i=()=>($i=oe.rb)(),_i=n=>(_i=oe.sb)(n),Si=()=>(Si=oe.tb)();d.___start_em_js=839500,d.___stop_em_js=839661;function rl(){var n=oe;n=Object.assign({},n);var l=b=>C=>b(C)>>>0,f=b=>()=>b()>>>0;return n.wa=l(n.wa),n.$a=f(n.$a),n.ab=l(n.ab),n.emscripten_main_runtime_thread_id=f(n.emscripten_main_runtime_thread_id),n.mb=l(n.mb),n.nb=f(n.nb),n}d.wasmMemory=ae,d.stackSave=()=>io(),d.stackRestore=n=>fn(n),d.stackAlloc=n=>oo(n),d.keepRuntimeAlive=()=>0Bi)});var Mi=Wr((gm,cl)=>{cl.exports=\'"use strict";var Module={},ENVIRONMENT_IS_NODE=typeof process=="object"&&typeof process.versions=="object"&&typeof process.versions.node=="string";if(ENVIRONMENT_IS_NODE){var nodeWorkerThreads=require("worker_threads"),parentPort=nodeWorkerThreads.parentPort;parentPort.on("message",e=>onmessage({data:e}));var fs=require("fs"),vm=require("vm");Object.assign(global,{self:global,require,Module,location:{href:__filename},Worker:nodeWorkerThreads.Worker,importScripts:e=>vm.runInThisContext(fs.readFileSync(e,"utf8"),{filename:e}),postMessage:e=>parentPort.postMessage(e),performance:global.performance||{now:Date.now}})}var initializedJS=!1;function threadPrintErr(...e){var a=e.join(" ");if(ENVIRONMENT_IS_NODE){fs.writeSync(2,a+`\\n`);return}console.error(a)}function threadAlert(...e){var a=e.join(" ");postMessage({cmd:"alert",text:a,threadId:Module._pthread_self()})}var err=threadPrintErr;self.alert=threadAlert,Module.instantiateWasm=(e,a)=>{var r=Module.wasmModule;Module.wasmModule=null;var t=new WebAssembly.Instance(r,e);return a(t)},self.onunhandledrejection=e=>{throw e.reason||e};function handleMessage(e){try{if(e.data.cmd==="load"){let r=[];self.onmessage=t=>r.push(t),self.startWorker=t=>{Module=t,postMessage({cmd:"loaded"});for(let s of r)handleMessage(s);self.onmessage=handleMessage},Module.wasmModule=e.data.wasmModule;for(const t of e.data.handlers)Module[t]=(...s)=>{postMessage({cmd:"callHandler",handler:t,args:s})};if(Module.wasmMemory=e.data.wasmMemory,Module.buffer=Module.wasmMemory.buffer,Module.ENVIRONMENT_IS_PTHREAD=!0,typeof e.data.urlOrBlob=="string")importScripts(e.data.urlOrBlob);else{var a=URL.createObjectURL(e.data.urlOrBlob);importScripts(a),URL.revokeObjectURL(a)}ortWasmThreaded(Module)}else if(e.data.cmd==="run"){Module.__emscripten_thread_init(e.data.pthread_ptr,0,0,1),Module.__emscripten_thread_mailbox_await(e.data.pthread_ptr),Module.establishStackSpace(),Module.PThread.receiveObjectTransfer(e.data),Module.PThread.threadInitTLS(),initializedJS||(initializedJS=!0);try{Module.invokeEntryPoint(e.data.start_routine,e.data.arg)}catch(r){if(r!="unwind")throw r}}else e.data.cmd==="cancel"?Module._pthread_self()&&Module.__emscripten_thread_exit(-1):e.data.target==="setimmediate"||(e.data.cmd==="checkMailbox"?initializedJS&&Module.checkMailbox():e.data.cmd&&(err(`worker.js received unknown command ${e.data.cmd}`),err(e.data)))}catch(r){throw Module.__emscripten_thread_crashed?.(),r}}self.onmessage=handleMessage;\\n\'});var go,Gt,tr,bn,Gr,Hi,yo,ye=Y(()=>{"use strict";go=e=>{switch(e){case"int8":return 3;case"uint8":return 2;case"bool":return 9;case"int16":return 5;case"uint16":return 4;case"int32":return 6;case"uint32":return 12;case"float16":return 10;case"float32":return 1;case"float64":return 11;case"string":return 8;case"int64":return 7;case"uint64":return 13;default:throw new Error(`unsupported data type: ${e}`)}},Gt=e=>{switch(e){case 3:return"int8";case 2:return"uint8";case 9:return"bool";case 5:return"int16";case 4:return"uint16";case 6:return"int32";case 12:return"uint32";case 10:return"float16";case 1:return"float32";case 11:return"float64";case 8:return"string";case 7:return"int64";case 13:return"uint64";default:throw new Error(`unsupported data type: ${e}`)}},tr=e=>[void 0,4,1,1,2,2,4,8,void 0,1,2,8,4,8,void 0,void 0,void 0][e],bn=e=>{switch(e){case"float16":return typeof Float16Array<"u"&&Float16Array.from?Float16Array:Uint16Array;case"float32":return Float32Array;case"uint8":return Uint8Array;case"int8":return Int8Array;case"uint16":return Uint16Array;case"int16":return Int16Array;case"int32":return Int32Array;case"bool":return Uint8Array;case"float64":return Float64Array;case"uint32":return Uint32Array;case"int64":return BigInt64Array;case"uint64":return BigUint64Array;default:throw new Error(`unsupported type: ${e}`)}},Gr=e=>{switch(e){case"verbose":return 0;case"info":return 1;case"warning":return 2;case"error":return 3;case"fatal":return 4;default:throw new Error(`unsupported logging level: ${e}`)}},Hi=e=>e==="float32"||e==="float16"||e==="int32"||e==="int64"||e==="uint32"||e==="uint8"||e==="bool",yo=e=>{switch(e){case"none":return 0;case"cpu":return 1;case"cpu-pinned":return 2;case"texture":return 3;case"gpu-buffer":return 4;default:throw new Error(`unsupported data location: ${e}`)}}});var wn=Y(()=>{"use strict"});var Fi=Y(()=>{"use strict";wn()});var qi,ji=Y(()=>{"use strict";qi="1.18.0"});var Ki,pt,bo=Y(()=>{"use strict";ji();Ki="warning",pt={wasm:{},webgl:{},webgpu:{},versions:{common:qi},set logLevel(e){if(e!==void 0){if(typeof e!="string"||["verbose","info","warning","error","fatal"].indexOf(e)===-1)throw new Error(`Unsupported logging level: ${e}`);Ki=e}},get logLevel(){return Ki}};Object.defineProperty(pt,"logLevel",{enumerable:!0})});var vr,Yi=Y(()=>{"use strict";bo();vr=pt});var Zi=Y(()=>{"use strict"});var Xi=Y(()=>{"use strict";vn()});var Ji=Y(()=>{"use strict"});var ea=Y(()=>{"use strict";vn()});var vn=Y(()=>{"use strict";Zi();Xi();Ji();ea()});var $n=Y(()=>{"use strict";vn()});var wo,ta,rr,Ht,vo=Y(()=>{"use strict";bo();wo=(e,t)=>{(typeof pt.trace>"u"?!pt.wasm.trace:!pt.trace)||console.timeStamp(`${e}::ORT::${t}`)},ta=(e,t)=>{let r=new Error().stack?.split(/\\r\\n|\\r|\\n/g)||[],o=!1;for(let i=0;i{(typeof pt.trace>"u"?!pt.wasm.trace:!pt.trace)||ta("BEGIN",e)},Ht=e=>{(typeof pt.trace>"u"?!pt.wasm.trace:!pt.trace)||ta("END",e)}});var ra=Y(()=>{"use strict";wn();$n();vo()});var na=Y(()=>{"use strict";ra()});var oa=Y(()=>{"use strict"});var ia=Y(()=>{"use strict"});var aa=Y(()=>{"use strict"});var sa=Y(()=>{"use strict"});var ua=Y(()=>{"use strict";wn();$n()});var da=Y(()=>{"use strict";ua()});var $r=Y(()=>{"use strict";Fi();Yi();na();$n();oa();ia();vo();aa();sa();da()});var _l,Sl,la,ca,pa,xl,Ve,Lt=Y(()=>{"use strict";ye();_l=["V","I","W","E","F"],Sl=(e,t)=>{console.log(`[${_l[e]},${new Date().toISOString()}]${t}`)},pa=(e,t)=>{la=e,ca=t},xl=(e,t)=>{let r=Gr(e),o=Gr(la);r>=o&&Sl(r,typeof t=="function"?t():t)},Ve=(...e)=>{ca&&xl(...e)}});var ma,fa=Y(()=>{"use strict";ye();ma=(e,t)=>new(bn(t))(e)});var _n=Y(()=>{"use strict"});var ha,$o,_o,Cl,Al,ga,xo,So,ba,wa=Y(()=>{"use strict";Lt();_n();ha=new Map([[64,250],[128,200],[256,200],[512,200],[2048,230],[4096,200],[8192,50],[16384,50],[32768,50],[65536,50],[131072,50],[262144,50],[524288,50],[1048576,50],[2097152,30],[4194304,20],[8388608,10],[12582912,10],[16777216,10],[26214400,15],[33554432,22],[44236800,2],[58982400,6],[67108864,6],[134217728,6],[167772160,6]]),$o=[],_o=e=>Math.ceil(e/16)*16,Cl=e=>{for(let t=0;t<$o.length;t++){let r=$o[t];if(e<=r)return r}return Math.ceil(e/16)*16},Al=1,ga=()=>Al++,xo=async(e,t,r,o)=>{let i=_o(r),u=e.device.createBuffer({size:i,usage:GPUBufferUsage.COPY_DST|GPUBufferUsage.MAP_READ});try{let a=e.getCommandEncoder();e.endComputePass(),a.copyBufferToBuffer(t,0,u,0,i),e.flush(),await u.mapAsync(GPUMapMode.READ);let c=u.getMappedRange();if(o){let p=o();return p.set(new Uint8Array(c,0,r)),p}else return new Uint8Array(c.slice(0,r))}finally{u.destroy()}},So=class{constructor(t){this.backend=t;this.storageCache=new Map,this.freeBuffers=new Map,this.freeUniformBuffers=new Map,this.buffersForUploadingPending=[],this.buffersPending=[],this.externalBuffers=new Map,this.capturedPendingBuffers=new Map;for(let[r]of ha)$o.push(r),this.freeBuffers.set(r,[]),this.freeUniformBuffers.set(r,[])}upload(t,r){let o=r.buffer,i=r.byteOffset,u=r.byteLength,a=_o(u),c=this.storageCache.get(t);if(!c)throw new Error("gpu data for uploading does not exist");if(c.originalSize!==u)throw new Error(`inconsistent data size. gpu data size=${c.originalSize}, data size=${u}`);let p=this.backend.device.createBuffer({mappedAtCreation:!0,size:a,usage:GPUBufferUsage.MAP_WRITE|GPUBufferUsage.COPY_SRC}),h=p.getMappedRange();new Uint8Array(h).set(new Uint8Array(o,i,u)),p.unmap();let d=this.backend.getCommandEncoder();this.backend.endComputePass(),d.copyBufferToBuffer(p,0,c.gpuData.buffer,0,a),Ve("verbose",()=>`[WebGPU] GpuDataManager.upload(id=${t})`),this.buffersForUploadingPending.push(p)}memcpy(t,r){let o=this.storageCache.get(t);if(!o)throw new Error("source gpu data for memcpy does not exist");let i=this.storageCache.get(r);if(!i)throw new Error("destination gpu data for memcpy does not exist");if(o.originalSize!==i.originalSize)throw new Error("inconsistent source and destination gpu data size");let u=_o(o.originalSize),a=this.backend.getCommandEncoder();this.backend.endComputePass(),a.copyBufferToBuffer(o.gpuData.buffer,0,i.gpuData.buffer,0,u)}registerExternalBuffer(t,r,o){let i;if(o){if(i=this.externalBuffers.get(o),i===void 0)throw new Error("previous buffer is not registered");if(t===o)return Ve("verbose",()=>`[WebGPU] GpuDataManager.registerExternalBuffer(size=${r}) => id=${i}, buffer is the same, skip.`),i;if(this.backend.capturedCommandList.has(this.backend.currentSessionId))throw new Error(`Registering a different external buffer under graph capture mode is not supported yet.\n Please use the previous external buffer!`);this.externalBuffers.delete(o)}else i=ga();return this.storageCache.set(i,{gpuData:{id:i,type:0,buffer:t},originalSize:r}),this.externalBuffers.set(t,i),Ve("verbose",()=>`[WebGPU] GpuDataManager.registerExternalBuffer(size=${r}) => id=${i}, registered.`),i}unregisterExternalBuffer(t){let r=this.externalBuffers.get(t);r!==void 0&&(this.storageCache.delete(r),this.externalBuffers.delete(t),Ve("verbose",()=>`[WebGPU] GpuDataManager.unregisterExternalBuffer() => id=${r}`))}create(t,r=GPUBufferUsage.STORAGE|GPUBufferUsage.COPY_SRC|GPUBufferUsage.COPY_DST){let o=Cl(t),i,u=(r&GPUBufferUsage.STORAGE)===GPUBufferUsage.STORAGE,a=(r&GPUBufferUsage.UNIFORM)===GPUBufferUsage.UNIFORM;if(u||a){let h=(u?this.freeBuffers:this.freeUniformBuffers).get(o);h?h.length>0?i=h.pop():i=this.backend.device.createBuffer({size:o,usage:r}):i=this.backend.device.createBuffer({size:o,usage:r})}else i=this.backend.device.createBuffer({size:o,usage:r});let c={id:ga(),type:0,buffer:i};return this.storageCache.set(c.id,{gpuData:c,originalSize:t}),Ve("verbose",()=>`[WebGPU] GpuDataManager.create(size=${t}) => id=${c.id}`),c}get(t){return this.storageCache.get(t)?.gpuData}release(t){let r=this.storageCache.get(t);if(!r)throw new Error("releasing data does not exist");return Ve("verbose",()=>`[WebGPU] GpuDataManager.release(id=${t}), gpuDataId=${r.gpuData.id}`),this.storageCache.delete(t),this.buffersPending.push(r.gpuData.buffer),r.originalSize}async download(t,r){let o=this.storageCache.get(t);if(!o)throw new Error("data does not exist");await xo(this.backend,o.gpuData.buffer,o.originalSize,r)}refreshPendingBuffers(){for(let t of this.buffersForUploadingPending)t.destroy();if(this.buffersForUploadingPending=[],this.buffersPending.length!==0)if(this.backend.sessionStatus==="default"){for(let t of this.buffersPending){let r=ha.get(t.size);if((t.usage&GPUBufferUsage.STORAGE)===GPUBufferUsage.STORAGE){let o=this.freeBuffers.get(t.size)||[];r===void 0||o.length>=r?t.destroy():o.push(t)}else if((t.usage&GPUBufferUsage.UNIFORM)===GPUBufferUsage.UNIFORM){let o=this.freeUniformBuffers.get(t.size)||[];r===void 0||o.length>=r?t.destroy():o.push(t)}else t.destroy()}this.buffersPending=[]}else{let t=this.capturedPendingBuffers.get(this.backend.currentSessionId);t||(t=[],this.capturedPendingBuffers.set(this.backend.currentSessionId,t));for(let r of this.buffersPending)t.push(r);this.buffersPending=[]}}dispose(){this.freeBuffers.forEach(t=>{t.forEach(r=>{r.destroy()})}),this.freeUniformBuffers.forEach(t=>{t.forEach(r=>{r.destroy()})}),this.storageCache.forEach(t=>{t.gpuData.buffer.destroy()}),this.capturedPendingBuffers.forEach(t=>{t.forEach(r=>{r.destroy()})}),this.storageCache=new Map,this.freeBuffers=new Map,this.freeUniformBuffers=new Map,this.capturedPendingBuffers=new Map}onReleaseSession(t){let r=this.capturedPendingBuffers.get(t);r&&(r.forEach(o=>{o.destroy()}),this.capturedPendingBuffers.delete(t))}},ba=(...e)=>new So(...e)});var Co,ve,Ze=Y(()=>{"use strict";Co=class{constructor(t){Object.assign(this,t)}get cacheKey(){return this.key||(this.key=Object.getOwnPropertyNames(this).sort().map(t=>`${this[t]}`).join(";")),this.key}},ve=e=>new Co(e)});var Ao,It,M,nr,Sn,xn,Cn,Se=Y(()=>{"use strict";Ao=class{static calcMatMulShape(t,r){return t[1]!==r[0]?void 0:[t[0],r[1]]}},It=class{static calcShape(t,r,o=!1){let i=t.length,u=r.length;if(i===0)return r;if(u===0)return t;let a=Math.max(t.length,r.length),c=new Array(a);if(o){if(i<2||u<2)return;let p=Ao.calcMatMulShape([t[i-2],t[i-1]],[r[u-2],r[u-1]]);if(p===void 0)return;[c[a-2],c[a-1]]=p}for(let p=o?3:1;p<=a;p++){let h=i-p<0?1:t[i-p],d=u-p<0?1:r[u-p];if(h!==d&&h>1&&d>1)return;let y=Math.max(h,d);if(h&&d)c[a-p]=Math.max(h,d);else{if(y>1)return;c[a-p]=0}}return c}static isValidBroadcast(t,r){let o=t.length,i=r.length;if(o>i)return!1;for(let u=1;u<=o;u++)if(t[o-u]!==1&&t[o-u]!==r[i-u])return!1;return!0}},M=class e{static size(t){return e.getSizeFromDimensionRange(t,0,t.length)}static convertShape(t,r=4){let o=t.length;if(o===0)return[];let i=new Array(o),u=o-1;for(;u>=0;){if(t[u]%r===0){i[u]=t[u]/r;break}if(r%t[u]!==0)throw new Error("cannot convert shape");i[u]=1,r/=t[u],u--}for(u--;u>=0;u--)i[u]=t[u];return i}static sizeFromDimension(t,r){if(r<0||r>t.length)throw new Error(`invalid dimension of ${r} for sizeFromDimension as Tensor has ${t.length} dimensions.`);return e.getSizeFromDimensionRange(t,r,t.length)}static sizeToDimension(t,r){if(r<0||r>t.length)throw new Error(`invalid dimension of ${r} for sizeToDimension as Tensor has ${t.length} dimensions.`);return e.getSizeFromDimensionRange(t,0,r)}static getSizeFromDimensionRange(t,r,o){let i=1;for(let u=r;u=0;--i)o[i]=o[i+1]*t[i+1];return o}static normalizeAxis(t,r){if(t<-r&&t>=r)throw new Error("unsupported axis for this operation.");return t<0?t+r:t}static normalizeAxes(t,r){return t.map(o=>this.normalizeAxis(o,r??t.length))}static sortBasedOnPerm(t,r){return r?r.map(o=>t[o]):t.slice().reverse()}static padShape(t,r){let o=t.length;return t.map((i,u)=>i+r[u]+r[u+o])}static areEqual(t,r){return t.length!==r.length?!1:t.every((o,i)=>o===r[i])}},nr=class e{static adjustPoolAttributes(t,r,o,i,u,a){if(!t&&o.length!==r.length-2)throw new Error("length of specified kernel shapes should be 2 less than length of input dimensions");if(t)for(let c=0;c=o.length?o.push(r[c+2]):o[c]=r[c+2];for(let c=0;c=o[c]||a[c+o.length]>=o[c])throw new Error("pads should be smaller than kernel")}}static adjustPadsBasedOnAutoPad(t,r,o,i,u,a,c){if(c){if(u.length!==2*(t.length-2))throw new Error("length of pads should be twice the length of data dimensions");if(r.length!==t.length-2)throw new Error("length of strides should be the length of data dimensions");if(i.length!==t.length-2)throw new Error("length of kernel shapes should be the length of data dimensions");for(let p=0;p{"use strict";ye();Se();or=64,To=(e,t)=>{if(t===3)throw new Error("vec3 has same alignment as vec4, use vec4 instead");switch(e){case 10:return t>1?`vec${t}`:"f16";case 1:return t>1?`vec${t}`:"f32";case 6:return t>1?`vec${t}`:"i32";case 12:return t>1?`vec${t}`:"u32";case 7:if(t>1)throw new Error("currently not supported vecX of uint64 yet");return["vec2","i32"];case 13:if(t>1)throw new Error("currently not supported vecX of uint64 yet");return["vec2","u32"];case 9:if(t!==4)throw new Error("bool must be vec4");return["u32","vec4"];default:throw new Error(`Unknown data type: ${e}`)}},De=(e,t=1)=>{let r=To(e,t);return typeof r=="string"?r:r[0]},et=(e,t=1)=>{let r=To(e,t);return typeof r=="string"?r:r[1]},Z=(...e)=>{let t=[];return e.forEach(r=>{r.length!==0&&t.push({type:12,data:r},{type:12,data:M.computeStrides(r)})}),t},Me=e=>e%4===0?4:e%2===0?2:1,$t=(e="f32",t,r="0")=>!t||t===1?`${e}(${r})`:`vec${t}<${e}>(${r})`,ir=(e,t,r)=>e==="f32"?r:t===1?`f32(${r})`:`vec${t}(${r})`,_t=(e,t)=>t===4?`(${e}.x + ${e}.y + ${e}.z + ${e}.w)`:t===2?`(${e}.x + ${e}.y)`:t===3?`(${e}.x + ${e}.y + ${e}.z)`:e,fe=(e,t,r,o)=>e.startsWith("uniforms.")&&r>4?typeof t=="string"?o==="f16"?`${e}[(${t}) / 8][(${t}) % 8 / 4][(${t}) % 8 % 4]`:`${e}[(${t}) / 4][(${t}) % 4]`:o==="f16"?`${e}[${Math.floor(t/8)}][${Math.floor(t%8/4)}][${t%8%4}]`:`${e}[${Math.floor(t/4)}][${t%4}]`:r>1?`${e}[${t}]`:e,Eo=(e,t,r,o,i)=>{let u=typeof r=="number",a=u?r:r.length,c=[...new Array(a).keys()],p=a<2?"u32":a<=4?`vec${a}`:`array`,h=To(t,i),d=typeof h=="string"?h:h[1],y=typeof h=="string"?h:h[0],w={indices:p,value:d,storage:y,tensor:t},_=G=>typeof G=="string"?G:`${G}u`,v={offsetToIndices:!1,indicesToOffset:!1,broadcastedIndicesToOffset:!1,set:!1,setByIndices:!1,get:!1,getByIndices:!1},S=u?"uniforms.":"",A=`${S}${e}_shape`,I=`${S}${e}_strides`,x="";for(let G=0;G ${w.indices} {\n var indices: ${w.indices};\n var current = offset;\n ${x}\n return indices;\n }`,P=G=>(v.offsetToIndices=!0,a<2?G:`o2i_${e}(${G})`),O=[];if(a>=2)for(let G=a-1;G>=0;G--)O.push(`${fe(I,G,a)} * (indices[${G}])`);let R=a<2?"":`\n fn i2o_${e}(indices: ${w.indices}) -> u32 {\n return ${O.join("+")};\n }`,L=G=>(v.indicesToOffset=!0,a<2?G:`i2o_${e}(${G})`),N=(...G)=>a===0?"0u":`${w.indices}(${G.map(_).join(",")})`,K=(G,ne)=>a<2?`${G}`:`${fe(G,ne,a)}`,Q=(G,ne,xe)=>a<2?`${G}=${xe};`:`${fe(G,ne,a)}=${xe};`,he={},W=(G,ne)=>{v.broadcastedIndicesToOffset=!0;let xe=`${ne.name}broadcastedIndicesTo${e}Offset`;if(xe in he)return`${xe}(${G})`;let Ke=[];for(let Be=a-1;Be>=0;Be--){let Ge=ne.indicesGet("outputIndices",Be+ne.rank-a);Ke.push(`${K(I,Be)} * (${Ge} % ${K(A,Be)})`)}return he[xe]=`fn ${xe}(outputIndices: ${ne.type.indices}) -> u32 {\n return ${Ke.length>0?Ke.join("+"):"0u"};\n }`,`${xe}(${G})`},se=(G,ne)=>(()=>{if(w.storage===w.value)return`${e}[${G}]=${ne};`;if(w.storage==="vec2"&&w.value==="i32")return`${e}[${G}]=vec2(u32(${ne}), select(0u, 0xFFFFFFFFu, ${ne} < 0));`;if(w.storage==="vec2"&&w.value==="u32")return`${e}[${G}]=vec2(u32(${ne}), 0u);`;if(w.storage==="u32"&&w.value==="vec4")return`${e}[${G}]=dot(vec4(0x1, 0x100, 0x10000, 0x1000000), vec4(${ne}));`;throw new Error(`not supported combination of storage type ${w.storage} and value type ${w.value} yet`)})(),Ce=G=>(()=>{if(w.storage===w.value)return`${e}[${G}]`;if(w.storage==="vec2"&&w.value==="i32")return`i32(${e}[${G}].x)`;if(w.storage==="vec2"&&w.value==="u32")return`u32(${e}[${G}].x)`;if(w.storage==="u32"&&w.value==="vec4")return`vec4(bool(${e}[${G}] & 0xFFu), bool(${e}[${G}] & 0xFF00u), bool(${e}[${G}] & 0xFF0000u), bool(${e}[${G}] & 0xFF000000u))`;throw new Error(`not supported combination of storage type ${w.storage} and value type ${w.value} yet`)})(),We=a<2?"":`\n fn get_${e}ByIndices(indices: ${w.indices}) -> ${d} {\n return ${Ce(`i2o_${e}(indices)`)};\n }`,ee=a<2?"":(()=>{let G=c.map(xe=>`d${xe}: u32`).join(", "),ne=c.map(xe=>`d${xe}`).join(", ");return`\n fn get_${e}(${G}) -> ${d} {\n return get_${e}ByIndices(${N(ne)});\n }`})(),ae=(...G)=>{if(G.length!==a)throw new Error(`indices length must be ${a}`);let ne=G.map(_).join(",");return a===0?Ce("0u"):a===1?Ce(ne[0]):(v.get=!0,v.getByIndices=!0,v.indicesToOffset=!0,`get_${e}(${ne})`)},Ae=G=>a<2?Ce(G):(v.getByIndices=!0,v.indicesToOffset=!0,`get_${e}ByIndices(${G})`),me=a<2?"":`\n fn set_${e}ByIndices(indices: ${w.indices}, value: ${d}) {\n ${se(`i2o_${e}(indices)`,"value")}\n }`,ie=a<2?"":(()=>{let G=c.map(xe=>`d${xe}: u32`).join(", "),ne=c.map(xe=>`d${xe}`).join(", ");return`\n fn set_${e}(${G}, value: ${d}) {\n set_${e}ByIndices(${N(ne)}, value);\n }`})();return{impl:()=>{let G=[],ne=!1;return v.offsetToIndices&&(G.push(E),ne=!0),v.indicesToOffset&&(G.push(R),ne=!0),v.broadcastedIndicesToOffset&&(Object.values(he).forEach(xe=>G.push(xe)),ne=!0),v.set&&(G.push(ie),ne=!0),v.setByIndices&&(G.push(me),ne=!0),v.get&&(G.push(ee),ne=!0),v.getByIndices&&(G.push(We),ne=!0),!u&&ne&&G.unshift(`const ${A} = ${w.indices}(${r.join(",")});`,`const ${I} = ${w.indices}(${M.computeStrides(r).join(",")});`),G.join(`\n`)},type:w,offsetToIndices:P,indicesToOffset:L,broadcastedIndicesToOffset:W,indices:N,indicesGet:K,indicesSet:Q,set:(...G)=>{if(G.length!==a+1)throw new Error(`indices length must be ${a}`);let ne=G[a];if(typeof ne!="string")throw new Error("value must be string");let xe=G.slice(0,a).map(_).join(",");return a===0?se("0u",ne):a===1?se(xe[0],ne):(v.set=!0,v.setByIndices=!0,v.indicesToOffset=!0,`set_${e}(${xe}, ${ne})`)},setByOffset:se,setByIndices:(G,ne)=>a<2?se(G,ne):(v.setByIndices=!0,v.indicesToOffset=!0,`set_${e}ByIndices(${G}, ${ne});`),get:ae,getByOffset:Ce,getByIndices:Ae,usage:o,name:e,strides:I,shape:A,rank:a}},U=(e,t,r,o=1)=>Eo(e,t,r,"input",o),j=(e,t,r,o=1)=>Eo(e,t,r,"output",o),An=(e,t,r,o=1)=>Eo(e,t,r,"internal",o),Io=class{constructor(t,r){this.normalizedDispatchGroup=t;this.limits=r;this.internalVariables=[];this.variables=[];this.uniforms=[];this.variableIndex=0}guardAgainstOutOfBoundsWorkgroupSizes(t){return`if (global_idx >= ${typeof t=="number"?`${t}u`:t}) { return; }`}mainStart(t=or){let r=typeof t=="number"?t:t[0],o=typeof t=="number"?1:t[1],i=typeof t=="number"?1:t[2];if(r>this.limits.maxComputeWorkgroupSizeX||o>this.limits.maxComputeWorkgroupSizeY||i>this.limits.maxComputeWorkgroupSizeZ)throw new Error(`workgroup size [${r}, ${o}, ${i}] exceeds the maximum workgroup size [${this.limits.maxComputeWorkgroupSizeX}, ${this.limits.maxComputeWorkgroupSizeY}, ${this.limits.maxComputeWorkgroupSizeZ}].`);if(r*o*i>this.limits.maxComputeInvocationsPerWorkgroup)throw new Error(`workgroup size [${r}, ${o}, ${i}] exceeds the maximum workgroup invocations ${this.limits.maxComputeInvocationsPerWorkgroup}.`);let u=this.normalizedDispatchGroup[1]===1&&this.normalizedDispatchGroup[2]===1,a=u?`@builtin(global_invocation_id) global_id : vec3,\n @builtin(workgroup_id) workgroup_id : vec3,\n @builtin(local_invocation_id) local_id : vec3`:`@builtin(global_invocation_id) global_id : vec3,\n @builtin(local_invocation_id) local_id : vec3,\n @builtin(local_invocation_index) local_idx : u32,\n @builtin(workgroup_id) workgroup_id : vec3,\n @builtin(num_workgroups) num_workgroups : vec3`,c=u?"let global_idx = global_id.x; let local_idx = local_id.x;":`let global_idx = (workgroup_id.z * num_workgroups[0] * num_workgroups[1] +\n workgroup_id.y * num_workgroups[0] + workgroup_id.x) * ${r*o*i}u + local_idx;`;return`@compute @workgroup_size(${r}, ${o}, ${i})\n fn main(${a}) {\n ${c}\n `}appendVariableUniforms(t){t.rank!==0&&(t.shape.startsWith("uniforms.")&&this.uniforms.push({name:t.shape.replace("uniforms.",""),type:"u32",length:t.rank}),t.strides.startsWith("uniforms.")&&this.uniforms.push({name:t.strides.replace("uniforms.",""),type:"u32",length:t.rank}))}declareVariable(t,r){if(t.usage==="internal")throw new Error("cannot use internal variable with declareVariable(). use registerInternalVariables() instead.");this.variables.push(t),this.appendVariableUniforms(t);let o=t.usage==="input"?"read":"read_write",i=t.type.storage;return`@group(0) @binding(${r}) var ${t.name}: array<${i}>;`}declareVariables(...t){return t.map(r=>this.declareVariable(r,this.variableIndex++)).join(`\n`)}registerInternalVariable(t){if(t.usage!=="internal")throw new Error("cannot use input or output variable with registerInternalVariable(). use declareVariables() instead.");this.internalVariables.push(t),this.appendVariableUniforms(t)}registerInternalVariables(...t){return t.forEach(r=>this.registerInternalVariable(r)),this}registerUniform(t,r,o=1){return this.uniforms.push({name:t,type:r,length:o}),this}registerUniforms(t){return this.uniforms=this.uniforms.concat(t),this}uniformDeclaration(){if(this.uniforms.length===0)return"";let t=[];for(let{name:r,type:o,length:i}of this.uniforms)if(i&&i>4)o==="f16"?t.push(`@align(16) ${r}:array, ${Math.ceil(i/8)}>`):t.push(`${r}:array, ${Math.ceil(i/4)}>`);else{let u=i==null||i===1?o:`vec${i}<${o}>`;t.push(`${r}:${u}`)}return`\n struct Uniforms { ${t.join(", ")} };\n @group(0) @binding(${this.variableIndex}) var uniforms: Uniforms;`}get additionalImplementations(){return this.uniformDeclaration()+this.variables.map(t=>t.impl()).join(`\n`)+this.internalVariables.map(t=>t.impl()).join(`\n`)}get variablesInfo(){if(this.uniforms.length===0)return;let t=r=>[12,10,1,6][["u32","f16","f32","i32"].indexOf(r)];return this.uniforms.map(r=>[t(r.type),r.length??1])}},va=(e,t)=>new Io(e,t),_r=(e,t)=>{let r=e.length,o=[];for(let i=0;i1&&a===1&&o.unshift(u)}return o}});var Il,$a,Tl,El,yt,_a,Sa,Sr=Y(()=>{"use strict";ye();Se();Ze();_e();Il=e=>{if(!e||e.length!==1)throw new Error("Transpose requires 1 input.")},$a=(e,t)=>t&&t.length!==e?[...new Array(e).keys()].reverse():t,Tl=(e,t)=>M.sortBasedOnPerm(e,$a(e.length,t)),El=(e,t,r,o)=>{let i=[];i.push(`fn perm(i: ${o.type.indices}) -> ${r.type.indices} {\n var a: ${r.type.indices};`);for(let u=0;u{let r=e.dataType,o=e.dims.length,i=$a(o,t),u=Tl(e.dims,i),a=j("output",r,u.length),c=U("a",r,o),p=h=>`\n ${h.registerUniform("output_size","u32").declareVariables(c,a)}\n\n ${El(i,o,c,a)}\n\n ${h.mainStart()}\n ${h.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")}\n\n let indices = ${a.offsetToIndices("global_idx")};\n let aIndices = perm(indices);\n\n ${a.setByOffset("global_idx",c.getByIndices("aIndices"))}\n }`;return{name:"Transpose",shaderCache:{hint:`${t}`,inputDependencies:["rank"]},getRunData:h=>{let d=M.size(u);return{outputs:[{dims:u,dataType:h[0].dataType}],dispatchGroup:{x:Math.ceil(d/64)},programUniforms:[{type:12,data:d},...Z(h[0].dims,u)]}},getShaderSource:p}},_a=(e,t)=>{Il(e.inputs),e.compute(yt(e.inputs[0],t.perm))},Sa=e=>ve({perm:e.perm})});var Pl,kl,Ol,Rl,Bl,Dl,zl,Ml,Ul,Vl,Tt,xa,Ca,Aa,Ia,Ta,Ea,Pa,ka,Oa,Ra,Ba=Y(()=>{"use strict";ye();Se();_e();In();Sr();Pl={max:"select(bestValue, candidate, candidate > bestValue)",min:"select(bestValue, candidate, candidate < bestValue)",mean:"bestValue + candidate",sum:"bestValue + candidate",prod:"bestValue * candidate",sumSquare:"bestValue + candidate * candidate",logSumExp:"bestValue + exp(candidate)",l1:"bestValue + abs(candidate)",l2:"bestValue + candidate * candidate",logSum:"bestValue + candidate"},kl={max:"select(bestValue, candidate, candidate > bestValue)",min:"select(bestValue, candidate, candidate < bestValue)",mean:"bestValue + candidate",sum:"bestValue + candidate",prod:"bestValue * candidate",sumSquare:"bestValue + candidate",logSumExp:"bestValue + candidate",l1:"bestValue + candidate",l2:"bestValue + candidate",logSum:"bestValue + candidate"},Ol={max:"_A[offset]",min:"_A[offset]",mean:"0",sum:"0",prod:"1",sumSquare:"0",logSumExp:"0",l1:"0",l2:"0",logSum:"0"},Rl={max:"bestValue",min:"bestValue",sum:"bestValue",prod:"bestValue",sumSquare:"bestValue",logSumExp:"log(bestValue)",l1:"bestValue",l2:"sqrt(bestValue)",logSum:"log(bestValue)"},Bl=(e,t)=>{let r=[];for(let o=t-e;o{let r=[],o=e.length;for(let u=0;ue[u]);return[r,i]},zl=(e,t)=>{let r=e.length+t.length,o=[],i=0;for(let u=0;u{for(let r=0;r{let r=[];if(!Ml(e,t)){for(let o=0;or.push(o))}return r},Vl=(e,t,r,o,i,u,a)=>{let c=r[0].dims,p=M.size(u),h=M.size(a),d=U("_A",r[0].dataType,c),y=j("output",i,u),w=32,_=`\n var aBestValues : array;\n `;return{name:e,shaderCache:t,getShaderSource:S=>`\n ${S.registerUniform("reduceSize","u32").declareVariables(d,y)}\n ${_}\n fn DIV_CEIL(a : u32, b : u32) -> u32 {\n return ((a - 1u) / b + 1u);\n }\n ${S.mainStart(w)}\n\n let outputIndex = global_idx / ${w};\n let offset = outputIndex * uniforms.reduceSize;\n\n var bestValue = f32(${Ol[o]});\n let Length = uniforms.reduceSize;\n for (var k = local_idx; k < Length; k = k + ${w}) {\n let candidate = f32(${d.getByOffset("offset + k")});\n bestValue = ${Pl[o]};\n }\n aBestValues[local_idx] = bestValue;\n workgroupBarrier();\n\n var reduceSize = min(Length, ${w}u);\n for (var currentSize = reduceSize / 2u; reduceSize > 1u;\n currentSize = reduceSize / 2u) {\n let interval = DIV_CEIL(reduceSize, 2u);\n if (local_idx < currentSize) {\n let candidate = aBestValues[local_idx + interval];\n bestValue = ${kl[o]};\n aBestValues[local_idx] = bestValue;\n }\n reduceSize = interval;\n workgroupBarrier();\n }\n\n if (local_idx == 0u) {\n ${y.setByOffset("outputIndex",`${o==="mean"?`${y.type.storage}(bestValue / f32(uniforms.reduceSize))`:`${y.type.storage}(${Rl[o]})`}`)};\n }\n }`,getRunData:()=>({outputs:[{dims:u,dataType:i}],dispatchGroup:{x:p},programUniforms:[{type:12,data:h}]})}},Tt=(e,t,r,o)=>{let i=e.inputs.length===1?r:Po(e.inputs,r),u=i.axes;u.length===0&&!i.noopWithEmptyAxes&&(u=e.inputs[0].dims.map((_,v)=>v));let a=M.normalizeAxes(u,e.inputs[0].dims.length),c=a,p=e.inputs[0],h=Ul(c,e.inputs[0].dims.length);h.length>0&&(p=e.compute(yt(e.inputs[0],h),{inputs:[0],outputs:[-1]})[0],c=Bl(c.length,p.dims.length));let[d,y]=Dl(p.dims,c),w=d;i.keepDims&&(w=zl(d,a)),e.compute(Vl(t,{hint:i.cacheKey,inputDependencies:["type"]},[p],o,e.inputs[0].dataType,w,y),{inputs:[p]})},xa=(e,t)=>{Tt(e,"ReduceMeanShared",t,"mean")},Ca=(e,t)=>{Tt(e,"ReduceL1Shared",t,"l1")},Aa=(e,t)=>{Tt(e,"ReduceL2Shared",t,"l2")},Ia=(e,t)=>{Tt(e,"ReduceLogSumExpShared",t,"logSumExp")},Ta=(e,t)=>{Tt(e,"ReduceMaxShared",t,"max")},Ea=(e,t)=>{Tt(e,"ReduceMinShared",t,"min")},Pa=(e,t)=>{Tt(e,"ReduceProdShared",t,"prod")},ka=(e,t)=>{Tt(e,"ReduceSumShared",t,"sum")},Oa=(e,t)=>{Tt(e,"ReduceSumSquareShared",t,"sumSquare")},Ra=(e,t)=>{Tt(e,"ReduceLogSumShared",t,"logSum")}});var Et,Wl,Tn,Po,Pt,Nl,Gl,Hl,Ll,Fl,ql,jl,Kl,Yl,Zl,kt,Da,za,Ma,Ua,Va,Wa,Na,Ga,Ha,La,In=Y(()=>{"use strict";ye();Se();Ze();_e();Ba();Et=e=>{if(!e||e.length===0||e.length>2)throw new Error("Reduce op requires 1 or 2 inputs.");if(e.length===2&&e[1].dims.length!==1)throw new Error("Invalid axes input dims.")},Wl=e=>["","",`var value = ${e.getByIndices("input_indices")};`,""],Tn=(e,t,r,o,i,u,a=!1,c=!1)=>{let p=[],h=r[0].dims,d=h.length,y=M.normalizeAxes(i,d),w=!c&&y.length===0;h.forEach((A,I)=>{w||y.indexOf(I)>=0?a&&p.push(1):p.push(A)});let _=p.length,v=M.size(p);return{name:e,shaderCache:t,getShaderSource:A=>{let I=[],x=U("_A",r[0].dataType,d),E=j("output",u,_),P=o(x,E,y),O=P[2];for(let R=0,L=0;R=0?(a&&L++,O=`for(var j${R}: u32 = 0; j${R} < ${h[R]}; j${R}++) {\n ${P[2].includes("last_index")?`let last_index = j${R};`:""}\n ${x.indicesSet("input_indices",R,`j${R}`)}\n ${O}\n }`):(I.push(`${x.indicesSet("input_indices",R,E.indicesGet("output_indices",L))};`),L++);return`\n\n ${A.registerUniform("output_size","u32").declareVariables(x,E)}\n\n ${A.mainStart()}\n ${A.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")}\n var input_indices: ${x.type.indices};\n let output_indices = ${E.offsetToIndices("global_idx")};\n\n ${I.join(`\n`)}\n ${P[0]} // init ops for reduce max/min\n ${P[1]}\n ${O}\n ${P[3]}\n ${P.length===4?E.setByOffset("global_idx","value"):P.slice(4).join(`\n`)}\n }`},getRunData:()=>({outputs:[{dims:p,dataType:u}],dispatchGroup:{x:Math.ceil(v/64)},programUniforms:[{type:12,data:v},...Z(h,p)]})}},Po=(e,t)=>{let r=[];return e[1].dims[0]>0&&e[1].getBigInt64Array().forEach(o=>r.push(Number(o))),ve({axes:r,keepDims:t.keepDims,noopWithEmptyAxes:t.noopWithEmptyAxes})},Pt=(e,t,r,o)=>{let i=e.inputs,u=i.length===1?r:Po(i,r);e.compute(Tn(t,{hint:u.cacheKey,inputDependencies:["rank"]},[i[0]],u.noopWithEmptyAxes&&u.axes.length===0?Wl:o,u.axes,i[0].dataType,u.keepDims,u.noopWithEmptyAxes),{inputs:[0]})},Nl=(e,t)=>{Et(e.inputs),Pt(e,"ReduceLogSum",t,(o,i)=>[`var value = ${i.type.storage}(0);`,"",`value += ${o.getByIndices("input_indices")};`,"value = log(value);"])},Gl=(e,t)=>{Et(e.inputs),Pt(e,"ReduceL1",t,(o,i)=>[`var value = ${i.type.storage}(0);`,"",`value += abs(${o.getByIndices("input_indices")});`,""])},Hl=(e,t)=>{Et(e.inputs),Pt(e,"ReduceL2",t,(o,i)=>[`var t = ${i.type.value}(0); var value = ${i.type.value}(0);`,"",`t = ${o.getByIndices("input_indices")}; value += (t * t);`,"value = sqrt(value);"])},Ll=(e,t)=>{Et(e.inputs),Pt(e,"ReduceLogSumExp",t,(o,i)=>[`var value = ${i.type.storage}(0);`,"",`value += exp(${o.getByIndices("input_indices")});`,"value = log(value);"])},Fl=(e,t)=>{Et(e.inputs),Pt(e,"ReduceMax",t,(o,i,u)=>{let a=[];for(let c=0;c=0||u.length===0)&&a.push(o.indicesSet("input_indices",c,0));return[`${a.join(`\n`)}`,`var value = ${o.getByIndices("input_indices")};`,`value = max(value, ${o.getByIndices("input_indices")});`,""]})},ql=(e,t)=>{Et(e.inputs),Pt(e,"ReduceMean",t,(o,i,u)=>{let a=1;for(let c=0;c=0||u.length===0)&&(a*=e.inputs[0].dims[c]);return["var sum = f32(0);","",`sum += f32(${o.getByIndices("input_indices")});`,`let value = ${i.type.value}(sum / ${a});`]})},jl=(e,t)=>{Et(e.inputs),Pt(e,"ReduceMin",t,(o,i,u)=>{let a=[];for(let c=0;c=0||u.length===0)&&a.push(`input_indices[${c}] = 0;`);return[`${a.join(`\n`)}`,`var value = ${o.getByIndices("input_indices")};`,`value = min(value, ${o.getByIndices("input_indices")});`,""]})},Kl=(e,t)=>{Et(e.inputs),Pt(e,"ReduceProd",t,(o,i)=>[`var value = ${i.type.storage}(1);`,"",`value *= ${o.getByIndices("input_indices")};`,""])},Yl=(e,t)=>{Et(e.inputs),Pt(e,"ReduceSum",t,(o,i)=>[`var value = ${i.type.storage}(0);`,"",`value += ${o.getByIndices("input_indices")};`,""])},Zl=(e,t)=>{Et(e.inputs),Pt(e,"ReduceSumSquare",t,(o,i)=>[`var t = ${i.type.value}(0); var value = ${i.type.value}(0);`,"",`t = ${o.getByIndices("input_indices")}; value += t * t;`,""])},kt=(e,t,r)=>{if(t.length===0)return r;let o=1,i=1;for(let u=0;u1024},Da=(e,t)=>{kt(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?ql(e,t):xa(e,t)},za=(e,t)=>{kt(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Gl(e,t):Ca(e,t)},Ma=(e,t)=>{kt(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Hl(e,t):Aa(e,t)},Ua=(e,t)=>{kt(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Ll(e,t):Ia(e,t)},Va=(e,t)=>{kt(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Fl(e,t):Ta(e,t)},Wa=(e,t)=>{kt(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?jl(e,t):Ea(e,t)},Na=(e,t)=>{kt(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Kl(e,t):Pa(e,t)},Ga=(e,t)=>{kt(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Yl(e,t):ka(e,t)},Ha=(e,t)=>{kt(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Zl(e,t):Oa(e,t)},La=(e,t)=>{kt(e.inputs[0].dims,t.axes,t.noopWithEmptyAxes)?Nl(e,t):Ra(e,t)}});var Fa,qa,ja,ko,Ka=Y(()=>{"use strict";ye();Ze();In();Fa=e=>{if(!e||e.length===0||e.length>2)throw new Error("ArgMinMaxOp op requires 1 or 2 inputs.");if(e[0].dataType!==1)throw new Error("Invalid input type.")},qa=(e,t)=>{Fa(e.inputs);let r=(o,i,u)=>{let a=[];for(let c=0;c=0||u.length===0)&&a.push(`input_indices[${c}] = 0;`);return[`${a.join(`\n`)}`,`var value = ${o.getByIndices("input_indices")};\nvar best_index : i32 = 0;`,`if (${o.getByIndices("input_indices")} ${t.selectLastIndex>0?"<=":"<"} value) {\n value = ${o.getByIndices("input_indices")};\n best_index = i32(last_index);\n }`,"",i.setByOffset("global_idx","best_index")]};e.compute(Tn("ArgMin",{hint:t.cacheKey,inputDependencies:["rank"]},[e.inputs[0]],r,[t.axis],7,t.keepDims),{inputs:[0]})},ja=(e,t)=>{Fa(e.inputs);let r=(o,i,u)=>{let a=[];for(let c=0;c=0||u.length===0)&&a.push(`input_indices[${c}] = 0;`);return[`${a.join(`\n`)}`,`var value = ${o.getByIndices("input_indices")};\nvar best_index : i32 = 0;`,`if (${o.getByIndices("input_indices")} ${t.selectLastIndex>0?">=":">"} value) {\n value = ${o.getByIndices("input_indices")};\n best_index = i32(last_index);\n }`,"",i.setByOffset("global_idx","best_index")]};e.compute(Tn("argMax",{hint:t.cacheKey,inputDependencies:["rank"]},[e.inputs[0]],r,[t.axis],7,t.keepDims),{inputs:[0]})},ko=e=>ve(e)});var Xl,Ql,Jl,En,Ya,Za,Oo=Y(()=>{"use strict";ye();Se();Ze();_e();Xl=(e,t)=>{if(!e||e.length<1)throw new Error("too few inputs");let r=0,o=e[r],i=o.dataType,u=o.dims.length;e.forEach((a,c)=>{if(c!==r){if(a.dataType!==i)throw new Error("input tensors should be one type");if(a.dims.length!==u)throw new Error("input tensors should have the same shape");a.dims.forEach((p,h)=>{if(h!==t&&p!==o.dims[h])throw new Error("non concat dimensions must match")})}})},Ql=(e,t)=>`\n fn calculateInputIndex(index: u32) -> u32 {\n let sizeInConcatAxis = array(${t});\n for (var i: u32 = 0u; i < ${e}; i += 1u ) {\n if (index < sizeInConcatAxis[i]) {\n return i;\n }\n }\n return ${e}u;\n }`,Jl=(e,t)=>{let r=e.length,o=[];for(let i=0;i{let i=M.size(r),u=new Array(e.length),a=new Array(e.length),c=0,p=[],h=[],d=[{type:12,data:i}];for(let S=0;S`uniforms.sizeInConcatAxis${S}`).join(","),v=S=>`\n\n ${(()=>{S.registerUniform("outputSize","u32");for(let A=0;A(${_});\n ${w} -= sizeInConcatAxis[inputIndex - 1u];\n }\n\n ${Jl(a,y)}\n }`;return{name:"Concat",shaderCache:{hint:`${t}`,inputDependencies:p},getRunData:()=>({outputs:[{dims:r,dataType:o}],dispatchGroup:{x:Math.ceil(i/64)},programUniforms:d}),getShaderSource:v}},Ya=(e,t)=>{let r=e.inputs,o=r[0].dims,i=M.normalizeAxis(t.axis,o.length);Xl(r,i);let u=o.slice();u[i]=r.reduce((c,p)=>c+(p.dims.length>i?p.dims[i]:0),0);let a=r.filter(c=>M.size(c.dims)>0);e.compute(En(a,i,u,r[0].dataType),{inputs:a})},Za=e=>ve({axis:e.axis})});var ec,tc,rc,nc,Pn,oc,Xa,Ro=Y(()=>{"use strict";ye();_n();_e();Oo();ec=(e,t)=>{let r=e[0],o=e[1],i=e[2],u=e[3],a=e[4],c=e[5];if(a&&c)throw new Error("Attention cannot have both past and relative_position_bias");if(r.dims.length!==3)throw new Error(\'Input "input" must have 3 dimensions\');let p=r.dims[0],h=r.dims[1],d=r.dims[2];if(i.dims.length!==1)throw new Error(\'Input "bias" is expected to have 1 dimensions\');if(o.dims.length!==2)throw new Error(\'Input "weights" is expected to have 2 dimensions\');if(o.dims[0]!==d)throw new Error("Input 1 dimension 0 should have same length as dimension 2 of input 0");if(i.dims[0]!==o.dims[1])throw new Error(\'Input "bias" dimension 0 should have same length as dimension 1 of input "weights"\');let y=i.dims[0]/3,w=y,_=w;if(t.qkvHiddenSizes.length>0){if(t.qkvHiddenSizes.length!==3)throw new Error("qkv_hidden_sizes attribute should have 3 elements");for(let E of t.qkvHiddenSizes)if(E%t.numHeads!==0)throw new Error("qkv_hidden_sizes should be divisible by num_heads");y=t.qkvHiddenSizes[0],w=t.qkvHiddenSizes[1],_=t.qkvHiddenSizes[2]}let v=h;if(y!==w)throw new Error("qkv_hidden_sizes first element should be same as the second");if(i.dims[0]!==y+w+_)throw new Error(\'Input "bias" dimension 0 should have same length as sum of Q/K/V hidden sizes\');let S=0;if(a){if(w!==_)throw new Error(\'Input "past" expect k_hidden_size == v_hidden_size\');if(a.dims.length!==5)throw new Error(\'Input "past" must have 5 dimensions\');if(a.dims[0]!==2)throw new Error(\'Input "past" first dimension must be 2\');if(a.dims[1]!==p)throw new Error(\'Input "past" second dimension must be batch_size\');if(a.dims[2]!==t.numHeads)throw new Error(\'Input "past" third dimension must be num_heads\');if(a.dims[4]!==w/t.numHeads)throw new Error(\'Input "past" fifth dimension must be k_hidden_size / num_heads\');t.pastPresentShareBuffer||(S=a.dims[3])}let A=v+S,I=-1,x=0;if(u)throw new Error("Mask not supported");if(a)throw new Error("past is not supported");return{batchSize:p,sequenceLength:h,pastSequenceLength:S,kvSequenceLength:v,totalSequenceLength:A,maxSequenceLength:I,inputHiddenSize:d,hiddenSize:y,vHiddenSize:_,headSize:Math.floor(y/t.numHeads),vHeadSize:Math.floor(_/t.numHeads),numHeads:t.numHeads,isUnidirectional:!1,pastPresentShareBuffer:!1,maskFilterValue:t.maskFilterValue,maskType:x,scale:t.scale,broadcastResPosBias:!1,passPastInKv:!1,qkvFormat:1}},tc=(e,t,r,o)=>{let i=Me(o),u=64,a=o/i;a{let _=j("x",t.dataType,t.dims,i),S=[{name:"d_inv",type:et(t.dataType)},{name:"d_comp",type:"u32"},{name:"elements_per_thread",type:"u32"}];return`\n var thread_max: array;\n var thread_sum: array;\n ${w.registerUniforms(S).declareVariables(_)}\n ${w.mainStart([u,1,1])}\n let local_offset = local_idx * uniforms.elements_per_thread;\n let offset = workgroup_id.x * uniforms.d_comp + local_offset;\n\n var thread_max_vector = ${d}(-3.402823e+38f);\n for (var i: u32 = 0; i < uniforms.elements_per_thread && i + local_offset < uniforms.d_comp; i++) {\n thread_max_vector = max(${d}(x[offset + i]), thread_max_vector);\n }\n thread_max[local_idx] = ${(()=>{switch(i){case 1:return"thread_max_vector";case 2:return"max(thread_max_vector.x, thread_max_vector.y)";case 4:return"max(max(thread_max_vector.x, thread_max_vector.y), max(thread_max_vector.z, thread_max_vector.w))";default:throw new Error(`Unsupported components: ${i}`)}})()};\n workgroupBarrier();\n\n var max_value = f32(-3.402823e+38f);\n for (var i = 0u; i < ${u}; i++) {\n max_value = max(thread_max[i], max_value);\n }\n\n var sum_vector = ${d}(0);\n for (var i: u32 = 0; i < uniforms.elements_per_thread && i + local_offset < uniforms.d_comp; i++) {\n sum_vector += exp(${d}(x[offset + i]) - max_value);\n }\n thread_sum[local_idx] = ${(()=>{switch(i){case 1:return"sum_vector";case 2:return"sum_vector.x + sum_vector.y";case 4:return"sum_vector.x + sum_vector.y + sum_vector.z + sum_vector.w";default:throw new Error(`Unsupported components: ${i}`)}})()};\n workgroupBarrier();\n\n var sum: f32 = 0;\n for (var i = 0u; i < ${u}; i++) {\n sum += thread_sum[i];\n }\n\n if (sum == 0) {\n for (var i: u32 = 0; i < uniforms.elements_per_thread && i + local_offset < uniforms.d_comp; i++) {\n x[offset + i] = ${_.type.value}(uniforms.d_inv);\n }\n } else {\n for (var i: u32 = 0; i < uniforms.elements_per_thread && i + local_offset < uniforms.d_comp; i++) {\n var f32input = ${d}(x[offset + i]);\n x[offset + i] = ${_.type.value}(exp(f32input - max_value) / sum);\n }\n }\n }`};return{name:"AttentionProbsSoftmax",shaderCache:{hint:`${u};${h};${i}`},getShaderSource:y,getRunData:()=>({outputs:[],dispatchGroup:{x:r},programUniforms:p})}},rc=(e,t,r,o,i,u,a)=>{let c=a+i.kvSequenceLength,p=[i.batchSize,i.numHeads,i.sequenceLength,c],h=u.scale===0?1/Math.sqrt(i.headSize):u.scale,d=Me(i.headSize),y=i.headSize/d,w=12,_={x:Math.ceil(c/w),y:Math.ceil(i.sequenceLength/w),z:i.batchSize*i.numHeads},v=[{type:12,data:i.sequenceLength},{type:12,data:y},{type:12,data:c},{type:12,data:i.numHeads},{type:1,data:h}],S=o?["type","type","type"]:["type","type"],A=I=>{let x=U("q",t.dataType,t.dims,d),E=U("key",r.dataType,r.dims,d),P=[x,E];o&&P.push(U("relative_position_bias",o.dataType,o.dims));let O=j("output",t.dataType,p),R=et(1,d),L=[{name:"M",type:"u32"},{name:"K",type:"u32"},{name:"N",type:"u32"},{name:"num_heads",type:"u32"},{name:"alpha",type:"f32"}];return`\n const TILE_SIZE = ${w}u;\n\n var tileQ: array<${x.type.storage}, ${w*w}>;\n var tileK: array<${x.type.storage}, ${w*w}>;\n ${I.registerUniforms(L).declareVariables(...P,O)}\n ${I.mainStart([w,w,1])}\n // x holds the N and y holds the M\n let headIdx = workgroup_id.z;\n let m = workgroup_id.y * TILE_SIZE;\n let n = workgroup_id.x * TILE_SIZE;\n let qOffset = uniforms.M * uniforms.K * headIdx + m * uniforms.K;\n let kOffset = uniforms.N * uniforms.K * headIdx + n * uniforms.K;\n\n var value = ${R}(0);\n for (var w: u32 = 0u; w < uniforms.K; w += TILE_SIZE) {\n if (global_id.y < uniforms.M && w + local_id.x < uniforms.K) {\n tileQ[TILE_SIZE * local_id.y + local_id.x] = q[qOffset + local_id.y * uniforms.K + w + local_id.x];\n }\n if (n + local_id.y < uniforms.N && w + local_id.x < uniforms.K) {\n tileK[TILE_SIZE * local_id.y + local_id.x] = key[kOffset + local_id.y * uniforms.K + w + local_id.x];\n }\n workgroupBarrier();\n\n for (var k: u32 = 0u; k < TILE_SIZE && w+k < uniforms.K; k++) {\n value += ${R}(tileQ[TILE_SIZE * local_id.y + k] * tileK[TILE_SIZE * local_id.x + k]);\n }\n\n workgroupBarrier();\n }\n\n let headOffset = headIdx * uniforms.M * uniforms.N;\n if (global_id.y < uniforms.M && global_id.x < uniforms.N) {\n let outputIdx = headOffset + global_id.y * uniforms.N + global_id.x;\n var sum: f32 = ${(()=>{switch(d){case 1:return"value";case 2:return"value.x + value.y";case 4:return"value.x + value.y + value.z + value.w";default:throw new Error(`Unsupported components: ${d}`)}})()};\n output[outputIdx] = ${O.type.value} (sum * uniforms.alpha) + ${o?"relative_position_bias[outputIdx]":"0.0"};\n }\n }`};return{name:"AttentionProbs",shaderCache:{hint:`${d}`,inputDependencies:S},getRunData:()=>({outputs:[{dims:p,dataType:t.dataType,gpuDataType:0}],dispatchGroup:_,programUniforms:v}),getShaderSource:A}},nc=(e,t,r,o,i)=>{let u=i+o.kvSequenceLength,a=[o.batchSize,o.sequenceLength,o.vHiddenSize],c=12,p={x:Math.ceil(o.vHeadSize/c),y:Math.ceil(o.sequenceLength/c),z:o.batchSize*o.numHeads},h=[{type:12,data:o.sequenceLength},{type:12,data:u},{type:12,data:o.vHeadSize},{type:12,data:o.numHeads},{type:12,data:o.vHiddenSize}];return{name:"AttentionScore",shaderCache:{inputDependencies:["type","type"]},getRunData:()=>({outputs:[{dims:a,dataType:t.dataType,gpuDataType:0}],dispatchGroup:p,programUniforms:h}),getShaderSource:w=>{let _=U("probs",t.dataType,t.dims),v=U("v",r.dataType,r.dims),S=j("output",t.dataType,a),A=[{name:"M",type:"u32"},{name:"K",type:"u32"},{name:"N",type:"u32"},{name:"num_heads",type:"u32"},{name:"v_hidden_size",type:"u32"}];return`\n const TILE_SIZE = ${c}u;\n var tileQ: array<${_.type.value}, ${c*c}>;\n var tileK: array<${_.type.value}, ${c*c}>;\n ${w.registerUniforms(A).declareVariables(_,v,S)}\n ${w.mainStart([c,c,1])}\n let headIdx = workgroup_id.z;\n let m = global_id.y;\n let n = global_id.x;\n\n let offsetA = headIdx * (uniforms.M * uniforms.K) + m * uniforms.K;\n let offsetB = headIdx * (uniforms.N * uniforms.K) + n;\n\n var value = ${_.type.storage}(0);\n for (var w: u32 = 0u; w < uniforms.K; w += TILE_SIZE) {\n if (m < uniforms.M && w + local_id.x < uniforms.K) {\n tileQ[TILE_SIZE * local_id.y + local_id.x] = probs[offsetA + w + local_id.x];\n }\n if (n < uniforms.N && w + local_id.y < uniforms.K) {\n tileK[TILE_SIZE * local_id.y + local_id.x] = v[offsetB + (w + local_id.y) * uniforms.N];\n }\n workgroupBarrier();\n for (var k: u32 = 0u; k < TILE_SIZE && w+k < uniforms.K; k++) {\n value += tileQ[TILE_SIZE * local_id.y + k] * tileK[TILE_SIZE * k + local_id.x];\n }\n workgroupBarrier();\n }\n\n // we need to transpose output from BNSH_v to BSND_v\n let batchIdx = workgroup_id.z / uniforms.num_heads;\n let currentBatchHeadNumber = workgroup_id.z % uniforms.num_heads;\n if (m < uniforms.M && n < uniforms.N) {\n let outputIdx = batchIdx * uniforms.M * uniforms.v_hidden_size + m * uniforms.v_hidden_size\n + currentBatchHeadNumber * uniforms.N + n;\n output[outputIdx] = value;\n }\n }`}}},Pn=(e,t,r,o,i,u,a,c,p,h,d)=>{let y=e.outputCount>1,w=e.outputCount>2,_=y&&w?h.pastSequenceLength:0,v=_+h.kvSequenceLength,S=[h.batchSize,h.numHeads,v,h.headSize],A=a?[a,r]:[r],I=y?e.compute(En(A,2,S,r.dataType),{inputs:A,outputs:[1]})[0]:r,x=[h.batchSize,h.numHeads,v,h.headSize],E=c?[c,o]:[o],P=w?e.compute(En(E,2,x,o.dataType),{inputs:E,outputs:[2]})[0]:o,O=[t,I];p&&O.push(p);let R=e.compute(rc(e,t,I,p,h,d,_),{inputs:O,outputs:[-1]})[0];e.compute(tc(e,R,h.batchSize*h.numHeads*h.sequenceLength,v),{inputs:[R],outputs:[]});let L=[R,P];e.compute(nc(e,R,P,h,_),{inputs:L,outputs:[0]})},oc=(e,t)=>{let r=[t.batchSize,t.numHeads,t.sequenceLength,t.headSize],o=t.sequenceLength,i=t.inputHiddenSize,u=t.headSize,a=12,c={x:Math.ceil(t.headSize/a),y:Math.ceil(t.sequenceLength/a),z:t.batchSize*t.numHeads},p=[e.inputs[0],e.inputs[1],e.inputs[2]],h=[{type:12,data:o},{type:12,data:i},{type:12,data:u},{type:12,data:t.numHeads},{type:12,data:t.headSize},{type:12,data:t.hiddenSize},{type:12,data:t.hiddenSize+t.hiddenSize+t.vHiddenSize}],d=y=>{let w=j("output_q",p[0].dataType,r),_=j("output_k",p[0].dataType,r),v=j("output_v",p[0].dataType,r),S=U("input",p[0].dataType,p[0].dims),A=U("weight",p[1].dataType,p[1].dims),I=U("bias",p[2].dataType,p[2].dims),x=S.type.storage,E=[{name:"M",type:"u32"},{name:"K",type:"u32"},{name:"N",type:"u32"},{name:"num_heads",type:"u32"},{name:"head_size",type:"u32"},{name:"hidden_size",type:"u32"},{name:"ldb",type:"u32"}];return`\n const TILE_SIZE = ${a}u;\n var tileInput: array<${x}, ${a*a}>;\n var tileWeightQ: array<${x}, ${a*a}>;\n var tileWeightK: array<${x}, ${a*a}>;\n var tileWeightV: array<${x}, ${a*a}>;\n ${y.registerUniforms(E).declareVariables(S,A,I,w,_,v)}\n ${y.mainStart([a,a,1])}\n let batchIndex = workgroup_id.z / uniforms.num_heads;\n let headNumber = workgroup_id.z % uniforms.num_heads;\n let m = global_id.y;\n let n = global_id.x;\n\n let inputOffset = batchIndex * (uniforms.M * uniforms.K) + m * uniforms.K;\n let biasOffsetQ = headNumber * uniforms.head_size;\n let biasOffsetK = uniforms.hidden_size + biasOffsetQ;\n let biasOffsetV = uniforms.hidden_size + biasOffsetK;\n\n var valueQ = ${x}(0);\n var valueK = ${x}(0);\n var valueV = ${x}(0);\n for (var w: u32 = 0u; w < uniforms.K; w += TILE_SIZE) {\n if (m < uniforms.M && w + local_id.x < uniforms.K) {\n tileInput[TILE_SIZE * local_id.y + local_id.x] = input[inputOffset + w + local_id.x];\n }\n if (n < uniforms.N && w + local_id.y < uniforms.K) {\n let offset = n + (w + local_id.y) * uniforms.ldb;\n tileWeightQ[TILE_SIZE * local_id.y + local_id.x] = weight[biasOffsetQ + offset];\n tileWeightK[TILE_SIZE * local_id.y + local_id.x] = weight[biasOffsetK + offset];\n tileWeightV[TILE_SIZE * local_id.y + local_id.x] = weight[biasOffsetV + offset];\n }\n workgroupBarrier();\n for (var k: u32 = 0u; k({outputs:[{dims:r,dataType:e.inputs[0].dataType,gpuDataType:0},{dims:r,dataType:e.inputs[0].dataType,gpuDataType:0},{dims:r,dataType:e.inputs[0].dataType,gpuDataType:0}],dispatchGroup:c,programUniforms:h}),getShaderSource:d},{inputs:p,outputs:[-1,-1,-1]})},Xa=(e,t)=>{let r=ec(e.inputs,t),[o,i,u]=oc(e,r);return Pn(e,o,i,u,e.inputs[4],void 0,void 0,void 0,e.inputs[5],r,t)}});var ic,ac,sc,Qa,Ja=Y(()=>{"use strict";$r();ye();Se();Ze();_e();ic=(e,t)=>{if(!e||e.length!==5)throw new Error("BatchNormalization requires 5 inputs");let r=(o,i,u)=>{let a=i.length;if(a!==o.length)throw new Error(`${u}: num dimensions != ${a}`);i.forEach((c,p)=>{if(c!==o[p])throw new Error(`${u}: dim[${p}] do not match`)})};if(e[0].dims.length>1){let o=t.format==="NHWC"?t.spatial?e[0].dims.slice(-1):e[0].dims.slice(-1).concat(e[0].dims.slice(1,e[0].dims.length-1)):e[0].dims.slice(1,t.spatial?2:void 0);r(e[1].dims,o,"Invalid input scale"),r(e[2].dims,o,"Invalid input B"),r(e[3].dims,o,"Invalid input mean"),r(e[4].dims,o,"Invalid input var")}else r(e[1].dims,[1],"Invalid input scale"),r(e[2].dims,[1],"Invalid input B"),r(e[3].dims,[1],"Invalid input mean"),r(e[4].dims,[1],"Invalid input var")},ac=(e,t)=>{let{epsilon:r,spatial:o,format:i}=t,u=e[0].dims,a=o?Me(u[u.length-1]):1,c=i==="NHWC"&&u.length>1?a:1,p=M.size(u)/a,h=o,d=h?u.length:u,y=U("x",e[0].dataType,e[0].dims,a),w=U("scale",e[1].dataType,e[1].dims,c),_=U("bias",e[2].dataType,e[2].dims,c),v=U("inputMean",e[3].dataType,e[3].dims,c),S=U("inputVar",e[4].dataType,e[4].dims,c),A=j("y",e[0].dataType,d,a),I=()=>{let E="";if(o)E=`let cOffset = ${u.length===1?"0u":i==="NHWC"?`outputIndices[${u.length-1}] / ${a}`:"outputIndices[1]"};`;else if(i==="NCHW")E=`\n ${A.indicesSet("outputIndices","0","0")}\n let cOffset = ${A.indicesToOffset("outputIndices")};`;else{E=`var cIndices = ${w.type.indices}(0);\n cIndices[0] = outputIndices[${u.length-1}];`;for(let P=1;P`\n const epsilon = ${r};\n ${E.registerUniform("outputSize","u32").declareVariables(y,w,_,v,S,A)}\n ${E.mainStart()}\n ${E.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")}\n var outputIndices = ${A.offsetToIndices(`global_idx * ${a}`)};\n ${I()}\n let scale = ${w.getByOffset("cOffset")};\n let bias = ${_.getByOffset("cOffset")};\n let inputMean = ${v.getByOffset("cOffset")};\n let inputVar = ${S.getByOffset("cOffset")};\n let x = ${y.getByOffset("global_idx")};\n let value = (x - inputMean) * inverseSqrt(inputVar + epsilon) * scale + bias;\n ${A.setByOffset("global_idx","value")}\n }`;return{name:"BatchNormalization",shaderCache:{hint:`${t.epsilon}_${t.format}_${o}_${a}`,inputDependencies:h?["rank","type","type","type","type"]:void 0},getShaderSource:x,getRunData:()=>({outputs:[{dims:e[0].dims,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(p/64)},programUniforms:h?[{type:12,data:p},...Z(u)]:[{type:12,data:p}]})}},sc=e=>ve(e),Qa=(e,t)=>{let{inputs:r,outputCount:o}=e,i=sc({...t,outputCount:o});if(vr.webgpu.validateInputContent&&ic(r,i),t.trainingMode)throw new Error("BatchNormalization trainingMode is not supported yet.");e.compute(ac(r,i))}});var uc,dc,es,ts=Y(()=>{"use strict";Se();_e();uc=e=>{if(e[0].dims.length!==3)throw new Error("input should have 3 dimensions");if(![320,640,1280].includes(e[0].dims[2]))throw new Error("number of channels should be 320, 640 or 1280");if(e[1].dims.length!==1)throw new Error("bias is expected to have 1 dimensions");if(e[0].dims[2]!==e[1].dims[0])throw new Error("last dimension of input and bias are not the same")},dc=e=>{let t=e[0].dims,r=e[0].dims[2],o=M.size(t)/4,i=e[0].dataType,u=U("input",i,t,4),a=U("bias",i,[r],4),c=U("residual",i,t,4),p=j("output",i,t,4);return{name:"BiasAdd",getRunData:()=>({outputs:[{dims:t,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(o/64)}}),getShaderSource:d=>`\n const channels = ${r}u / 4;\n ${d.declareVariables(u,a,c,p)}\n\n ${d.mainStart()}\n ${d.guardAgainstOutOfBoundsWorkgroupSizes(o)}\n let value = ${u.getByOffset("global_idx")}\n + ${a.getByOffset("global_idx % channels")} + ${c.getByOffset("global_idx")};\n ${p.setByOffset("global_idx","value")}\n }`}},es=e=>{uc(e.inputs),e.compute(dc(e.inputs))}});var lc,ke,rs,ns,os,is,as,ss,us,ds,ls,cc,cs,ps,ms,fs,kn,hs,On,gs,ys,bs,ws,vs,$s,_s,Ss,xs,Cs,As,Is,Ts,Es,Ps,ks,Os,Rs,Bo,Do,Bs,Ds,zs,Rn=Y(()=>{"use strict";ye();Se();Ze();_e();lc=(e,t,r,o,i,u)=>{let a=Math.ceil(t/4),c="";typeof i=="string"?c=`${i}(a)`:c=i("a");let p=U("inputData",r,[a],4),h=j("outputData",o,[a],4);return`\n ${e.registerUniform("vec_size","u32").declareVariables(p,h)}\n\n ${u??""}\n\n ${e.mainStart()}\n ${e.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.vec_size")}\n\n let a = ${p.getByOffset("global_idx")};\n ${h.setByOffset("global_idx",c)}\n }`},ke=(e,t,r,o,i,u=e.dataType)=>({name:t,shaderCache:{hint:i,inputDependencies:["type"]},getShaderSource:a=>lc(a,M.size(e.dims),e.dataType,u,r,o),getRunData:a=>({outputs:[{dims:e.dims,dataType:u}],dispatchGroup:{x:Math.ceil(M.size(a[0].dims)/64/4)},programUniforms:[{type:12,data:Math.ceil(M.size(e.dims)/4)}]})}),rs=e=>{e.compute(ke(e.inputs[0],"Abs","abs"))},ns=e=>{e.compute(ke(e.inputs[0],"Acos","acos"))},os=e=>{e.compute(ke(e.inputs[0],"Acosh","acosh"))},is=e=>{e.compute(ke(e.inputs[0],"Asin","asin"))},as=e=>{e.compute(ke(e.inputs[0],"Asinh","asinh"))},ss=e=>{e.compute(ke(e.inputs[0],"Atan","atan"))},us=e=>{e.compute(ke(e.inputs[0],"Atanh","atanh"))},ds=e=>ve(e),ls=(e,t)=>{let r;switch(t.to){case 10:r="vec4";break;case 1:r="vec4";break;case 12:r="vec4";break;case 6:r="vec4";break;case 9:r="vec4";break;default:throw new RangeError(`not supported type (specified in attribute \'to\' from \'Cast\' operator): ${t.to}`)}e.compute(ke(e.inputs[0],"Cast",r,void 0,t.cacheKey,t.to))},cc=e=>{let t=e.length>=2&&e[1].data!==0?e[1].getFloat32Array()[0]:xn,r=e.length>=3&&e[2].data!==0?e[2].getFloat32Array()[0]:Cn;return ve({min:t,max:r})},cs=(e,t)=>{let r=e.inputs.length===1?t:cc(e.inputs),o=et(e.inputs[0].dataType);e.compute(ke(e.inputs[0],"Clip",i=>`clamp(${i}, clip_min_, clip_max_)`,`\n const clip_min_: vec4<${o}> = vec4(${o}(${r.min}));\n const clip_max_: vec4<${o}> = vec4(${o}(${r.max}));\n`,r.cacheKey),{inputs:[0]})},ps=e=>{e.compute(ke(e.inputs[0],"Ceil","ceil"))},ms=e=>{e.compute(ke(e.inputs[0],"Cos","cos"))},fs=e=>{e.compute(ke(e.inputs[0],"Cosh","cosh"))},kn=e=>ve(e),hs=(e,t)=>{let r=et(e.inputs[0].dataType);e.compute(ke(e.inputs[0],"Elu",o=>`elu_vf32(${o})`,`\n const elu_alpha_ = ${r}(${t.alpha});\n\n fn elu_f32(a: ${r}) -> ${r} {\n return select((exp(a) - 1.0) * elu_alpha_, a, a >= 0.0);\n }\n\n fn elu_vf32(v: vec4<${r}>) -> vec4<${r}> {\n return vec4(elu_f32(v.x), elu_f32(v.y), elu_f32(v.z), elu_f32(v.w));\n }`,t.cacheKey))},On=(e="f32")=>`\nconst r0: ${e} = 0.3275911;\nconst r1: ${e} = 0.254829592;\nconst r2: ${e} = -0.284496736;\nconst r3: ${e} = 1.421413741;\nconst r4: ${e} = -1.453152027;\nconst r5: ${e} = 1.061405429;\n\nfn erf_vf32(v: vec4<${e}>) -> vec4<${e}> {\n let absv = abs(v);\n let x = 1.0 / (1.0 + r0 * absv);\n return sign(v) * (1.0 - ((((r5 * x + r4) * x + r3) * x + r2) * x + r1) * x * exp(-absv * absv));\n}`,gs=e=>{let t=et(e.inputs[0].dataType);e.compute(ke(e.inputs[0],"Erf",r=>`erf_vf32(${r})`,On(t)))},ys=e=>{e.compute(ke(e.inputs[0],"Exp","exp"))},bs=e=>{e.compute(ke(e.inputs[0],"Floor","floor"))},ws=e=>{let t=et(e.inputs[0].dataType);e.compute(ke(e.inputs[0],"Gelu",r=>`0.5 * ${r} * (1.0 + erf_vf32(${r} * 0.7071067811865475))`,On(t)))},vs=(e,t)=>{let r=et(e.inputs[0].dataType);e.compute(ke(e.inputs[0],"LeakyRelu",o=>`select(leaky_relu_alpha_ * ${o}, ${o}, ${o} >= vec4<${r}>(0.0))`,`const leaky_relu_alpha_ = ${r}(${t.alpha});`,t.cacheKey))},$s=e=>{e.compute(ke(e.inputs[0],"Not",t=>`!${t}`))},_s=e=>{e.compute(ke(e.inputs[0],"Neg",t=>`-${t}`))},Ss=e=>{e.compute(ke(e.inputs[0],"Reciprocal",t=>`1.0/${t}`))},xs=e=>{let t=et(e.inputs[0].dataType);e.compute(ke(e.inputs[0],"Relu",r=>`select(vec4<${t}>(0.0), ${r}, ${r} > vec4<${t}>(0.0))`))},Cs=e=>{e.compute(ke(e.inputs[0],"Sigmoid",t=>`(1.0 / (1.0 + exp(-${t})))`))},As=e=>ve(e),Is=(e,t)=>{let r=et(e.inputs[0].dataType);e.compute(ke(e.inputs[0],"HardSigmoid",o=>`max(vec4<${r}>(0.0), min(vec4<${r}>(1.0), ${t.alpha} * ${o} + vec4<${r}>(${t.beta})))`,void 0,t.cacheKey))},Ts=e=>{e.compute(ke(e.inputs[0],"Sin","sin"))},Es=e=>{e.compute(ke(e.inputs[0],"Sinh","sinh"))},Ps=e=>{e.compute(ke(e.inputs[0],"Sqrt","sqrt"))},ks=e=>{e.compute(ke(e.inputs[0],"Tan","tan"))},Os=e=>`sign(${e}) * (1 - exp(-2 * abs(${e}))) / (1 + exp(-2 * abs(${e})))`,Rs=e=>{e.compute(ke(e.inputs[0],"Tanh",Os))},Bo=(e="f32")=>`\nconst fast_gelu_a: ${e} = 0.5;\nconst fast_gelu_b: ${e} = 0.7978845608028654;\nconst fast_gelu_c: ${e} = 0.035677408136300125;\n\nfn tanh_v(v: vec4<${e}>) -> vec4<${e}> {\n return ${Os("v")};\n}\n`,Do=e=>`(fast_gelu_a + fast_gelu_a * tanh_v(${e} * (fast_gelu_c * ${e} * ${e} + fast_gelu_b))) * ${e}`,Bs=e=>{let t=et(e.inputs[0].dataType);e.compute(ke(e.inputs[0],"FastGelu",Do,Bo(t),void 0,e.inputs[0].dataType))},Ds=(e,t)=>{let r=et(e.inputs[0].dataType);return e.compute(ke(e.inputs[0],"ThresholdedRelu",o=>`select(vec4<${r}>(0.0), ${o}, ${o} > thresholded_relu_alpha_)`,`const thresholded_relu_alpha_ = vec4<${r}>(${t.alpha});`,t.cacheKey)),0},zs=e=>{e.compute(ke(e.inputs[0],"Log","log"))}});var pc,mc,Us,Vs=Y(()=>{"use strict";Se();_e();Rn();pc=e=>{if(e[0].dims.length!==3)throw new Error("input should have 3 dimensions");if(![2560,5120,10240].includes(e[0].dims[2]))throw new Error("hidden state should be 2560, 5120 or 10240");if(e[1].dims.length!==1)throw new Error("bias is expected to have 1 dimensions");if(e[0].dims[2]!==e[1].dims[0])throw new Error("last dimension of input and bias are not the same")},mc=e=>{let t=e[0].dims.slice();t[2]=t[2]/2;let r=U("input",e[0].dataType,e[0].dims,4),o=U("bias",e[0].dataType,[e[0].dims[2]],4),i=j("output",e[0].dataType,t,4),u=M.size(t)/4,a=De(e[0].dataType);return{name:"BiasSplitGelu",getRunData:()=>({outputs:[{dims:t,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(u/64)}}),getShaderSource:p=>`\n const M_SQRT2 = sqrt(2.0);\n const halfChannels = ${e[0].dims[2]/4/2}u;\n\n ${p.declareVariables(r,o,i)}\n\n ${On(a)}\n\n ${p.mainStart()}\n ${p.guardAgainstOutOfBoundsWorkgroupSizes(u)}\n let biasIdx = global_idx % halfChannels;\n let batchIndex = global_idx / halfChannels;\n let inputOffset = biasIdx + batchIndex * halfChannels * 2;\n let valueLeft = input[inputOffset] + bias[biasIdx];\n let valueRight = input[inputOffset + halfChannels] + bias[biasIdx + halfChannels];\n let geluRight = valueRight * 0.5 * (erf_vf32(valueRight / M_SQRT2) + 1);\n\n ${i.setByOffset("global_idx","valueLeft * geluRight")}\n }`}},Us=e=>{pc(e.inputs),e.compute(mc(e.inputs))}});var fc,hc,Ot,Ws,Ns,Gs,Hs,Ls,Fs,qs,js,Ks,Ys,Zs=Y(()=>{"use strict";ye();Se();_e();fc=(e,t,r,o,i,u,a,c,p,h,d,y)=>{let w,_;typeof c=="string"?w=_=(x,E)=>`${c}((${x}),(${E}))`:typeof c=="function"?w=_=c:(w=c.scalar,_=c.vector);let v=j("outputData",d,o.length,4),S=U("aData",p,t.length,4),A=U("bData",h,r.length,4),I;if(i)if(u){let x=M.size(t)===1,E=M.size(r)===1,P=t.length>0&&t[t.length-1]%4===0,O=r.length>0&&r[r.length-1]%4===0;x||E?I=v.setByOffset("global_idx",_(x?`${S.type.value}(${S.getByOffset("0")}.x)`:S.getByOffset("global_idx"),E?`${A.type.value}(${A.getByOffset("0")}.x)`:A.getByOffset("global_idx"))):I=`\n let outputIndices = ${v.offsetToIndices("global_idx * 4u")};\n let offsetA = ${S.broadcastedIndicesToOffset("outputIndices",v)};\n let offsetB = ${A.broadcastedIndicesToOffset("outputIndices",v)};\n ${v.setByOffset("global_idx",_(a||P?S.getByOffset("offsetA / 4u"):`${S.type.value}(${S.getByOffset("offsetA / 4u")}[offsetA % 4u])`,a||O?A.getByOffset("offsetB / 4u"):`${A.type.value}(${A.getByOffset("offsetB / 4u")}[offsetB % 4u])`))}\n `}else I=v.setByOffset("global_idx",_(S.getByOffset("global_idx"),A.getByOffset("global_idx")));else{if(!u)throw new Error("no necessary to use scalar implementation for element-wise binary op implementation.");let x=(E,P,O="")=>{let R=`aData[indexA${P}][componentA${P}]`,L=`bData[indexB${P}][componentB${P}]`;return`\n let outputIndices${P} = ${v.offsetToIndices(`global_idx * 4u + ${P}u`)};\n let offsetA${P} = ${S.broadcastedIndicesToOffset(`outputIndices${P}`,v)};\n let offsetB${P} = ${A.broadcastedIndicesToOffset(`outputIndices${P}`,v)};\n let indexA${P} = offsetA${P} / 4u;\n let indexB${P} = offsetB${P} / 4u;\n let componentA${P} = offsetA${P} % 4u;\n let componentB${P} = offsetB${P} % 4u;\n ${E}[${P}] = ${O}(${w(R,L)});\n `};d===9?I=`\n var data = vec4(0);\n ${x("data",0,"u32")}\n ${x("data",1,"u32")}\n ${x("data",2,"u32")}\n ${x("data",3,"u32")}\n outputData[global_idx] = dot(vec4(0x1, 0x100, 0x10000, 0x1000000), vec4(data));`:I=`\n ${x("outputData[global_idx]",0)}\n ${x("outputData[global_idx]",1)}\n ${x("outputData[global_idx]",2)}\n ${x("outputData[global_idx]",3)}\n `}return`\n ${e.registerUniform("vec_size","u32").declareVariables(S,A,v)}\n\n ${y??""}\n\n ${e.mainStart()}\n ${e.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.vec_size")}\n ${I}\n }`},hc=(e,t,r,o,i,u,a=r.dataType)=>{let c=!M.areEqual(r.dims,o.dims),p=r.dims,h=M.size(r.dims),d=!1,y=!1,w=[c];if(c){let _=It.calcShape(r.dims,o.dims,!1);if(!_)throw new Error("Can\'t perform binary op on the given tensors");p=_,h=M.size(p);let v=M.size(r.dims)===1,S=M.size(o.dims)===1,A=r.dims.length>0&&r.dims[r.dims.length-1]%4===0,I=o.dims.length>0&&o.dims[o.dims.length-1]%4===0;w.push(v),w.push(S),w.push(A),w.push(I);let x=1;for(let E=1;E_.toString()).join("_"),inputDependencies:["rank","rank"]},getShaderSource:_=>fc(_,r.dims,o.dims,p,d,c,y,i,r.dataType,o.dataType,a,u),getRunData:()=>({outputs:[{dims:p,dataType:a}],dispatchGroup:{x:Math.ceil(h/64/4)},programUniforms:[{type:12,data:Math.ceil(M.size(p)/4)},...Z(r.dims,o.dims,p)]})}},Ot=(e,t,r,o,i,u)=>{e.compute(hc(t,i??"",e.inputs[0],e.inputs[1],r,o,u))},Ws=e=>{Ot(e,"Add",(t,r)=>`${t}+${r}`)},Ns=e=>{Ot(e,"Div",(t,r)=>`${t}/${r}`)},Gs=e=>{Ot(e,"Equal",{scalar:(t,r)=>`u32(${t}==${r})`,vector:(t,r)=>`vec4(${t}==${r})`},void 0,void 0,9)},Hs=e=>{Ot(e,"Mul",(t,r)=>`${t}*${r}`)},Ls=e=>{let t=U("input",e.inputs[0].dataType,e.inputs[0].dims).type.value;Ot(e,"Pow",{scalar:(o,i)=>`pow_custom(${o},${i})`,vector:(o,i)=>`pow_vector_custom(${o},${i})`},`\n fn pow_custom(a : ${t}, b : ${t}) -> ${t} {\n if (b == ${t}(0.0)) {\n return ${t}(1.0);\n } else if (a < ${t}(0.0) && f32(b) != floor(f32(b))) {\n return ${t}(pow(f32(a), f32(b))); // NaN\n }\n return select(sign(a), ${t}(1.0), round(f32(abs(b) % ${t}(2.0))) != 1.0) * ${t}(${t==="i32"?"round":""}(pow(f32(abs(a)), f32(b))));\n }\n fn pow_vector_custom(a : vec4<${t}>, b : vec4<${t}>) -> vec4<${t}> {\n // TODO: implement vectorized pow\n return vec4<${t}>(pow_custom(a.x, b.x), pow_custom(a.y, b.y), pow_custom(a.z, b.z), pow_custom(a.w, b.w));\n }\n `)},Fs=e=>{Ot(e,"Sub",(t,r)=>`${t}-${r}`)},qs=e=>{Ot(e,"Greater",{scalar:(t,r)=>`u32(${t}>${r})`,vector:(t,r)=>`vec4(${t}>${r})`},void 0,void 0,9)},js=e=>{Ot(e,"Less",{scalar:(t,r)=>`u32(${t}<${r})`,vector:(t,r)=>`vec4(${t}<${r})`},void 0,void 0,9)},Ks=e=>{Ot(e,"GreaterOrEqual",{scalar:(t,r)=>`u32(${t}>=${r})`,vector:(t,r)=>`vec4(${t}>=${r})`},void 0,void 0,9)},Ys=e=>{Ot(e,"LessOrEqual",{scalar:(t,r)=>`u32(${t}<=${r})`,vector:(t,r)=>`vec4(${t}<=${r})`},void 0,void 0,9)}});var St,xt,Ct,Bn,Ft=Y(()=>{"use strict";ye();Se();St=(e,t,r="f32")=>{switch(e.activation){case"Relu":return`value = max(value, ${t}(0.0));`;case"Sigmoid":return`value = (${t}(1.0) / (${t}(1.0) + exp(-value)));`;case"Clip":return`value = clamp(value, ${t}(${r}(uniforms.clip_min)), ${t}(${r}(uniforms.clip_max)));`;case"HardSigmoid":return`value = max(${t}(0.0), min(${t}(1.0), ${r}(uniforms.alpha) * value + ${r}(uniforms.beta)));`;case"LeakyRelu":return`value = select(${r}(uniforms.alpha) * value, value, value >= ${t}(0.0));`;case"":return"";default:throw new Error(`Unsupported activation ${e.activation}`)}},xt=(e,t)=>{e.activation==="Clip"?t.push({type:1,data:e.clipMax},{type:1,data:e.clipMin}):e.activation==="HardSigmoid"?t.push({type:1,data:e.alpha},{type:1,data:e.beta}):e.activation==="LeakyRelu"&&t.push({type:1,data:e.alpha})},Ct=(e,t)=>{e.activation==="Clip"?t.push({name:"clip_max",type:"f32"},{name:"clip_min",type:"f32"}):e.activation==="HardSigmoid"?t.push({name:"alpha",type:"f32"},{name:"beta",type:"f32"}):e.activation==="LeakyRelu"&&t.push({name:"alpha",type:"f32"})},Bn=e=>{let t=e?.activation||"";if(t==="HardSigmoid"){let[r,o]=e?.activation_params||[.2,.5];return{activation:t,alpha:r,beta:o}}else if(t==="Clip"){let[r,o]=e?.activation_params||[xn,Cn];return{activation:t,clipMax:o,clipMin:r}}else if(t==="LeakyRelu"){let[r]=e?.activation_params||[.01];return{activation:t,alpha:r}}return{activation:t}}});var tt,Dn,zn=Y(()=>{"use strict";tt=(e,t)=>{switch(e){case 1:return t;case 2:return`vec2<${t}>`;case 3:return`vec3<${t}>`;case 4:return`vec4<${t}>`;default:throw new Error(`${e}-component is not supported.`)}},Dn=e=>`\n ${e?"value = value + getBiasByOutputCoords(coords);":""}\n `});var Mn,zo=Y(()=>{"use strict";Mn=e=>`\nfn getIndexFromCoords4D(coords : vec4, shape : vec4) -> i32 {\n return dot(coords, vec4(\n shape.y * shape.z * shape.w, shape.z * shape.w, shape.w, 1));\n}\nfn getOutputIndexFromCoords(coords : vec4) -> i32 {\n return dot(coords, vec4(\n i32(${e}.x), i32(${e}.y), i32(${e}.z), 1));\n}\n`});var yc,bc,Hr,Xs,wc,Lr,vc,Un,Fr=Y(()=>{"use strict";ye();Se();_e();Ft();zn();yc=(e,t)=>e?`\n mm_Asub[inputRow][inputCol] = mm_readA(batch,\n kStart + inputRow,\n globalRowStart / innerElementSize + inputCol${t?", batchIndices":""});\n `:`\n mm_Asub[inputRow][inputCol] = mm_readA(batch,\n globalRow + innerRow,\n kStart / innerElementSize + inputCol${t?", batchIndices":""});\n `,bc=(e,t)=>e?`\n let ACached0 = mm_Asub[k * innerElementSize][localRow];\n let ACached1 = mm_Asub[k * innerElementSize + 1][localRow];\n let ACached2 = mm_Asub[k * innerElementSize + 2][localRow];\n ${t===3?"":"let ACached3 = mm_Asub[k * innerElementSize + 3][localRow];"}\n for (var i = 0; i < rowPerThread; i = i + 1) {\n acc[i] = BCached0 * ACached0[i] + acc[i];\n acc[i] = BCached1 * ACached1[i] + acc[i];\n acc[i] = BCached2 * ACached2[i] + acc[i];\n ${t===3?"":"acc[i] = BCached3 * ACached3[i] + acc[i];"}\n }`:`\n for (var i = 0; i < rowPerThread; i = i + 1) {\n let ACached = mm_Asub[tileRow + i][k];\n acc[i] = BCached0 * ACached.x + acc[i];\n acc[i] = BCached1 * ACached.y + acc[i];\n acc[i] = BCached2 * ACached.z + acc[i];\n ${t===3?"":"acc[i] = BCached3 * ACached.w + acc[i];"}\n }`,Hr=(e,t,r="f32",o,i=!1,u=32,a=!1,c=32)=>{let p=t[1]*e[1],h=t[0]*e[0],d=i?p:u,y=i?u:p,w=d/t[0],_=u/t[1];if(!((i&&w===4&&e[1]===4||!i&&(w===3||w===4))&&d%t[0]===0&&u%t[1]===0&&e[0]===4))throw new Error(`If transposeA ${i} is true, innerElementSize ${w} and workPerThread[1] ${e[1]} must be 4.\n Otherwise, innerElementSize ${w} must be 3 or 4.\n tileAWidth ${d} must be divisible by workgroupSize[0]${t[0]}. tileInner ${u} must be divisible by workgroupSize[1] ${t[1]}. colPerThread ${e[0]} must be 4.`);return`\nvar mm_Asub: array, ${d/w}>, ${y}>;\nvar mm_Bsub: array, ${h/e[0]}>, ${u}>;\n\nconst rowPerThread = ${e[1]};\nconst colPerThread = ${e[0]};\nconst innerElementSize = ${w};\nconst tileInner = ${u};\n\n@compute @workgroup_size(${t[0]}, ${t[1]}, ${t[2]})\nfn main(@builtin(local_invocation_id) localId : vec3,\n @builtin(global_invocation_id) globalId : vec3,\n @builtin(workgroup_id) workgroupId : vec3) {\n let localRow = i32(localId.y);\n let tileRow = localRow * rowPerThread;\n let tileCol = i32(localId.x);\n\n let globalRow =i32(globalId.y) * rowPerThread;\n let globalCol = i32(globalId.x);\n let batch = ${a?"0":"i32(globalId.z)"};\n ${o?`let batchIndices = ${o.offsetToIndices("u32(batch)")};`:""}\n let globalRowStart = i32(workgroupId.y) * ${p};\n\n let num_tiles = ${a?`${Math.ceil(c/u)}`:"(uniforms.dim_inner - 1) / tileInner + 1"};\n var kStart = ${a?`i32(globalId.z) * ${c}`:"0"};\n\n var acc: array, rowPerThread>;\n\n // Loop over shared dimension.\n let tileRowB = localRow * ${_};\n for (var t = 0; t < num_tiles; t = t + 1) {\n // Load one tile of A into local memory.\n for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) {\n let inputRow = tileRow + innerRow;\n let inputCol = tileCol;\n ${yc(i,o)}\n }\n\n // Load one tile of B into local memory.\n for (var innerRow = 0; innerRow < ${_}; innerRow = innerRow + 1) {\n let inputRow = tileRowB + innerRow;\n let inputCol = tileCol;\n mm_Bsub[inputRow][inputCol] = mm_readB(batch, kStart + inputRow, globalCol${o?", batchIndices":""});\n }\n kStart = kStart + tileInner;\n workgroupBarrier();\n\n // Compute acc values for a single thread.\n for (var k = 0; k < tileInner / innerElementSize; k = k + 1) {\n let BCached0 = mm_Bsub[k * innerElementSize][tileCol];\n let BCached1 = mm_Bsub[k * innerElementSize + 1][tileCol];\n let BCached2 = mm_Bsub[k * innerElementSize + 2][tileCol];\n ${w===3?"":"let BCached3 = mm_Bsub[k * innerElementSize + 3][tileCol];"}\n\n ${bc(i,w)}\n }\n\n workgroupBarrier();\n }\n\n for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) {\n mm_write(batch, globalRow + innerRow, globalCol, acc[innerRow]);\n }\n}`},Xs=(e,t)=>e?`\n mm_Asub[inputRow][inputCol] = mm_readA(batch,\n kStart + inputRow,\n globalRowStart + inputCol${t?", batchIndices":""});\n `:`\n mm_Asub[inputRow][inputCol] = mm_readA(batch,\n globalRowStart + inputRow,\n kStart + inputCol${t?", batchIndices":""});\n `,wc=e=>e?"let ACached = mm_Asub[k][tileRow + innerRow];":"let ACached = mm_Asub[tileRow + innerRow][k];",Lr=(e,t,r="f32",o,i=!1,u=32,a=!1,c=32,p=!1)=>{let h=e[1]*t[1],d=e[0]*t[0],y=i?h:u,w=i?u:h;if(!(w%t[1]===0&&y%t[0]===0&&u%t[1]===0))throw new Error(`tileAHight ${w} must be divisible by workgroupSize[1]${t[1]}, tileAWidth ${y} must be divisible by workgroupSize[0]${t[0]}, tileInner ${u} must be divisible by workgroupSize[1]${t[1]}`);let _=w/t[1],v=y/t[0],S=u/t[1],A=p?`\n let localRow = i32(localId.y);\n let localCol = i32(localId.x);\n let globalRowStart = i32(workgroupId.y) * ${h};\n let globalColStart = i32(workgroupId.x) * ${d};\n\n // Loop over shared dimension.\n for (var t = 0; t < num_tiles; t = t + 1) {\n // Load one tile of A into local memory.\n for (var inputRow = localRow; inputRow < ${w}; inputRow = inputRow + ${t[1]}) {\n for (var inputCol = localCol; inputCol < ${y}; inputCol = inputCol + ${t[0]}) {\n ${Xs(i,o)}\n }\n }\n // Load one tile of B into local memory.\n for (var inputRow = localRow; inputRow < ${u}; inputRow = inputRow + ${t[1]}) {\n for (var inputCol = localCol; inputCol < ${d}; inputCol = inputCol + ${t[0]}) {\n mm_Bsub[inputRow][inputCol] = mm_readB(batch,\n kStart + inputRow,\n globalColStart + inputCol${o?", batchIndices":""});\n }\n }\n kStart = kStart + tileInner;\n workgroupBarrier();\n\n // Compute acc values for a single thread.\n var BCached : array<${r}, colPerThread>;\n for (var k = 0; k < tileInner; k = k + 1) {\n for (var inner = 0; inner < colPerThread; inner = inner + 1) {\n BCached[inner] = mm_Bsub[k][localCol + inner * ${t[0]}];\n }\n for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) {\n let ACached = ${i?`mm_Asub[k][localRow + innerRow * ${t[1]}];`:`mm_Asub[localRow + innerRow * ${t[1]}][k];`}\n for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) {\n acc[innerRow][innerCol] = acc[innerRow][innerCol] +\n ACached * BCached[innerCol];\n }\n }\n }\n workgroupBarrier();\n }\n for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) {\n let gRow = globalRowStart + localRow + innerRow * ${t[1]};\n for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) {\n let gCol = globalColStart + localCol + innerCol * ${t[0]};\n mm_write(batch, gRow, gCol, acc[innerRow][innerCol]);\n }\n }\n `:`\nlet tileRow = i32(localId.y) * rowPerThread;\nlet tileCol = i32(localId.x) * colPerThread;\n\nlet globalRow = i32(globalId.y) * rowPerThread;\nlet globalCol = i32(globalId.x) * colPerThread;\nlet globalRowStart = i32(workgroupId.y) * ${h};\n\nlet tileRowA = i32(localId.y) * ${_};\nlet tileColA = i32(localId.x) * ${v};\nlet tileRowB = i32(localId.y) * ${S};\n// Loop over shared dimension.\nfor (var t = 0; t < num_tiles; t = t + 1) {\n // Load one tile of A into local memory.\n for (var innerRow = 0; innerRow < ${_}; innerRow = innerRow + 1) {\n for (var innerCol = 0; innerCol < ${v}; innerCol = innerCol + 1) {\n let inputRow = tileRowA + innerRow;\n let inputCol = tileColA + innerCol;\n ${Xs(i,o)}\n }\n }\n\n // Load one tile of B into local memory.\n for (var innerRow = 0; innerRow < ${S}; innerRow = innerRow + 1) {\n for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) {\n let inputRow = tileRowB + innerRow;\n let inputCol = tileCol + innerCol;\n mm_Bsub[inputRow][inputCol] = mm_readB(batch,\n kStart + inputRow,\n globalCol + innerCol${o?", batchIndices":""});\n }\n }\n kStart = kStart + tileInner;\n workgroupBarrier();\n\n // Compute acc values for a single thread.\n var BCached : array<${r}, colPerThread>;\n for (var k = 0; k < tileInner; k = k + 1) {\n for (var inner = 0; inner < colPerThread; inner = inner + 1) {\n BCached[inner] = mm_Bsub[k][tileCol + inner];\n }\n\n for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) {\n ${wc(i)}\n for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) {\n acc[innerRow][innerCol] = acc[innerRow][innerCol] + ACached * BCached[innerCol];\n }\n }\n }\n\n workgroupBarrier();\n}\n\nfor (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) {\n for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) {\n mm_write(batch, globalRow + innerRow, globalCol + innerCol,\n acc[innerRow][innerCol]);\n }\n}\n`;return`\n var mm_Asub : array, ${w}>;\n var mm_Bsub : array, ${u}>;\n const rowPerThread = ${e[1]};\n const colPerThread = ${e[0]};\n const tileInner = ${u};\n\n@compute @workgroup_size(${t[0]}, ${t[1]}, ${t[2]})\nfn main(@builtin(local_invocation_id) localId : vec3,\n @builtin(global_invocation_id) globalId : vec3,\n @builtin(workgroup_id) workgroupId : vec3) {\n let batch = ${a?"0":"i32(globalId.z)"};\n ${o?`let batchIndices = ${o.offsetToIndices("u32(batch)")};`:""}\n let num_tiles = ${a?`${Math.ceil(c/u)}`:"(uniforms.dim_inner - 1) / tileInner + 1"};\n var kStart = ${a?`i32(globalId.z) * ${c}`:"0"};\n\n var acc : array, rowPerThread>;\n\n // Without this initialization strange values show up in acc.\n for (var innerRow = 0; innerRow < rowPerThread; innerRow = innerRow + 1) {\n for (var innerCol = 0; innerCol < colPerThread; innerCol = innerCol + 1) {\n acc[innerRow][innerCol] = 0.0;\n }\n }\n ${A}\n }\n`},vc=(e,t,r,o,i,u=!1)=>{let[a,c,p]=i,[h,d,y,w]=o,_=_r(a,p),v=_r(c,p),S=De(o[0].type.tensor),A=()=>{let E=d.rank,P=h.rank,O=`var aIndices: ${d.type.indices};`;for(let R=E-2-1,L=P-1;R>=0;R--,L--)O+=`\naIndices[${R}] = ${P>1?`batchIndices[${L}]`:"batchIndices"};`;return _.forEach(R=>{O+=`\naIndices[${R}] = 0;`}),O+=`\naIndices[${E-2}] = u32(row);\n aIndices[${E-1}] = u32(colIn);`,O},I=()=>{let E=y.rank,P=h.rank,O=`var bIndices: ${y.type.indices};`;for(let R=E-2-1,L=P-1;R>=0;R--,L--)O+=`\nbIndices[${R}] = ${P>1?`batchIndices[${L}]`:"batchIndices"};`;return v.forEach(R=>{O+=`\nbIndices[${R}] = 0;`}),O+=`\nbIndices[${E-2}] = u32(row);\n bIndices[${E-1}] = u32(colIn);`,O};return`\n fn mm_readA(batch: i32, row: i32, colIn: i32, batchIndices: ${h.type.indices}) -> ${tt(e,S)} {\n var value = ${tt(e,S)}(0.0);\n let col = colIn * ${e};\n if(row < uniforms.dim_a_outer && col < uniforms.dim_inner)\n {\n ${A()}\n value = ${d.getByIndices("aIndices")};\n }\n return value;\n }\n\n fn mm_readB(batch: i32, row: i32, colIn: i32, batchIndices: ${h.type.indices}) -> ${tt(e,S)} {\n var value = ${tt(e,S)}(0.0);\n let col = colIn * ${e};\n if(row < uniforms.dim_inner && col < uniforms.dim_b_outer)\n {\n ${I()}\n value = ${y.getByIndices("bIndices")};\n }\n return value;\n }\n\n fn mm_write(batch: i32, row: i32, colIn: i32, valueIn: ${tt(e,S)}) {\n let col = colIn * ${e};\n if (row < uniforms.dim_a_outer && col < uniforms.dim_b_outer) {\n var value = valueIn;\n let coords = vec3(batch, row, colIn);\n ${t?`value = value + ${u?"bias[colIn]":`${tt(e,S)}(bias[row])`};`:""}\n ${r}\n ${w.setByIndices("vec3(coords)","value")}\n }\n }\n `},Un=(e,t,r,o,i=!1)=>{let u=e[0].dims,a=e[1].dims,c=u.slice(0,-2),p=a.slice(0,-2),h=o?o.slice(0,-2):r.slice(0,-2),d=M.size(h),y=u[u.length-2],w=u[u.length-1],_=a[a.length-1],v=w%4===0&&_%4===0,S=y<=8?[4,1,1]:[4,4,1],A=[8,8,1],I=[Math.ceil(_/A[0]/S[0]),Math.ceil(y/A[1]/S[1]),Math.ceil(d/A[2]/S[2])],x=v?4:1,E=[...c,y,w/x],P=E.length,O=[...p,w,_/x],R=O.length,L=[d,y,_/x],N=[{type:6,data:y},{type:6,data:_},{type:6,data:w}];xt(t,N),N.push(...Z(h,E,O));let K=["rank","rank"],Q=e.length>2;Q&&(N.push(...Z(e[2].dims)),K.push("rank")),N.push(...Z(L));let he=W=>{let se=h.length,Ce=An("batchDims",e[0].dataType,se,1),We=De(e[0].dataType),ee=U("a",e[0].dataType,P,x),ae=U("b",e[1].dataType,R,x),Ae=j("result",e[0].dataType,L.length,x),me=[ee,ae];if(Q){let G=i?x:1;me.push(U("bias",e[2].dataType,e[2].dims.length,G))}let ie=[{name:"dim_a_outer",type:"i32"},{name:"dim_b_outer",type:"i32"},{name:"dim_inner",type:"i32"}];Ct(t,ie);let ue=De(Ae.type.tensor),le=St(t,Ae.type.value,ue),qe=vc(x,Q,le,[Ce,ee,ae,Ae],[c,p,h],i);return`\n ${W.registerUniforms(ie).registerInternalVariables(Ce).declareVariables(...me,Ae)}\n ${qe}\n ${v?Hr(S,A,We,Ce):Lr(S,A,We,Ce)}\n `};return{name:"MatMul",shaderCache:{hint:`${S};${t.activation};${v};${i}`,inputDependencies:K},getRunData:()=>({outputs:[{dims:r,dataType:e[0].dataType}],dispatchGroup:{x:I[0],y:I[1],z:I[2]},programUniforms:N}),getShaderSource:he}}});var $c,Qs,Js=Y(()=>{"use strict";ye();Lt();_e();Ft();zn();zo();Fr();$c=(e,t,r,o,i=!1,u,a=4,c=4,p=4,h="f32")=>{let d=Q=>{switch(Q){case 1:return"resData = x[xIndex];";case 3:return`resData = vec3<${h}>(x[xIndex], x[xIndex + 1], x[xIndex + 2]);`;case 4:return"resData = x[xIndex / 4];";default:throw new Error(`innerElementSize ${Q} is not supported.`)}},y=Q=>{switch(Q){case 1:return"return w[row * i32(uniforms.w_shape[3]) + colIn];";case 4:return"return w[row * i32(uniforms.w_shape[3]) / 4 + colIn];";default:throw new Error(`innerElementSize ${Q} is not supported.`)}},w=e?`\n let coord = vec4(batch, xRow, xCol, xCh);\n `:`\n let coord = vec4(batch, xCh, xRow, xCol);\n `,_=e?`\n let coords = vec4(\n batch,\n row / outWidth,\n row % outWidth,\n col);\n `:`\n let coords = vec4(\n batch,\n row,\n col / outWidth,\n col % outWidth);\n `,v=e?"i32(uniforms.x_shape[1])":"i32(uniforms.x_shape[2])",S=e?"i32(uniforms.x_shape[2])":"i32(uniforms.x_shape[3])",A=e?"row":"col",I=e?"col":"row",x=`\n let inChannels = i32(uniforms.w_shape[2]);\n let outWidth = ${e?"i32(uniforms.result_shape[2])":"i32(uniforms.result_shape[3])"};\n let outRow = ${A} / outWidth;\n let outCol = ${A} % outWidth;\n\n let WRow = ${I} / (i32(uniforms.w_shape[1]) * inChannels);\n let WCol = ${I} / inChannels % i32(uniforms.w_shape[1]);\n let xRow = outRow * uniforms.stride[0] + uniforms.dilation[0] * WRow - uniforms.pad[0];\n let xCol = outCol * uniforms.stride[1] + uniforms.dilation[1] * WCol - uniforms.pad[1];\n let xCh = ${I} % inChannels;\n var resData = ${tt(a,h)}(0.0);\n // The bounds checking is always needed since we use it to pad zero for\n // the \'same\' padding type.\n if (xRow >= 0 && xRow < ${v} && xCol >= 0 && xCol < ${S}) {\n ${w}\n let xIndex = getIndexFromCoords4D(coord, vec4(uniforms.x_shape));\n ${d(a)}\n }\n return resData;`,E=e?t&&o?`\n let col = colIn * ${a};\n ${x}`:`\n let col = colIn * ${a};\n if (row < uniforms.dim_a_outer && col < uniforms.dim_inner) {\n ${x}\n }\n return ${tt(a,h)}(0.0);`:o&&r?`\n let col = colIn * ${a};\n ${x}`:`\n let col = colIn * ${a};\n if (row < uniforms.dim_inner && col < uniforms.dim_b_outer) {\n ${x}\n }\n return ${tt(a,h)}(0.0);`,P=`${y(c)}`,O=tt(p,h),R=e?tt(a,h):tt(c,h),L=e?tt(c,h):tt(a,h),N=St(u,O,h);return`\n fn mm_readA(batch: i32, row : i32, colIn : i32) -> ${R} {\n ${e?E:P}\n }\n\n fn mm_readB(batch: i32, row : i32, colIn : i32) -> ${L} {\n ${e?P:E}\n }\n\n fn mm_write(batch: i32, row : i32, colIn : i32, valueIn : ${O}) {\n let col = colIn * ${p};\n if (row < uniforms.dim_a_outer && col < uniforms.dim_b_outer)\n {\n var value = valueIn;\n let outWidth = ${e?"i32(uniforms.result_shape[2])":"i32(uniforms.result_shape[3])"};\n ${_}\n ${Dn(i)}\n ${N}\n setOutputAtCoords(coords[0], coords[1], coords[2], coords[3], value);\n }\n }`},Qs=(e,t,r,o,i,u,a,c)=>{let p=t.format==="NHWC",h=p?e[0].dims[3]:e[0].dims[1],d=r[0],y=p?r[2]:r[3],w=p?r[1]:r[2],_=p?r[3]:r[1],v=p&&(h%4===0||h%3===0)&&_%4===0,S=p?_:y*w,A=p?y*w:_,I=[8,8,1],x=o<=8?[4,1,1]:[4,4,1],E=[Math.ceil(S/I[0]/x[0]),Math.ceil(A/I[1]/x[1]),Math.ceil(d/I[2]/x[2])];Ve("verbose",()=>`[conv2d_mm_webgpu] dispatch = ${E}`);let P=v?p&&h%4!==0?3:4:1,O=I[1]*x[1],R=I[0]*x[0],L=Math.max(I[0]*P,I[1]),N=o%O===0,K=i%R===0,Q=u%L===0,he=v?[P,4,4]:[1,1,1],W=[{type:6,data:o},{type:6,data:i},{type:6,data:u},{type:6,data:[t.pads[0],t.pads[1]]},{type:6,data:t.strides},{type:6,data:t.dilations}];xt(t,W),W.push(...Z(e[0].dims,e[1].dims));let se=["rank","rank"];a&&(W.push(...Z(e[2].dims)),se.push("rank")),W.push(...Z(r));let Ce=We=>{let ee=[{name:"dim_a_outer",type:"i32"},{name:"dim_b_outer",type:"i32"},{name:"dim_inner",type:"i32"},{name:"pad",type:"i32",length:2},{name:"stride",type:"i32",length:2},{name:"dilation",type:"i32",length:2}];Ct(t,ee);let ae=v?4:1,Ae=De(e[0].dataType),me=`\n fn setOutputAtIndex(flatIndex : i32, value : ${v?`vec4<${Ae}>`:Ae}) {\n result[flatIndex] = ${v?`vec4<${Ae}>`:Ae}(value);\n }\n fn setOutputAtCoords(d0 : i32, d1 : i32, d2 : i32, d3 : i32, value : ${v?`vec4<${Ae}>`:Ae}) {\n let flatIndex = getOutputIndexFromCoords(vec4(d0, d1, d2, d3));\n setOutputAtIndex(flatIndex ${v?"/ 4":""}, value);\n }`,ie=U("x",e[0].dataType,e[0].dims.length,P===3?1:P),ue=U("w",e[1].dataType,e[1].dims.length,ae),le=[ie,ue],qe=j("result",e[0].dataType,r.length,ae);if(a){let G=U("bias",e[2].dataType,e[2].dims.length,ae);le.push(G),me+=`\n fn getBiasByOutputCoords(coords : vec4) -> ${v?`vec4<${Ae}>`:Ae} {\n return bias[coords.${p?"w":"y"}${v?"/ 4":""}];\n }`}return`\n ${Mn("uniforms.result_strides")}\n //struct Uniforms { xShape : vec4, wShape : vec4, outShape : vec4,\n // outShapeStrides: vec3, filterDims : vec2, pad : vec2, stride : vec2,\n // dilation : vec2, dimAOuter : i32, dimBOuter : i32, dimInner : i32 };\n ${We.registerUniforms(ee).declareVariables(...le,qe)}\n ${me}\n ${$c(p,N,K,Q,a,t,he[0],he[1],he[2],Ae)}\n ${v?Hr(x,I,Ae,void 0,!p,L):Lr(x,I,Ae,void 0,!p,L,!1,void 0,c)}`};return{name:"Conv2DMatMul",shaderCache:{hint:`${t.cacheKey};${P};${v};${N};${K};${Q};${O};${R};${L}`,inputDependencies:se},getRunData:()=>({outputs:[{dims:r,dataType:e[0].dataType}],dispatchGroup:{x:E[0],y:E[1],z:E[2]},programUniforms:W}),getShaderSource:Ce}}});var Mo,eu,tu=Y(()=>{"use strict";ye();Se();_e();Uo();Ft();Mo=(e,t,r)=>{let o=e.length>2,i=o?"value += b[output_channel];":"",u=e[0].dims,a=e[1].dims,c=a[0]/t.group,p=t.format==="NHWC",h=Vn(u,a,t.dilations,t.pads,t.strides,p),d=M.size(h),y=[{type:12,data:d},{type:12,data:t.dilations},{type:12,data:[t.strides[0],t.strides[1]]},{type:12,data:[t.pads[0],t.pads[1]]},{type:12,data:c}];xt(t,y),y.push(...Z(u,a));let w=["rank","rank"];o&&(y.push(...Z(e[2].dims)),w.push("rank")),y.push(...Z(h));let _=v=>{let S=j("output",e[0].dataType,h.length),A=De(S.type.tensor),I=St(t,S.type.value,A),x=U("x",e[0].dataType,u.length),E=U("w",e[1].dataType,a.length),P=[x,E];o&&P.push(U("b",e[2].dataType,e[2].dims.length));let O=[{name:"output_size",type:"u32"},{name:"dilations",type:"u32",length:t.dilations.length},{name:"strides",type:"u32",length:2},{name:"pads",type:"u32",length:2},{name:"output_channels_per_group",type:"u32"}];return Ct(t,O),`\n ${v.registerUniforms(O).declareVariables(...P,S)}\n\n ${v.mainStart()}\n ${v.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")}\n\n let outputIndices = ${S.offsetToIndices("global_idx")};\n let batch: u32 = outputIndices[0];\n let output_channel: u32 = outputIndices[${p?3:1}];\n let xRCCorner: vec2 = vec2(outputIndices[${p?1:2}], outputIndices[${p?2:3}]) * uniforms.strides - uniforms.pads;\n let group_id: u32 = output_channel / uniforms.output_channels_per_group;\n\n var value: ${S.type.value} = ${S.type.value}(0);\n for (var wInChannel: u32 = 0u; wInChannel < uniforms.w_shape[1]; wInChannel++) {\n let input_channel = group_id * uniforms.w_shape[1] + wInChannel;\n for (var wHeight: u32 = 0u; wHeight < uniforms.w_shape[2]; wHeight++) {\n let xHeight = xRCCorner.x + wHeight * uniforms.dilations[0];\n\n if (xHeight < 0u || xHeight >= uniforms.x_shape[${p?1:2}]) {\n continue;\n }\n\n for (var wWidth: u32 = 0u; wWidth < uniforms.w_shape[3]; wWidth++) {\n let xWidth = xRCCorner.y + wWidth * uniforms.dilations[1];\n if (xWidth < 0u || xWidth >= uniforms.x_shape[${p?2:3}]) {\n continue;\n }\n\n let xVal = ${p?x.get("batch","xHeight","xWidth","input_channel"):x.get("batch","input_channel","xHeight","xWidth")};\n let wVal = ${E.get("output_channel","wInChannel","wHeight","wWidth")};\n value += xVal*wVal;\n }\n }\n }\n ${i}\n ${I}\n ${S.setByOffset("global_idx","value")}\n }`};return{name:"GroupedConv",shaderCache:{hint:t.cacheKey,inputDependencies:w},getRunData:()=>({outputs:[{dims:r?r(h):h,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(d/64)},programUniforms:y}),getShaderSource:_}},eu=(e,t,r)=>{let o=e.length>2,i=Me(r[3]),u=Me(r[2]),a=M.size(r)/i/u,c=[e[0].dims[0],e[0].dims[1],e[0].dims[2],e[0].dims[3]/i],p=[e[1].dims[0],e[1].dims[1],e[1].dims[2],e[1].dims[3]/i],h=[r[0],r[1],r[2],r[3]/i],d=[{type:12,data:a},{type:6,data:[t.strides[0],t.strides[1]]},{type:6,data:[t.pads[0],t.pads[1]]}];xt(t,d),d.push(...Z(c,p,h));let y=(u-1)*t.strides[1]+p[1],w=_=>{let v=j("output",e[0].dataType,h.length,i),S=De(v.type.tensor),A=St(t,v.type.value,S),I=U("x",e[0].dataType,c.length,i),x=U("w",e[1].dataType,p.length,i),E=[I,x];o&&E.push(U("b",e[2].dataType,e[2].dims,i));let P=o?"value += b[output_channel];":"",O=[{name:"output_size",type:"u32"},{name:"strides",type:"i32",length:2},{name:"pads",type:"i32",length:2}];return Ct(t,O),`\n ${_.registerUniforms(O).declareVariables(...E,v)}\n ${_.mainStart()}\n ${_.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")}\n let width0 = uniforms.output_shape[3];\n let output_channel = global_idx % width0;\n var index1 = global_idx / width0;\n let width1 = uniforms.output_shape[2] / ${u}u;\n let col = (index1 % width1) * ${u}u;\n index1 = index1 / width1;\n let row = index1 % uniforms.output_shape[1];\n let batch = index1 / uniforms.output_shape[1];\n\n let x_corner = vec2(i32(row), i32(col)) * uniforms.strides - uniforms.pads;\n\n var x_vals: array<${I.type.value}, ${y}>;\n var values: array<${v.type.value}, ${u}>;\n let input_channel = output_channel;\n // Use constant instead of uniform can give better performance for w\'s height/width.\n for (var w_height: u32 = 0u; w_height < ${p[0]}; w_height++) {\n let x_height = x_corner.x + i32(w_height);\n if (x_height >= 0 && u32(x_height) < uniforms.x_shape[1]) {\n for (var i = 0; i < ${y}; i++) {\n let x_width = x_corner.y + i;\n if (x_width >= 0 && u32(x_width) < uniforms.x_shape[2]) {\n x_vals[i] = ${I.get("batch","u32(x_height)","u32(x_width)","input_channel")};\n } else {\n x_vals[i] = ${I.type.value}(0);\n }\n }\n for (var w_width: u32 = 0u; w_width < ${p[1]}; w_width++) {\n let w_val = ${x.get("w_height","w_width","0","output_channel")};\n for (var i = 0u; i < ${u}u; i++) {\n values[i] = fma(x_vals[i * u32(uniforms.strides[1]) + w_width], w_val, values[i]);\n }\n }\n }\n }\n\n for (var i = 0u; i < ${u}u; i++) {\n var value = values[i];\n ${P}\n ${A}\n ${v.set("batch","row","col + i","output_channel","value")};\n }\n }`};return{name:"GroupedConv-Vectorize",shaderCache:{hint:`${t.cacheKey};${i};${u};${y};${p[0]};${p[1]}`,inputDependencies:o?["rank","rank","type"]:["rank","rank"]},getRunData:()=>({outputs:[{dims:r,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(a/64)},programUniforms:d}),getShaderSource:w}}});var Vo,_c,ru,Wo=Y(()=>{"use strict";ye();Se();Fr();_e();Ft();Vo=(e,t,r,o,i=!1)=>{let u=e[0].dims,a=e[1].dims,c=u[u.length-2],p=a[a.length-1],h=u[u.length-1],d=Me(p),y=Me(h),w=Me(c),_=M.size(r)/d/w,v=e.length>2,S=o?o.slice(0,-2):r.slice(0,-2),I=[M.size(S),c,p],x=[{type:12,data:_},{type:12,data:c},{type:12,data:p},{type:12,data:h}];xt(t,x),x.push(...Z(S,u,a)),v&&x.push(...Z(e[2].dims)),x.push(...Z(I));let E=P=>{let O=An("batch_dims",e[0].dataType,S.length),R=U("a",e[0].dataType,u.length,y),L=U("b",e[1].dataType,a.length,d),N=j("output",e[0].dataType,I.length,d),K=De(N.type.tensor),Q=St(t,N.type.value,K),he=[R,L],W="";if(v){let ie=i?d:1;he.push(U("bias",e[2].dataType,e[2].dims.length,ie)),W=`${i?`value += bias[col / ${ie}];`:`value += ${N.type.value}(bias[row + i]);`}`}let se=u.slice(0,-2),Ce=a.slice(0,-2),We=_r(se,S),ee=_r(Ce,S),ae=[{name:"output_size",type:"u32"},{name:"M",type:"u32"},{name:"N",type:"u32"},{name:"K",type:"u32"}];Ct(t,ae);let Ae=(ie,ue)=>{let le=ie.rank,qe=ie.name;if(le===2)return`var ${qe}_indices = ${ie.type.indices}(0u, 0u);`;let G=O.rank,ne=`var ${qe}_indices: ${ie.type.indices};`;for(let xe=le-2-1,Ke=G-1;xe>=0;xe--,Ke--)ne+=`\n${qe}_indices[${xe}] = ${G>1?`batch_indices[${Ke}]`:"batch_indices"};`;return ue.forEach(xe=>{ne+=`\n${qe}_indices[${xe}] = 0;`}),ne+=`${qe}_indices[${le-2}] = 0u;\n ${qe}_indices[${le-1}] = 0u;`,ne},me=()=>{let ie=`var a_data: ${R.type.value};`;for(let ue=0;ue;\n for (var k: u32 = 0u; k < uniforms.K; k = k + ${y}) {\n ${me()}\n }\n for (var i = 0u; i < ${w}u; i++) {\n var value = values[i];\n ${W}\n ${Q}\n let cur_indices = ${N.type.indices}(batch, row + i, col);\n let offset = ${N.indicesToOffset("cur_indices")};\n ${N.setByOffset(`offset / ${d}`,"value")};\n }\n }\n `};return{name:"MatMulNaive",shaderCache:{hint:`${t.activation};${d};${y};${w};${i}`,inputDependencies:v?["rank","rank","rank"]:["rank","rank"]},getRunData:()=>({outputs:[{dims:r,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(_/64)},programUniforms:x}),getShaderSource:E}},_c=e=>{if(!e||e.length!==2)throw new Error("MatMul requires 2 inputs.");if(e[0].dims[e[0].dims.length-1]!==e[1].dims[e[1].dims.length-2])throw new Error("shared dimension does not match.")},ru=e=>{_c(e.inputs);let t=It.calcShape(e.inputs[0].dims,e.inputs[1].dims,!0);if(!t)throw new Error("Can\'t use matmul on the given tensors");let r=t[t.length-1],o=e.inputs[0].dims[e.inputs[0].dims.length-1];r<8&&o<8?e.compute(Vo(e.inputs,{activation:""},t)):e.compute(Un(e.inputs,{activation:""},t))}});var Vn,No,Sc,nu,Go,xc,Cc,Ho,Uo=Y(()=>{"use strict";Se();Js();Fr();tu();Ft();Wo();Sr();Vn=(e,t,r,o,i,u)=>{let a=e[0],c=e.slice(u?1:2,u?3:4),p=c.length,h=t[0],y=t.slice(2).map((v,S)=>v+(v-1)*(r[S]-1)),_=c.map((v,S)=>v+o[S]+o[S+p]).map((v,S)=>Math.floor((v-y[S]+i[S])/i[S]));return _.splice(0,0,a),_.splice(u?3:1,0,h),_},No=[2,3,1,0],Sc=(e,t)=>{if(!e||e.length!==2&&e.length!==3)throw new Error("Conv requires 2 or 3 inputs");if(e[0].dims.length!==4&&e[0].dims.length!==3)throw new Error("currently only support conv 1D and 2D");if(e[0].dims.length!==e[1].dims.length)throw new Error("filter does not have same dimension as input");let r=e[0].dims[t.format==="NHWC"?e[0].dims.length-1:1],o=e[1].dims[1]*t.group;if(r!==o)throw new Error("FILTER_IN_CHANNEL should be equal to DATA_CHANNEL");if(e.length===3&&(e[2].dims.length!==1||e[1].dims[0]!==e[2].dims[0]))throw new Error("invalid bias");let i=e[0].dims.length-2;if(t.dilations.length!==i)throw new Error(`dilations should be ${i}D`);if(t.strides.length!==i)throw new Error(`strides should be ${i}D`);if(t.pads.length!==i*2)throw new Error(`pads should be ${i*2}D`);if(t.kernelShape.length!==0&&t.kernelShape.length!==e[1].dims.length-2)throw new Error("invalid kernel shape")},nu=(e,t)=>{let r=e.kernelShape.slice();for(let u=2;u{let t=Bn(e),r=e.format,o=["NOTSET","VALID","SAME_UPPER","SAME_LOWER"][e.auto_pad],i=e.dilations,u=e.group,a=e.kernel_shape,c=e.pads,p=e.strides,h=e.w_is_const();return{autoPad:o,format:r,dilations:i,group:u,kernelShape:a,pads:c,strides:p,wIsConst:h,...t,cacheKey:`${e.format};${t.activation};`}},xc=(e,t,r)=>{let o=nu(r,t),i=r.format==="NHWC";if(r.group!==1){if(!e.adapterInfo.isArchitecture("ampere")&&i&&t[1].dims[0]===r.group&&t[1].dims[1]===1&&r.dilations[0]===1&&r.dilations[1]===1){let L=Vn(t[0].dims,t[1].dims,r.dilations,o.pads,r.strides,i),N=e.kernelCustomData.wT??e.compute(yt(t[1],No),{inputs:[1],outputs:[r.wIsConst?-2:-1]})[0];r.wIsConst&&!e.kernelCustomData.wT&&(e.kernelCustomData.wT=N);let K=[t[0],N];t.length===3&&K.push(t[2]),e.compute(eu(K,o,L),{inputs:K})}else e.compute(Mo(t,o));return}let u=t.length===3,a=t[0].dims[i?1:2],c=t[0].dims[i?2:3],p=t[0].dims[i?3:1],h=t[1].dims[2],d=t[1].dims[3],y=Vn(t[0].dims,t[1].dims,r.dilations,o.pads,r.strides,i),w=y[i?1:2],_=y[i?2:3],v=y[i?3:1],S=i&&h===a&&d===c&&r.pads[0]===0&&r.pads[1]===0;if(S||h===1&&d===1&&r.dilations[0]===1&&r.dilations[1]===1&&r.strides[0]===1&&r.strides[1]===1&&r.pads[0]===0&&r.pads[1]===0){let R=y[0],L,N,K,Q=[];if(i){let se=e.kernelCustomData.wT??e.compute(yt(t[1],No),{inputs:[1],outputs:[r.wIsConst?-2:-1]})[0];if(r.wIsConst&&!e.kernelCustomData.wT&&(e.kernelCustomData.wT=se),S){let Ce=a*c*p;L=t[0].reshape([1,R,Ce]),N=se.reshape([1,Ce,v]),K=[1,R,v]}else L=t[0].reshape([R,a*c,p]),N=se.reshape([1,p,v]),K=[R,w*_,v];Q.push(L),Q.push(N)}else L=t[0].reshape([R,p,a*c]),N=t[1].reshape([1,v,p]),K=[R,v,w*_],Q.push(N),Q.push(L);u&&Q.push(t[2]);let he=K[2],W=Q[0].dims[Q[0].dims.length-1];he<8&&W<8?e.compute(Vo(Q,o,y,K,i),{inputs:Q}):e.compute(Un(Q,o,y,K,i),{inputs:Q});return}let A=!0,I=e.kernelCustomData.wT??e.compute(yt(t[1],No),{inputs:[1],outputs:[r.wIsConst?-2:-1]})[0];r.wIsConst&&!e.kernelCustomData.wT&&(e.kernelCustomData.wT=I);let x=[t[0],I];u&&x.push(t[2]);let E=i?w*_:v,P=i?v:w*_,O=h*d*p;e.compute(Qs(x,o,y,E,P,O,u,A),{inputs:x})},Cc=(e,t)=>{let r=t.format==="NHWC",o=[e.inputs[0].reshape(r?[e.inputs[0].dims[0],1,e.inputs[0].dims[1],e.inputs[0].dims[2]]:[e.inputs[0].dims[0],e.inputs[0].dims[1],1,e.inputs[0].dims[2]]),e.inputs[1].reshape([e.inputs[1].dims[0],e.inputs[1].dims[1],1,e.inputs[1].dims[2]])];e.inputs.length===3&&o.push(e.inputs[2]);let i=[0,t.pads[0],0,t.pads[1]],u=[1].concat(t.strides),a=[1].concat(t.dilations),c=[1].concat(t.kernelShape),p=nu({...t,pads:i,strides:u,dilations:a,kernelShape:c},o);e.compute(Mo(o,p,h=>r?[h[0],h[2],h[3]]:[]))},Ho=(e,t)=>{Sc(e.inputs,t),e.inputs[0].dims.length===3?Cc(e,t):xc(e,e.inputs,t)}});var Ac,ou,iu=Y(()=>{"use strict";ye();Lt();_e();Ft();zn();zo();Fr();Ac=(e,t=!1,r,o,i=4)=>{let u=I=>{switch(I){case 1:return"return w[getIndexFromCoords4D(coord, vec4(uniforms.w_shape))];";case 4:return`\n let coord1 = vec4(coordX, coordY, col + 1, rowInner);\n let coord2 = vec4(coordX, coordY, col + 2, rowInner);\n let coord3 = vec4(coordX, coordY, col + 3, rowInner);\n let v0 = w[getIndexFromCoords4D(coord, vec4(uniforms.w_shape))];\n let v1 = w[getIndexFromCoords4D(coord1, vec4(uniforms.w_shape))];\n let v2 = w[getIndexFromCoords4D(coord2, vec4(uniforms.w_shape))];\n let v3 = w[getIndexFromCoords4D(coord3, vec4(uniforms.w_shape))];\n return ${o}(v0, v1, v2, v3);\n `;default:throw new Error(`innerElementSize ${I} is not supported.`)}},a=e?`\n let coord = vec4(batch, iXR, iXC, xCh);\n `:`\n let coord = vec4(batch, xCh, iXR, iXC);\n `,c=e?`\n let coords = vec4(\n batch,\n row / outWidth,\n row % outWidth,\n col);\n `:`\n let coords = vec4(\n batch,\n row,\n col / outWidth,\n col % outWidth);\n `,p=e?"i32(uniforms.x_shape[1])":"i32(uniforms.x_shape[2])",h=e?"i32(uniforms.x_shape[2])":"i32(uniforms.x_shape[3])",d=e?"row":"col",y=e?"col":"row",w=`\n let inChannels = ${e?"i32(uniforms.x_shape[3])":"i32(uniforms.x_shape[1])"};\n let outWidth = ${e?"i32(uniforms.result_shape[2])":"i32(uniforms.result_shape[3])"};\n let outRow = ${d} / outWidth;\n let outCol = ${d} % outWidth;\n\n let WRow = ${y} / (uniforms.filter_dims[1] * inChannels);\n let WCol = ${y} / inChannels % uniforms.filter_dims[1];\n let xR = f32(outRow - uniforms.pads[0] + uniforms.dilations[0] * WRow) / f32(uniforms.strides[0]);\n let xC = f32(outCol - uniforms.pads[1] + uniforms.dilations[1] * WCol) / f32(uniforms.strides[1]);\n if (xR < 0.0 || xR >= f32(${p}) || fract(xR) > 0.0) {\n return ${o}(0.0);\n }\n if (xC < 0.0 || xC >= f32(${h}) || fract(xC) > 0.0) {\n return ${o}(0.0);\n }\n let iXR = i32(xR);\n let iXC = i32(xC);\n let xCh = ${y} % inChannels;\n ${a}\n return x[getIndexFromCoords4D(coord, vec4(uniforms.x_shape))/${i}];`,_=e?`\n let col = colIn * ${i};\n if (row < uniforms.dim_a_outer && col < uniforms.dim_inner) {\n ${w}\n }\n return ${o}(0.0);`:`\n let col = colIn * ${i};\n if (row < uniforms.dim_inner && col < uniforms.dim_b_outer) {\n ${w}\n }\n return ${o}(0.0);`,v=`\n let col = colIn * ${i};\n let inChannels = ${e?"i32(uniforms.x_shape[3])":"i32(uniforms.x_shape[1])"};\n let coordX = uniforms.filter_dims[0] - 1 - row / (uniforms.filter_dims[1] * inChannels);\n let coordY = uniforms.filter_dims[1] - 1 - (row / inChannels) % uniforms.filter_dims[1];\n if (${e?"row < uniforms.dim_inner && col < uniforms.dim_b_outer":"row < uniforms.dim_inner && col < uniforms.dim_a_outer"} && coordX >= 0 && coordY >= 0) {\n let rowInner = row % inChannels;\n let coord = vec4(coordX, coordY, col, rowInner);\n ${u(i)}\n }\n return ${o}(0.0);\n `,S=St(r,o);return`\n fn mm_readA(batch: i32, row : i32, colIn : i32) -> ${o} {\n ${e?_:v}\n }\n\n fn mm_readB(batch: i32, row : i32, colIn : i32) -> ${o} {\n ${e?v:_}\n }\n\n fn mm_write(batch: i32, row : i32, colIn : i32, valueInput : ${o}) {\n let col = colIn * ${i};\n if (row < uniforms.dim_a_outer && col < uniforms.dim_b_outer) {\n var value = valueInput;\n let outWidth = ${e?"i32(uniforms.result_shape[2])":"i32(uniforms.result_shape[3])"};\n ${c}\n ${Dn(t)}\n ${S}\n result[getIndexFromCoords4D(coords, vec4(uniforms.result_shape))/${i}] = value;\n }\n }`},ou=(e,t,r,o,i,u,a,c)=>{let p=t.format==="NHWC",h=p?e[0].dims[3]:e[0].dims[1],d=r[0],y=p?r[2]:r[3],w=p?r[1]:r[2],_=p?r[3]:r[1],v=p&&h%4===0&&h%3&&_%4===0,S=p?_:y*w,A=p?y*w:_,I=[8,8,1],x=o<=8?[4,1,1]:[4,4,1],E=[Math.ceil(S/I[0]/x[0]),Math.ceil(A/I[1]/x[1]),Math.ceil(d/I[2]/x[2])];Ve("verbose",()=>`[conv_backprop_mm_webgpu] dispatch = ${E}`);let P=v?4:1,O=Math.max(I[0]*P,I[1]),R=v?4:1,L=[t.kernelShape[p?1:2],t.kernelShape[p?2:3]],N=[L[0]+(t.dilations[0]<=1?0:(L[0]-1)*(t.dilations[0]-1)),L[1]+(t.dilations[1]<=1?0:(L[1]-1)*(t.dilations[1]-1))],K=[N[0]-1-Math.floor((t.pads[0]+t.pads[2])/2),N[1]-1-Math.floor((t.pads[1]+t.pads[3])/2)],Q=[{type:6,data:o},{type:6,data:i},{type:6,data:u},{type:6,data:t.strides},{type:6,data:t.dilations},{type:6,data:L},{type:6,data:K}];xt(t,Q),Q.push(...Z(e[0].dims,e[1].dims));let he=["rank","rank"];a&&(Q.push(...Z(e[2].dims)),he.push("rank")),Q.push(...Z(r));let W=se=>{let Ce=U("x",e[0].dataType,e[0].dims.length,R),We=U("w",e[1].dataType,e[1].dims.length,1),ee=j("result",e[0].dataType,r.length,R),ae=[Ce,We],Ae="";if(a){let ue=U("bias",e[2].dataType,e[2].dims.length,R);ae.push(ue),Ae+=`\n fn getBiasByOutputCoords(coords : vec4) -> ${ue.type.value} {\n return bias[coords.${p?"w":"y"}${v?"/ 4":""}];\n }`}let me=[{name:"dim_a_outer",type:"i32"},{name:"dim_b_outer",type:"i32"},{name:"dim_inner",type:"i32"},{name:"strides",type:"i32",length:2},{name:"dilations",type:"i32",length:2},{name:"filter_dims",type:"i32",length:L.length},{name:"pads",type:"i32",length:K.length}];Ct(t,me);let ie=De(e[0].dataType,1);if(ie!=="f16"&&ie!=="f32")throw new Error(`elemType ${ie} is not supported.`);return`\n ${Mn("uniforms.result_strides")}\n ${se.registerUniforms(me).declareVariables(...ae,ee)};\n ${Ae}\n ${Ac(p,a,t,Ce.type.value,P)}\n ${v?Hr(x,I,ie,void 0,!p,O):Lr(x,I,ie,void 0,!p,O,!1,void 0,c)}`};return{name:"Conv2DTransposeMatMul",shaderCache:{hint:`${t.cacheKey};${x};${I};${v}`,inputDependencies:he},getRunData:()=>({outputs:[{dims:r,dataType:e[0].dataType}],dispatchGroup:{x:E[0],y:E[1],z:E[2]},programUniforms:Q}),getShaderSource:W}}});var Ic,Lo,au=Y(()=>{"use strict";ye();Lt();Se();_e();Ic=(e,t,r,o,i,u=!1,a,c,p=!1)=>{let h=p?1:2,d=p?2:3,y=p?3:1,w=u?2:1,_=`\n fn setOutputAtIndex(flatIndex : u32, value : ${u?`vec4<${a}>`:a}) {\n result[flatIndex] = ${u?`vec4<${a}>`:a}(value);\n }`;o&&(_+=`\n fn getBiasByOutputCoords(coords : vec4) -> ${u?`vec4<${a}>`:a} {\n return bias[coords.${p?"w":"y"}${u?"/ 4":""}];\n }`);let v=u?4:1,S=U("W",t[1].dataType,t[1].dims.length,v),A=U("Dy",t[0].dataType,t[0].dims.length,v),I=[A,S];o&&I.push(U("bias",t[2].dataType,[r[y]].length,v));let x=j("result",t[0].dataType,r.length,v),E=`{\n let batch: u32 = ${i?"global_id.z":"workgroup_id.z"} / uniforms.result_shape[1];\n let r = ${i?"global_id.z":"workgroup_id.z"} % uniforms.result_shape[1];\n let c = ${i?"global_id.y":"workgroup_id.y"} * ${w};\n let d1: u32 = ${i?"global_id.x":"workgroup_id.x"} * 4;\n\n let dyCorner = vec2(i32(r), i32(c)) - vec2(uniforms.pads);\n\n // Convolve dy(?, ?, d2) with w(:, :, d1, d2) to compute dx(xR, xC, d1).\n // ? = to be determined. : = across all values in that axis.\n var dotProd: array, ${w}>;\n for (var i = 0; i < ${w}; i++) {\n dotProd[i] = vec4<${a}>(0.0);\n }\n for (var wR: u32 = 0; wR < uniforms.filter_dims[0]; wR = wR + 1) {\n var dyR = (${a}(dyCorner.x) + ${a}(wR)) / ${a}(uniforms.strides.x);\n let wRPerm = uniforms.filter_dims[0] - 1 - wR;\n if (dyR < 0.0 || dyR >= ${a}(uniforms.Dy_shape[1]) ||\n fract(dyR) > 0.0 || wRPerm < 0) {\n continue;\n }\n let idyR: u32 = u32(dyR);\n\n for (var wC: u32 = 0; wC < uniforms.filter_dims[1]; wC = wC + 1) {\n let dyC = (${a}(dyCorner.y) + ${a}(wC)) / ${a}(uniforms.strides.y);\n let dyC2 = (${a}(dyCorner.y) + 1.0 + ${a}(wC)) / ${a}(uniforms.strides.y);\n let wCPerm = uniforms.filter_dims[1] - 1 - wC;\n if (wCPerm < 0) {\n continue;\n }\n var bDyCVal = true;\n var bDyCVal2 = true;\n if (dyC < 0.0 || dyC >= ${a}(uniforms.Dy_shape[2]) ||\n fract(dyC) > 0.0) {\n bDyCVal = false;\n }\n if (dyC2 < 0.0 || dyC2 >= ${a}(uniforms.Dy_shape[2]) ||\n fract(dyC2) > 0.0) {\n bDyCVal2 = false;\n }\n\n let idyC: u32 = u32(dyC);\n let idyC2: u32 = u32(dyC2);\n if (bDyCVal && bDyCVal2) {\n let d2Length = uniforms.Dy_shape[3];\n for (var d2 :u32 = 0; d2 < d2Length; d2 = d2 + 4) {\n let wValue0 = ${S.get("u32(wRPerm)","u32(wCPerm)","d1","d2")};\n let wValue1 = ${S.get("u32(wRPerm)","u32(wCPerm)","d1 + 1","d2")};\n let wValue2 = ${S.get("u32(wRPerm)","u32(wCPerm)","d1 + 2","d2")};\n let wValue3 = ${S.get("u32(wRPerm)","u32(wCPerm)","d1 + 3","d2")};\n\n var xValue = ${A.get("batch","idyR","idyC","d2")};\n let tmpval = vec4<${a}>(dot(xValue, wValue0),\n dot(xValue, wValue1),\n dot(xValue, wValue2),\n dot(xValue, wValue3));\n dotProd[0] = dotProd[0] + tmpval;\n\n xValue = ${A.get("batch","idyR","idyC2","d2")};\n\n dotProd[1] = dotProd[1] + vec4<${a}>(dot(xValue, wValue0),\n dot(xValue, wValue1),\n dot(xValue, wValue2),\n dot(xValue, wValue3));\n }\n } else if (bDyCVal) {\n let d2Length = uniforms.Dy_shape[${y}];\n for (var d2: u32 = 0; d2 < d2Length; d2 = d2 + 4) {\n let wValue0 = ${S.get("u32(wRPerm)","u32(wCPerm)","d1","d2")};\n let wValue1 = ${S.get("u32(wRPerm)","u32(wCPerm)","d1 + 1","d2")};\n let wValue2 = ${S.get("u32(wRPerm)","u32(wCPerm)","d1 + 2","d2")};\n let wValue3 = ${S.get("u32(wRPerm)","u32(wCPerm)","d1 + 3","d2")};\n\n var xValue = ${A.get("batch","idyR","idyC","d2")};\n let tmpval = vec4<${a}>(dot(xValue, wValue0),\n dot(xValue, wValue1),\n dot(xValue, wValue2),\n dot(xValue, wValue3));\n dotProd[0] = dotProd[0] + tmpval;\n }\n } else if (bDyCVal2) {\n let d2Length = uniforms.Dy_shape[3];\n for (var d2: u32 = 0; d2 < d2Length; d2 = d2 + 4) {\n let wValue0 = ${S.get("u32(wRPerm)","u32(wCPerm)","d1","d2")};\n let wValue1 = ${S.get("u32(wRPerm)","u32(wCPerm)","d1 + 1","d2")};\n let wValue2 = ${S.get("u32(wRPerm)","u32(wCPerm)","d1 + 2","d2")};\n let wValue3 = ${S.get("u32(wRPerm)","u32(wCPerm)","d1 + 3","d2")};\n\n var xValue = ${A.get("batch","idyR","idyC2","d2")};\n let tmpval = vec4<${a}>(dot(xValue, wValue0),\n dot(xValue, wValue1),\n dot(xValue, wValue2),\n dot(xValue, wValue3));\n dotProd[1] = dotProd[1] + tmpval;\n }\n }\n }\n }\n\n for (var i: u32 = 0; i < ${w}; i = i + 1) {\n let value = dotProd[i] + ${o?"bias[c+i]":`vec4<${a}>(0.0)`};\n ${x.set("batch","r","c + i","d1","value")};\n }\n }`,P=`\n let outputIndices = ${x.offsetToIndices("global_idx")};\n let batch = ${x.indicesGet("outputIndices",0)};\n let d1 = ${x.indicesGet("outputIndices",y)};\n let r = ${x.indicesGet("outputIndices",h)};\n let c = ${x.indicesGet("outputIndices",d)};\n let dyCorner = vec2(i32(r), i32(c)) - uniforms.pads;\n let dyRCorner = dyCorner.x;\n let dyCCorner = dyCorner.y;\n let groupId = d1 / uniforms.output_channels_per_group;\n let wOutChannel = d1 - groupId * uniforms.output_channels_per_group;\n // Convolve dy(?, ?, d2) with w(:, :, d1, d2) to compute dx(xR, xC, d1).\n // ? = to be determined. : = across all values in that axis.\n var dotProd = ${a}(0.0);\n for (var wR: u32 = 0; wR < uniforms.effective_filter_dims.x; wR = wR + 1) {\n if (wR % uniforms.dilations.x != 0) {\n continue;\n }\n let dyR = (${a}(dyRCorner) + ${a}(wR)) / ${a}(uniforms.strides[0]);\n let wRPerm = uniforms.filter_dims.x - 1 - wR / uniforms.dilations.x;\n if (dyR < 0.0 || dyR >= ${a}(uniforms.Dy_shape[${h}]) || fract(dyR) > 0.0 ||\n wRPerm < 0) {\n continue;\n }\n let idyR: u32 = u32(dyR);\n\n for (var wC: u32 = 0; wC < uniforms.effective_filter_dims.y; wC = wC + 1) {\n if (wC % uniforms.dilations.y != 0) {\n continue;\n }\n let dyC = (${a}(dyCCorner) + ${a}(wC)) / ${a}(uniforms.strides.y);\n let wCPerm = uniforms.filter_dims.y - 1 - wC / uniforms.dilations.y;\n if (dyC < 0.0 || dyC >= ${a}(uniforms.Dy_shape[${d}]) ||\n fract(dyC) > 0.0 || wCPerm < 0) {\n continue;\n }\n let idyC: u32 = u32(dyC);\n var inputChannel = groupId * uniforms.input_channels_per_group;\n for (var d2: u32 = 0; d2 < uniforms.input_channels_per_group; d2 = d2 + 1) {\n let xValue = ${p?A.get("batch","idyR","idyC","inputChannel"):A.get("batch","inputChannel","idyR","idyC")};\n let wValue = ${S.get("inputChannel","wOutChannel","u32(wRPerm)","u32(wCPerm)")};\n dotProd = dotProd + xValue * wValue;\n inputChannel = inputChannel + 1;\n }\n }\n }\n let value = dotProd + ${o?"bias[d1]":`${a}(0.0)`};\n ${x.setByOffset("global_idx","value")};\n `;return`\n ${e.registerUniforms(c).declareVariables(...I,x)}\n ${_}\n\n ${e.mainStart()}\n ${e.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")};\n ${u?E:P}}`},Lo=(e,t,r)=>{let o=e.length>2,i=t.outputShape,u=M.size(i),a=[Math.ceil(u/64),1,1];Ve("verbose",()=>`[conv2d_backprop_webgpu] dispatch = ${a}`);let c=t.format==="NHWC",p=["rank","rank"],h=[t.strides[0],t.strides[1]],d=[t.kernelShape[c?1:2],t.kernelShape[c?2:3]],y=[t.dilations[0],t.dilations[1]],w=[d[0]+(t.dilations[0]<=1?0:(t.kernelShape[c?1:2]-1)*(t.dilations[0]-1)),d[1]+(t.dilations[1]<=1?0:(t.kernelShape[c?2:3]-1)*(t.dilations[1]-1))],_=[w[0]-1-Math.floor((t.pads[0]+t.pads[2])/2),w[1]-1-Math.floor(t.pads[1]+t.pads[3])/2],v=!1,S=t.group,A=e[1].dims,I=A[0]/S,x=A[1],E=[{type:12,data:u},{type:12,data:h},{type:12,data:d},{type:12,data:y},{type:12,data:w},{type:6,data:_},{type:12,data:I},{type:12,data:x},...Z(e[0].dims,e[1].dims)];o&&(E.push(...Z(e[2].dims)),p.push("rank")),E.push(...Z(i));let P=a[1]===1&&a[2]===1,O=R=>{let L=[{name:"output_size",type:"u32"},{name:"strides",type:"u32",length:h.length},{name:"filter_dims",type:"u32",length:d.length},{name:"dilations",type:"u32",length:d.length},{name:"effective_filter_dims",type:"u32",length:w.length},{name:"pads",type:"i32",length:_.length},{name:"input_channels_per_group",type:"u32"},{name:"output_channels_per_group",type:"u32"}],N=De(e[0].dataType);return`${Ic(R,e,i,o,P,v,N,L,c)}`};return{name:"ConvTranspose2D",shaderCache:{hint:`${t.cacheKey};`,inputDependencies:p},getRunData:()=>({dispatchGroup:{x:a[0],y:a[1],z:a[2]},outputs:[{dims:r?r(i):i,dataType:e[0].dataType}],programUniforms:E}),getShaderSource:O}}});var Tc,Ec,Pc,su,uu,kc,Oc,Rc,Bc,du,lu=Y(()=>{"use strict";iu();au();Ft();Sr();Tc=(e,t,r,o,i,u)=>(e-1)*t+r+(o-1)*i+1-u,Ec=(e,t,r,o,i)=>{let u=Math.floor(e/2);t==="SAME_UPPER"?(r[o]=u,r[i]=e-u):t==="SAME_LOWER"&&(r[o]=e-u,r[i]=u)},Pc=(e,t,r,o,i,u,a,c,p,h)=>{let d=e.length-2,y=h.length===0;if(p.length===0)for(let v=0;v{let r=e.kernelShape.slice();if(e.kernelShape.length===0||e.kernelShape.reduce((y,w)=>y*w,1)===0){r.length=0;for(let y=2;yy+w,0)===0){let y=t[0].dims.length-2;p=new Array(y).fill(1)}let h=e.strides.slice();if(h.reduce((y,w)=>y+w,0)===0){let y=t[0].dims.length-2;h=new Array(y).fill(1)}Pc(c,r,p,e.autoPad,e.group,i,h,o,a,u);let d=Object.assign({},e);return Object.assign(d,{kernelShape:r,pads:i,outputPadding:a,outputShape:u,dilations:p,strides:h}),d},uu=e=>{let t=Bn(e),r=e.format,o=["NOTSET","VALID","SAME_UPPER","SAME_LOWER"][typeof e.autoPad>"u"?0:e.autoPad],i=e.dilations,u=e.group,a=e.kernelShape,c=e.pads,p=e.strides,h=e.wIsConst(),d=e.outputPadding,y=e.outputShape;return{autoPad:o,format:r,dilations:i,group:u,kernelShape:a,outputPadding:d,outputShape:y,pads:c,strides:p,wIsConst:h,...t,cacheKey:`${e.format};${t.activation};`}},kc=(e,t)=>{if(!e||e.length!==2&&e.length!==3)throw new Error("Conv requires 2 or 3 inputs");if(e[0].dims.length!==4&&e[0].dims.length!==3)throw new Error("currently only support 2-dimensional conv");if(e[0].dims.length!==e[1].dims.length)throw new Error("filter does not have same dimension as input");let r=e[0].dims[t.format==="NHWC"?e[0].dims.length-1:1],o=e[1].dims[0];if(r!==o)throw new Error("FILTER_IN_CHANNEL should be equal to DATA_CHANNEL");let i=e[1].dims[1]*t.group;if(e.length===3&&(e[2].dims.length!==1||e[2].dims[0]!==i))throw new Error("invalid bias");let u=e[0].dims.length-2;if(t.dilations.reduce((d,y)=>d+y,0)>0&&t.dilations.length!==u)throw new Error(`dilations should be ${u}D`);if(t.strides.reduce((d,y)=>d+y,0)>0&&t.strides.length!==u)throw new Error(`strides should be ${u}D`);if(t.pads.reduce((d,y)=>d+y,0)>0&&t.pads.length!==u*2)throw new Error(`pads should be ${u*2}D`);if(t.outputPadding.length!==u&&t.outputPadding.length!==0)throw new Error(`output_padding should be ${u}D`);if(t.kernelShape.reduce((d,y)=>d+y,0)>0&&t.kernelShape.length!==0&&t.kernelShape.length!==e[1].dims.length-2)throw new Error("invalid kernel shape");if(t.outputShape.length!==0&&t.outputShape.length!==e[0].dims.length-2)throw new Error("invalid output shape")},Oc=[2,3,1,0],Rc=(e,t,r)=>{let o=su(r,t),i=r.format==="NHWC",u=o.outputShape,a=u[i?3:1],c=t[0].dims[i?3:1];if(o.group!==1||a===1&&c===1){e.compute(Lo(t,o));return}let p=u[i?1:2],h=u[i?2:3],d=t[1].dims[2],y=t[1].dims[3],w=i?p*h:a,_=i?a:p*h,v=d*y*c,S=!0,A=e.kernelCustomData.wT??e.compute(yt(t[1],Oc),{inputs:[1],outputs:[r.wIsConst?-2:-1]})[0];r.wIsConst&&!e.kernelCustomData.wT&&(e.kernelCustomData.wT=A);let I=[t[0],A],x=t.length===3;x&&(!i&&t[2].dims.length===1?I.push(t[2].reshape([t[2].dims[0],1,1])):I.push(t[2])),e.compute(ou(I,o,u,w,_,v,x,S),{inputs:I})},Bc=(e,t)=>{let r=t.format==="NHWC",o=[e.inputs[0].reshape(r?[e.inputs[0].dims[0],1,e.inputs[0].dims[1],e.inputs[0].dims[2]]:[e.inputs[0].dims[0],e.inputs[0].dims[1],1,e.inputs[0].dims[2]]),e.inputs[1].reshape([e.inputs[1].dims[0],e.inputs[1].dims[1],1,e.inputs[1].dims[2]])];e.inputs.length===3&&o.push(e.inputs[2]);let i=t.kernelShape;(i.length===0||i[0]===0)&&(i=[e.inputs[1].dims[2]]);let u=t.dilations;(u.length===0||u[0]===0)&&(u=[1]);let a=t.strides;(a.length===0||a[0]===0)&&(a=[1]);let c=t.pads;c.length===0&&(c=[0,0]),c=[0,c[0],0,c[1]],a=[1].concat(a),u=[1].concat(u),i=[1].concat(i);let p=su({...t,pads:c,strides:a,dilations:u,kernelShape:i},o);e.compute(Lo(o,p,h=>r?[h[0],h[2],h[3]]:[h[0],h[1],h[3]]))},du=(e,t)=>{kc(e.inputs,t),e.inputs[0].dims.length===3?Bc(e,t):Rc(e,e.inputs,t)}});var Dc,cu,pu,mu=Y(()=>{"use strict";ye();Se();Ze();_e();Dc=(e,t,r,o)=>{let i=M.size(t),u=t.length,a=U("input",e,u),c=j("output",e,u),p=r.dataType===6?r.getInt32Array()[0]:Number(r.getBigInt64Array()[0]),h=M.normalizeAxis(p,u),d=y=>{let w=` i32(${a.indicesGet("inputIndices","uniforms.axis")}) `,_=fe("uniforms.input_shape","uniforms.axis",u),v=o.reverse?w+(o.exclusive?" + 1":""):"0",S=o.reverse?_:w+(o.exclusive?"":" + 1");return`\n ${y.registerUniform("outputSize","u32").registerUniform("axis","u32").declareVariables(a,c)}\n ${y.mainStart()}\n ${y.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")}\n var inputIndices = ${c.offsetToIndices("global_idx")};\n var sum = ${c.type.value}(0);\n let first : i32 = ${v};\n let last : i32 = ${S};\n for (var i : i32 = first; i < last; i++) {\n ${a.indicesSet("inputIndices","uniforms.axis","u32(i)")};\n sum = sum + ${a.getByIndices("inputIndices")};\n }\n ${c.setByOffset("global_idx","sum")};\n }`};return{name:"CumSum",shaderCache:{hint:o.cacheKey,inputDependencies:["rank"]},getRunData:()=>({outputs:[{dims:t,dataType:e}],dispatchGroup:{x:Math.ceil(i/64)},programUniforms:[{type:12,data:i},{type:12,data:h},...Z(t,t)]}),getShaderSource:d}},cu=(e,t)=>{let r=e.inputs[0].dims,o=e.inputs[0].dataType,i=e.inputs[1];e.compute(Dc(o,r,i,t),{inputs:[0]})},pu=e=>{let t=e.exclusive===1,r=e.reverse===1;return ve({exclusive:t,reverse:r})}});var zc,Mc,Uc,fu,hu,gu=Y(()=>{"use strict";ye();Se();Ze();_e();zc=e=>{if(!e||e.length!==1)throw new Error("DepthToSpace requires 1 input.");if(e[0].dims.length!==4)throw new Error("DepthToSpace requires 4D input.")},Mc=(e,t,r,o)=>{let i=[];i.push(`fn perm(i: ${o.type.indices}) -> ${r.type.indices} {\n var a: ${r.type.indices};`);for(let u=0;u{let r,o,i,u,a,c,p=t.format==="NHWC",h=t.blocksize,d=t.mode==="DCR";p?([r,o,i,u]=e.dims,a=d?[r,o,i,h,h,u/h**2]:[r,o,i,u/h**2,h,h],c=d?[0,1,3,2,4,5]:[0,1,4,2,5,3]):([r,o,i,u]=[e.dims[0],e.dims[2],e.dims[3],e.dims[1]],a=d?[r,h,h,u/h**2,o,i]:[r,u/h**2,h,h,o,i],c=d?[0,3,4,1,5,2]:[0,1,4,2,5,3]);let y=e.reshape(a),w=y.dims.length,_=e.dataType,v=U("a",_,w),S=j("output",_,w),A=I=>`\n ${I.registerUniform("output_size","u32").declareVariables(v,S)}\n\n ${Mc(c,w,v,S)}\n\n ${I.mainStart()}\n ${I.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")}\n\n let indices = ${S.offsetToIndices("global_idx")};\n let aIndices = perm(indices);\n\n ${S.setByOffset("global_idx",v.getByIndices("aIndices"))}\n }`;return{name:"DepthToSpace",shaderCache:{hint:`${e.dims};${t.blocksize};${t.mode}`,inputDependencies:["rank"]},getRunData:I=>{let x=p?[r,o*h,i*h,u/h**2]:[r,u/h**2,o*h,i*h],E=M.size(x),P=y.dims,O=M.sortBasedOnPerm(P,c);return{outputs:[{dims:x,dataType:I[0].dataType}],dispatchGroup:{x:Math.ceil(E/64)},programUniforms:[{type:12,data:E},...Z(P,O)]}},getShaderSource:A}},fu=(e,t)=>{zc(e.inputs),e.compute(Uc(e.inputs[0],t))},hu=e=>ve({blocksize:e.blocksize,mode:e.mode,format:e.format})});var Fo,Wn,yu,Vc,Wc,qo,jo,bu,Nc,wu,vu,$u=Y(()=>{"use strict";ye();Se();Ze();_e();Fo="[a-zA-Z]|\\\\.\\\\.\\\\.",Wn="("+Fo+")+",yu="^"+Wn+"$",Vc="("+Wn+",)*"+Wn,Wc="^"+Vc+"$",qo=class{constructor(t=-1){this.symbolToIndices=new Map,this.inputIndex=t}addSymbol(t,r){let o=this.symbolToIndices.get(t);o===void 0?o=[r]:o.push(r),this.symbolToIndices.set(t,o)}},jo=class{constructor(t,r){this.equation=r;this.hasEllipsis=!1,this.symbolToInfo=new Map,this.lhs=new Array,this.outputDims=[];let[o,i]=r.includes("->")?r.split("->",2):[r,""];if(!o.match(RegExp(Wc)))throw new Error("Invalid LHS term");if(o.split(",").forEach((c,p)=>{let h=t[p].dims.slice();if(!c.match(RegExp(yu)))throw new Error("Invalid LHS term");let d=this.processTerm(c,!0,h,p);this.lhs.push(d)}),i==="")i+=[...this.symbolToInfo.entries()].filter(([c,p])=>p.count===1||c==="...").map(([c])=>c).join("");else if(!i.match(RegExp(Wn)))throw new Error("Invalid RHS");i.match(RegExp(Fo,"g"))?.forEach(c=>{if(c==="...")this.outputDims=this.outputDims.concat(this.ellipsisDims);else{let p=this.symbolToInfo.get(c);if(p===void 0)throw new Error("Invalid RHS symbol");this.outputDims.push(p.dimValue)}}),this.rhs=this.processTerm(i,!1,this.outputDims)}addSymbol(t,r,o){let i=this.symbolToInfo.get(t);if(i!==void 0){if(i.dimValue!==r&&i.count!==1)throw new Error("Dimension mismatch");i.count++,i.inputIndices.push(o)}else i={count:1,dimValue:r,inputIndices:[o]};this.symbolToInfo.set(t,i)}processTerm(t,r,o,i=-1){let u=o.length,a=!1,c=[],p=0;if(!t.match(RegExp(yu))&&!r&&t!=="")throw new Error("Invalid LHS term");let h=t.match(RegExp(Fo,"g")),d=new qo(i);return h?.forEach((y,w)=>{if(y==="..."){if(a)throw new Error("Only one ellipsis is allowed per input term");a=!0;let _=u-h.length+1;if(_<0)throw new Error("Ellipsis out of bounds");if(c=o.slice(p,p+_),this.hasEllipsis){if(this.ellipsisDims.length!==c.length||this.ellipsisDims.toString()!==c.toString())throw new Error("Ellipsis dimensions mismatch")}else if(r)this.hasEllipsis=!0,this.ellipsisDims=c;else throw new Error("Ellipsis must be specified in the LHS");for(let v=0;ve+"_max",Nc=(e,t,r,o)=>{let u=e.map(d=>d.length).map((d,y)=>U(`input${y}`,t,d)),a=M.size(o),c=j("output",t,o.length),p=[...r.symbolToInfo.keys()].filter(d=>!r.rhs.symbolToIndices.has(d)),h=d=>{let y=[],w="var prod = 1.0;",_="var sum = 0.0;",v="sum += prod;",S=[],A=[],I=[],x=[],E=r.symbolToInfo.size===r.rhs.symbolToIndices.size;r.symbolToInfo.forEach((O,R)=>{if(r.rhs.symbolToIndices.has(R)){let L=r.rhs.symbolToIndices.get(R)?.[0];L!==void 0&&r.lhs.forEach((N,K)=>{if(O.inputIndices.includes(K)){let Q=N.symbolToIndices.get(R);if(Q===void 0)throw new Error("Invalid symbol error");Q.forEach(he=>{y.push(`${u[K].indicesSet(`input${K}Indices`,he,c.indicesGet("outputIndices",L))}`)})}})}else r.lhs.forEach((L,N)=>{if(O.inputIndices.includes(N)){let K=L.symbolToIndices.get(R);if(K===void 0)throw new Error("Invalid symbol error");K.forEach(Q=>{S.push(`${u[N].indicesSet(`input${N}Indices`,Q,`${R}`)}`)}),x.push(`prod *= ${u[N].getByIndices(`input${N}Indices`)};`)}}),A.push(`for(var ${R}: u32 = 0; ${R} < uniforms.${bu(R)}; ${R}++) {`),I.push("}")});let P=E?[...y,`let sum = ${u.map((O,R)=>O.getByIndices(`input${R}Indices`)).join(" * ")};`]:[...y,_,...A,...S,w,...x,v,...I];return`\n ${d.registerUniforms(p.map(O=>({name:`${bu(O)}`,type:"u32"}))).registerUniform("outputSize","u32").declareVariables(...u,c)}\n\n ${d.mainStart()}\n ${d.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")}\n var outputIndices = ${c.offsetToIndices("global_idx")};\n ${u.map((O,R)=>`var input${R}Indices: ${u[R].type.indices};`).join(`\n`)}\n ${P.join(`\n`)};\n ${c.setByOffset("global_idx","sum")};\n }`};return{name:"Einsum",shaderCache:{hint:r.equation,inputDependencies:e.map(()=>"rank")},getRunData:()=>{let d=p.filter(w=>r.symbolToInfo.has(w)).map(w=>({type:12,data:r.symbolToInfo.get(w)?.dimValue||0}));d.push({type:12,data:a});let y=e.map((w,_)=>[...Z(w)]).reduce((w,_)=>w.concat(_),d);return y.push(...Z(o)),{outputs:[{dims:o,dataType:t}],dispatchGroup:{x:Math.ceil(a/64)},programUniforms:y}},getShaderSource:h}},wu=(e,t)=>{let r=new jo(e.inputs,t.equation),o=r.outputDims,i=e.inputs.map((u,a)=>u.dims);e.compute(Nc(i,e.inputs[0].dataType,r,o))},vu=e=>{let t=e.equation.replace(/\\s+/g,"");return ve({equation:t})}});var Gc,_u,Hc,Lc,Su,xu=Y(()=>{"use strict";ye();Se();_e();Gc=e=>{if(!e||e.length!==2)throw new Error("Expand requires 2 input.");let t=e[0].dims,r=Array.from(e[1].getBigInt64Array(),Number),o=r.length{let r=e.length-t.length,o=[];for(let i=0;ie.length>t.length?_u(e,t):_u(t,e),Lc=e=>{let t=e[0].dims,r=Array.from(e[1].getBigInt64Array(),Number),o=Hc(t,r),i=e[0].dataType,u=i===9?4:1,a=Math.ceil(M.size(o)/u),c=h=>{let d=U("input",i,t.length,u),y=j("output",i,o.length,u),w;if(i===9){let _=(v,S,A="")=>`\n let outputIndices${S} = ${y.offsetToIndices(`outputOffset + ${S}u`)};\n let offset${S} = ${d.broadcastedIndicesToOffset(`outputIndices${S}`,y)};\n let index${S} = offset${S} / 4u;\n let component${S} = offset${S} % 4u;\n ${v}[${S}] = ${A}(${d.getByOffset(`index${S}`)}[component${S}]);\n `;w=`\n let outputOffset = global_idx * ${u};\n var data = vec4(0);\n ${_("data",0,"u32")}\n ${_("data",1,"u32")}\n ${_("data",2,"u32")}\n ${_("data",3,"u32")}\n ${y.setByOffset("global_idx","data")}\n }`}else w=`\n let outputIndices = ${y.offsetToIndices("global_idx")};\n let inputOffset = ${d.broadcastedIndicesToOffset("outputIndices",y)};\n ${y.setByOffset("global_idx",d.getByOffset("inputOffset"))}\n }`;return`\n ${h.registerUniform("vec_size","u32").declareVariables(d,y)}\n ${h.mainStart()}\n ${h.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.vec_size")}\n ${w}`},p=[{type:12,data:a},...Z(t,o)];return{name:"Expand",shaderCache:{hint:`${o.length}`,inputDependencies:["rank"]},getShaderSource:c,getRunData:()=>({outputs:[{dims:o,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(a/64)},programUniforms:p})}},Su=e=>{Gc(e.inputs),e.compute(Lc(e.inputs),{inputs:[0]})}});var Fc,Cu,Au=Y(()=>{"use strict";ye();Se();_e();Rn();Fc=e=>{let t=e[0].dataType,r=M.size(e[0].dims),o=M.size(e[1].dims),i=o%4===0,u=a=>{let c=U("x",t,[1],4),p=U("bias",t,[1],4),h=j("y",t,[1],4),d=[{name:"output_vec_size",type:"u32"},{name:"bias_size",type:"u32"}],y=_=>`\n let bias${_}_offset: u32 = (global_idx * 4 + ${_}) % uniforms.bias_size;\n let bias${_} = ${p.getByOffset(`bias${_}_offset / 4`)}[bias${_}_offset % 4];`,w=i?`\n let bias = ${p.getByOffset("global_idx % (uniforms.bias_size / 4)")};`:`${y(0)}${y(1)}${y(2)}${y(3)}\n let bias = ${c.type.value}(bias0, bias1, bias2, bias3);`;return`${a.registerUniforms(d).declareVariables(c,p,h)}\n\n ${Bo(et(t))}\n\n ${a.mainStart(or)}\n ${a.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_vec_size")}\n\n let x = ${c.getByOffset("global_idx")};\n ${w}\n let x_in = x + bias;\n ${h.setByOffset("global_idx",Do("x_in"))}\n }`};return{name:"FastGeluWithBias",shaderCache:{hint:`${i}`,inputDependencies:["type","type"]},getShaderSource:u,getRunData:a=>({outputs:[{dims:a[0].dims,dataType:a[0].dataType}],programUniforms:[{type:12,data:Math.ceil(r/4)},{type:12,data:o}],dispatchGroup:{x:Math.ceil(r/or/4)}})}},Cu=e=>{e.inputs.length<2||M.size(e.inputs[1].dims)===0?Bs(e):e.compute(Fc(e.inputs))}});var qc,jc,Iu,Tu,Eu=Y(()=>{"use strict";ye();Se();Ze();_e();qc=e=>{if(!e||e.length!==2)throw new Error("Gather requires 2 inputs.")},jc=(e,t)=>{let r=e[0].dims,o=e[1].dims,i=r.length,u=M.normalizeAxis(t.axis,i),a=r.slice(0);a.splice(u,1,...o);let c=r[u],p=e[0].dataType===9?4:1,h=Math.ceil(M.size(a)/p),d=[{type:12,data:h},{type:6,data:c},{type:12,data:u},...Z(e[0].dims,e[1].dims,a)],y=w=>{let _=U("data",e[0].dataType,e[0].dims.length,p),v=U("inputIndices",e[1].dataType,e[1].dims.length),S=j("output",e[0].dataType,a.length,p),A=x=>{let E=o.length,P=`var indicesIndices${x} = ${v.type.indices}(0);`;for(let O=0;O1?`indicesIndices${x}[${O}]`:`indicesIndices${x}`} = ${a.length>1?`outputIndices${x}[uniforms.axis + ${O}]`:`outputIndices${x}`};`;P+=`\n var idx${x} = ${v.getByIndices(`indicesIndices${x}`)};\n if (idx${x} < 0) {\n idx${x} = idx${x} + uniforms.axisDimLimit;\n }\n var dataIndices${x} : ${_.type.indices};\n `;for(let O=0,R=0;O1?`dataIndices${x}[${O}]`:`dataIndices${x}`} = u32(idx${x});`,R+=E):(P+=`${i>1?`dataIndices${x}[${O}]`:`dataIndices${x}`} = ${a.length>1?`outputIndices${x}[${R}]`:`outputIndices${x}`};`,R++);return P},I;if(e[0].dataType===9){let x=(E,P,O="")=>`\n let outputIndices${P} = ${S.offsetToIndices(`outputOffset + ${P}u`)};\n ${A(P)};\n let offset${P} = ${_.indicesToOffset(`dataIndices${P}`)};\n let index${P} = offset${P} / 4u;\n let component${P} = offset${P} % 4u;\n ${E}[${P}] = ${O}(${_.getByOffset(`index${P}`)}[component${P}]);\n `;I=`\n let outputOffset = global_idx * ${p};\n var value = vec4(0);\n ${x("value",0,"u32")}\n ${x("value",1,"u32")}\n ${x("value",2,"u32")}\n ${x("value",3,"u32")}\n ${S.setByOffset("global_idx","value")}\n `}else I=`\n let outputIndices = ${S.offsetToIndices("global_idx")};\n ${A("")};\n let value = ${_.getByIndices("dataIndices")};\n ${S.setByOffset("global_idx","value")};\n `;return`\n ${w.registerUniform("outputSize","u32").registerUniform("axisDimLimit","i32").registerUniform("axis","u32").declareVariables(_,v,S)}\n ${w.mainStart()}\n ${w.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")}\n ${I}\n }`};return{name:"Gather",shaderCache:{hint:t.cacheKey,inputDependencies:["rank","rank"]},getRunData:()=>({outputs:[{dims:a,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(h/64)},programUniforms:d}),getShaderSource:y}},Iu=e=>ve({axis:e.axis}),Tu=(e,t)=>{let r=e.inputs;qc(r),e.compute(jc(e.inputs,t))}});var Kc,Yc,Pu,ku,Ou=Y(()=>{"use strict";ye();Se();Ze();_e();Kc=e=>{if(!e||e.length!==2)throw new Error("GatherElements requires 2 inputs.");if(e[0].dims.length<1)throw new Error("GatherElements requires that the data input be rank >= 1.");if(e[0].dims.length!==e[1].dims.length)throw new Error(`GatherElements requires that the data input and\n indices input tensors be of same rank.`)},Yc=(e,t)=>{let r=e[0].dims,o=e[0].dataType,i=r.length,u=e[1].dims,a=e[1].dataType,c=M.normalizeAxis(t.axis,i),p=r[c],h=u.slice(0),d=M.size(h),y=U("input",o,i),w=U("indicesInput",a,u.length),_=j("output",o,h.length),v=[{type:12,data:d},{type:6,data:p},{type:12,data:c}];return v.push(...Z(r,u,h)),{name:"GatherElements",shaderCache:{inputDependencies:["rank","rank"]},getRunData:()=>({outputs:[{dims:h,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(d/64)},programUniforms:v}),getShaderSource:I=>`\n ${I.registerUniform("outputSize","u32").registerUniform("axisDimLimit","i32").registerUniform("axis","u32").declareVariables(y,w,_)}\n ${I.mainStart()}\n ${I.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")}\n\n let outputIndices = ${_.offsetToIndices("global_idx")};\n\n var idx = ${w.getByOffset("global_idx")};\n if (idx < 0) {\n idx = idx + uniforms.axisDimLimit;\n }\n var inputIndices = ${y.type.indices}(outputIndices);\n ${y.indicesSet("inputIndices","uniforms.axis","u32(idx)")};\n let value = ${y.getByIndices("inputIndices")};\n\n ${_.setByOffset("global_idx","value")};\n }`}},Pu=e=>ve({axis:e.axis}),ku=(e,t)=>{let r=e.inputs;Kc(r),e.compute(Yc(e.inputs,t))}});var Zc,Xc,Ru,Bu,Du=Y(()=>{"use strict";ye();Se();_e();Zc=e=>{if(!e)throw new Error("Input is missing");if(e.length<2||e.length>3)throw new Error("Invaid input number.");if(e.length===3&&e[2].dims.length>2)throw new Error("Invalid input shape of C");if(e[0].dataType!==e[1].dataType||e.length===3&&e[0].dataType!==e[2].dataType)throw new Error("Input types are mismatched")},Xc=(e,t)=>{let r=e[0].dims.slice(),o=e[1].dims.slice(),[i,u,a]=Sn.getShapeOfGemmResult(r,t.transA,o,t.transB,e.length===3?e[2].dims:void 0),c=[i,u];if(!c)throw new Error("Can\'t use gemm on the given tensors");let p=M.size(c),h=[{type:12,data:p},{type:12,data:i},{type:12,data:u},{type:12,data:a},{type:1,data:t.alpha},{type:1,data:t.beta}],d=["type","type"];e.length===3&&(h.push(...Z(e[2].dims)),d.push("rank")),h.push(...Z(c));let y=w=>{let _="";t.transA&&t.transB?_="value += a[k * uniforms.M + m] * b[n * uniforms.K + k];":t.transA&&!t.transB?_="value += a[k * uniforms.M + m] * b[k * uniforms.N + n];":!t.transA&&t.transB?_="value += a[m * uniforms.K + k] * b[n * uniforms.K + k];":!t.transA&&!t.transB&&(_="value += a[m * uniforms.K + k] * b[k * uniforms.N + n];");let v=t.alpha===1?"":"value *= uniforms.alpha;",S=U("a",e[0].dataType,e[0].dims),A=U("b",e[1].dataType,e[1].dims),I=S.type.value,x=null,E=[S,A];e.length===3&&(x=U("c",e[2].dataType,e[2].dims.length),E.push(x));let P=j("output",e[0].dataType,c.length);E.push(P);let O=[{name:"output_size",type:"u32"},{name:"M",type:"u32"},{name:"N",type:"u32"},{name:"K",type:"u32"},{name:"alpha",type:"f32"},{name:"beta",type:"f32"}];return`\n ${w.registerUniforms(O).declareVariables(...E)}\n\n ${w.mainStart()}\n ${w.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")}\n\n let m = global_idx / uniforms.N;\n let n = global_idx % uniforms.N;\n\n var value = ${I}(0);\n for (var k: u32 = 0u; k < uniforms.K; k++) {\n ${_}\n }\n\n ${v}\n ${(()=>x!=null?`let cOffset = ${x.broadcastedIndicesToOffset("vec2(m, n)",P)}; value += ${I}(uniforms.beta) * ${x.getByOffset("cOffset")};`:"")()}\n output[global_idx] = value;\n }`};return{name:"Gemm",shaderCache:{hint:`${t.cacheKey}`,inputDependencies:d},getRunData:()=>({outputs:[{dims:c,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(p/64)},programUniforms:h}),getShaderSource:y}},Ru=e=>{let t=e.transA,r=e.transB,o=e.alpha,i=e.beta;return{transA:t,transB:r,alpha:o,beta:i,cacheKey:`${e.transA};${e.transB};${e.alpha===1}`}},Bu=(e,t)=>{Zc(e.inputs),e.compute(Xc(e.inputs,t))}});var Qc,Jc,ep,zu,Mu=Y(()=>{"use strict";ye();Se();_e();Qc=(e,t)=>{let r=e[0].dims,o=r,i=2,u=M.sizeToDimension(r,i),a=M.sizeFromDimension(r,i),c=Me(a),p=a/c,h=[r[0],r[1],p],d=["rank","type","type"],y=[{type:12,data:a},{type:12,data:p}];y.push(...Z(h,h));let w=_=>{let v=U("x",e[0].dataType,h.length,c),S=U("scale",e[1].dataType,e[1].dims),A=U("bias",e[2].dataType,e[2].dims),I=j("output",e[0].dataType,h.length,c),x=[v,S,A,I],E=v.type.value,P=c===1?"f32":`vec${c}`,O=64,R=[{name:"normSize",type:"u32"},{name:"normPackedSize",type:"u32"}];return`\n var meanShared : f32;\n var squaredNormShared : f32;\n var workgroupShared : array<${P}, ${O}>;\n const workgroupSize = ${O}u;\n ${_.registerUniforms(R).declareVariables(...x)}\n ${_.mainStart(O)}\n let norm = global_idx / workgroupSize;\n let batch = norm / uniforms.x_shape[1];\n let channel = norm % uniforms.x_shape[1];\n let localIndex = local_id.x;\n\n // initialize workgroup memory\n var initial = ${P}(0);\n for (var h = localIndex; h < uniforms.normPackedSize; h += workgroupSize) {\n initial = initial + ${P}(${v.get("batch","channel","h")});\n }\n workgroupShared[localIndex] = initial;\n workgroupBarrier();\n\n // Calculate the mean of current channel data.\n for (var currSize = workgroupSize >> 1; currSize > 0; currSize = currSize >> 1) {\n if (localIndex < currSize) {\n workgroupShared[localIndex] = workgroupShared[localIndex] + workgroupShared[localIndex + currSize];\n }\n workgroupBarrier();\n }\n if (localIndex == 0) {\n meanShared = ${_t("workgroupShared[0]",c)} / f32(uniforms.normSize);\n }\n workgroupBarrier();\n\n // reinitialize workgroup memory.\n initial = ${P}(0);\n for (var h = localIndex; h < uniforms.normPackedSize; h += workgroupSize) {\n let deviation = ${P}(${v.get("batch","channel","h")}) - ${P}(meanShared);\n initial = initial + deviation * deviation;\n }\n workgroupShared[localIndex] = initial;\n workgroupBarrier();\n\n // Calculate the sum of square of deviation of current channel data.\n for (var currSize = workgroupSize >> 1; currSize > 0; currSize = currSize >> 1) {\n if (localIndex < currSize) {\n workgroupShared[localIndex] = workgroupShared[localIndex] + workgroupShared[localIndex + currSize];\n }\n workgroupBarrier();\n }\n if (localIndex == 0) {\n squaredNormShared = ${_t("workgroupShared[0]",c)};\n }\n workgroupBarrier();\n\n let invStdDev = inverseSqrt(squaredNormShared / f32(uniforms.normSize) + f32(${t.epsilon}));\n let channelScale = invStdDev * f32(${S.getByOffset("channel")});\n let channelShift = f32(${A.getByOffset("channel")}) - meanShared * channelScale;\n for (var h = localIndex; h < uniforms.normPackedSize; h += workgroupSize) {\n let value = ${v.get("batch","channel","h")} * ${E}(${P}(channelScale)) + ${E}(${P}(channelShift));\n ${I.set("batch","channel","h","value")};\n }\n }`};return{name:"InstanceNormalization",shaderCache:{hint:`${t.epsilon};${c}`,inputDependencies:d},getRunData:()=>({outputs:[{dims:o,dataType:e[0].dataType}],dispatchGroup:{x:u},programUniforms:y}),getShaderSource:w}},Jc=(e,t,r,o,i,u,a,c)=>{let p=Me(a),h=64,d=p===1?"vec2f":`mat2x${p}f`,y=p===1?"f32":`vec${p}f`,w=(R,L)=>`${d}(${R}, ${L})`,_=i*a/p,v=Math.ceil(u/h),S=["type"],A=[{type:12,data:v},{type:12,data:u},{type:12,data:Math.floor(a/p)},{type:12,data:Math.floor(u*a/p)}],I=R=>{let L=U("input",t.dataType,t.dims,p);return`\n ${R.declareVariables(L)}\n @group(0) @binding(1) var output : array<${d}>;\n struct Uniforms {wg_size:u32, H:u32, C:u32, image_size:u32};\n @group(0) @binding(2) var uniforms: Uniforms;\n\n ${R.mainStart(h)}\n let currentImageNumber = global_idx / ${h} / uniforms.C;\n let currentChannelNumber = (global_idx / ${h}) % uniforms.C;\n let wgOffset = local_id.x * uniforms.wg_size;\n if (wgOffset >= uniforms.H) {\n return;\n }\n let wgMax = min(wgOffset + uniforms.wg_size, uniforms.H);\n\n let offset = currentImageNumber * uniforms.image_size + currentChannelNumber;\n var sum = ${$t("f32",p)};\n var squaredSum = ${$t("f32",p)};\n for (var i: u32 = wgOffset; i < wgMax; i++) {\n let value = ${y}(input[offset + i * uniforms.C]);\n sum += value;\n squaredSum += value * value;\n }\n output[global_idx] = ${w("sum","squaredSum")};\n }`},x=e.compute({name:"InstanceNormComputeMean",shaderCache:{hint:`${p}`,inputDependencies:S},getRunData:()=>({outputs:[{dims:[i,a,h,2],dataType:1}],dispatchGroup:{x:i*a/p},programUniforms:A}),getShaderSource:I},{inputs:[t],outputs:[-1]})[0],E=[{type:12,data:_},{type:12,data:u},{type:12,data:Math.floor(a/p)},{type:12,data:Math.floor(h*a/p)}],P=["type","type","type"],O=R=>{let L=U("scale",r.dataType,r.dims,p),N=U("bias",o.dataType,o.dims,p);return`\n @group(0) @binding(0) var input : array<${d}>;\n @group(0) @binding(1) var scale : array<${L.type.storage}>;\n @group(0) @binding(2) var bias : array<${N.type.storage}>;\n @group(0) @binding(3) var output : array<${d}>;\n struct Uniforms {units_of_work : u32, H: u32, C : u32, image_size : u32};\n @group(0) @binding(4) var uniforms: Uniforms;\n\n ${R.mainStart()}\n ${R.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.units_of_work")}\n let currentImageNumber = global_idx / uniforms.C;\n let currentChannelNumber = global_idx % uniforms.C;\n\n let offset = currentImageNumber * uniforms.image_size;\n var sum = ${$t("f32",p)};\n var squaredSum = ${$t("f32",p)};\n for (var i: u32 = 0; i < min(${h}, uniforms.H); i++) {\n let value = input[offset + i + currentChannelNumber * ${h}];\n sum += value[0];\n squaredSum += value[1];\n }\n sum = sum / f32(uniforms.H);\n squaredSum = squaredSum / f32(uniforms.H);\n let invStdDev = inverseSqrt(squaredSum - sum * sum + f32(${c}));\n let channelScale = invStdDev * ${y}(scale[currentChannelNumber]);\n let channelShift = ${y}(bias[currentChannelNumber]) - sum * channelScale;\n\n output[global_idx] = ${w("channelScale","channelShift")};\n }`};return e.compute({name:"InstanceNormComputeChannelScaleShift",shaderCache:{hint:`${p};${c}`,inputDependencies:P},getRunData:()=>({outputs:[{dims:[i,a,2],dataType:1}],dispatchGroup:{x:Math.ceil(_/64)},programUniforms:E}),getShaderSource:O},{inputs:[x,r,o],outputs:[-1]})[0]},ep=(e,t,r)=>{let o=t[0].dims,i=o,u=o[0],a=o[o.length-1],c=M.sizeFromDimension(o,1)/a,p=Me(a),h=M.size(i)/p,d=[{type:12,data:c},{type:12,data:Math.floor(a/p)}],y=["type","type"],w=Jc(e,t[0],t[1],t[2],u,c,a,r.epsilon),_=v=>{let S=De(t[0].dataType),A=p===1?"vec2f":`mat2x${p}f`,I=p===1?S:`vec${p}<${S}>`,x=U("input",t[0].dataType,t[0].dims,p),E=j("output",t[0].dataType,i,p);return`\n @group(0) @binding(0) var input : array<${x.type.storage}>;\n @group(0) @binding(1) var scaleInput : array<${A}>;\n @group(0) @binding(2) var output : array<${E.type.storage}>;\n struct Uniforms {H: u32, C : u32};\n @group(0) @binding(3) var uniforms: Uniforms;\n\n ${v.mainStart()}\n let currentImageNumber = global_idx / (uniforms.C * uniforms.H);\n let currentChannelNumber = global_idx % uniforms.C;\n\n let scaleOffset = currentImageNumber * uniforms.C + currentChannelNumber;\n let scale = scaleInput[scaleOffset];\n output[global_idx] = fma(input[global_idx], ${I}(scale[0]), ${I}(scale[1]));\n }`};e.compute({name:"InstanceNormalizationNHWC",shaderCache:{hint:`${p}`,inputDependencies:y},getRunData:()=>({outputs:[{dims:i,dataType:t[0].dataType}],dispatchGroup:{x:Math.ceil(h/64)},programUniforms:d}),getShaderSource:_},{inputs:[t[0],w]})},zu=(e,t)=>{t.format==="NHWC"?ep(e,e.inputs,t):e.compute(Qc(e.inputs,t))}});var tp,rp,Uu,Vu=Y(()=>{"use strict";ye();Se();_e();tp=e=>{if(!e||e.length<2)throw new Error("layerNorm requires at least 2 inputs.")},rp=(e,t,r)=>{let o=t.simplified,i=e[0].dims,u=e[1],a=!o&&e[2],c=i,p=M.normalizeAxis(t.axis,i.length),h=M.sizeToDimension(i,p),d=M.sizeFromDimension(i,p),y=M.size(u.dims),w=a?M.size(a.dims):0;if(y!==d||a&&w!==d)throw new Error(`Size of X.shape()[axis:] == ${d}.\n Size of scale and bias (if provided) must match this.\n Got scale size of ${y} and bias size of ${w}`);let _=[];for(let O=0;O1,x=r>2,E=O=>{let R=De(e[0].dataType),L=[U("x",e[0].dataType,e[0].dims,v),U("scale",u.dataType,u.dims,v)];a&&L.push(U("bias",a.dataType,a.dims,v)),L.push(j("output",e[0].dataType,c,v)),I&&L.push(j("mean_data_output",1,_)),x&&L.push(j("inv_std_output",1,_));let N=[{name:"norm_count",type:"u32"},{name:"norm_size",type:"f32"},{name:"norm_size_vectorized",type:"u32"},{name:"epsilon",type:"f32"}];return`\n ${O.registerUniforms(N).declareVariables(...L)}\n ${O.mainStart()}\n ${O.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.norm_count")}\n let offset = global_idx * uniforms.norm_size_vectorized;\n var mean_vector = ${$t("f32",v)};\n var mean_square_vector = ${$t("f32",v)};\n\n for (var h: u32 = 0u; h < uniforms.norm_size_vectorized; h++) {\n let value = ${ir(R,v,"x[h + offset]")};\n mean_vector += value;\n mean_square_vector += value * value;\n }\n let mean = ${_t("mean_vector",v)} / uniforms.norm_size;\n let inv_std_dev = inverseSqrt(${_t("mean_square_vector",v)} / uniforms.norm_size ${o?"":"- mean * mean"} + uniforms.epsilon);\n\n for (var j: u32 = 0; j < uniforms.norm_size_vectorized; j++) {\n let f32input = ${ir(R,v,"x[j + offset]")};\n let f32scale = ${ir(R,v,"scale[j]")};\n output[j + offset] = ${L[0].type.value}((f32input ${o?"":"- mean"}) * inv_std_dev * f32scale\n ${a?`+ ${ir(R,v,"bias[j]")}`:""}\n );\n }\n\n ${I?"mean_data_output[global_idx] = mean":""};\n ${x?"inv_std_output[global_idx] = inv_std_dev":""};\n }`},P=[{dims:c,dataType:e[0].dataType}];return I&&P.push({dims:_,dataType:1}),x&&P.push({dims:_,dataType:1}),{name:"LayerNormalization",shaderCache:{hint:`${v};${r};${o}`,inputDependencies:S},getRunData:()=>({outputs:P,dispatchGroup:{x:Math.ceil(h/64)},programUniforms:A}),getShaderSource:E}},Uu=(e,t)=>{tp(e.inputs),e.compute(rp(e.inputs,t,e.outputCount))}});var np,op,Wu,Nu,Gu=Y(()=>{"use strict";ye();Se();Ze();_e();np=(e,t)=>{if(e.length<3||e.length>4)throw new Error("MatMulNBits requires 3 or 4 inputs");let r=e[0],o=r.dims.length;if(r.dims[o-1]!==t.k)throw new Error("The last dim of input shape does not match the k value");let i=Math.floor((t.k+t.blockSize-1)/t.blockSize),u=t.blockSize/8*t.bits,a=e[1];if(!M.areEqual(a.dims,[t.n,i,u]))throw new Error("The second inputs must be 3D tensor with shape N X nBlocksPerCol X blobSize");let p=e[2].dims;if(M.size(p)!==t.n*i)throw new Error("scales input size error.");if(e.length===4){let d=e[3].dims,y=t.bits>4?t.n*i:t.n*Math.floor((i+1)/2);if(M.size(d)!==y)throw new Error("zeroPoints input size error.")}},op=(e,t,r,o)=>{let i=e[0].dims,u=i.length,a=Math.floor((t.k+t.blockSize-1)/t.blockSize),c=i[u-2],p=t.k,h=t.n,d=i.slice(0,u-2),y=M.size(d),_=t.blockSize/8*t.bits/4,v=e[0].dataType,S=Me(c),A=Me(t.k),I=Me(_),x=tr(v),E=c*a*x,P=Math.floor(o/E),O=a<=r[0]&&P>0,R=!O||P>=4?Me(h):P>=2&&Me(h)>=2?2:1,L=d.concat([c,h]),N=M.size(L)/R/S,K=O?[]:[{type:12,data:N},{type:12,data:t.blockSize}],Q=[y,c,p/A],he=M.convertShape(e[1].dims).slice();he.splice(-1,1,_/I),K.push(...Z(Q)),K.push(...Z(he)),K.push(...Z(e[2].dims)),e.length===4&&K.push(...Z(M.convertShape(e[3].dims)));let W=[y,c,h/R];K.push(...Z(W));let se=Ce=>{let We=Q.length,ee=U("a",e[0].dataType,We,A),ae=U("b",12,he.length,I),Ae=U("scales",e[2].dataType,e[2].dims.length),me=[ee,ae,Ae],ie=e.length===4?U("zero_points",12,e[3].dims.length):void 0;ie&&me.push(ie);let ue=W.length,le=j("output",e[0].dataType,ue,R),qe=[{name:"output_size",type:"u32"},{name:"block_size",type:"u32"}],G=De(e[0].dataType),ne=(()=>{switch(A){case 1:return`array<${G}, 8>`;case 2:return`mat4x2<${G}>`;case 4:return`mat2x4<${G}>`;default:throw new Error(`${A}-component is not supported.`)}})(),xe=`\n for (var word: u32 = 0; word < ${_}; word += ${I}) {\n ${ae.indicesSet("b_indices","2","word")};\n let b_data = ${ae.getByIndices("b_indices")};\n for (var i: u32 = 0; i < ${I}; i++) {\n let b_value: u32 = ${I===1?"b_data":"b_data[word + i]"};\n let b_mask: u32 = 0x0F0F0F0Fu;\n let b_value_lower: vec4 = unpack4xU8(b_value & b_mask);\n let b_value_upper: vec4 = unpack4xU8((b_value >> 4) & b_mask);\n let b_quantized_values = ${ne}(${Array.from({length:4},(Be,Ge)=>`${G}(b_value_lower[${Ge}]), ${G}(b_value_upper[${Ge}])`).join(", ")});\n let b_dequantized_values = ${(()=>A===1?`${ne}(${Array.from({length:8},(Be,Ge)=>`(b_quantized_values[${Ge}] - zero_point) * scale`).join(", ")});`:`(b_quantized_values - ${ne}(${Array(8).fill("zero_point").join(",")})) * scale;`)()};\n // Number of B elements per 32-bit word is 32/bits = 32/4 = 8\n for (var m: u32 = 0; m < ${O?c:S}u; m++) {\n ${ee.indicesSet("a_indices",We-2,O?"m":`row * ${S} + m`)};\n ${ee.indicesSet("a_indices",We-1,"word_offset")};\n var input_offset = ${ee.indicesToOffset("a_indices")};\n var a_data: ${ne};\n for (var j: u32 = 0; j < ${8/A}; j++) {\n a_data[j] = ${ee.getByOffset("input_offset")};\n input_offset++;\n }\n ${O?"workgroup_shared[workgroup_shared_offset + m]":"output_values[m]"}${R>1?"[c]":""} += ${Array.from({length:8/A},(Be,Ge)=>`${A===1?`a_data[${Ge}] * b_dequantized_values[${Ge}]`:`dot(a_data[${Ge}], b_dequantized_values[${Ge}])`}`).join(" + ")};\n }\n word_offset += ${8/A};\n }\n }`,Ke=ie?`\n zero_point_offset += 4;\n if (zero_point_offset == 32) {\n zero_point_offset = 0;\n zero_point_index++;\n zero_point_word = ${ie.getByOffset("zero_point_index")};\n }`:"";return O?`\n var workgroup_shared: array<${le.type.value}, ${c*a}>;\n ${Ce.declareVariables(...me,le)}\n ${Ce.mainStart([a,1,1])}\n var a_indices: ${ee.type.indices};\n var block = local_id.x;\n var col = workgroup_id.y;\n var batch = workgroup_id.z;\n ${ee.indicesSet("a_indices","0","batch")};\n // Two zero points are packed into one byte when uniforms.bits is 4.\n for (var c: u32 = 0; c < ${R}; c++) {\n let col_times_components_plus_c = col * ${R} + c;\n ${ie?`\n var zero_point_bytes_per_col: u32 = (${a} + 1) / 2;\n var zero_point_byte_count: u32 = col_times_components_plus_c * zero_point_bytes_per_col + (block >> 0x1u);\n var zero_point_word_index: u32 = zero_point_byte_count >> 0x2u;\n var zero_point_byte_offset: u32 = zero_point_byte_count & 0x3u;\n var zero_point_nibble_offset: u32 = block & 0x1u;\n var zero_point_bits_offset: u32 = (zero_point_byte_offset << 3) + (zero_point_nibble_offset << 2);\n var zero_point_word: u32 = ${ie.getByOffset("zero_point_word_index")} >> zero_point_bits_offset;`:""}\n var b_indices: ${ae.type.indices};\n ${ae.indicesSet("b_indices","0","col_times_components_plus_c")};\n // The scale and zero points are computed per block.\n var scales_index = col_times_components_plus_c * ${a} + block;\n let scale = ${Ae.getByOffset("scales_index")};\n // The default zero point is 8 for unsigned 4-bit quantization.\n let zero_point = ${G}(${ie?"(zero_point_word) & 0xFu":8});\n ${ae.indicesSet("b_indices","1","block")};\n var word_offset: u32 = block * ${t.blockSize/A};\n var workgroup_shared_offset: u32 = block * ${c};\n ${xe}\n }\n workgroupBarrier();\n if (local_id.x == 0u) {\n var output_indices: ${le.type.indices};\n ${le.indicesSet("output_indices","0","batch")};\n ${le.indicesSet("output_indices",ue-1,"col")};\n ${le.indicesSet("output_indices",ue-2,"0")};\n var output_offset = ${le.indicesToOffset("output_indices")};\n for (var m: u32 = 0u; m < ${c}u; m++) {\n var output_value: ${le.type.value} = ${le.type.value}(0);\n var workgroup_shared_offset: u32 = m;\n for (var b: u32 = 0u; b < ${a}u; b++) {\n output_value += workgroup_shared[workgroup_shared_offset];\n workgroup_shared_offset += ${c};\n }\n ${le.setByOffset("output_offset","output_value")};\n output_offset += ${h/R};\n }\n }\n }`:`\n ${Ce.registerUniforms(qe).declareVariables(...me,le)}\n ${Ce.mainStart()}\n ${Ce.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")}\n var output_values: array<${le.type.value}, ${S}>;\n var output_indices = ${le.offsetToIndices("global_idx")};\n var col = ${le.indicesGet("output_indices",ue-1)};\n var row = ${le.indicesGet("output_indices",ue-2)};\n var a_indices: ${ee.type.indices} = output_indices;\n // Two zero points are packed into one byte because uniforms.bits <= 4.\n // zero_point_offset is either 0 or 4. It is bit offset within one byte.\n // TODO support zero_point_offset for bits > 4\n ${ie?`\n var zero_point_abs_offset = col * ${R} * ((${a} + 1) / 2);\n var zero_point_index: u32 = zero_point_abs_offset / 4;\n var zero_point_word: u32 = ${ie.getByOffset("zero_point_index")};\n var zero_point_offset: u32 = (zero_point_abs_offset % 4) * 8;`:""}\n var scale_index = col * ${a*R};\n var b_indices: ${ae.type.indices};\n for (var c: u32 = 0; c < ${R}; c++) {\n ${ae.indicesSet("b_indices","0",`col * ${R} + c`)};\n var block_offset: u32 = 0;\n for (var block: u32 = 0; block < ${a}; block++) {\n // The scale and zero points are computed per block.\n let scale = ${Ae.getByOffset("scale_index")};\n // The default zero point is 8 for unsigned 4-bit quantization.\n let zero_point = ${G}(${ie?"extractBits(zero_point_word, zero_point_offset, 4)":8});\n ${ae.indicesSet("b_indices","1","block")};\n var word_offset: u32 = block_offset;\n ${xe}\n scale_index++;\n ${Ke}\n block_offset += uniforms.block_size / ${A};\n }\n // Drop the trailing 4 bits if the zero_poit_offset is not a byte boundary to align with the next byte.\n ${ie?`if (zero_point_offset % 8 > 0) {\n ${Ke}\n }`:""}\n }\n for (var k: u32 = 0u; k < ${S}u; k++) {\n ${le.indicesSet("output_indices",ue-2,`${S} * row + k`)};\n ${le.setByIndices("output_indices","output_values[k]")}\n }\n }`};return{name:O?"BlockwiseMatMulNBits":"MatMulNBits",shaderCache:{hint:`${t.cacheKey};${c};${v};${e.length}`,inputDependencies:Array(e.length).fill("rank")},getRunData:()=>({outputs:[{dims:L,dataType:v}],name:O?"BlockwiseMatMulNBits":"MatMulNBits",dispatchGroup:O?{x:1,y:Math.ceil(h/R),z:y}:{x:Math.ceil(N/64)},programUniforms:K}),getShaderSource:se}},Wu=(e,t)=>{np(e.inputs,t);let r=e.getMaxComputeWorkgroupSizes(),o=e.getMaxComputeWorkgroupStoragesize();e.compute(op(e.inputs,t,r,o))},Nu=e=>ve(e)});var it,ip,Lu,Hu,ap,Ko,Fu,qu=Y(()=>{"use strict";ye();Se();Ze();_n();Ro();_e();Sr();it=(e,t)=>e.length>t&&e[t].dims.length>0&&M.size(e[t].dims)>0?e[t]:void 0,ip=(e,t)=>{let r=e[0],o=it(e,1),i=it(e,2),u=it(e,3),a=it(e,4),c=it(e,5),p=it(e,6),h=it(e,7);if(r.dims.length!==3&&r.dims.length!==5)throw new Error("Input query is expected to have 3 or 5 dimensions");let d=!1,y=r.dims[0],w=r.dims[1],_=r.dims.length===3?d?r.dims[2]/3:r.dims[2]:t.numHeads*r.dims[4],v=w,S=0,A=0,I=Math.floor(_/t.numHeads);if(p&&h){if(p.dims.length!==4)throw new Error(\'Input "past_key" is expected to have 4 dimensions\');if(p.dims[0]!==y||p.dims[1]!==t.numHeads||p.dims[3]!==I)throw new Error(\'Input "past_key" shape (batch_size, num_heads, past_sequence_length, head_size)\');if(h.dims[0]!==y||h.dims[1]!==t.numHeads||h.dims[3]!==I)throw new Error(\'Input "past_value" shape (batch_size, num_heads, past_sequence_length, head_size)\');if(p.dims[2]!==h.dims[2])throw new Error(\'Input "past_key" and "past_value" shall have same dim 2 (past_sequence_length)\');if(h.dims.length!==4)throw new Error(\'Input "past_value" is expected to have 4 dimensions\');S=p.dims[2],A=p.dims[2]}else if(p||h)throw new Error(\'Input "past_key" and "past_value" shall be both present or both absent\');let x;if(o){if(r.dims.length!==3)throw new Error(\'Input "query" is expected to have 3 dimensions when key is given\');if(o.dims.length<3||o.dims.length>5)throw new Error(\'Input "key" is expected to have 3, 4, or 5 dimensions\');if(r.dims[0]!==o.dims[0])throw new Error(\'Input "query" and "key" shall have same dim 0 (batch size)\');if(o.dims.length===3){if(o.dims[2]!==r.dims[2])throw new Error(\'Input "query" and "key" shall have same dim 2 (hidden_size)\');x=2,v=o.dims[1]}else if(o.dims.length===5){if(o.dims[2]!==t.numHeads||o.dims[3]!==2||o.dims[4]!==I)throw new Error(\'Expect "key" shape (batch_size, kv_sequence_length, num_heads, 2, head_size) for packed kv\');if(i)throw new Error(\'Expect "value" be none when "key" has packed kv format.\');x=5,v=o.dims[1]}else{if(o.dims[1]!==t.numHeads||o.dims[3]!==I)throw new Error(\'Expect "key" shape (batch_size, num_heads, kv_sequence_length, head_size) for past_key\');x=0,v=o.dims[2]}}else{if(r.dims.length!==3&&r.dims.length!==5)throw new Error(\'Input "query" is expected to have 3 or 5 dimensions when key is empty\');if(r.dims.length===5&&(r.dims[2]!==t.numHeads||r.dims[3]!==3))throw new Error(\'Expect "query" shape (batch_size, kv_sequence_length, num_heads, 3, head_size) for packed kv\');x=3}if(u){if(u.dims.length!==1)throw new Error(\'Input "bias" is expected to have 1 dimension\');if(i&&r.dims.length===5&&r.dims[3]===2)throw new Error("bias is not allowed for packed kv.")}let E=0;if(a){E=8;let N=a.dims;throw N.length===1?N[0]===y?E=1:N[0]===3*y+2&&(E=3):N.length===2&&N[0]===y&&N[1]===v&&(E=5),E===8?new Error(\'Input "key_padding_mask" shape shall be (batch_size) or (batch_size, kv_sequence_length)\'):new Error("Mask not supported")}let P=!1,O=_;if(i){if(i.dims.length!==3&&i.dims.length!==4)throw new Error(\'Input "value" is expected to have 3 or 4 dimensions\');if(r.dims[0]!==i.dims[0])throw new Error(\'Input "query" and "value" shall have same dim 0 (batch_size)\');if(i.dims.length===3){if(v!==i.dims[1])throw new Error(\'Input "key" and "value" shall have the same dim 1 (kv_sequence_length)\');O=i.dims[2]}else{if(v!==i.dims[2])throw new Error(\'Input "past_key" and "past_value" shall have the same dim 2 (kv_sequence_length)\');O=i.dims[1]*i.dims[3],P=!0}}let R=S+v,L=!1;if(a)throw new Error("Key padding mask is not supported");if(c){if(c.dims.length!==4)throw new Error(\'Input "relative_position_bias" is expected to have 4 dimensions\');if(c.dims[0]!==y&&c.dims[0]!==1||c.dims[1]!==t.numHeads||c.dims[2]!==w||c.dims[3]!==R)throw new Error(\'Input "relative_position_bias" shape (batch_size, 1, sequence_length, kv_sequence_length)\')}return{batchSize:y,sequenceLength:w,pastSequenceLength:S,kvSequenceLength:v,totalSequenceLength:R,maxSequenceLength:A,inputHiddenSize:0,hiddenSize:_,vHiddenSize:O,headSize:I,vHeadSize:Math.floor(O/t.numHeads),numHeads:t.numHeads,isUnidirectional:!1,pastPresentShareBuffer:!1,maskFilterValue:t.maskFilterValue,maskType:E,scale:t.scale,broadcastResPosBias:L,passPastInKv:P,qkvFormat:x}},Lu=e=>ve({...e}),Hu=ve({perm:[0,2,1,3]}),ap=(e,t,r,o,i,u,a)=>{let c=[o,i,u],p=M.size(c),h=[{type:12,data:p},{type:12,data:a},{type:12,data:u}],d=y=>{let w=j("qkv_with_bias",t.dataType,c),_=U("qkv",t.dataType,c),v=U("bias",r.dataType,c),S=[{name:"output_size",type:"u32"},{name:"bias_offset",type:"u32"},{name:"hidden_size",type:"u32"}];return`\n ${y.registerUniforms(S).declareVariables(_,v,w)}\n ${y.mainStart()}\n ${y.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")}\n let bias_offset_idx = (global_idx % uniforms.hidden_size) + uniforms.bias_offset;\n\n qkv_with_bias[global_idx] = qkv[global_idx] + bias[bias_offset_idx];\n }`};return e.compute({name:"MultiHeadAttentionAddBias",shaderCache:{inputDependencies:["type","type"]},getRunData:()=>({outputs:[{dims:c,dataType:t.dataType,gpuDataType:0}],dispatchGroup:{x:Math.ceil(p/64)},programUniforms:h}),getShaderSource:d},{inputs:[t,r],outputs:[-1]})[0]},Ko=(e,t,r,o,i,u,a,c)=>{let p=u;if(a){if(o===1)throw new Error("AddBiasReshape is not implemented. Please export your model with packed QKV or KV");return p=ap(e,u,a,t,o,r*i,c),p=p.reshape([t,o,r,i]),e.compute(yt(p,Hu.perm),{inputs:[p],outputs:[-1]})[0]}else return u.dims.length===3&&(p=u.reshape([t,o,r,i])),e.compute(yt(p,Hu.perm),{inputs:[p],outputs:[-1]})[0]},Fu=(e,t)=>{let r=ip(e.inputs,t),o=e.inputs[0],i=it(e.inputs,1),u=it(e.inputs,2),a=it(e.inputs,3),c=it(e.inputs,4),p=it(e.inputs,5),h=it(e.inputs,6),d=it(e.inputs,7);if(o.dims.length===5)throw new Error("Packed QKV is not implemented");if(i?.dims.length===5)throw new Error("Packed KV is not implemented");let y=i&&u&&i.dims.length===4&&u.dims.length===4,w=Ko(e,r.batchSize,r.numHeads,r.sequenceLength,r.headSize,o,a,0);if(y)return Pn(e,w,i,u,c,void 0,h,d,p,r,t);if(!i||!u)throw new Error("key and value must be provided");let _=Ko(e,r.batchSize,r.numHeads,r.kvSequenceLength,r.headSize,i,a,r.hiddenSize),v=Ko(e,r.batchSize,r.numHeads,r.kvSequenceLength,r.vHeadSize,u,a,2*r.hiddenSize);Pn(e,w,_,v,c,void 0,h,d,p,r,t)}});var sp,up,dp,lp,cp,pp,mp,fp,ju,Ku=Y(()=>{"use strict";ye();Se();_e();sp=e=>{if(!e||e.length<1)throw new Error("Too few inputs");if(e[0].dataType!==1&&e[0].dataType!==10)throw new Error("Input type must be float or float16.");if(e.length>=2){let t=e[0].dims.length*2===e[1].dims[0];if(e.length===4&&(t=e[3].dims[0]*2===e[1].dims[0]),!t)throw new Error("The pads should be a 1D tensor of shape [2 * input_rank] or [2 * num_axes].")}},up=(e,t,r)=>{let o="";for(let i=t-1;i>=0;--i)o+=`\n k = i32(${e.indicesGet("indices",i)}) - ${fe("uniforms.pads",i,r)};\n if (k < 0) {\n break;\n }\n if (k >= i32(${fe("uniforms.x_shape",i,t)})) {\n break;\n }\n offset += k * i32(${fe("uniforms.x_strides",i,t)});\n `;return`\n value = ${e.type.value}(uniforms.constant_value);\n for (var i = 0; i < 1; i++) {\n var offset = 0;\n var k = 0;\n ${o}\n value = x[offset];\n }\n `},dp=(e,t,r)=>{let o="";for(let i=t-1;i>=0;--i)o+=`\n k = i32(${e.indicesGet("indices",i)}) - ${fe("uniforms.pads",i,r)};\n if (k < 0) {\n k = -k;\n }\n {\n let _2n_1 = 2 * (i32(${fe("uniforms.x_shape",i,t)}) - 1);\n k = k % _2n_1;\n if(k >= i32(${fe("uniforms.x_shape",i,t)})) {\n k = _2n_1 - k;\n }\n }\n offset += k * i32(${fe("uniforms.x_strides",i,t)});\n `;return`\n var offset = 0;\n var k = 0;\n ${o}\n value = x[offset];\n `},lp=(e,t,r)=>{let o="";for(let i=t-1;i>=0;--i)o+=`\n k = i32(${e.indicesGet("indices",i)}) - ${fe("uniforms.pads",i,r)};\n if (k < 0) {\n k = 0;\n }\n if (k >= i32(${fe("uniforms.x_shape",i,t)})) {\n k = i32(${fe("uniforms.x_shape",i,t)}) - 1;\n }\n offset += k * i32(${fe("uniforms.x_strides",i,t)});\n `;return`\n var offset = 0;\n var k = 0;\n ${o}\n value = x[offset];\n `},cp=(e,t,r)=>{let o="";for(let i=t-1;i>=0;--i)o+=`\n k = i32(${e.indicesGet("indices",i)}) - ${fe("uniforms.pads",i,r)};\n if (k < 0) {\n k += i32(${fe("uniforms.x_shape",i,t)}]);\n }\n if (k >= i32(${fe("uniforms.x_shape",i,t)})) {\n k -= i32(${fe("uniforms.x_shape",i,t)});\n }\n offset += k * i32(${fe("uniforms.x_strides",i,t)});\n `;return`\n var offset = 0;\n var k = 0;\n ${o}\n value = x[offset];\n `},pp=(e,t,r)=>{switch(r.mode){case 0:return up(e,t,r.pads.length);case 1:return dp(e,t,r.pads.length);case 2:return lp(e,t,r.pads.length);case 3:return cp(e,t,r.pads.length);default:throw new Error("Invalid mode")}},mp=(e,t)=>{let r=M.padShape(e[0].dims.slice(),t.pads),o=e[0].dims,i=M.size(r),u=[{type:12,data:i},{type:6,data:t.pads}];t.mode===0&&u.push({type:e[0].dataType,data:t.value}),u.push(...Z(e[0].dims,r));let a=["rank"],c=p=>{let h=j("output",e[0].dataType,r.length),d=U("x",e[0].dataType,o.length),y=d.type.value,w=pp(h,o.length,t),_=[{name:"output_size",type:"u32"},{name:"pads",type:"i32",length:t.pads.length}];return t.mode===0&&_.push({name:"constant_value",type:y}),`\n ${p.registerUniforms(_).declareVariables(d,h)}\n ${p.mainStart()}\n ${p.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")}\n\n let indices = ${h.offsetToIndices("global_idx")};\n\n var value = ${y}(0);\n ${w}\n output[global_idx] = value;\n }`};return{name:"Pad",shaderCache:{hint:`${t.mode}`,inputDependencies:a},getRunData:()=>({outputs:[{dims:r,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(M.size(r)/64)},programUniforms:u}),getShaderSource:c}},fp=(e,t)=>{if(e.length>1){let r=e[1].getBigInt64Array(),o=e.length>=3&&e[2].data?e[2].getFloat32Array()[0]:0,i=e[0].dims.length,u=new Int32Array(2*i).fill(0);if(e.length>=4){let c=e[3].getBigInt64Array();for(let p=0;pu[Number(p)]=Number(c));let a=[];return u.forEach(c=>a.push(c)),{mode:t.mode,value:o,pads:a}}else return t},ju=(e,t)=>{sp(e.inputs);let r=fp(e.inputs,t);e.compute(mp(e.inputs,r),{inputs:[0]})}});var Nn,Yu,Zu,Xu,Qu,hp,gp,Ju,ed,td,rd,nd,od,id,ad,sd,ud,dd,ld,cd=Y(()=>{"use strict";$r();ye();Se();_e();Nn=e=>{if(vr.webgpu.validateInputContent&&(!e||e.length!==1))throw new Error("Pool ops requires 1 input.")},Yu=(e,t,r)=>{let o=t.format==="NHWC",i=e.dims.slice();o&&i.splice(1,0,i.pop());let u=Object.hasOwnProperty.call(t,"dilations"),a=t.kernelShape.slice(),c=t.strides.slice(),p=u?t.dilations.slice():[],h=t.pads.slice();nr.adjustPoolAttributes(r,i,a,c,p,h);let d=nr.computePoolOutputShape(r,i,c,p,a,h,t.autoPad),y=Object.assign({},t);u?Object.assign(y,{kernelShape:a,strides:c,pads:h,dilations:p,cacheKey:t.cacheKey}):Object.assign(y,{kernelShape:a,strides:c,pads:h,cacheKey:t.cacheKey});let w=d.slice();return w.push(w.splice(1,1)[0]),[y,o?w:d]},Zu=(e,t)=>{let r=t.format==="NHWC",o=M.size(e),i=M.size(t.kernelShape),u=[{type:12,data:o},{type:12,data:i}],a=[{name:"outputSize",type:"u32"},{name:"kernelSize",type:"u32"}];if(t.kernelShape.length<=2){let c=t.kernelShape[t.kernelShape.length-1],p=t.strides[t.strides.length-1],h=t.pads[t.pads.length/2-1],d=t.pads[t.pads.length-1],y=!!(h+d);u.push({type:12,data:c},{type:12,data:p},{type:12,data:h},{type:12,data:d}),a.push({name:"kw",type:"u32"},{name:"sw",type:"u32"},{name:"pwStart",type:"u32"},{name:"pwEnd",type:"u32"});let w=!1;if(t.kernelShape.length===2){let _=t.kernelShape[t.kernelShape.length-2],v=t.strides[t.strides.length-2],S=t.pads[t.pads.length/2-2],A=t.pads[t.pads.length-2];w=!!(S+A),u.push({type:12,data:_},{type:12,data:v},{type:12,data:S},{type:12,data:A}),a.push({name:"kh",type:"u32"},{name:"sh",type:"u32"},{name:"phStart",type:"u32"},{name:"phEnd",type:"u32"})}return[u,a,!0,y,w]}else{if(r)throw new Error("Pooling with kernelShape.length > 2 is not supported for NHWC format.");let c=M.computeStrides(t.kernelShape);u.push({type:12,data:c},{type:12,data:t.pads},{type:12,data:t.strides}),a.push({name:"kernelStrides",type:"u32",length:c.length},{name:"pads",type:"u32",length:t.pads.length},{name:"strides",type:"u32",length:t.strides.length});let p=t.pads.reduce((h,d)=>h+d);return[u,a,!!p,!1,!1]}},Xu=(e,t,r,o,i,u,a,c,p,h,d,y)=>{let w=i.format==="NHWC",_=t.type.value,v=j("output",t.type.tensor,o);if(i.kernelShape.length<=2){let S="",A="",I="",x=r-(w?2:1);if(d?S=`\n for (var i: u32 = 0u; i < uniforms.kw; i++) {\n xIndices[${x}] = indices[${x}] * uniforms.sw - uniforms.pwStart + i;\n if (xIndices[${x}] < 0 || xIndices[${x}]\n >= uniforms.x_shape[${x}]) {\n pad++;\n continue;\n }\n let x_val = x[${t.indicesToOffset("xIndices")}];\n ${u}\n }`:S=`\n for (var i: u32 = 0u; i < uniforms.kw; i++) {\n xIndices[${x}] = indices[${x}] * uniforms.sw - uniforms.pwStart + i;\n let x_val = x[${t.indicesToOffset("xIndices")}];\n ${u}\n }`,i.kernelShape.length===2){let P=r-(w?3:2);y?A=`\n for (var j: u32 = 0u; j < uniforms.kh; j++) {\n xIndices[${P}] = indices[${P}] * uniforms.sh - uniforms.phStart + j;\n if (xIndices[${P}] < 0 || xIndices[${P}] >= uniforms.x_shape[${P}]) {\n pad += i32(uniforms.kw);\n continue;\n }\n `:A=`\n for (var j: u32 = 0u; j < uniforms.kh; j++) {\n xIndices[${P}] = indices[${P}] * uniforms.sh - uniforms.phStart + j;\n `,I=`\n }\n `}return`\n ${e.registerUniforms(p).declareVariables(t,v)}\n\n ${e.mainStart()}\n ${e.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")}\n\n let indices = ${v.offsetToIndices("global_idx")};\n var xIndices = ${v.offsetToIndices("global_idx")};\n\n var value = ${_}(${c});\n var pad = 0;\n ${A}\n ${S}\n ${I}\n ${a}\n\n output[global_idx] = value;\n }`}else{if(w)throw new Error("Pooling with kernelShape.length > 2 is not supported for NHWC format.");let S=i.kernelShape.length,A=i.pads.length,I="";return h?I=`\n if (xIndices[j] >= uniforms.x_shape[j]) {\n pad++;\n isPad = true;\n break;\n }\n }\n if (!isPad) {\n let x_val = x[${t.indicesToOffset("xIndices")}];\n ${u}\n }`:I=`\n }\n let x_val = x[${t.indicesToOffset("xIndices")}];\n ${u}\n `,`\n ${e.registerUniforms(p).declareVariables(t,v)}\n\n ${e.mainStart()}\n ${e.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")}\n let indices = ${v.offsetToIndices("global_idx")};\n var xIndices = ${v.offsetToIndices("global_idx")};\n\n var offsets: array;\n\n var value = ${_}(${c});\n var pad = 0;\n var isPad = false;\n\n for (var i: u32 = 0u; i < uniforms.kernelSize; i++) {\n var offset = i;\n for (var j = 0u; j < ${S-1}u; j++) {\n offsets[j] = offset / ${fe("uniforms.kernelStrides","j",S)};\n offset -= offsets[j] * ${fe("uniforms.kernelStrides","j",S)};\n }\n offsets[${S-1}] = offset;\n\n isPad = false;\n for (var j = ${r-S}u; j < ${r}u; j++) {\n xIndices[j] = indices[j] * ${fe("uniforms.strides",`j - ${r-S}u`,S)}\n + offsets[j - ${r-S}u] - ${fe("uniforms.pads","j - 2u",A)};\n ${I}\n }\n ${a}\n\n output[global_idx] = value;\n }`}},Qu=e=>`${e.format};${e.ceilMode};${e.autoPad};${e.kernelShape.length}`,hp=e=>`${Qu(e)};${e.countIncludePad}`,gp=e=>`${Qu(e)};${e.storageOrder};${e.dilations}`,Ju=e=>({format:e.format,autoPad:["NOTSET","VALID","SAME_UPPER","SAME_LOWER"][e.auto_pad],ceilMode:e.ceil_mode,kernelShape:e.kernel_shape,strides:e.strides,pads:e.pads}),ed=(e,t,r,o)=>{let[i,u]=Yu(t,o,r),a=U("x",t.dataType,t.dims.length),c=a.type.value,p="value += x_val;",h="";i.countIncludePad?h+=`value /= ${c}(uniforms.kernelSize);`:h+=`value /= ${c}(i32(uniforms.kernelSize) - pad);`;let[d,y,w,_,v]=Zu(u,i);d.push(...Z(t.dims,u));let S=["rank"];return{name:e,shaderCache:{hint:`${o.cacheKey};${w};${_};${v}`,inputDependencies:S},getRunData:()=>({outputs:[{dims:u,dataType:t.dataType}],dispatchGroup:{x:Math.ceil(M.size(u)/64)},programUniforms:d}),getShaderSource:A=>Xu(A,a,t.dims.length,u.length,i,p,h,0,y,w,_,v)}},td=e=>{let t=e.count_include_pad!==0,r=Ju(e);if(r.ceilMode!==0)throw new Error("using ceil() in shape computation is not yet supported for AveragePool");let o={countIncludePad:t,...r,cacheKey:""};return{...o,cacheKey:hp(o)}},rd=(e,t)=>{Nn(e.inputs),e.compute(ed("AveragePool",e.inputs[0],!1,t))},nd={autoPad:"",ceilMode:0,countIncludePad:!1,kernelShape:[],strides:[],pads:[],storageOrder:0,dilations:[]},od=e=>{let t=e.format;return{format:t,...nd,cacheKey:t}},id=(e,t)=>{Nn(e.inputs),e.compute(ed("GlobalAveragePool",e.inputs[0],!0,t))},ad=(e,t,r,o)=>{let[i,u]=Yu(t,o,r),a=`\n value = max(x_val, value);\n `,c="",p=U("x",t.dataType,t.dims.length),h=["rank"],[d,y,w,_,v]=Zu(u,i);return d.push(...Z(t.dims,u)),{name:e,shaderCache:{hint:`${o.cacheKey};${w};${_};${v}`,inputDependencies:h},getRunData:()=>({outputs:[{dims:u,dataType:t.dataType}],dispatchGroup:{x:Math.ceil(M.size(u)/64)},programUniforms:d}),getShaderSource:S=>Xu(S,p,t.dims.length,u.length,i,a,c,t.dataType===10?-65504:-1e5,y,w,_,v)}},sd=(e,t)=>{Nn(e.inputs),e.compute(ad("MaxPool",e.inputs[0],!1,t))},ud=e=>{let t=e.storage_order,r=e.dilations,o=Ju(e);if(t!==0)throw new Error("column major storage order is not yet supported for MaxPool");if(o.ceilMode!==0)throw new Error("using ceil() in shape computation is not yet supported for MaxPool");let i={storageOrder:t,dilations:r,...o,cacheKey:""};return{...i,cacheKey:gp(i)}},dd=e=>{let t=e.format;return{format:t,...nd,cacheKey:t}},ld=(e,t)=>{Nn(e.inputs),e.compute(ad("GlobalMaxPool",e.inputs[0],!0,t))}});var bp,wp,pd,md=Y(()=>{"use strict";$r();ye();_e();bp=(e,t,r)=>{let o=e===t,i=et&&r>0;if(o||i||u)throw new Error("Range these inputs\' contents are invalid.")},wp=(e,t,r,o)=>{let i=Math.abs(Math.ceil((t-e)/r)),u=[i],a=i,c=[{type:12,data:a},{type:o,data:e},{type:o,data:r},...Z(u)],p=h=>{let d=j("output",o,u.length),y=d.type.value,w=[{name:"outputSize",type:"u32"},{name:"start",type:y},{name:"delta",type:y}];return`\n ${h.registerUniforms(w).declareVariables(d)}\n ${h.mainStart()}\n ${h.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")}\n output[global_idx] = uniforms.start + ${y}(global_idx) * uniforms.delta;\n }`};return{name:"Range",shaderCache:{hint:`${o}`},getShaderSource:p,getRunData:()=>({outputs:[{dims:u,dataType:o}],dispatchGroup:{x:Math.ceil(a/64)},programUniforms:c})}},pd=e=>{let t=0,r=0,o=0;e.inputs[0].dataType===6?(t=e.inputs[0].getInt32Array()[0],r=e.inputs[1].getInt32Array()[0],o=e.inputs[2].getInt32Array()[0]):e.inputs[0].dataType===1&&(t=e.inputs[0].getFloat32Array()[0],r=e.inputs[1].getFloat32Array()[0],o=e.inputs[2].getFloat32Array()[0]),vr.webgpu.validateInputContent&&bp(t,r,o),e.compute(wp(t,r,o,e.inputs[0].dataType),{inputs:[]})}});var vp,$p,_p,Sp,xp,Cp,Ap,Ip,Tp,Ep,Pp,fd,kp,Op,Rp,Bp,Dp,hd,gd,yd=Y(()=>{"use strict";ye();Se();Ze();_e();vp=(e,t)=>{if(e.every(r=>r>0||(()=>{throw new Error("Resize requires scales input values to be positive")})),e.length>0){if(t.mode==="linear"){if(!(e.length===2||e.length===3||e.length===4&&e[0]===1&&e[1]===1||e.length===4&&e[0]===1&&e[3]===1||e.length===5&&e[0]===1&&e[1]===1))throw new Error(`For linear mode, Resize requires scales to be 2D, 3D, 4D with either two outermost or one innermost and\n one outermost scale values equal to 1, or 5D with two outermost scale values equal to 1`)}else if(t.mode==="cubic"&&!(e.length===2||e.length===4&&e[0]===1&&e[1]===1||e.length===4&&e[0]===1&&e[3]===1))throw new Error("Resize requires scales input size to be 2 or 4 for cubic mode")}},$p=(e,t,r)=>{t.every(i=>i>=0&&i{throw new Error("Resize requires axes input values to be positive and less than rank")}));let o=new Array(r).fill(1);return t.forEach((i,u)=>o[i]=e[u]),o},_p=(e,t,r,o,i,u)=>{let[a,c,p]=r>10?[1,2,3]:[-1,e.length>1?1:-1,-1],h=e[0].dims.length;if(a>0&&e.length>a&&e[a].dims.length>0)e[a].getFloat32Array().forEach(d=>u.push(d));else if(t.coordinateTransformMode==="tf_crop_and_resize")throw new Error("Resize requires RoI input to be specified when coordinateTransformMode is tfCropAndResize");if(c>0&&e.length>c&&e[c].dims.length>0){if(e[c].getFloat32Array().forEach(d=>o.push(d)),o.length!==0&&o.length!==h&&r>=18&&o.length!==t.axes.length)throw new Error("Resize requires scales input size to be same as input rank or axes size for opset 18 and up");vp(o,t),t.axes.length>0&&$p(o,t.axes,h).forEach((d,y)=>o[y]=d)}if(p>0&&e.length>p&&(e[p].getBigInt64Array().forEach(d=>i.push(Number(d))),i.length!==h||r>=18&&i.length===t.axes.length))throw new Error("Resize requires sizes input size to be same as input rank or axes size for opset 18 and up");if(t.axes.length>0){if(o.length!==t.axes.length)throw new Error(\'Resize requires "scales" input size to be of axes rank when axes attributes is specified\');if(i.length!==t.axes.length)throw new Error(\'Resize requires "sizes" input size to be of rank axes rank when axes attributes is specified\')}if(typeof o<"u"&&typeof i<"u"&&o.length>0&&i.length>h)throw new Error("Resize requires only of scales or sizes to be specified")},Sp=(e,t)=>`fn getOriginalCoordinateFromResizedCoordinate(xResized: u32, xScale: f32, lengthResized: u32,\n lengthOriginal: u32, roiStart: f32, roiEnd: f32) -> ${t} { `+(()=>{switch(e){case"asymmetric":return`return ${t}(xResized) / ${t}(xScale);`;case"pytorch_half_pixel":return`if (lengthResized > 1) {\n return (${t}(xResized) + 0.5) / ${t}(xScale) - 0.5;\n } else {\n return 0.0;\n }`;case"tf_half_pixel_for_nn":return`return (${t}(xResized) + 0.5) / ${t}(xScale);`;case"align_corners":return`if (lengthResized == 1) {\n return 0.0;\n } else {\n // The whole part and the fractional part are calculated separately due to inaccuracy of floating\n // point division. As an example, f32(21) / f32(7) may evaluate to 2.99... instead of 3, causing an\n // offset-by-one error later in floor().\n let whole = ${t}(xResized * (lengthOriginal - 1) / (lengthResized - 1));\n let fract =\n ${t}(xResized * (lengthOriginal - 1) % (lengthResized - 1)) / ${t}(lengthResized - 1);\n return whole + fract;\n }`;case"tf_crop_and_resize":return`if (lengthResized > 1) {\n return ${t}(roiStart) * ${t}(lengthOriginal - 1) +\n (${t}(xResized) * ${t}(roiEnd - roiStart) * ${t}(lengthOriginal - 1)) /\n ${t}(lengthResized - 1);\n } else {\n return 0.5 * ${t}(roiStart + roiEnd) * ${t}(lengthOriginal - 1);\n }`;case"half_pixel_symmetric":return`const outputWidth = ${t}xScale * ${t}(lengthResized);\n const adjustment = ${t}(lengthResized) / outputWidth;\n const center = ${t}(lengthOriginal) / 2;\n const offset = center * (1 - adjustment);\n return offset + ((${t}(xResized) + 0.5) / ${t}(xScale)) - 0.5;`;case"half_pixel":return`return ((${t}(xResized) + 0.5) / ${t}(xScale)) - 0.5;`;default:throw new Error(`Coordinate transform mode ${e} is not supported`)}})()+"}",xp=(e,t,r)=>`fn getNearestPixelFromOriginal(xOriginal: ${r}, isDownSample: bool) -> ${r} {`+(()=>{switch(e){case"round_prefer_ceil":return"if (fract(xOriginal) == 0.5) { return ceil(xOriginal); } else { return round(xOriginal); }";case"floor":return"return floor(xOriginal);";case"ceil":return"return ceil(xOriginal);";case"round_prefer_floor":return"if (fract(xOriginal) == 0.5) { return floor(xOriginal); } else { return round(xOriginal); }";case"simple":default:if(t<11)return"if (isDownSample) { return ceil(xOriginal); } else { return xOriginal; }";throw new Error(`Nearest mode ${e} is not supported`)}})()+"}",Cp=(e,t,r)=>{let o=new Array(r).fill(0).concat(new Array(r).fill(1)),i=e.length===0?o:e.slice();return t.length>0?(t.forEach((u,a)=>{o[u]=i[a],o[a+r]=i[t.length+a]}),o):i},Ap=(e,t,r,o)=>{let i=[];if(r.length>0)if(o.length>0){if(e.forEach(u=>i.push(u)),Math.max(...o)>e.length)throw new Error("axes is out of bound");o.forEach((u,a)=>i[u]=r[a])}else r.forEach(u=>i.push(u));else{if(t.length===0)throw new Error("Resize requires either scales or sizes.");i=e.map((u,a)=>Math.round(u*t[a]))}return i},Ip=(e,t,r)=>{let o=(()=>{switch(r.keepAspectRatioPolicy){case"not_larger":return r.axes.length>0?Math.min(...r.axes.map(u=>t[u]),Number.MAX_VALUE):Math.min(...t,Number.MAX_VALUE);case"not_smaller":return r.axes.length>0?Math.max(...r.axes.map(u=>t[u]),Number.MIN_VALUE):Math.max(...t,Number.MIN_VALUE);default:throw new Error(`Keep aspect ratio policy ${r.keepAspectRatioPolicy} is not supported`)}})();t.fill(1,0,t.length);let i=e.slice();return r.axes.length>0?(r.axes.forEach(u=>t[u]=o),r.axes.forEach(u=>i[u]=Math.round(e[u]*t[u]))):(t.fill(o,0,t.length),i.forEach((u,a)=>i[a]=Math.round(u*t[a]))),i},Tp=(e,t,r,o,i)=>`\n fn calculateOriginalIndicesFromOutputIndices(output_indices: ${e.type.indices}) -> array<${e.type.value}, ${r.length}> {\n var original_indices: array<${e.type.value}, ${r.length}>;\n for (var i:u32 = 0; i < ${r.length}; i++) {\n var output_index = ${e.indicesGet("output_indices","i")};\n var scale = ${fe("uniforms.scales","i",o)};\n var roi_low = ${fe("uniforms.roi","i",i)};\n var roi_hi = ${fe("uniforms.roi",`i + ${t.length}`,i)};\n if (scale == 1.0) {\n original_indices[i] = ${e.type.value}(output_index);\n } else {\n var input_shape_i = ${fe("uniforms.input_shape","i",t.length)};\n var output_shape_i = ${fe("uniforms.output_shape","i",r.length)};\n original_indices[i] = getOriginalCoordinateFromResizedCoordinate(output_index, scale, output_shape_i,\n input_shape_i, roi_low, roi_hi);\n }\n }\n return original_indices;\n }`,Ep=(e,t,r,o,i,u,a)=>`\n fn calculateInputIndicesFromOutputIndices(output_indices: ${t.type.indices}) -> ${e.type.indices} {\n var input_indices: ${e.type.indices};\n for (var i:u32 = 0; i < ${o.length}; i++) {\n var output_index = ${t.indicesGet("output_indices","i")};\n var input_index: u32;\n var scale = ${fe("uniforms.scales","i",i)};\n if (scale == 1.0) {\n input_index = output_index;\n } else {\n var roi_low = ${fe("uniforms.roi","i",u)};\n var roi_hi = ${fe("uniforms.roi",`i + ${r.length}`,u)};\n var input_shape_i = ${fe("uniforms.input_shape","i",r.length)};\n var output_shape_i = ${fe("uniforms.output_shape","i",o.length)};\n var original_idx = getOriginalCoordinateFromResizedCoordinate(output_index, scale, output_shape_i,\n input_shape_i, roi_low, roi_hi);\n if (!${a} || (original_idx >= 0 && original_idx < ${t.type.value}(input_shape_i))) {\n if (original_idx < 0) {\n input_index = 0;\n } else if (original_idx > ${t.type.value}(input_shape_i - 1)) {\n input_index = input_shape_i - 1;\n } else {\n input_index = u32(getNearestPixelFromOriginal(original_idx, scale < 1));\n }\n } else {\n input_index = u32(original_idx);\n }\n }\n ${e.indicesSet("input_indices","i"," input_index")}\n }\n return input_indices;\n }`,Pp=(e,t)=>`\n fn checkInputIndices(input_indices: ${e.type.indices}) -> bool {\n for (var i:u32 = 0; i < ${t.length}; i++) {\n var input_index = ${e.indicesGet("input_indices","i")};\n if (input_index < 0 || input_index >= ${fe("uniforms.input_shape","i",t.length)}) {\n return false;\n }\n }\n return true;\n }`,fd=(e,t,r,o)=>e.rank>o?`\n ${e.indicesSet("input_indices",t,"channel")};\n ${e.indicesSet("input_indices",r,"batch")};\n`:"",kp=(e,t,r,o,i)=>{let[a,c,p,h]=r.length===2?[-1,0,1,-1]:[0,2,3,1],d=e.type.value;return`\n fn getInputValue(batch: u32, channel: u32, row: u32, col: u32) -> ${d} {\n var input_indices: ${e.type.indices};\n ${e.indicesSet("input_indices",c,`max(0, min(row, ${r[c]} - 1))`)};\n ${e.indicesSet("input_indices",p,`max(0, min(col, ${r[p]} - 1))`)};\n ${fd(e,h,a,2)}\n return ${e.getByIndices("input_indices")};\n }\n\n fn bilinearInterpolation(output_indices: ${t.type.indices}) -> ${d} {\n var originalIndices = calculateOriginalIndicesFromOutputIndices(output_indices);\n var row:${d} = originalIndices[${c}];\n var col:${d} = originalIndices[${p}];\n ${o?`if (row < 0 || row > (${r[c]} - 1) || col < 0 || col > (${r[p]} - 1)) {\n return ${i};\n }`:""};\n row = max(0, min(row, ${r[c]} - 1));\n col = max(0, min(col, ${r[p]} - 1));\n var row1: u32 = u32(row);\n var col1: u32 = u32(col);\n var row2: u32 = u32(row + 1);\n var col2: u32 = u32(col + 1);\n var channel: u32 = ${r.length>2?`u32(originalIndices[${h}])`:"0"};\n var batch: u32 = ${r.length>2?`u32(originalIndices[${a}])`:"0"};\n var x11: ${d} = getInputValue(batch, channel, row1, col1);\n var x12: ${d} = getInputValue(batch, channel, row1, col2);\n var x21: ${d} = getInputValue(batch, channel, row2, col1);\n var x22: ${d} = getInputValue(batch, channel, row2, col2);\n var dx1: ${d} = abs(row - ${d}(row1));\n var dx2: ${d} = abs(${d}(row2) - row);\n var dy1: ${d} = abs(col - ${d}(col1));\n var dy2: ${d} = abs(${d}(col2) - col);\n if (row1 == row2) {\n dx1 = 0.5;\n dx2 = 0.5;\n }\n if (col1 == col2) {\n dy1 = 0.5;\n dy2 = 0.5;\n }\n return (x11 * dx2 * dy2 + x12 * dx2 * dy1 + x21 * dx1 * dy2 + x22 * dx1 * dy1);\n }`},Op=(e,t,r,o,i,u,a,c,p,h)=>{let d=r.length===2,y=!0,[w,_]=d?[0,1]:y?[2,3]:[1,2],v=e.type.value,S=A=>{let I=A===w?"row":"col";return`\n fn ${I}CubicInterpolation(input_indices: ${e.type.indices}, output_indices: ${t.type.indices}) -> ${v} {\n var output_index = ${t.indicesGet("output_indices",A)};\n var originalIdx: ${v} = getOriginalCoordinateFromResizedCoordinate(output_index, ${i[A]},\n ${o[A]}, ${r[A]}, ${u[A]}, ${u[A]} + ${r.length});\n var fractOriginalIdx: ${v} = originalIdx - floor(originalIdx);\n var coefs = getCubicInterpolationCoefs(fractOriginalIdx);\n\n if (${c} && (originalIdx < 0 || originalIdx > (${r[A]} - 1))) {\n return ${p};\n }\n var data: array<${v}, 4> = array<${v}, 4>(0.0, 0.0, 0.0, 0.0);\n for (var i: i32 = -1; i < 3; i++) {\n var ${I}: ${v} = originalIdx + ${v}(i);\n if (${I} < 0 || ${I} >= ${r[A]}) {\n ${(()=>h?`coefs[i + 1] = 0.0;\n continue;`:c?`return ${p};`:`${I} = max(0, min(${I}, ${r[A]} - 1));`)()};\n }\n var input_indices_copy: ${e.type.indices} = input_indices;\n ${e.indicesSet("input_indices_copy",A,`u32(${I})`)};\n data[i + 1] = ${A===w?e.getByIndices("input_indices_copy"):"rowCubicInterpolation(input_indices_copy, output_indices)"};\n }\n return cubicInterpolation1D(data, coefs);\n }`};return`\n ${S(w)};\n ${S(_)};\n fn getCubicInterpolationCoefs(s: ${v}) -> array<${v}, 4> {\n var absS = abs(s);\n var coeffs: array<${v}, 4> = array<${v}, 4>(0.0, 0.0, 0.0, 0.0);\n var oneMinusAbsS: ${v} = 1.0 - absS;\n var twoMinusAbsS: ${v} = 2.0 - absS;\n var onePlusAbsS: ${v} = 1.0 + absS;\n coeffs[0] = ((${a} * onePlusAbsS - 5 * ${a}) * onePlusAbsS + 8 * ${a}) * onePlusAbsS - 4 * ${a};\n coeffs[1] = ((${a} + 2) * absS - (${a} + 3)) * absS * absS + 1;\n coeffs[2] = ((${a} + 2) * oneMinusAbsS - (${a} + 3)) * oneMinusAbsS * oneMinusAbsS + 1;\n coeffs[3] = ((${a} * twoMinusAbsS - 5 * ${a}) * twoMinusAbsS + 8 * ${a}) * twoMinusAbsS - 4 * ${a};\n return coeffs;\n }\n\n fn cubicInterpolation1D(x: array<${v}, 4>, coefs: array<${v}, 4>) -> ${v} {\n var coefsSum: ${v} = coefs[0] + coefs[1] + coefs[2] + coefs[3];\n return (x[0] * coefs[0] + x[1] * coefs[1]+ x[2] * coefs[2]+ x[3] * coefs[3]) / coefsSum;\n }\n\n fn bicubicInterpolation(output_indices: ${t.type.indices}) -> ${v} {\n var input_indices: ${e.type.indices} = output_indices;\n return colCubicInterpolation(input_indices, output_indices);\n }\n `},Rp=(e,t,r,o,i)=>{let[a,c,p,h,d]=r.length===3?[-1,0,1,2,-1]:[0,2,3,4,1],y=e.type.value;return`\n fn getInputValue(batch: u32, channel: u32, depth:u32, height: u32, width: u32) -> ${y} {\n var input_indices: ${e.type.indices};\n ${e.indicesSet("input_indices",c,`max(0, min(depth, ${r[c]} - 1))`)};\n ${e.indicesSet("input_indices",p,`max(0, min(height, ${r[p]} - 1))`)};\n ${e.indicesSet("input_indices",h,`max(0, min(width, ${r[h]} - 1))`)};\n ${fd(e,d,a,3)}\n return ${e.getByIndices("input_indices")};\n }\n\n fn trilinearInterpolation(output_indices: ${t.type.indices}) -> ${y} {\n var originalIndices = calculateOriginalIndicesFromOutputIndices(output_indices);\n var depth:${y} = originalIndices[${c}];\n var height:${y} = originalIndices[${p}];\n var width:${y} = originalIndices[${h}];\n ${o?`if (depth < 0 || depth > (${r[c]} - 1) || height < 0 || height > (${r[p]} - 1) || width < 0 || (width > ${r[h]} - 1)) {\n return ${i};\n }`:""};\n\n depth = max(0, min(depth, ${r[c]} - 1));\n height = max(0, min(height, ${r[p]} - 1));\n width = max(0, min(width, ${r[h]} - 1));\n var depth1: u32 = u32(depth);\n var height1: u32 = u32(height);\n var width1: u32 = u32(width);\n var depth2: u32 = u32(depth + 1);\n var height2: u32 = u32(height + 1);\n var width2: u32 = u32(width + 1);\n var channel: u32 = ${r.length>3?`u32(originalIndices[${d}])`:"0"};\n var batch: u32 = ${r.length>3?`u32(originalIndices[${a}])`:"0"};\n\n var x111: ${y} = getInputValue(batch, channel, depth1, height1, width1);\n var x112: ${y} = getInputValue(batch, channel, depth1, height1, width2);\n var x121: ${y} = getInputValue(batch, channel, depth1, height2, width1);\n var x122: ${y} = getInputValue(batch, channel, depth1, height2, width2);\n var x211: ${y} = getInputValue(batch, channel, depth2, height1, width1);\n var x212: ${y} = getInputValue(batch, channel, depth2, height1, width2);\n var x221: ${y} = getInputValue(batch, channel, depth2, height2, width1);\n var x222: ${y} = getInputValue(batch, channel, depth2, height2, width2);\n var dx1: ${y} = abs(depth - ${y}(depth1));\n var dx2: ${y} = abs(${y}(depth2) - depth);\n var dy1: ${y} = abs(height - ${y}(height1));\n var dy2: ${y} = abs(${y}(height2) - height);\n var dz1: ${y} = abs(width - ${y}(width1));\n var dz2: ${y} = abs(${y}(width2) - width);\n if (depth1 == depth2) {\n dx1 = 0.5;\n dx2 = 0.5;\n }\n if (height1 == height2) {\n dy1 = 0.5;\n dy2 = 0.5;\n }\n if (width1 == width2) {\n dz1 = 0.5;\n dz2 = 0.5;\n }\n return (x111 * dx2 * dy2 * dz2 + x112 * dx2 * dy2 * dz1 + x121 * dx2 * dy1 *dz2 + x122 * dx2 * dy1 * dz1 +\n x211 * dx1 * dy2 * dz2 + x212 * dx1 * dy2 * dz1 + x221 * dx1 * dy1 *dz2 + x222 * dx1 * dy1 * dz1);\n }`},Bp=(e,t,r,o,i,u)=>{let a=e.dims,c=Cp(u,t.axes,a.length),p=Ap(a,o,i,t.axes),h=o.slice();o.length===0&&(h=a.map((x,E)=>x===0?1:p[E]/x),t.keepAspectRatioPolicy!=="stretch"&&(p=Ip(a,h,t)));let d=j("output",e.dataType,p.length),y=U("input",e.dataType,a.length),w=M.size(p),_=a.length===p.length&&a.every((x,E)=>x===p[E]),v=t.coordinateTransformMode==="tf_crop_and_resize",S=t.extrapolationValue,A=y.type.value,I=x=>`\n ${_?"":`\n ${Sp(t.coordinateTransformMode,A)};\n ${(()=>{switch(t.mode){case"nearest":return`\n ${Pp(y,a)};\n ${xp(t.nearestMode,r,A)};\n ${Ep(y,d,a,p,h.length,c.length,v)};\n `;case"linear":return`\n ${Tp(d,a,p,h.length,c.length)};\n ${(()=>{if(a.length===2||a.length===4)return`${kp(y,d,a,v,S)}`;if(a.length===3||a.length===5)return`${Rp(y,d,a,v,S)}`;throw Error("Linear mode only supports input dims 2, 3, 4 and 5 are supported in linear mode.")})()};\n `;case"cubic":return`\n ${(()=>{if(a.length===2||a.length===4)return`${Op(y,d,a,p,h,c,t.cubicCoeffA,v,t.extrapolationValue,t.excludeOutside)}`;throw Error("Cubic mode only supports input dims 2 and 4 are supported in linear mode.")})()};\n `;default:throw Error("Invalid resize mode")}})()};\n `}\n ${x.registerUniform("output_size","u32").registerUniform("scales","f32",h.length).registerUniform("roi","f32",c.length).declareVariables(y,d)}\n ${x.mainStart()}\n ${x.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")}\n ${_?"output[global_idx] = input[global_idx];":`\n let output_indices = ${d.offsetToIndices("global_idx")};\n var input_indices: ${y.type.indices};\n ${(()=>{switch(t.mode){case"nearest":return`input_indices = calculateInputIndicesFromOutputIndices(output_indices);\n if (checkInputIndices(input_indices)) {\n output[global_idx] = ${y.getByIndices("input_indices")};\n } else {\n output[global_idx] = ${t.extrapolationValue};\n }`;case"linear":return`output[global_idx] = ${a.length===2||a.length===4?"bilinearInterpolation":"trilinearInterpolation"}(output_indices);`;case"cubic":return"output[global_idx] = bicubicInterpolation(output_indices);";default:throw Error(`Unsupported resize mode: ${t.mode}`)}})()};\n`}\n }`;return{name:"Resize",shaderCache:{hint:`${t.cacheKey}|${r}|${h.length>0?h:""}|${i.length>0?i:""}|${c.length>0?c:""}|${_}|${a}`,inputDependencies:["rank"]},getShaderSource:I,getRunData:()=>({outputs:[{dims:p,dataType:e.dataType}],dispatchGroup:{x:Math.ceil(w/64)},programUniforms:[{type:12,data:w},{type:1,data:h},{type:1,data:c},...Z(a,p)]})}},Dp=e=>{let t=e.customDataBuffer;return new Uint32Array(t,t.byteOffset,1)[0]},hd=(e,t)=>{let r=[],o=[],i=[],u=Dp(e);if(t.antialias!==0)throw Error("Only default value (0) for Antialias attribute is supported");_p(e.inputs,t,u,r,o,i),e.compute(Bp(e.inputs[0],t,u,r,o,i),{inputs:[0]})},gd=e=>{let t=e.antialias,r=e.axes,o=e.coordinateTransformMode,i=e.cubicCoeffA,u=e.excludeOutside!==0,a=e.extrapolationValue,c=e.keepAspectRatioPolicy,p=e.mode,h=e.nearestMode===""?"simple":e.nearestMode;return ve({antialias:t,axes:r,coordinateTransformMode:o,cubicCoeffA:i,excludeOutside:u,extrapolationValue:a,keepAspectRatioPolicy:c,mode:p,nearestMode:h})}});var zp,Mp,bd,wd=Y(()=>{"use strict";ye();Se();Ze();_e();zp=(e,t)=>{let[r,o,i,u]=e,{numHeads:a,rotaryEmbeddingDim:c}=t;if(r.dims.length!==3&&r.dims.length!==4)throw new Error(`Input \'x\' is expected to have 3 or 4 dimensions, got ${r.dims.length}`);if(!M.areEqual(o.dims,[])&&!M.areEqual(o.dims,[1])&&o.dims.length!==2)throw new Error(`Input \'position_ids\' is expected to have 0, 1, or 2 dimensions, got ${o.dims.length}`);if(i.dims.length!==2)throw new Error(`Input \'cos_cache\' is expected to have 2 dimensions, got ${i.dims.length}`);if(u.dims.length!==2)throw new Error(`Input \'sin_cache\' is expected to have 2 dimensions, got ${u.dims.length}`);if(!M.areEqual(i.dims,u.dims))throw new Error("Inputs \'cos_cache\' and \'sin_cache\' are expected to have the same shape");if(c>0&&a===0)throw new Error("num_heads must be provided if rotary_embedding_dim is specified");let p=r.dims[0],h=r.dims[r.dims.length-2],d=i.dims[0],y=M.sizeFromDimension(r.dims,1)/h,w=c===0?i.dims[1]*2:y/a;if(c>w)throw new Error("rotary_embedding_dim must be less than or equal to head_size");if(o.dims.length===2){if(p!==o.dims[0])throw new Error(`Input \'position_ids\' dimension 0 should be of size batch_size, got ${o.dims[0]}`);if(h!==o.dims[1])throw new Error(`Input \'position_ids\' dimension 1 should be of size sequence_length, got ${o.dims[1]}`)}if(w/2!==i.dims[1]&&c/2!==i.dims[1])throw new Error(`Input \'cos_cache\' dimension 1 should be same as head_size / 2 or rotary_embedding_dim / 2, got ${i.dims[1]}`);if(h>d)throw new Error("Updating cos_cache and sin_cache in RotaryEmbedding is not currently supported")},Mp=(e,t)=>{let{interleaved:r,numHeads:o,rotaryEmbeddingDim:i,scale:u}=t,a=e[0].dims[0],c=M.sizeFromDimension(e[0].dims,1),p=e[0].dims[e[0].dims.length-2],h=c/p,d=e[2].dims[1],y=i===0?d*2:h/o,w=new Array(a,p,h/y,y-d),_=M.computeStrides(w),v=[{type:1,data:u},{type:12,data:w},{type:12,data:_},...e[0].dims.length===3?new Array({type:12,data:[c,h,y,1]}):[],...e[0].dims.length===4?new Array({type:12,data:[c,y,p*y,1]}):[],...Z(e[0].dims,e[1].dims,e[2].dims,e[3].dims,e[0].dims)],S=A=>{let I=U("input",e[0].dataType,e[0].dims.length),x=U("position_ids",e[1].dataType,e[1].dims.length),E=U("cos_cache",e[2].dataType,e[2].dims.length),P=U("sin_cache",e[3].dataType,e[3].dims.length),O=j("output",e[0].dataType,e[0].dims.length);return A.registerUniforms([{name:"scale",type:"f32"},{name:"global_shape",type:"u32",length:w.length},{name:"global_strides",type:"u32",length:_.length},{name:"input_output_strides",type:"u32",length:_.length}]),`\n ${A.declareVariables(I,x,E,P,O)}\n\n ${A.mainStart(or)}\n let half_rotary_emb_dim = uniforms.${E.name}_shape[1];\n let bsnh = global_idx / uniforms.global_strides % uniforms.global_shape;\n let size = uniforms.global_shape[0] * uniforms.global_strides[0];\n ${A.guardAgainstOutOfBoundsWorkgroupSizes("size")}\n\n if (bsnh[3] < half_rotary_emb_dim) {\n let position_ids_idx =\n ${x.broadcastedIndicesToOffset("bsnh.xy",j("",x.type.tensor,2))};\n let position_id =\n u32(${x.getByOffset("position_ids_idx")}) + select(0, bsnh[1], position_ids_idx == 0);\n let i = dot(bsnh, uniforms.input_output_strides) + select(0, bsnh[3], ${r});\n let j = i + select(half_rotary_emb_dim, 1, ${r});\n let re = ${I.getByOffset("i")} * ${E.get("position_id","bsnh[3]")} -\n ${I.getByOffset("j")} * ${P.get("position_id","bsnh[3]")};\n ${O.setByOffset("i","re")}\n let im = ${I.getByOffset("i")} * ${P.get("position_id","bsnh[3]")} +\n ${I.getByOffset("j")} * ${E.get("position_id","bsnh[3]")};\n ${O.setByOffset("j","im")}\n } else {\n let k = dot(bsnh, uniforms.input_output_strides) + half_rotary_emb_dim;\n ${O.setByOffset("k",I.getByOffset("k"))}\n }\n }`};return{name:"RotaryEmbedding",shaderCache:{hint:ve({interleaved:r}).cacheKey,inputDependencies:["rank","rank","rank","rank"]},getShaderSource:S,getRunData:()=>({outputs:[{dims:e[0].dims,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(M.size(w)/or)},programUniforms:v})}},bd=(e,t)=>{zp(e.inputs,t),e.compute(Mp(e.inputs,t))}});var Up,Vp,vd,$d=Y(()=>{"use strict";ye();Se();_e();Up=e=>{if(!e||e.length<3)throw new Error("layerNorm requires at least 3 inputs.");let t=e[0],r=e[1],o=e[2];if(t.dataType!==r.dataType||t.dataType!==o.dataType)throw new Error("All inputs must have the same data type");if(t.dims.length!==3&&t.dims.length!==2)throw new Error("Input must be 2D or 3D");if(r.dims.length!==3&&r.dims.length!==2)throw new Error("Skip must be 2D or 3D");let i=t.dims[t.dims.length-1],u=t.dims[t.dims.length-2];if(r.dims[r.dims.length-1]!==i)throw new Error("Skip must have the same hidden size as input");if(r.dims[r.dims.length-2]!==u)throw new Error("Skip must have the same sequence length as input");if(o.dims.length!==1)throw new Error("Gamma must be 1D");if(o.dims[o.dims.length-1]!==i)throw new Error("Gamma must have the same hidden size as input");if(e.length>3){let a=e[3];if(a.dims.length!==1)throw new Error("Beta must be 1D");if(a.dims[a.dims.length-1]!==i)throw new Error("Beta must have the same hidden size as input")}if(e.length>4){let a=e[4];if(a.dims.length!==1)throw new Error("Bias must be 1D");if(a.dims[a.dims.length-1]!==i)throw new Error("Bias must have the same hidden size as input")}},Vp=(e,t,r,o)=>{let i=t.simplified,u=e[0].dims,a=M.size(u),c=u,p=a,h=u.slice(-1)[0],d=o?u.slice(0,-1).concat(1):[],y=!i&&e.length>3,w=e.length>4,_=o&&r>1,v=o&&r>2,S=r>3,A=Me(h),I=[{type:12,data:p},{type:12,data:A},{type:12,data:h},{type:1,data:t.epsilon}],x=P=>{let O=[{name:"output_size",type:"u32"},{name:"components",type:"u32"},{name:"hidden_size",type:"u32"},{name:"epsilon",type:"f32"}],R=[U("x",e[0].dataType,e[0].dims,A),U("skip",e[1].dataType,e[1].dims,A),U("gamma",e[2].dataType,e[2].dims,A)];y&&R.push(U("beta",e[3].dataType,e[3].dims,A)),w&&R.push(U("bias",e[4].dataType,e[4].dims,A)),R.push(j("output",e[0].dataType,c,A)),_&&R.push(j("mean_output",1,d)),v&&R.push(j("inv_std_output",1,d)),S&&R.push(j("input_skip_bias_sum",e[0].dataType,c,A));let L=De(e[0].dataType);return`\n\n ${P.registerUniforms(O).declareVariables(...R)}\n\n ${P.mainStart()}\n ${P.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size / uniforms.hidden_size")}\n let hidden_size_vectorized: u32 = uniforms.hidden_size / uniforms.components;\n let offset = global_idx * hidden_size_vectorized;\n var sum = ${$t("f32",A)};\n var squareSum = ${$t("f32",A)};\n for (var i: u32 = 0; i < hidden_size_vectorized; i++) {\n let skip_value = skip[offset + i];\n let bias_value = ${w?"bias[i]":L+"(0.0)"};\n let input_value = x[offset + i];\n let value = input_value + skip_value + bias_value;\n ${S?"input_skip_bias_sum[offset + i] = value;":""}\n output[offset + i] = value;\n let f32_value = ${ir(L,A,"value")};\n sum += f32_value;\n squareSum += f32_value * f32_value;\n }\n let mean = ${_t("sum",A)} / f32(uniforms.hidden_size);\n let inv_std_dev = inverseSqrt(${_t("squareSum",A)} / f32(uniforms.hidden_size) ${i?"":"- mean * mean"} + uniforms.epsilon);\n ${_?"mean_output[global_idx] = mean;":""}\n ${v?"inv_std_output[global_idx] = inv_std_dev;":""}\n for (var i: u32 = 0; i < hidden_size_vectorized; i++) {\n output[offset + i] = (output[offset + i] ${i?"":`- ${L}(mean)`}) * ${L}(inv_std_dev) * gamma[i] ${y?"+ beta[i]":""};\n }\n }`},E=[{dims:c,dataType:e[0].dataType}];return r>1&&E.push({dims:d,dataType:1}),r>2&&E.push({dims:d,dataType:1}),r>3&&E.push({dims:u,dataType:e[0].dataType}),{name:"SkipLayerNormalization",shaderCache:{hint:`${A};${_};${v};${S}`,inputDependencies:e.map((P,O)=>"type")},getShaderSource:x,getRunData:()=>({outputs:E,dispatchGroup:{x:Math.ceil(p/h/64)},programUniforms:I})}},vd=(e,t)=>{Up(e.inputs);let o=[0];e.outputCount>1&&o.push(-3),e.outputCount>2&&o.push(-3),e.outputCount>3&&o.push(3),e.compute(Vp(e.inputs,t,e.outputCount,!1),{outputs:o})}});var Wp,Gn,Np,_d,Gp,Hp,Sd,xd,Cd=Y(()=>{"use strict";ye();Se();Ze();_e();Wp=(e,t)=>{if(!e||e.length<1)throw new Error("too few inputs");if(t.axes.length!==0){if(t.axes.length!==t.starts.length||t.axes.length!==t.ends.length)throw new Error("axes, starts and ends must have the same length")}else if(t.starts.length!==t.ends.length)throw new Error("starts and ends must have the same length");e.slice(1).forEach((r,o)=>{if(e[o+1].dataType!==6&&e[o+1].dataType!==7)throw new Error(`Input ${o} must be an array of int32 or int64`)})},Gn=(e,t)=>{let r=[];if(e.length>t)if(e[t].dataType===7)e[t].getBigInt64Array().forEach(o=>r.push(Number(o)));else if(e[t].dataType===6)e[t].getInt32Array().forEach(o=>r.push(Number(o)));else throw new Error(`Input ${t} must be an array of int32 or int64`);return r},Np=(e,t)=>{if(e.length>1){let r=Gn(e,1),o=Gn(e,2),i=Gn(e,3);return i.length===0&&(i=[...Array(e[0].dims.length).keys()]),ve({starts:r,ends:o,axes:i})}else return t},_d=(e,t,r,o,i)=>{let u=e;return e<0&&(u+=r[o[t]]),i[t]<0?Math.max(0,Math.min(u,r[o[t]]-1)):Math.max(0,Math.min(u,r[o[t]]))},Gp=(e,t,r)=>`fn calculateInputIndices(output_indices: ${t.type.indices}) -> ${e.type.indices} {\n var input_indices: ${e.type.indices};\n var carry = 0u;\n for (var i = ${r.length}; i >= 0; i--) {\n let input_shape_i = ${fe("uniforms.input_shape","i",r.length)};\n let steps_i = ${fe("uniforms.steps","i",r.length)};\n let signs_i = ${fe("uniforms.signs","i",r.length)};\n let starts_i = ${fe("uniforms.starts","i",r.length)};\n var output_index = ${t.indicesGet("output_indices","i")};\n var input_index = output_index * steps_i + starts_i + carry;\n carry = input_index / input_shape_i;\n input_index = input_index % input_shape_i;\n if (signs_i < 0) {\n input_index = input_shape_i - input_index - 1u + starts_i;\n }\n ${e.indicesSet("input_indices","i","input_index")};\n }\n return input_indices;\n }`,Hp=(e,t)=>{let r=e[0].dims,o=M.size(r),i=t.axes.length>0?M.normalizeAxes(t.axes,r.length):[...Array(r.length).keys()],u=Gn(e,4);u.forEach(I=>I!==0||(()=>{throw new Error("step cannot be 0")})),u.length===0&&(u=Array(i.length).fill(1));let a=t.starts.map((I,x)=>_d(I,x,r,i,u)),c=t.ends.map((I,x)=>_d(I,x,r,i,u));if(i.length!==a.length||i.length!==c.length)throw new Error("start, ends and axes should have the same number of elements");if(i.length!==r.length)for(let I=0;IMath.sign(I));u.forEach((I,x,E)=>{if(I<0){let P=(c[x]-a[x])/I,O=a[x],R=O+P*u[x];a[x]=R,c[x]=O,E[x]=-I}});let h=r.slice(0);i.forEach((I,x)=>{h[I]=Math.ceil((c[I]-a[I])/u[I])});let d={dims:h,dataType:e[0].dataType},y=j("output",e[0].dataType,h.length),w=U("input",e[0].dataType,e[0].dims.length),_=M.size(h),v=[{name:"outputSize",type:"u32"},{name:"starts",type:"u32",length:a.length},{name:"signs",type:"i32",length:p.length},{name:"steps",type:"u32",length:u.length}],S=[{type:12,data:_},{type:12,data:a},{type:6,data:p},{type:12,data:u},...Z(e[0].dims,h)],A=I=>`\n ${I.registerUniforms(v).declareVariables(w,y)}\n ${Gp(w,y,r)}\n ${I.mainStart()}\n ${I.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.outputSize")}\n let output_indices = ${y.offsetToIndices("global_idx")};\n let input_indices = calculateInputIndices(output_indices);\n ${y.setByOffset("global_idx",w.getByIndices("input_indices"))}\n }`;return{name:"Slice",shaderCache:{hint:`${p.length}_${a.length}_${u.length}`,inputDependencies:["rank"]},getShaderSource:A,getRunData:()=>({outputs:[d],dispatchGroup:{x:Math.ceil(o/64)},programUniforms:S})}},Sd=(e,t)=>{Wp(e.inputs,t);let r=Np(e.inputs,t);e.compute(Hp(e.inputs,r),{inputs:[0]})},xd=e=>{let t=e.starts,r=e.ends,o=e.axes;return ve({starts:t,ends:r,axes:o})}});var Lp,Fp,Ad,Id,Td=Y(()=>{"use strict";ye();Se();Ze();_e();Lp=e=>{if(!e||e.length!==1)throw new Error("Softmax op requires 1 input.")},Fp=(e,t)=>{let r=e.dims,o=M.size(r),i=64,u=t.axis;if(u<0&&(u=r.length+u),uI===4?`max(max(${A}.x, ${A}.y), max(${A}.z, ${A}.w))`:I===2?`max(${A}.x, ${A}.y)`:I===3?`max(max(${A}.x, ${A}.y), ${A}.z)`:A,y=U("x",e.dataType,e.dims,p),w=j("result",e.dataType,e.dims,p),_=y.type.value,v=De(e.dataType)==="f32"?`var threadMax = ${_}(-3.402823e+38f);`:`var threadMax = ${_}(-65504.0h);`,S=A=>`\n var rowMaxShared : ${_};\n var rowSumShared : ${_};\n var threadShared : array<${_}, ${i}>;\n\n fn getValue(row: i32, col: i32, row_stride: i32) -> ${_} {\n let index = row * row_stride + col;\n return x[index];\n }\n\n fn setValue(row: i32, col: i32, row_stride: i32, value: ${_}) {\n let index = row * row_stride + col;\n result[index] = value;\n }\n ${A.registerUniform("packedCols","i32").declareVariables(y,w)}\n ${A.mainStart()}\n let gindex = i32(global_idx);\n let lindex = i32(local_idx);\n const wg = ${i};\n let row = gindex / wg;\n let cols = uniforms.packedCols;\n let row_stride : i32 = uniforms.packedCols;\n\n // find the rows max\n ${v}\n for (var col = lindex; col < cols; col += wg) {\n let value = getValue(row, col, row_stride);\n threadMax = max(threadMax, value);\n }\n if (lindex < cols) {\n threadShared[lindex] = threadMax;\n }\n workgroupBarrier();\n\n var reduceSize = min(cols, wg);\n for (var currSize = reduceSize >> 1; currSize > 0; currSize = reduceSize >> 1) {\n reduceSize = currSize + (reduceSize & 1);\n if (lindex < currSize) {\n threadShared[lindex] = max(threadShared[lindex], threadShared[lindex + reduceSize]);\n }\n workgroupBarrier();\n }\n if (lindex == 0) {\n rowMaxShared = ${_}(${d("threadShared[0]",p)});\n }\n workgroupBarrier();\n\n // find the rows sum\n var threadSum = ${_}(0.0);\n for (var col = lindex; col < cols; col += wg) {\n let subExp = exp(getValue(row, col, row_stride) - rowMaxShared);\n threadSum += subExp;\n }\n threadShared[lindex] = threadSum;\n workgroupBarrier();\n\n for (var currSize = wg >> 1; currSize > 0; currSize = currSize >> 1) {\n if (lindex < currSize) {\n threadShared[lindex] = threadShared[lindex] + threadShared[lindex + currSize];\n }\n workgroupBarrier();\n }\n if (lindex == 0) {\n rowSumShared = ${_}(${_t("threadShared[0]",p)});\n }\n workgroupBarrier();\n\n // calculate final value for each element in the row\n for (var col = lindex; col < cols; col += wg) {\n let value = exp(getValue(row, col, row_stride) - rowMaxShared) / rowSumShared;\n setValue(row, col, row_stride, value);\n }\n }`;return{name:"Softmax",shaderCache:{hint:`${p}`,inputDependencies:["type"]},getRunData:()=>({outputs:[{dims:r,dataType:e.dataType}],dispatchGroup:{x:c},programUniforms:[{type:6,data:h}]}),getShaderSource:S}},Ad=(e,t)=>{Lp(e.inputs),e.compute(Fp(e.inputs[0],t))},Id=e=>ve({axis:e.axis})});var qp,jp,Kp,Yp,Zp,Ed,Pd,kd=Y(()=>{"use strict";ye();Se();Ze();_e();qp=e=>{if(!e||e.length<1)throw new Error("too few inputs")},jp=(e,t)=>{let r=[],o=t.numOutputs;return e[1].dims[0]>0&&(e[1].getBigInt64Array().forEach(i=>r.push(Number(i))),o=r.length),ve({numOutputs:o,axis:t.axis,splitSizes:r})},Kp=e=>`\nfn calculateOutputIndex(index: u32) -> u32 {\n for (var i: u32 = 0u; i < ${e}u; i += 1u ) {\n if (index < ${fe("uniforms.size_in_split_axis","i",e)}) {\n return i;\n }\n }\n return ${e}u;\n}`,Yp=e=>{let t=e.length,r=[];for(let o=0;o{let r=e[0].dims,o=M.size(r),i=e[0].dataType,u=M.normalizeAxis(t.axis,r.length),a=new Array(t.numOutputs),c=U("input",i,r.length),p=new Array(t.numOutputs),h=[],d=[],y=0,w=[{type:12,data:o}];for(let v=0;v`\n ${v.registerUniform("input_size","u32").registerUniform("size_in_split_axis","u32",p.length).declareVariables(c,...a)}\n ${Kp(p.length)}\n ${Yp(a)}\n\n ${v.mainStart()}\n ${v.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.input_size")}\n\n var indices = ${c.offsetToIndices("global_idx")};\n var index = ${c.indicesGet("indices",u)};\n let output_number = calculateOutputIndex(index);\n if (output_number != 0) {\n index -= ${fe("uniforms.size_in_split_axis","output_number - 1u",p.length)};\n ${c.indicesSet("indices",u,"index")};\n }\n writeBufferData(output_number, indices, global_idx);\n }`;return{name:"Split",shaderCache:{hint:t.cacheKey,inputDependencies:["rank"]},getShaderSource:_,getRunData:()=>({outputs:h,dispatchGroup:{x:Math.ceil(o/64)},programUniforms:w})}},Ed=(e,t)=>{qp(e.inputs);let r=e.inputs.length===1?t:jp(e.inputs,t);e.compute(Zp(e.inputs,r),{inputs:[0]})},Pd=e=>{let t=e.axis,r=e.splitSizes,o=e.numOutputs<0?r.length:e.numOutputs;if(o!==r.length)throw new Error("numOutputs and splitSizes lengh must be equal");return ve({axis:t,numOutputs:o,splitSizes:r})}});var Od,Xp,Qp,Jp,Rd,Bd=Y(()=>{"use strict";ye();Se();_e();Od=e=>Array.from(e.getBigInt64Array(),Number),Xp=e=>{if(!e||e.length!==2)throw new Error("Tile requires 2 inputs.");if(e[0].dataType!==1&&e[0].dataType!==6&&e[0].dataType!==12)throw new Error("Tile only support float, int32, and uint32 data types");if(e[1].dataType!==7)throw new Error("Tile `repeats` input should be of int64 data type");if(e[1].dims.length!==1)throw new Error("Tile `repeats` input should be 1-D");if(Od(e[1]).length!==e[0].dims.length)throw new Error("Tile `repeats` input should have same number of elements as rank of input data tensor")},Qp=(e,t)=>{let r=[];for(let o=0;o{let t=e[0].dims,r=Od(e[1]),o=Qp(t,r),i=M.size(o),u=e[0].dataType,a=U("input",u,t.length),c=j("output",u,o.length),p=h=>`\n const inputShape = ${a.indices(...t)};\n ${h.registerUniform("output_size","u32").declareVariables(a,c)}\n ${h.mainStart()}\n ${h.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.output_size")}\n let output_indices = ${c.offsetToIndices("global_idx")};\n var input_indices: ${a.type.indices};\n for (var i = 0; i < ${t.length}; i++) {\n let input_dim_i = ${a.indicesGet("uniforms.input_shape","i")};\n let input_dim_value = ${c.indicesGet("output_indices","i")} % input_dim_i;\n\n ${a.indicesSet("input_indices","i","input_dim_value")}\n }\n ${c.setByOffset("global_idx",a.getByIndices("input_indices"))}\n }`;return{name:"Tile",shaderCache:{hint:`${r}`,inputDependencies:["rank"]},getRunData:()=>({outputs:[{dims:o,dataType:e[0].dataType}],dispatchGroup:{x:Math.ceil(i/64)},programUniforms:[{type:12,data:i},...Z(e[0].dims,o)]}),getShaderSource:p}},Rd=e=>{Xp(e.inputs),e.compute(Jp(e.inputs),{inputs:[0]})}});var em,tm,Dd,zd=Y(()=>{"use strict";ye();Se();_e();em=(e,t,r,o,i)=>{let u=j("output_data",i,r.length,4),a=U("a_data",t[1].dataType,t[1].dims.length,4),c=U("b_data",t[2].dataType,t[2].dims.length,4),p=U("c_data",t[0].dataType,t[0].dims.length,4),h,d=(y,w,_)=>`select(${w}, ${y}, ${_})`;if(!o)h=u.setByOffset("global_idx",d(a.getByOffset("global_idx"),c.getByOffset("global_idx"),p.getByOffset("global_idx")));else{let y=(w,_,v="")=>{let S=`a_data[index_a${_}][component_a${_}]`,A=`b_data[index_b${_}][component_b${_}]`,I=`bool(c_data[index_c${_}] & (0xffu << (component_c${_} * 8)))`;return`\n let output_indices${_} = ${u.offsetToIndices(`global_idx * 4u + ${_}u`)};\n let offset_a${_} = ${a.broadcastedIndicesToOffset(`output_indices${_}`,u)};\n let offset_b${_} = ${c.broadcastedIndicesToOffset(`output_indices${_}`,u)};\n let offset_c${_} = ${p.broadcastedIndicesToOffset(`output_indices${_}`,u)};\n let index_a${_} = offset_a${_} / 4u;\n let index_b${_} = offset_b${_} / 4u;\n let index_c${_} = offset_c${_} / 4u;\n let component_a${_} = offset_a${_} % 4u;\n let component_b${_} = offset_b${_} % 4u;\n let component_c${_} = offset_c${_} % 4u;\n ${w}[${_}] = ${v}(${d(S,A,I)});\n `};i===9?h=`\n var data = vec4(0);\n ${y("data",0,"u32")}\n ${y("data",1,"u32")}\n ${y("data",2,"u32")}\n ${y("data",3,"u32")}\n output_data[global_idx] = dot(vec4(0x1, 0x100, 0x10000, 0x1000000), vec4(data));`:h=`\n ${y("output_data[global_idx]",0)}\n ${y("output_data[global_idx]",1)}\n ${y("output_data[global_idx]",2)}\n ${y("output_data[global_idx]",3)}\n `}return`\n ${e.registerUniform("vec_size","u32").declareVariables(p,a,c,u)}\n ${e.mainStart()}\n ${e.guardAgainstOutOfBoundsWorkgroupSizes("uniforms.vec_size")}\n ${h}\n }`},tm=e=>{let t=e[1].dims,r=e[2].dims,o=e[0].dims,i=e[1].dataType,u=!(M.areEqual(t,r)&&M.areEqual(r,o)),a=t,c=M.size(t);if(u){let h=It.calcShape(It.calcShape(t,r,!1),o,!1);if(!h)throw new Error("Can\'t perform where op on the given tensors");a=h,c=M.size(a)}let p=Math.ceil(c/4);return{name:"Where",shaderCache:{inputDependencies:["rank","rank","rank"]},getShaderSource:h=>em(h,e,a,u,i),getRunData:()=>({outputs:[{dims:a,dataType:i}],dispatchGroup:{x:Math.ceil(c/64/4)},programUniforms:[{type:12,data:p},...Z(o,t,r,a)]})}},Dd=e=>{e.compute(tm(e.inputs))}});var Md,Ud=Y(()=>{"use strict";Ka();Ro();Ja();ts();Vs();Zs();Oo();Uo();lu();mu();gu();$u();xu();Au();Eu();Ou();Du();Mu();Vu();Wo();Gu();qu();Ku();cd();md();In();yd();wd();$d();Cd();Td();kd();Bd();Sr();Rn();zd();Md=new Map([["Abs",[rs]],["Acos",[ns]],["Acosh",[os]],["Add",[Ws]],["ArgMax",[ja,ko]],["ArgMin",[qa,ko]],["Asin",[is]],["Asinh",[as]],["Atan",[ss]],["Atanh",[us]],["Attention",[Xa]],["AveragePool",[rd,td]],["BatchNormalization",[Qa]],["BiasAdd",[es]],["BiasSplitGelu",[Us]],["Cast",[ls,ds]],["Ceil",[ps]],["Clip",[cs]],["Concat",[Ya,Za]],["Conv",[Ho,Go]],["ConvTranspose",[du,uu]],["Cos",[ms]],["Cosh",[fs]],["CumSum",[cu,pu]],["DepthToSpace",[fu,hu]],["Div",[Ns]],["Einsum",[wu,vu]],["Elu",[hs,kn]],["Equal",[Gs]],["Erf",[gs]],["Exp",[ys]],["Expand",[Su]],["FastGelu",[Cu]],["Floor",[bs]],["FusedConv",[Ho,Go]],["Gather",[Tu,Iu]],["GatherElements",[ku,Pu]],["Gelu",[ws]],["Gemm",[Bu,Ru]],["GlobalAveragePool",[id,od]],["GlobalMaxPool",[ld,dd]],["Greater",[qs]],["GreaterOrEqual",[Ks]],["HardSigmoid",[Is,As]],["InstanceNormalization",[zu]],["LayerNormalization",[Uu]],["LeakyRelu",[vs,kn]],["Less",[js]],["LessOrEqual",[Ys]],["Log",[zs]],["MatMul",[ru]],["MatMulNBits",[Wu,Nu]],["MaxPool",[sd,ud]],["Mul",[Hs]],["MultiHeadAttention",[Fu,Lu]],["Neg",[_s]],["Not",[$s]],["Pad",[ju]],["Pow",[Ls]],["Range",[pd]],["Reciprocal",[Ss]],["ReduceMin",[Wa]],["ReduceMean",[Da]],["ReduceMax",[Va]],["ReduceSum",[Ga]],["ReduceProd",[Na]],["ReduceL1",[za]],["ReduceL2",[Ma]],["ReduceLogSum",[La]],["ReduceLogSumExp",[Ua]],["ReduceSumSquare",[Ha]],["Relu",[xs]],["Resize",[hd,gd]],["RotaryEmbedding",[bd]],["Sigmoid",[Cs]],["Sin",[Ts]],["Sinh",[Es]],["Slice",[Sd,xd]],["SkipLayerNormalization",[vd]],["Split",[Ed,Pd]],["Sqrt",[Ps]],["Softmax",[Ad,Id]],["Sub",[Fs]],["Tan",[ks]],["Tanh",[Rs]],["ThresholdedRelu",[Ds,kn]],["Tile",[Rd]],["Transpose",[_a,Sa]],["Where",[Dd]]])});var Hn,Vd=Y(()=>{"use strict";$r();Lt();_e();Hn=class{constructor(t){this.backend=t;this.repo=new Map,this.attributesBound=!1}getArtifact(t){return this.repo.get(t)}setArtifact(t,r){this.repo.set(t,r)}run(t,r,o,i,u){rr(t.programInfo.name);let a=this.backend.device,c=this.backend.getComputePassEncoder();this.backend.writeTimestamp(this.backend.pendingDispatchNumber*2);let p=[];for(let d of r)p.push({binding:p.length,resource:{buffer:d.buffer}});for(let d of o)p.push({binding:p.length,resource:{buffer:d.buffer}});u&&p.push({binding:p.length,resource:u});let h=a.createBindGroup({layout:t.computePipeline.getBindGroupLayout(0),entries:p,label:t.programInfo.name});if(this.backend.sessionStatus==="capturing"){let d={kernelId:this.backend.currentKernelId,computePipeline:t.computePipeline,bindGroup:h,dispatchGroup:i};this.backend.capturedCommandList.get(this.backend.currentSessionId).push(d)}c.setPipeline(t.computePipeline),c.setBindGroup(0,h),c.dispatchWorkgroups(...i),this.backend.writeTimestamp(this.backend.pendingDispatchNumber*2+1),this.backend.pendingDispatchNumber++,(this.backend.pendingDispatchNumber>=this.backend.maxDispatchNumber||this.backend.queryType==="at-passes")&&this.backend.endComputePass(),this.backend.pendingDispatchNumber>=this.backend.maxDispatchNumber&&this.backend.flush(),Ht(t.programInfo.name)}dispose(){}build(t,r){rr(t.name);let o=this.backend.device,i=[];o.features.has("shader-f16")&&i.push("enable f16;");let u=va(r,this.backend.device.limits),a=t.getShaderSource(u),c=`${i.join(`\n`)}\n${u.additionalImplementations}\n${a}`,p=o.createShaderModule({code:c,label:t.name});Ve("verbose",()=>`[WebGPU] ${t.name} shader code: ${c}`);let h=o.createComputePipeline({compute:{module:p,entryPoint:"main"},layout:"auto",label:t.name});return Ht(t.name),{programInfo:t,computePipeline:h,uniformVariablesInfo:u.variablesInfo}}normalizeDispatchGroupSize(t){let r=typeof t=="number"?t:t.x,o=typeof t=="number"?1:t.y||1,i=typeof t=="number"?1:t.z||1,u=this.backend.device.limits.maxComputeWorkgroupsPerDimension;if(r<=u&&o<=u&&i<=u)return[r,o,i];let a=r*o*i,c=Math.ceil(Math.sqrt(a));if(c>u){if(c=Math.ceil(Math.cbrt(a)),c>u)throw new Error("Total dispatch size exceeds WebGPU maximum.");return[c,c,c]}else return[c,c,1]}}});var rm,nm,Yo,Ln,Wd=Y(()=>{"use strict";$r();ye();Lt();fa();wa();Ud();Vd();rm=(e,t)=>{if(t.length!==e.length)throw new Error(`inputDependencies length ${t.length} is not equal to inputTensors length ${e.length}.`);let r=[];for(let o=0;o{let o=e.name;return e.shaderCache?.hint&&(o+="["+e.shaderCache.hint+"]"),o+=":"+r+`:${rm(t,e.shaderCache?.inputDependencies??new Array(t.length).fill("dims"))}`,o},Yo=class{constructor(t){t&&(this.architecture=t.architecture,this.vendor=t.vendor)}isArchitecture(t){return this.architecture===t}isVendor(t){return this.vendor===t}},Ln=class{constructor(){this.currentSessionId=null;this.currentKernelId=null;this.commandEncoder=null;this.computePassEncoder=null;this.maxDispatchNumber=16;this.pendingDispatchNumber=0;this.pendingKernels=[];this.pendingQueries=new Map;this.sessionStatus="default";this.capturedCommandList=new Map;this.capturedPendingKernels=new Map;this.sessionExternalDataMapping=new Map}get currentKernelCustomData(){if(this.currentKernelId===null)throw new Error("currentKernelCustomData(): currentKernelId is null. (should not happen)");let t=this.kernelCustomData.get(this.currentKernelId);return t||(t={},this.kernelCustomData.set(this.currentKernelId,t)),t}async initialize(t,r){this.env=t;let o=[],i={requiredLimits:{maxComputeWorkgroupStorageSize:r.limits.maxComputeWorkgroupStorageSize,maxComputeWorkgroupsPerDimension:r.limits.maxComputeWorkgroupsPerDimension,maxStorageBufferBindingSize:r.limits.maxStorageBufferBindingSize,maxBufferSize:r.limits.maxBufferSize,maxComputeInvocationsPerWorkgroup:r.limits.maxComputeInvocationsPerWorkgroup,maxComputeWorkgroupSizeX:r.limits.maxComputeWorkgroupSizeX,maxComputeWorkgroupSizeY:r.limits.maxComputeWorkgroupSizeY,maxComputeWorkgroupSizeZ:r.limits.maxComputeWorkgroupSizeZ},requiredFeatures:o};r.features.has("chromium-experimental-timestamp-query-inside-passes")?o.push("chromium-experimental-timestamp-query-inside-passes"):r.features.has("timestamp-query")&&o.push("timestamp-query"),r.features.has("shader-f16")&&o.push("shader-f16"),this.device=await r.requestDevice(i),this.adapterInfo=new Yo(await r.requestAdapterInfo()),this.gpuDataManager=ba(this),this.programManager=new Hn(this),this.kernels=new Map,this.kernelPersistentData=new Map,this.kernelCustomData=new Map,pa(t.logLevel,!!t.debug),this.device.onuncapturederror=u=>{u.error instanceof GPUValidationError&&console.error(`An uncaught WebGPU validation error was raised: ${u.error.message}`)},Object.defineProperty(this.env.webgpu,"device",{value:this.device,writable:!1,enumerable:!0,configurable:!1}),Object.defineProperty(this.env.webgpu,"adapter",{value:r,writable:!1,enumerable:!0,configurable:!1}),this.setQueryType()}dispose(){typeof this.querySet<"u"&&this.querySet.destroy(),this.gpuDataManager.dispose()}getCommandEncoder(){return this.commandEncoder||(this.commandEncoder=this.device.createCommandEncoder()),this.commandEncoder}getComputePassEncoder(){if(!this.computePassEncoder){let t=this.getCommandEncoder(),r={};this.queryType==="at-passes"&&(r.timestampWrites={querySet:this.querySet,beginningOfPassWriteIndex:this.pendingDispatchNumber*2,endOfPassWriteIndex:this.pendingDispatchNumber*2+1}),this.computePassEncoder=t.beginComputePass(r)}return this.computePassEncoder}endComputePass(){this.computePassEncoder&&(this.computePassEncoder.end(),this.computePassEncoder=null)}flush(){if(!this.commandEncoder)return;rr(),this.endComputePass();let t;this.queryType!=="none"&&(this.commandEncoder.resolveQuerySet(this.querySet,0,this.pendingDispatchNumber*2,this.queryResolveBuffer,0),t=this.device.createBuffer({size:this.pendingDispatchNumber*2*8,usage:GPUBufferUsage.MAP_READ|GPUBufferUsage.COPY_DST}),this.pendingQueries.set(t,this.pendingKernels),this.pendingKernels=[],this.commandEncoder.copyBufferToBuffer(this.queryResolveBuffer,0,t,0,this.pendingDispatchNumber*2*8)),this.device.queue.submit([this.commandEncoder.finish()]),this.gpuDataManager.refreshPendingBuffers(),this.commandEncoder=null,this.pendingDispatchNumber=0,this.queryType!=="none"&&t.mapAsync(GPUMapMode.READ).then(()=>{let r=new BigUint64Array(t.getMappedRange()),o=this.pendingQueries.get(t);for(let i=0;i"u"&&(this.queryTimeBase=_);let S=Number(_-this.queryTimeBase),A=Number(v-this.queryTimeBase);if(!Number.isSafeInteger(S)||!Number.isSafeInteger(A))throw new RangeError("incorrect timestamp range");if(this.env.webgpu.profiling?.ondata)this.env.webgpu.profiling.ondata({version:1,inputsMetadata:y.map(I=>({dims:I.dims,dataType:Gt(I.dataType)})),outputsMetadata:w.map(I=>({dims:I.dims,dataType:Gt(I.dataType)})),kernelId:a,kernelType:p,kernelName:h,programName:d,startTime:S,endTime:A});else{let I="";y.forEach((E,P)=>{I+=`input[${P}]: [${E.dims}] | ${Gt(E.dataType)}, `});let x="";w.forEach((E,P)=>{x+=`output[${P}]: [${E.dims}] | ${Gt(E.dataType)}, `}),console.log(`[profiling] kernel "${a}|${p}|${h}|${d}" ${I}${x}execution time: ${A-S} ns`)}wo("GPU",`${d}::${_}::${v}`)}t.unmap(),this.pendingQueries.delete(t)}),Ht()}run(t,r,o,i,u,a){rr(t.name);let c=[];for(let E=0;EP):o;if(y.length!==p.length)throw new Error(`Output size ${y.length} must be equal to ${p.length}.`);let w=[],_=[];for(let E=0;E=a)throw new Error(`Invalid output index: ${y[E]}`);if(y[E]===-3)continue;let P=y[E]===-1,O=y[E]===-2,R=P||O?u(p[E].dataType,p[E].dims):i(y[E],p[E].dataType,p[E].dims);if(w.push(R),R.data===0)continue;let L=this.gpuDataManager.get(R.data);if(!L)throw new Error(`no GPU data for output: ${R.data}`);if(P&&this.temporaryData.push(L),O){let N=this.kernelPersistentData.get(this.currentKernelId);N||(N=[],this.kernelPersistentData.set(this.currentKernelId,N)),N.push(L)}_.push(L)}if(c.length!==r.length||_.length!==w.length){if(_.length===0)return Ht(t.name),w;throw new Error(`Program ${t.name} has zero-sized tensor(s) in inputs or outputs. This is not supported now.`)}let v;if(d){let E=0,P=[];d.forEach(N=>{let K=typeof N.data=="number"?[N.data]:N.data;if(K.length===0)return;let Q=N.type===10?2:4,he,W;N.type===10?(W=K.length>4?16:K.length>2?8:K.length*Q,he=K.length>4?16:Q*K.length):(W=K.length<=2?K.length*Q:16,he=16),E=Math.ceil(E/W)*W,P.push(E);let se=N.type===10?8:4;E+=K.length>4?Math.ceil(K.length/se)*he:K.length*Q});let O=16;E=Math.ceil(E/O)*O;let R=new ArrayBuffer(E);d.forEach((N,K)=>{let Q=P[K],he=typeof N.data=="number"?[N.data]:N.data;if(N.type===6)new Int32Array(R,Q,he.length).set(he);else if(N.type===12)new Uint32Array(R,Q,he.length).set(he);else if(N.type===10)new Uint16Array(R,Q,he.length).set(he);else if(N.type===1)new Float32Array(R,Q,he.length).set(he);else throw new Error(`Unsupported uniform type: ${Gt(N.type)}`)});let L=this.gpuDataManager.create(E,GPUBufferUsage.COPY_DST|GPUBufferUsage.UNIFORM);this.device.queue.writeBuffer(L.buffer,0,R,0,E),this.gpuDataManager.release(L.id),v={offset:0,size:E,buffer:L.buffer}}let S=this.programManager.normalizeDispatchGroupSize(h),A=S[1]===1&&S[2]===1,I=nm(t,r,A),x=this.programManager.getArtifact(I);if(x||(x=this.programManager.build(t,S),this.programManager.setArtifact(I,x),Ve("info",()=>`[artifact] key: ${I}, programName: ${t.name}`)),d&&x.uniformVariablesInfo){if(d.length!==x.uniformVariablesInfo.length)throw new Error(`Uniform variables count mismatch: expect ${x.uniformVariablesInfo.length}, got ${d.length} in program "${x.programInfo.name}".`);for(let E=0;E`[ProgramManager] run "${t.name}" (key=${I}) with ${S[0]}x${S[1]}x${S[2]}`),this.queryType!=="none"||this.sessionStatus==="capturing"){let E={kernelId:this.currentKernelId,programName:x.programInfo.name,inputTensorViews:r,outputTensorViews:w};this.pendingKernels.push(E),this.sessionStatus==="capturing"&&this.capturedPendingKernels.get(this.currentSessionId).push(E)}return this.programManager.run(x,c,_,S,v),Ht(t.name),w}upload(t,r){this.gpuDataManager.upload(t,r)}memcpy(t,r){this.gpuDataManager.memcpy(t,r)}async download(t,r){await this.gpuDataManager.download(t,r)}alloc(t){return this.gpuDataManager.create(t).id}free(t){return this.gpuDataManager.release(t)}createKernel(t,r,o,i){let u=Md.get(t);if(!u)throw new Error(`kernel not implemented: ${t}`);let a={kernelType:t,kernelName:i,kernelEntry:u[0],attributes:[u[1],o]};this.kernels.set(r,a)}releaseKernel(t){let r=this.kernelPersistentData.get(t);if(r){for(let o of r)this.gpuDataManager.release(o.id);this.kernelPersistentData.delete(t)}this.kernelCustomData.delete(t),this.kernels.delete(t)}computeKernel(t,r,o){let i=this.kernels.get(t);if(!i)throw new Error(`kernel not created: ${t}`);let u=i.kernelType,a=i.kernelName,c=i.kernelEntry,p=i.attributes;if(this.currentKernelId!==null)throw new Error(`kernel "[${u}] ${a}" is not allowed to be called recursively`);this.currentKernelId=t,p[0]&&(p[1]=p[0](p[1]),p[0]=void 0),Ve("info",()=>`[WebGPU] Start to run kernel "[${u}] ${a}"...`);let h=this.env.debug;this.temporaryData=[];try{return h&&this.device.pushErrorScope("validation"),c(r,p[1]),0}catch(d){return o.push(Promise.resolve(`[WebGPU] Kernel "[${u}] ${a}" failed. ${d}`)),1}finally{h&&o.push(this.device.popErrorScope().then(d=>d?`GPU validation error for kernel "[${u}] ${a}": ${d.message}`:null));for(let d of this.temporaryData)this.gpuDataManager.release(d.id);this.temporaryData=[],this.currentKernelId=null}}registerBuffer(t,r,o,i){let u=this.sessionExternalDataMapping.get(t);u||(u=new Map,this.sessionExternalDataMapping.set(t,u));let a=u.get(r),c=this.gpuDataManager.registerExternalBuffer(o,i,a?.[1]);return u.set(r,[c,o]),c}unregisterBuffers(t){let r=this.sessionExternalDataMapping.get(t);r&&(r.forEach(o=>this.gpuDataManager.unregisterExternalBuffer(o[1])),this.sessionExternalDataMapping.delete(t))}getBuffer(t){let r=this.gpuDataManager.get(t);if(!r)throw new Error(`no GPU data for buffer: ${t}`);return r.buffer}createDownloader(t,r,o){return async()=>{let i=await xo(this,t,r);return ma(i.buffer,o)}}writeTimestamp(t){this.queryType==="inside-passes"&&this.computePassEncoder.writeTimestamp(this.querySet,t)}setQueryType(){this.queryType="none",(this.env.webgpu.profiling?.mode==="default"||(typeof this.env.trace>"u"?this.env.wasm.trace:this.env.trace))&&(this.device.features.has("chromium-experimental-timestamp-query-inside-passes")?this.queryType="inside-passes":this.device.features.has("timestamp-query")&&(this.queryType="at-passes"),this.queryType!=="none"&&typeof this.querySet>"u"&&(this.querySet=this.device.createQuerySet({type:"timestamp",count:this.maxDispatchNumber*2}),this.queryResolveBuffer=this.device.createBuffer({size:this.maxDispatchNumber*2*8,usage:GPUBufferUsage.COPY_SRC|GPUBufferUsage.QUERY_RESOLVE})))}captureBegin(){Ve("info","captureBegin"),this.capturedCommandList.get(this.currentSessionId)||this.capturedCommandList.set(this.currentSessionId,[]),this.capturedPendingKernels.get(this.currentSessionId)||this.capturedPendingKernels.set(this.currentSessionId,[]),this.flush(),this.sessionStatus="capturing"}captureEnd(){Ve("info","captureEnd"),this.flush(),this.sessionStatus="default"}replay(){Ve("info","replay"),this.sessionStatus="replaying";let t=this.capturedCommandList.get(this.currentSessionId),r=this.capturedPendingKernels.get(this.currentSessionId),o=t.length;this.pendingKernels=[];for(let i=0;i=this.maxDispatchNumber||this.queryType==="at-passes")&&this.endComputePass(),this.pendingDispatchNumber>=this.maxDispatchNumber&&this.flush()}this.flush(),this.sessionStatus="default"}onReleaseSession(t){this.unregisterBuffers(t),this.capturedCommandList.has(t)&&this.capturedCommandList.delete(t),this.capturedPendingKernels.has(t)&&this.capturedPendingKernels.delete(t),this.gpuDataManager.onReleaseSession(t)}onRunStart(t){this.currentSessionId=t,this.setQueryType()}}});var Nd={};gn(Nd,{init:()=>om});var qr,Zo,om,Gd=Y(()=>{"use strict";ye();Wd();Lt();Se();qr=class e{constructor(t,r,o,i){this.module=t;this.dataType=r;this.data=o;this.dims=i}getFloat32Array(){if(this.dataType!==1)throw new Error("Invalid data type");let t=M.size(this.dims);return t===0?new Float32Array:new Float32Array(this.module.HEAP8.buffer,this.data,t)}getBigInt64Array(){if(this.dataType!==7)throw new Error("Invalid data type");let t=M.size(this.dims);return t===0?new BigInt64Array:new BigInt64Array(this.module.HEAP8.buffer,this.data,t)}getInt32Array(){if(this.dataType!==6)throw new Error("Invalid data type");let t=M.size(this.dims);return t===0?new Int32Array:new Int32Array(this.module.HEAP8.buffer,this.data,t)}reshape(t){if(M.size(t)!==M.size(this.dims))throw new Error("Invalid new shape");return new e(this.module,this.dataType,this.data,t)}},Zo=class{constructor(t,r,o){this.module=t;this.backend=r;this.customDataOffset=0;this.customDataSize=0;this.adapterInfo=r.adapterInfo;let i=t.HEAPU32,u=o>>>2;this.opKernelContext=i[u++];let a=i[u++];this.outputCount=i[u++],this.customDataOffset=i[u++],this.customDataSize=i[u++];let c=[];for(let p=0;ptypeof c=="number"?this.inputs[c]:c)??this.inputs,i=r?.outputs??[],u=(c,p,h)=>new qr(this.module,p,this.output(c,h),h),a=(c,p)=>{let h=tr(c);if(!h)throw new Error(`Unsupported data type: ${c}`);let d=h*M.size(p),y=d>0?this.backend.gpuDataManager.create(d).id:0;return new qr(this.module,c,y,p)};return this.backend.run(t,o,i,u,a,this.outputCount)}output(t,r){let o=this.module.stackSave();try{let i=this.module.stackAlloc((1+r.length)*4),u=i>>2;this.module.HEAPU32[u++]=r.length;for(let a=0;a{let i=t.jsepInit;if(!i)throw new Error("Failed to initialize JSEP. The WebAssembly module is not built with JSEP support.");if(e==="webgpu"){let u=new Ln;await u.initialize(r,o),i("webgpu",[u,a=>u.alloc(a),a=>u.free(a),(a,c,p,h=!1)=>{if(h)Ve("verbose",()=>`[WebGPU] jsepCopyGpuToGpu: src=${a}, dst=${c}, size=${p}`),u.memcpy(a,c);else{Ve("verbose",()=>`[WebGPU] jsepCopyCpuToGpu: dataOffset=${a}, gpuDataId=${c}, size=${p}`);let d=t.HEAPU8.subarray(a>>>0,(a>>>0)+p);u.upload(c,d)}},async(a,c,p)=>{Ve("verbose",()=>`[WebGPU] jsepCopyGpuToCpu: gpuDataId=${a}, dataOffset=${c}, size=${p}`),await u.download(a,()=>t.HEAPU8.subarray(c>>>0,(c>>>0)+p))},(a,c,p)=>u.createKernel(a,c,p,t.UTF8ToString(t._JsepGetNodeName(c))),a=>u.releaseKernel(a),(a,c,p,h)=>{Ve("verbose",()=>`[WebGPU] jsepRun: sessionHandle=${p}, kernel=${a}, contextDataOffset=${c}`);let d=new Zo(t,u,c);return u.computeKernel(a,d,h)},()=>u.captureBegin(),()=>u.captureEnd(),()=>u.replay()])}else i("webnn")}});var Vi;Vi=Ei();var pl=zi(),fo,ho=!1,yn=!1,Ui=!1,ml=e=>{if(e===1)return!1;if(typeof SharedArrayBuffer>"u")return typeof self<"u"&&!self.crossOriginIsolated&&console.warn("env.wasm.numThreads is set to "+e+", but this will not work unless you enable crossOriginIsolated mode. See https://web.dev/cross-origin-isolation-guide/ for more info."),!1;typeof process<"u"&&process.versions&&process.versions.node&&console.warn("env.wasm.numThreads is set to "+e+", however, currently onnxruntime-web does not support multi-threads in Node.js. Please consider using onnxruntime-node for performance critical scenarios.");try{return typeof MessageChannel<"u"&&new MessageChannel().port1.postMessage(new SharedArrayBuffer(1)),WebAssembly.validate(new Uint8Array([0,97,115,109,1,0,0,0,1,4,1,96,0,0,3,2,1,0,5,4,1,3,1,1,10,11,1,9,0,65,0,254,16,2,0,26,11]))}catch{return!1}},fl=()=>{try{return WebAssembly.validate(new Uint8Array([0,97,115,109,1,0,0,0,1,4,1,96,0,0,3,2,1,0,10,30,1,28,0,65,0,253,15,253,12,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,253,186,1,26,11]))}catch{return!1}},hl=(e,t)=>e?t?"ort-wasm-simd-threaded.wasm":"ort-wasm-simd.wasm":t?"ort-wasm-threaded.wasm":"ort-wasm.wasm",Wi=async e=>{if(ho)return Promise.resolve();if(yn)throw new Error("multiple calls to \'initializeWebAssembly()\' detected.");if(Ui)throw new Error("previous call to \'initializeWebAssembly()\' failed.");yn=!0;let t=e.initTimeout,r=e.numThreads,o=e.simd,i=ml(r),u=o&&fl(),a=e.wasmPaths,c=typeof a=="string"?a:void 0,p=hl(u,i),h=typeof a=="object"?a[p]:void 0,d=!1,y=[];if(t>0&&y.push(new Promise(w=>{setTimeout(()=>{d=!0,w()},t)})),y.push(new Promise((w,_)=>{let v=i?pl:Vi,S={locateFile:(A,I)=>{if(i&&A.endsWith(".worker.js")&&typeof Blob<"u")return URL.createObjectURL(new Blob([Mi()],{type:"text/javascript"}));if(A.endsWith(".wasm")){if(h)return h;let x=c??I;return p==="ort-wasm-simd.wasm"?x+"ort-wasm-simd.jsep.wasm":p==="ort-wasm-simd-threaded.wasm"?x+"ort-wasm-simd-threaded.jsep.wasm":x+p}return I+A}};if(i)if(S.numThreads=r,typeof Blob>"u")S.mainScriptUrlOrBlob=(void 0)(__dirname,"ort-wasm-threaded.js");else{let A=`var ortWasmThreaded=${v.toString()};`;S.mainScriptUrlOrBlob=new Blob([A],{type:"text/javascript"})}v(S).then(A=>{yn=!1,ho=!0,fo=A,w()},A=>{yn=!1,Ui=!0,_(A)})})),await Promise.race(y),d)throw new Error(`WebAssembly backend initializing failed due to timeout: ${t}ms`)},Le=()=>{if(ho&&fo)return fo;throw new Error("WebAssembly is not initialized yet.")};var Fe=(e,t)=>{let r=Le(),o=r.lengthBytesUTF8(e)+1,i=r._malloc(o);return r.stringToUTF8(e,i,o),t.push(i),i},Nr=(e,t,r,o)=>{if(typeof e=="object"&&e!==null){if(r.has(e))throw new Error("Circular reference in options");r.add(e)}Object.entries(e).forEach(([i,u])=>{let a=t?t+i:i;if(typeof u=="object")Nr(u,a+".",r,o);else if(typeof u=="string"||typeof u=="number")o(a,u.toString());else if(typeof u=="boolean")o(a,u?"1":"0");else throw new Error(`Can\'t handle extra config type: ${typeof u}`)})},Ue=e=>{let t=Le(),r=t.stackSave();try{let o=t.stackAlloc(8);t._OrtGetLastError(o,o+4);let i=t.HEAP32[o/4],u=t.HEAPU32[o/4+1],a=u?t.UTF8ToString(u):"";throw new Error(`${e} ERROR_CODE: ${i}, ERROR_MESSAGE: ${a}`)}finally{t.stackRestore(r)}};var Ni=e=>{let t=Le(),r=0,o=[],i=e||{};try{if(e?.logSeverityLevel===void 0)i.logSeverityLevel=2;else if(typeof e.logSeverityLevel!="number"||!Number.isInteger(e.logSeverityLevel)||e.logSeverityLevel<0||e.logSeverityLevel>4)throw new Error(`log serverity level is not valid: ${e.logSeverityLevel}`);if(e?.logVerbosityLevel===void 0)i.logVerbosityLevel=0;else if(typeof e.logVerbosityLevel!="number"||!Number.isInteger(e.logVerbosityLevel))throw new Error(`log verbosity level is not valid: ${e.logVerbosityLevel}`);e?.terminate===void 0&&(i.terminate=!1);let u=0;return e?.tag!==void 0&&(u=Fe(e.tag,o)),r=t._OrtCreateRunOptions(i.logSeverityLevel,i.logVerbosityLevel,!!i.terminate,u),r===0&&Ue("Can\'t create run options."),e?.extra!==void 0&&Nr(e.extra,"",new WeakSet,(a,c)=>{let p=Fe(a,o),h=Fe(c,o);t._OrtAddRunConfigEntry(r,p,h)!==0&&Ue(`Can\'t set a run config entry: ${a} - ${c}.`)}),[r,o]}catch(u){throw r!==0&&t._OrtReleaseRunOptions(r),o.forEach(a=>t._free(a)),u}};var gl=e=>{switch(e){case"disabled":return 0;case"basic":return 1;case"extended":return 2;case"all":return 99;default:throw new Error(`unsupported graph optimization level: ${e}`)}},yl=e=>{switch(e){case"sequential":return 0;case"parallel":return 1;default:throw new Error(`unsupported execution mode: ${e}`)}},bl=e=>{e.extra||(e.extra={}),e.extra.session||(e.extra.session={});let t=e.extra.session;t.use_ort_model_bytes_directly||(t.use_ort_model_bytes_directly="1"),e.executionProviders&&e.executionProviders.some(r=>(typeof r=="string"?r:r.name)==="webgpu")&&(e.enableMemPattern=!1)},wl=(e,t,r)=>{for(let o of t){let i=typeof o=="string"?o:o.name;switch(i){case"webnn":if(i="WEBNN",typeof o!="string"){let a=o;if(a?.deviceType){let c=Fe("deviceType",r),p=Fe(a.deviceType,r);Le()._OrtAddSessionConfigEntry(e,c,p)!==0&&Ue(`Can\'t set a session config entry: \'deviceType\' - ${a.deviceType}.`)}if(a?.numThreads){let c=a.numThreads;(typeof c!="number"||!Number.isInteger(c)||c<0)&&(c=0);let p=Fe("numThreads",r),h=Fe(c.toString(),r);Le()._OrtAddSessionConfigEntry(e,p,h)!==0&&Ue(`Can\'t set a session config entry: \'numThreads\' - ${a.numThreads}.`)}if(a?.powerPreference){let c=Fe("powerPreference",r),p=Fe(a.powerPreference,r);Le()._OrtAddSessionConfigEntry(e,c,p)!==0&&Ue(`Can\'t set a session config entry: \'powerPreference\' - ${a.powerPreference}.`)}}break;case"webgpu":if(i="JS",typeof o!="string"){let a=o;if(a?.preferredLayout){if(a.preferredLayout!=="NCHW"&&a.preferredLayout!=="NHWC")throw new Error(`preferredLayout must be either \'NCHW\' or \'NHWC\': ${a.preferredLayout}`);let c=Fe("preferredLayout",r),p=Fe(a.preferredLayout,r);Le()._OrtAddSessionConfigEntry(e,c,p)!==0&&Ue(`Can\'t set a session config entry: \'preferredLayout\' - ${a.preferredLayout}.`)}}break;case"wasm":case"cpu":continue;default:throw new Error(`not supported execution provider: ${i}`)}let u=Fe(i,r);Le()._OrtAppendExecutionProvider(e,u)!==0&&Ue(`Can\'t append execution provider: ${i}.`)}},Gi=e=>{let t=Le(),r=0,o=[],i=e||{};bl(i);try{let u=gl(i.graphOptimizationLevel??"all"),a=yl(i.executionMode??"sequential"),c=typeof i.logId=="string"?Fe(i.logId,o):0,p=i.logSeverityLevel??2;if(!Number.isInteger(p)||p<0||p>4)throw new Error(`log serverity level is not valid: ${p}`);let h=i.logVerbosityLevel??0;if(!Number.isInteger(h)||h<0||h>4)throw new Error(`log verbosity level is not valid: ${h}`);let d=typeof i.optimizedModelFilePath=="string"?Fe(i.optimizedModelFilePath,o):0;if(r=t._OrtCreateSessionOptions(u,!!i.enableCpuMemArena,!!i.enableMemPattern,a,!!i.enableProfiling,0,c,p,h,d),r===0&&Ue("Can\'t create session options."),i.executionProviders&&wl(r,i.executionProviders,o),i.enableGraphCapture!==void 0){if(typeof i.enableGraphCapture!="boolean")throw new Error(`enableGraphCapture must be a boolean value: ${i.enableGraphCapture}`);let y=Fe("enableGraphCapture",o),w=Fe(i.enableGraphCapture.toString(),o);t._OrtAddSessionConfigEntry(r,y,w)!==0&&Ue(`Can\'t set a session config entry: \'enableGraphCapture\' - ${i.enableGraphCapture}.`)}if(i.freeDimensionOverrides)for(let[y,w]of Object.entries(i.freeDimensionOverrides)){if(typeof y!="string")throw new Error(`free dimension override name must be a string: ${y}`);if(typeof w!="number"||!Number.isInteger(w)||w<0)throw new Error(`free dimension override value must be a non-negative integer: ${w}`);let _=Fe(y,o);t._OrtAddFreeDimensionOverride(r,_,w)!==0&&Ue(`Can\'t set a free dimension override: ${y} - ${w}.`)}return i.extra!==void 0&&Nr(i.extra,"",new WeakSet,(y,w)=>{let _=Fe(y,o),v=Fe(w,o);t._OrtAddSessionConfigEntry(r,_,v)!==0&&Ue(`Can\'t set a session config entry: ${y} - ${w}.`)}),[r,o]}catch(u){throw r!==0&&t._OrtReleaseSessionOptions(r),o.forEach(a=>t._free(a)),u}};ye();var Li=async e=>{if(typeof e=="string")if(typeof process<"u"&&process.versions&&process.versions.node)try{return new Uint8Array(await(void 0)(e))}catch(t){if(t.code==="ERR_FS_FILE_TOO_LARGE"){let r=(void 0)(e),o=[];for await(let i of r)o.push(i);return new Uint8Array(Buffer.concat(o))}throw t}else{let t=await fetch(e);if(!t.ok)throw new Error(`failed to load external data file: ${e}`);let r=t.headers.get("Content-Length"),o=r?parseInt(r,10):0;if(o<1073741824)return new Uint8Array(await t.arrayBuffer());{if(!t.body)throw new Error(`failed to load external data file: ${e}, no response body.`);let i=t.body.getReader(),u;try{u=new ArrayBuffer(o)}catch(c){if(c instanceof RangeError){let p=Math.ceil(o/65536);u=new WebAssembly.Memory({initial:p,maximum:p}).buffer}else throw c}let a=0;for(;;){let{done:c,value:p}=await i.read();if(c)break;let h=p.byteLength;new Uint8Array(u,a,h).set(p),a+=h}return new Uint8Array(u,0,o)}}else return e instanceof Blob?new Uint8Array(await e.arrayBuffer()):e instanceof Uint8Array?e:new Uint8Array(e)};var im=(e,t)=>{Le()._OrtInit(e,t)!==0&&Ue("Can\'t initialize onnxruntime.")},Ld=async e=>{im(e.wasm.numThreads,Gr(e.logLevel))},Fd=async(e,t)=>{{let r=(Gd(),wr(Nd)).init;if(t==="webgpu"){if(typeof navigator>"u"||!navigator.gpu)throw new Error("WebGPU is not supported in current environment");let o=e.webgpu.adapter;if(o){if(typeof o.limits!="object"||typeof o.features!="object"||typeof o.requestDevice!="function")throw new Error("Invalid GPU adapter set in `env.webgpu.adapter`. It must be a GPUAdapter object.")}else{let i=e.webgpu.powerPreference;if(i!==void 0&&i!=="low-power"&&i!=="high-performance")throw new Error(`Invalid powerPreference setting: "${i}"`);let u=e.webgpu.forceFallbackAdapter;if(u!==void 0&&typeof u!="boolean")throw new Error(`Invalid forceFallbackAdapter setting: "${u}"`);if(o=await navigator.gpu.requestAdapter({powerPreference:i,forceFallbackAdapter:u}),!o)throw new Error(\'Failed to get GPU adapter. You may need to enable flag "--enable-unsafe-webgpu" if you are using Chrome.\')}if(!e.wasm.simd)throw new Error("Not supported for WebGPU=ON and SIMD=OFF. Please set `env.wasm.simd` to true when using `webgpu` EP");await r("webgpu",Le(),e,o)}if(t==="webnn"){if(typeof navigator>"u"||!navigator.ml)throw new Error("WebNN is not supported in current environment");await r("webnn",Le(),e)}}},ar=new Map,am=e=>{let t=Le(),r=t.stackSave();try{let o=t.stackAlloc(8);return t._OrtGetInputOutputCount(e,o,o+4)!==0&&Ue("Can\'t get session input/output count."),[t.HEAP32[o/4],t.HEAP32[o/4+1]]}finally{t.stackRestore(r)}},Xo=e=>{let t=Le(),r=t._malloc(e.byteLength);if(r===0)throw new Error(`Can\'t create a session. failed to allocate a buffer of size ${e.byteLength}.`);return t.HEAPU8.set(e,r),[r,e.byteLength]},qd=async(e,t)=>{let r,o,i=Le();Array.isArray(e)?[r,o]=e:e.buffer===i.HEAPU8.buffer?[r,o]=[e.byteOffset,e.byteLength]:[r,o]=Xo(e);let u=0,a=0,c=0,p=[],h=[],d=[];try{if([a,p]=Gi(t),t?.externalData&&i.mountExternalData){let x=[];for(let E of t.externalData){let P=typeof E=="string"?E:E.path;x.push(Li(typeof E=="string"?E:E.data).then(O=>{i.mountExternalData(P,O)}))}await Promise.all(x)}u=await i._OrtCreateSession(r,o,a),u===0&&Ue("Can\'t create a session.");let[y,w]=am(u),_=!!t?.enableGraphCapture,v=[],S=[],A=[];for(let x=0;xx==="gpu-buffer")&&(c=i._OrtCreateBinding(u),c===0&&Ue("Can\'t create IO binding."),I={handle:c,outputPreferredLocations:A,outputPreferredLocationsEncoded:A.map(x=>yo(x))}),ar.set(u,[u,h,d,I,_,!1]),[u,v,S]}catch(y){throw h.forEach(w=>i._OrtFree(w)),d.forEach(w=>i._OrtFree(w)),c!==0&&i._OrtReleaseBinding(c),u!==0&&i._OrtReleaseSession(u),y}finally{i._free(r),a!==0&&i._OrtReleaseSessionOptions(a),p.forEach(y=>i._free(y)),i.unmountExternalData?.()}},jd=e=>{let t=Le(),r=ar.get(e);if(!r)throw new Error(`cannot release session. invalid session id: ${e}`);let[o,i,u,a,c]=r;a&&(c&&t._OrtClearBoundOutputs(a.handle),t._OrtReleaseBinding(a.handle)),t.jsepOnReleaseSession?.(e),i.forEach(p=>t._OrtFree(p)),u.forEach(p=>t._OrtFree(p)),t._OrtReleaseSession(o),ar.delete(e)},Hd=(e,t,r,o,i,u=!1)=>{if(!e){t.push(0);return}let a=Le(),c=e[0],p=e[1],h=e[3],d,y;if(c==="string"&&h==="gpu-buffer")throw new Error("String tensor is not supported on GPU.");if(u&&h!=="gpu-buffer")throw new Error(`External buffer must be provided for input/output index ${i} when enableGraphCapture is true.`);if(h==="gpu-buffer"){let v=e[2].gpuBuffer,S=tr(go(c));y=p.reduce((I,x)=>I*x,1)*S;let A=a.jsepRegisterBuffer;if(!A)throw new Error(\'Tensor location "gpu-buffer" is not supported without using WebGPU.\');d=A(o,i,v,y)}else{let v=e[2];if(Array.isArray(v)){y=4*v.length,d=a._malloc(y),r.push(d);let S=d/4;for(let A=0;Aa.HEAP32[v++]=A);let S=a._OrtCreateTensor(go(c),d,y,_,p.length,yo(h));S===0&&Ue(`Can\'t create tensor for input/output. session=${o}, index=${i}.`),t.push(S)}finally{a.stackRestore(w)}},Kd=async(e,t,r,o,i,u)=>{let a=Le(),c=ar.get(e);if(!c)throw new Error(`cannot run inference. invalid session id: ${e}`);let p=c[0],h=c[1],d=c[2],y=c[3],w=c[4],_=c[5],v=t.length,S=o.length,A=0,I=[],x=[],E=[],P=[],O=a.stackSave(),R=a.stackAlloc(v*4),L=a.stackAlloc(v*4),N=a.stackAlloc(S*4),K=a.stackAlloc(S*4);try{[A,I]=Ni(u);for(let ee=0;eeNe*Ye,1);ue=Gt(ne);let Ut=y?.outputPreferredLocations[o[ee]];if(ue==="string"){if(Ut==="gpu-buffer")throw new Error("String tensor is not supported on GPU.");let Ne=[],Ye=le/4;for(let mt=0;mt0){let Ne=a.jsepGetBuffer;if(!Ne)throw new Error(\'preferredLocation "gpu-buffer" is not supported without using WebGPU.\');let Ye=Ne(le),mt=tr(ne);if(mt===void 0||!Hi(ue))throw new Error(`Unsupported data type: ${ue}`);ie=!0,We.push([ue,Be,{gpuBuffer:Ye,download:a.jsepCreateDownloader(Ye,Ge*mt,ue),dispose:()=>{a._OrtReleaseTensor(ae)}},"gpu-buffer"])}else{let Ne=bn(ue),Ye=new Ne(Ge);new Uint8Array(Ye.buffer,Ye.byteOffset,Ye.byteLength).set(a.HEAPU8.subarray(le,le+Ye.byteLength)),We.push([ue,Be,Ye,"cpu"])}}finally{a.stackRestore(Ae),ue==="string"&&le&&a._free(le),ie||a._OrtReleaseTensor(ae)}}return y&&!w&&(a._OrtClearBoundOutputs(y.handle),ar.set(e,[p,h,d,y,w,!1])),We}finally{a.stackRestore(O),x.forEach(Q=>a._OrtReleaseTensor(Q)),E.forEach(Q=>a._OrtReleaseTensor(Q)),P.forEach(Q=>a._free(Q)),A!==0&&a._OrtReleaseRunOptions(A),I.forEach(Q=>a._free(Q))}},Yd=e=>{let t=Le(),r=ar.get(e);if(!r)throw new Error("invalid session id");let o=r[0],i=t._OrtEndProfiling(o);i===0&&Ue("Can\'t get an profile file name."),t._OrtFree(i)},Zd=e=>{let t=[];for(let r of e){let o=r[2];!Array.isArray(o)&&"buffer"in o&&t.push(o.buffer)}return t};self.onmessage=e=>{let{type:t,in:r}=e.data;try{switch(t){case"init-wasm":Wi(r.wasm).then(()=>{Ld(r).then(()=>{postMessage({type:t})},o=>{postMessage({type:t,err:o})})},o=>{postMessage({type:t,err:o})});break;case"init-ep":{let{epName:o,env:i}=r;Fd(i,o).then(()=>{postMessage({type:t})},u=>{postMessage({type:t,err:u})});break}case"copy-from":{let{buffer:o}=r,i=Xo(o);postMessage({type:t,out:i});break}case"create":{let{model:o,options:i}=r;qd(o,i).then(u=>{postMessage({type:t,out:u})},u=>{postMessage({type:t,err:u})});break}case"release":jd(r),postMessage({type:t});break;case"run":{let{sessionId:o,inputIndices:i,inputs:u,outputIndices:a,options:c}=r;Kd(o,i,u,a,new Array(a.length).fill(null),c).then(p=>{p.some(h=>h[3]!=="cpu")?postMessage({type:t,err:"Proxy does not support non-cpu tensor location."}):postMessage({type:t,out:p},Zd([...u,...p]))},p=>{postMessage({type:t,err:p})});break}case"end-profiling":Yd(r),postMessage({type:t});break;default:}}catch(o){postMessage({type:t,err:o})}};})();\n/**\n * @license\n * Copyright 2021 Google LLC. All Rights Reserved.\n * Licensed under the Apache License, Version 2.0 (the "License");\n * you may not use this file except in compliance with the License.\n * You may obtain a copy of the License at\n *\n * http://www.apache.org/licenses/LICENSE-2.0\n *\n * Unless required by applicable law or agreed to in writing, software\n * distributed under the License is distributed on an "AS IS" BASIS,\n * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.\n * See the License for the specific language governing permissions and\n * limitations under the License.\n * =============================================================================\n */\n/**\n * @license\n * Copyright 2020 Google LLC. All Rights Reserved.\n * Licensed under the Apache License, Version 2.0 (the "License");\n * you may not use this file except in compliance with the License.\n * You may obtain a copy of the License at\n *\n * http://www.apache.org/licenses/LICENSE-2.0\n *\n * Unless required by applicable law or agreed to in writing, software\n * distributed under the License is distributed on an "AS IS" BASIS,\n * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.\n * See the License for the specific language governing permissions and\n * limitations under the License.\n * =============================================================================\n */\n/**\n * @license\n * Copyright 2019 Google LLC. All Rights Reserved.\n * Licensed under the Apache License, Version 2.0 (the "License");\n * you may not use this file except in compliance with the License.\n * You may obtain a copy of the License at\n *\n * http://www.apache.org/licenses/LICENSE-2.0\n *\n * Unless required by applicable law or agreed to in writing, software\n * distributed under the License is distributed on an "AS IS" BASIS,\n * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.\n * See the License for the specific language governing permissions and\n * limitations under the License.\n * =============================================================================\n */\n'}),Ir,Dt,vn,aa,ia,eo,bi,Ur,Wr,Qc,sa,Km,Ym,Xm,Qm,Jm,Zm,eg,tg=Z(()=>{ar(),Dy(),xa(),Ir=()=>!!Ue.wasm.proxy&&typeof document<"u",vn=!1,aa=!1,ia=!1,bi=new Map,Ur=(t,e)=>{let r=bi.get(t);r?r.push(e):bi.set(t,[e])},Wr=()=>{if(vn||!aa||ia||!Dt)throw new Error("worker not ready")},Qc=t=>{switch(t.data.type){case"init-wasm":vn=!1,t.data.err?(ia=!0,eo[1](t.data.err)):(aa=!0,eo[0]());break;case"init-ep":case"copy-from":case"create":case"release":case"run":case"end-profiling":{let e=bi.get(t.data.type);t.data.err?e.shift()[1](t.data.err):e.shift()[0](t.data.out);break}}},sa=typeof document<"u"?document?.currentScript?.src:void 0,Km=async()=>{if(!aa){if(vn)throw new Error("multiple calls to 'initWasm()' detected.");if(ia)throw new Error("previous call to 'initWasm()' failed.");if(vn=!0,Ir())return Ue.wasm.wasmPaths===void 0&&sa&&sa.indexOf("blob:")!==0&&(Ue.wasm.wasmPaths=sa.substr(0,+sa.lastIndexOf("/")+1)),new Promise((t,e)=>{Dt?.terminate();let r=URL.createObjectURL(new Blob([Ny()],{type:"text/javascript"}));Dt=new Worker(r,{name:"ort-wasm-proxy-worker"}),Dt.onerror=a=>e(a),Dt.onmessage=Qc,URL.revokeObjectURL(r),eo=[t,e];let n={type:"init-wasm",in:Ue};Dt.postMessage(n)});try{await sh(Ue.wasm),await Um(Ue),aa=!0}catch(t){throw ia=!0,t}finally{vn=!1}}},Ym=async t=>{if(Ir())return Wr(),new Promise((e,r)=>{Ur("init-ep",[e,r]);let n={type:"init-ep",in:{epName:t,env:Ue}};Dt.postMessage(n)});await Wm(Ue,t)},Xm=async t=>Ir()?(Wr(),new Promise((e,r)=>{Ur("copy-from",[e,r]);let n={type:"copy-from",in:{buffer:t}};Dt.postMessage(n,[t.buffer])})):Eo(t),Qm=async(t,e)=>{if(Ir()){if(e?.preferredOutputLocation)throw new Error('session option "preferredOutputLocation" is not supported for proxy.');return Wr(),new Promise((r,n)=>{Ur("create",[r,n]);let a={type:"create",in:{model:t,options:{...e}}},i=[];t instanceof Uint8Array&&i.push(t.buffer),Dt.postMessage(a,i)})}else return Vm(t,e)},Jm=async t=>{if(Ir())return Wr(),new Promise((e,r)=>{Ur("release",[e,r]);let n={type:"release",in:t};Dt.postMessage(n)});Gm(t)},Zm=async(t,e,r,n,a,i)=>{if(Ir()){if(r.some(s=>s[3]!=="cpu"))throw new Error("input tensor on GPU is not supported for proxy.");if(a.some(s=>s))throw new Error("pre-allocated output tensor is not supported for proxy.");return Wr(),new Promise((s,o)=>{Ur("run",[s,o]);let u=r,l={type:"run",in:{sessionId:t,inputIndices:e,inputs:u,outputIndices:n,options:i}};Dt.postMessage(l,qm(u))})}else return Hm(t,e,r,n,a,i)},eg=async t=>{if(Ir())return Wr(),new Promise((e,r)=>{Ur("end-profiling",[e,r]);let n={type:"end-profiling",in:t};Dt.postMessage(n)});jm(t)}}),to,Jc,rg,Fy=Z(()=>{ar(),tg(),$e(),lh(),to=(t,e)=>{switch(t.location){case"cpu":return[t.type,t.dims,t.data,"cpu"];case"gpu-buffer":return[t.type,t.dims,{gpuBuffer:t.gpuBuffer},"gpu-buffer"];default:throw new Error(`invalid data location: ${t.location} for ${e()}`)}},Jc=t=>{switch(t[3]){case"cpu":return new bt(t[0],t[2],t[1]);case"gpu-buffer":{let e=t[0];if(!Go(e))throw new Error(`not supported data type: ${e} for deserializing GPU tensor`);let{gpuBuffer:r,download:n,dispose:a}=t[2];return bt.fromGpuBuffer(r,{dataType:e,dims:t[1],download:n,dispose:a})}default:throw new Error(`invalid data location: ${t[3]}`)}},rg=class{async fetchModelAndCopyToWasmMemory(t){return Xm(await Ni(t))}async loadModel(t,e){nr();let r;typeof t=="string"?typeof process<"u"&&process.versions&&process.versions.node?r=await Ni(t):r=await this.fetchModelAndCopyToWasmMemory(t):r=t,[this.sessionId,this.inputNames,this.outputNames]=await Qm(r,e),Lt()}async dispose(){return Jm(this.sessionId)}async run(t,e,r){nr();let n=[],a=[];Object.entries(t).forEach(f=>{let m=f[0],c=f[1],y=this.inputNames.indexOf(m);if(y===-1)throw new Error(`invalid input '${m}'`);n.push(c),a.push(y)});let i=[],s=[];Object.entries(e).forEach(f=>{let m=f[0],c=f[1],y=this.outputNames.indexOf(m);if(y===-1)throw new Error(`invalid output '${m}'`);i.push(c),s.push(y)});let o=n.map((f,m)=>to(f,()=>`input "${this.inputNames[a[m]]}"`)),u=i.map((f,m)=>f?to(f,()=>`output "${this.outputNames[s[m]]}"`):null),l=await Zm(this.sessionId,a,o,s,u,r),p={};for(let f=0;f{ar(),tg(),Fy(),Zc=()=>{if((typeof Ue.wasm.initTimeout!="number"||Ue.wasm.initTimeout<0)&&(Ue.wasm.initTimeout=0),typeof Ue.wasm.simd!="boolean"&&(Ue.wasm.simd=!0),typeof Ue.wasm.proxy!="boolean"&&(Ue.wasm.proxy=!1),typeof Ue.wasm.trace!="boolean"&&(Ue.wasm.trace=!1),typeof Ue.wasm.numThreads!="number"||!Number.isInteger(Ue.wasm.numThreads)||Ue.wasm.numThreads<=0){(typeof self<"u"&&!self.crossOriginIsolated||typeof process<"u"&&process.versions&&process.versions.node)&&(Ue.wasm.numThreads=1);let t=typeof navigator>"u"?(void 0)().length:navigator.hardwareConcurrency;Ue.wasm.numThreads=Math.min(4,Math.ceil((t||1)/2))}},ng=class{async init(t){Zc(),await Km(),await Ym(t)}async createInferenceSessionHandler(t,e){let r=new rg;return await r.loadModel(t,e),Promise.resolve(r)}}}),ag={};Mn(ag,{wasmBackend:()=>ig});var ig,Uy=Z(()=>{Ly(),ig=new ng});ar();ar();ar();var Wy="1.18.0",Vy=Qp;{let t=(Uy(),Jr(ag)).wasmBackend;Xr("webgpu",t,5),Xr("webnn",t,5),Xr("cpu",t,10),Xr("wasm",t,10)}Object.defineProperty(Ue.versions,"web",{value:Wy,enumerable:!0});/** -* @license -* Copyright 2021 Google LLC. All Rights Reserved. -* Licensed under the Apache License, Version 2.0 (the "License"); -* you may not use this file except in compliance with the License. -* You may obtain a copy of the License at -* -* http://www.apache.org/licenses/LICENSE-2.0 -* -* Unless required by applicable law or agreed to in writing, software -* distributed under the License is distributed on an "AS IS" BASIS, -* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -* See the License for the specific language governing permissions and -* limitations under the License. -* ============================================================================= -*//** - * @license - * Copyright 2020 Google LLC. All Rights Reserved. - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - * ============================================================================= - *//** - * @license - * Copyright 2019 Google LLC. All Rights Reserved. - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - * ============================================================================= - */const Gy=Object.freeze(Object.defineProperty({__proto__:null,get InferenceSession(){return No},get TRACE(){return ma},get TRACE_FUNC_BEGIN(){return nr},get TRACE_FUNC_END(){return Lt},get Tensor(){return bt},get TrainingSession(){return Fo},default:Vy,get env(){return Ue},get registerBackend(){return Xr}},Symbol.toStringTag,{value:"Module"})),Hy=(t,e)=>{const r=typeof document<"u"?document.createElement("canvas"):new OffscreenCanvas(1,1);r.width=t.dims[3],r.height=t.dims[2];const n=r.getContext("2d");if(n!=null){let a,i;e?.tensorLayout!==void 0&&e.tensorLayout==="NHWC"?(a=t.dims[2],i=t.dims[3]):(a=t.dims[3],i=t.dims[2]);const s=e?.format!==void 0?e.format:"RGB",o=e?.norm;let u,l;o===void 0||o.mean===void 0?u=[255,255,255,255]:typeof o.mean=="number"?u=[o.mean,o.mean,o.mean,o.mean]:(u=[o.mean[0],o.mean[1],o.mean[2],0],o.mean[3]!==void 0&&(u[3]=o.mean[3])),o===void 0||o.bias===void 0?l=[0,0,0,0]:typeof o.bias=="number"?l=[o.bias,o.bias,o.bias,o.bias]:(l=[o.bias[0],o.bias[1],o.bias[2],0],o.bias[3]!==void 0&&(l[3]=o.bias[3]));const p=i*a;let f=0,m=p,c=p*2,y=-1;s==="RGBA"?(f=0,m=p,c=p*2,y=p*3):s==="RGB"?(f=0,m=p,c=p*2):s==="RBG"&&(f=0,c=p,m=p*2);for(let w=0;w{const r=typeof document<"u"?document.createElement("canvas").getContext("2d"):new OffscreenCanvas(1,1).getContext("2d");let n;if(r!=null){let a,i,s;e?.tensorLayout!==void 0&&e.tensorLayout==="NHWC"?(a=t.dims[2],i=t.dims[1],s=t.dims[3]):(a=t.dims[3],i=t.dims[2],s=t.dims[1]);const o=e!==void 0&&e.format!==void 0?e.format:"RGB",u=e?.norm;let l,p;u===void 0||u.mean===void 0?l=[255,255,255,255]:typeof u.mean=="number"?l=[u.mean,u.mean,u.mean,u.mean]:(l=[u.mean[0],u.mean[1],u.mean[2],255],u.mean[3]!==void 0&&(l[3]=u.mean[3])),u===void 0||u.bias===void 0?p=[0,0,0,0]:typeof u.bias=="number"?p=[u.bias,u.bias,u.bias,u.bias]:(p=[u.bias[0],u.bias[1],u.bias[2],0],u.bias[3]!==void 0&&(p[3]=u.bias[3]));const f=i*a;if(e!==void 0&&(e.format!==void 0&&s===4&&e.format!=="RGBA"||s===3&&e.format!=="RGB"&&e.format!=="BGR"))throw new Error("Tensor format doesn't match input tensor dims");const m=4;let c=0,y=1,w=2,v=3,k=0,$=f,C=f*2,T=-1;o==="RGBA"?(k=0,$=f,C=f*2,T=f*3):o==="RGB"?(k=0,$=f,C=f*2):o==="RBG"&&(k=0,C=f,$=f*2),n=r.createImageData(a,i);for(let A=0;A{if(t===void 0)throw new Error("Image buffer must be defined");if(e.height===void 0||e.width===void 0)throw new Error("Image height and width must be defined");if(e.tensorLayout==="NHWC")throw new Error("NHWC Tensor layout is not supported yet");const{height:r,width:n}=e,a=e.norm??{mean:255,bias:0};let i,s;typeof a.mean=="number"?i=[a.mean,a.mean,a.mean,a.mean]:i=[a.mean[0],a.mean[1],a.mean[2],a.mean[3]??255],typeof a.bias=="number"?s=[a.bias,a.bias,a.bias,a.bias]:s=[a.bias[0],a.bias[1],a.bias[2],a.bias[3]??0];const o=e.format!==void 0?e.format:"RGBA",u=e.tensorFormat!==void 0&&e.tensorFormat!==void 0?e.tensorFormat:"RGB",l=r*n,p=u==="RGBA"?new Float32Array(l*4):new Float32Array(l*3);let f=4,m=0,c=1,y=2,w=3,v=0,k=l,$=l*2,C=-1;o==="RGB"&&(f=3,m=0,c=1,y=2,w=-1),u==="RGBA"?C=l*3:u==="RBG"?(v=0,$=l,k=l*2):u==="BGR"&&($=0,k=l,v=l*2);for(let A=0;A{const r=typeof HTMLImageElement<"u"&&t instanceof HTMLImageElement,n=typeof ImageData<"u"&&t instanceof ImageData,a=typeof ImageBitmap<"u"&&t instanceof ImageBitmap,i=typeof t=="string";let s,o=e??{};const u=()=>{if(typeof document<"u")return document.createElement("canvas");if(typeof OffscreenCanvas<"u")return new OffscreenCanvas(1,1);throw new Error("Canvas is not supported")},l=p=>p instanceof HTMLCanvasElement||p instanceof OffscreenCanvas?p.getContext("2d"):null;if(r){const p=u();p.width=t.width,p.height=t.height;const f=l(p);if(f!=null){let m=t.height,c=t.width;if(e!==void 0&&e.resizedHeight!==void 0&&e.resizedWidth!==void 0&&(m=e.resizedHeight,c=e.resizedWidth),e!==void 0){if(o=e,e.tensorFormat!==void 0)throw new Error("Image input config format must be RGBA for HTMLImageElement");o.tensorFormat="RGBA",o.height=m,o.width=c}else o.tensorFormat="RGBA",o.height=m,o.width=c;f.drawImage(t,0,0),s=f.getImageData(0,0,c,m).data}else throw new Error("Can not access image data")}else if(n){let p,f;if(e!==void 0&&e.resizedWidth!==void 0&&e.resizedHeight!==void 0?(p=e.resizedHeight,f=e.resizedWidth):(p=t.height,f=t.width),e!==void 0&&(o=e),o.format="RGBA",o.height=p,o.width=f,e!==void 0){const m=u();m.width=f,m.height=p;const c=l(m);if(c!=null)c.putImageData(t,0,0),s=c.getImageData(0,0,f,p).data;else throw new Error("Can not access image data")}else s=t.data}else if(a){if(e===void 0)throw new Error("Please provide image config with format for Imagebitmap");const p=u();p.width=t.width,p.height=t.height;const f=l(p);if(f!=null){const m=t.height,c=t.width;return f.drawImage(t,0,0,c,m),s=f.getImageData(0,0,c,m).data,o.height=m,o.width=c,ro(s,o)}else throw new Error("Can not access image data")}else{if(i)return new Promise((p,f)=>{const m=u(),c=l(m);if(!t||!c)return f();const y=new Image;y.crossOrigin="Anonymous",y.src=t,y.onload=()=>{m.width=y.width,m.height=y.height,c.drawImage(y,0,0,m.width,m.height);const w=c.getImageData(0,0,m.width,m.height);o.height=m.height,o.width=m.width,p(ro(w.data,o))}});throw new Error("Input data provided is not supported - aborted tensor creation")}if(s!==void 0)return ro(s,o);throw new Error("Input data provided is not supported - aborted tensor creation")},Ky=(t,e)=>{const{width:r,height:n,download:a,dispose:i}=e,s=[1,n,r,4];return new lr({location:"texture",type:"float32",texture:t,dims:s,download:a,dispose:i})},Yy=(t,e)=>{const{dataType:r,dims:n,download:a,dispose:i}=e;return new lr({location:"gpu-buffer",type:r??"float32",gpuBuffer:t,dims:n,download:a,dispose:i})},Xy=(t,e,r)=>new lr({location:"cpu-pinned",type:t,data:e,dims:r??[e.length]}),kn=new Map([["float32",Float32Array],["uint8",Uint8Array],["int8",Int8Array],["uint16",Uint16Array],["int16",Int16Array],["int32",Int32Array],["bool",Uint8Array],["float64",Float64Array],["uint32",Uint32Array]]),Ai=new Map([[Float32Array,"float32"],[Uint8Array,"uint8"],[Int8Array,"int8"],[Uint16Array,"uint16"],[Int16Array,"int16"],[Int32Array,"int32"],[Float64Array,"float64"],[Uint32Array,"uint32"]]);let ep=!1;const Qy=()=>{if(!ep){ep=!0;const t=typeof BigInt64Array<"u"&&BigInt64Array.from,e=typeof BigUint64Array<"u"&&BigUint64Array.from,r=typeof Float16Array<"u"&&Float16Array.from;t&&(kn.set("int64",BigInt64Array),Ai.set(BigInt64Array,"int64")),e&&(kn.set("uint64",BigUint64Array),Ai.set(BigUint64Array,"uint64")),r?(kn.set("float16",Float16Array),Ai.set(Float16Array,"float16")):kn.set("float16",Uint16Array)}},Jy=t=>{let e=1;for(let r=0;r{switch(t.location){case"cpu":return new lr(t.type,t.data,e);case"cpu-pinned":return new lr({location:"cpu-pinned",data:t.data,type:t.type,dims:e});case"texture":return new lr({location:"texture",texture:t.texture,type:t.type,dims:e});case"gpu-buffer":return new lr({location:"gpu-buffer",gpuBuffer:t.gpuBuffer,type:t.type,dims:e});default:throw new Error(`tensorReshape: tensor location ${t.location} is not supported`)}};let lr=class{constructor(e,r,n){Qy();let a,i;if(typeof e=="object"&&"location"in e)switch(this.dataLocation=e.location,a=e.type,i=e.dims,e.location){case"cpu-pinned":{const o=kn.get(a);if(!o)throw new TypeError(`unsupported type "${a}" to create tensor from pinned buffer`);if(!(e.data instanceof o))throw new TypeError(`buffer should be of type ${o.name}`);this.cpuData=e.data;break}case"texture":{if(a!=="float32")throw new TypeError(`unsupported type "${a}" to create tensor from texture`);this.gpuTextureData=e.texture,this.downloader=e.download,this.disposer=e.dispose;break}case"gpu-buffer":{if(a!=="float32"&&a!=="float16"&&a!=="int32"&&a!=="int64"&&a!=="uint32"&&a!=="uint8"&&a!=="bool")throw new TypeError(`unsupported type "${a}" to create tensor from gpu buffer`);this.gpuBufferData=e.gpuBuffer,this.downloader=e.download,this.disposer=e.dispose;break}default:throw new Error(`Tensor constructor: unsupported location '${this.dataLocation}'`)}else{let o,u;if(typeof e=="string")if(a=e,u=n,e==="string"){if(!Array.isArray(r))throw new TypeError("A string tensor's data must be a string array.");o=r}else{const l=kn.get(e);if(l===void 0)throw new TypeError(`Unsupported tensor type: ${e}.`);if(Array.isArray(r)){if(e==="float16"&&l===Uint16Array)throw new TypeError("Creating a float16 tensor from number array is not supported. Please use Uint16Array as data.");e==="uint64"||e==="int64"?o=l.from(r,BigInt):o=l.from(r)}else if(r instanceof l)o=r;else throw new TypeError(`A ${a} tensor's data must be type of ${l}`)}else if(u=r,Array.isArray(e)){if(e.length===0)throw new TypeError("Tensor type cannot be inferred from an empty array.");const l=typeof e[0];if(l==="string")a="string",o=e;else if(l==="boolean")a="bool",o=Uint8Array.from(e);else throw new TypeError(`Invalid element type of data array: ${l}.`)}else{const l=Ai.get(e.constructor);if(l===void 0)throw new TypeError(`Unsupported type for tensor data: ${e.constructor}.`);a=l,o=e}if(u===void 0)u=[o.length];else if(!Array.isArray(u))throw new TypeError("A tensor's dims must be a number array");i=u,this.cpuData=o,this.dataLocation="cpu"}const s=Jy(i);if(this.cpuData&&s!==this.cpuData.length)throw new Error(`Tensor's size(${s}) does not match data length(${this.cpuData.length}).`);this.type=a,this.dims=i,this.size=s}static async fromImage(e,r){return qy(e,r)}static fromTexture(e,r){return Ky(e,r)}static fromGpuBuffer(e,r){return Yy(e,r)}static fromPinnedBuffer(e,r,n){return Xy(e,r,n)}toDataURL(e){return Hy(this,e)}toImageData(e){return jy(this,e)}get data(){if(this.ensureValid(),!this.cpuData)throw new Error("The data is not on CPU. Use `getData()` to download GPU data to CPU, or use `texture` or `gpuBuffer` property to access the GPU data directly.");return this.cpuData}get location(){return this.dataLocation}get texture(){if(this.ensureValid(),!this.gpuTextureData)throw new Error("The data is not stored as a WebGL texture.");return this.gpuTextureData}get gpuBuffer(){if(this.ensureValid(),!this.gpuBufferData)throw new Error("The data is not stored as a WebGPU buffer.");return this.gpuBufferData}async getData(e){switch(this.ensureValid(),this.dataLocation){case"cpu":case"cpu-pinned":return this.data;case"texture":case"gpu-buffer":{if(!this.downloader)throw new Error("The current tensor is not created with a specified data downloader.");if(this.isDownloading)throw new Error("The current tensor is being downloaded.");try{this.isDownloading=!0;const r=await this.downloader();return this.downloader=void 0,this.dataLocation="cpu",this.cpuData=r,e&&this.disposer&&(this.disposer(),this.disposer=void 0),r}finally{this.isDownloading=!1}}default:throw new Error(`cannot get data from location: ${this.dataLocation}`)}}dispose(){if(this.isDownloading)throw new Error("The current tensor is being downloaded.");this.disposer&&(this.disposer(),this.disposer=void 0),this.cpuData=void 0,this.gpuTextureData=void 0,this.gpuBufferData=void 0,this.downloader=void 0,this.isDownloading=void 0,this.dataLocation="none"}ensureValid(){if(this.dataLocation==="none")throw new Error("The tensor is disposed.")}reshape(e){if(this.ensureValid(),this.downloader||this.disposer)throw new Error("Cannot reshape a tensor that owns GPU resource.");return Zy(this,e)}};const ew=lr,ca=[];let Co,ya;Zr.IS_NODE_ENV?(ya=Ze??n_,ca.push("cpu"),Co=["cpu"]):(ya=Gy,Zr.IS_WEBGPU_AVAILABLE&&ca.push("webgpu"),ca.push("wasm"),Co=["wasm"]);const tw=ya.InferenceSession;function rw(t){let e=Co;if(t){if(!ca.includes(t))throw new Error(`Unsupported device: "${t}". Should be one of: ${ca.join(", ")}.`);e=[t]}return e}async function sg(t,e){return await tw.create(t,e)}function og(t){return t instanceof ya.Tensor}const Yr=ya?.env;Yr?.wasm&&(Yr.wasm.wasmPaths="https://cdn.jsdelivr.net/npm/onnxruntime-web@1.18.0/dist/",Yr.wasm.proxy=!Zr.IS_WEBWORKER_ENV,(typeof crossOriginIsolated>"u"||!crossOriginIsolated)&&(Yr.wasm.numThreads=1),typeof navigator<"u"&&/iP(hone|od|ad).+16_4.+AppleWebKit/.test(navigator.userAgent)&&(Yr.wasm.simd=!1));function nw(){return Yr?.wasm?.proxy}Ct.backends.onnx=Yr;const no=async(t,e,r)=>{const n=await sg(t,e);return async a=>{const i=Object.fromEntries(Object.entries(a).map(([o,u])=>[o,u.ort_tensor])),s=await n.run(i);return new pe(s[r])}};class tp{static session_options={};static get bilinear_interpolate_4d(){return this._bilinear_interpolate_4d||(this._bilinear_interpolate_4d=no(new Uint8Array([8,9,18,0,58,128,1,10,40,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,17,10,4,109,111,100,101,34,6,108,105,110,101,97,114,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,20]),this.session_options,"y")),this._bilinear_interpolate_4d}static get bicubic_interpolate_4d(){return this._bicubic_interpolate_4d||(this._bicubic_interpolate_4d=no(new Uint8Array([8,9,18,0,58,127,10,39,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,16,10,4,109,111,100,101,34,5,99,117,98,105,99,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,20]),this.session_options,"y")),this._bicubic_interpolate_4d}static get matmul(){return this._matmul||(this._matmul=no(new Uint8Array([8,9,18,0,58,55,10,17,10,1,97,10,1,98,18,1,99,34,6,77,97,116,77,117,108,18,1,114,90,9,10,1,97,18,4,10,2,8,1,90,9,10,1,98,18,4,10,2,8,1,98,9,10,1,99,18,4,10,2,8,1,66,2,16,20]),this.session_options,"c")),this._matmul}}const rp=Object.freeze({float32:Float32Array,float16:Uint16Array,float64:Float64Array,string:Array,int8:Int8Array,uint8:Uint8Array,int16:Int16Array,uint16:Uint16Array,int32:Int32Array,uint32:Uint32Array,int64:BigInt64Array,uint64:BigUint64Array,bool:Uint8Array});class pe{get dims(){return this.ort_tensor.dims}set dims(e){this.ort_tensor.dims=e}get type(){return this.ort_tensor.type}get data(){return this.ort_tensor.data}get size(){return this.ort_tensor.size}get location(){return this.ort_tensor.location}ort_tensor;constructor(...e){return og(e[0])?this.ort_tensor=e[0]:this.ort_tensor=new ew(e[0],e[1],e[2]),new Proxy(this,{get:(r,n)=>{if(typeof n=="string"){let a=Number(n);if(Number.isInteger(a))return r._getitem(a)}return r[n]},set:(r,n,a)=>r[n]=a})}dispose(){this.ort_tensor.dispose()}*[Symbol.iterator](){const[e,...r]=this.dims;if(r.length>0){const n=r.reduce((a,i)=>a*i);for(let a=0;a0){const a=n.reduce((i,s)=>i*s);return this._subarray(e,a,n)}else return new pe(this.type,[this.data[e]],n)}indexOf(e){const r=this.data;for(let n=0;nm)throw new Error(`Invalid slice: ${p}`);let c=[Math.max(f,0),Math.min(m,this.dims[l])];n.push(c),r.push(c[1]-c[0])}else throw new Error(`Invalid slice: ${p}`)}let a=n.map(([l,p])=>p-l),i=a.reduce((l,p)=>l*p);const s=this.data;let o=new s.constructor(i);const u=this.stride();for(let l=0;l=0;--f){const c=a[f];p+=(m%c+n[f][0])*u[f],m=Math.floor(m/c)}o[l]=s[p]}return new pe(this.type,o,r)}permute(...e){return iw(this,e)}transpose(...e){return this.permute(...e)}sum(e=null,r=!1){return this.norm(1,e,r)}norm(e="fro",r=null,n=!1){if(e==="fro")e=2;else if(typeof e=="string")throw Error(`Unsupported norm: ${e}`);const a=this.data;if(r===null){let o=a.reduce((u,l)=>u+l**e,0)**(1/e);return new pe(this.type,[o],[])}r=ur(r,this.dims.length);const i=this.dims.slice();i[r]=1;const s=new a.constructor(a.length/this.dims[r]);for(let o=0;o=0;--l){const m=this.dims[l];if(l!==r){const c=p%m;u+=c*f,f*=i[l]}p=Math.floor(p/m)}s[u]+=a[o]**e}if(e!==1)for(let o=0;o=0;--o){const p=this.dims[o];if(o!==r){const f=u%p;s+=f*l,l*=this.dims[o]}u=Math.floor(u/p)}a[i]/=n.data[s]}return this}normalize(e=2,r=1){return this.clone().normalize_(e,r)}stride(){return uw(this.dims)}squeeze(e=null){return new pe(this.type,this.data,ip(this.dims,e))}squeeze_(e=null){return this.dims=ip(this.dims,e),this}unsqueeze(e=null){return new pe(this.type,this.data,sp(this.dims,e))}unsqueeze_(e=null){return this.dims=sp(this.dims,e),this}flatten_(e=0,r=-1){r=(r+this.dims.length)%this.dims.length;let n=this.dims.slice(0,e),a=this.dims.slice(e,r+1),i=this.dims.slice(r+1);return this.dims=[...n,a.reduce((s,o)=>s*o,1),...i],this}flatten(e=0,r=-1){return this.clone().flatten_(e,r)}view(...e){let r=-1;for(let n=0;ns!==r?a*i:a,1);e[r]=this.data.length/n}return new pe(this.type,this.data,e)}neg_(){const e=this.data;for(let r=0;ri*s);if(r!==n)throw Error(`cannot reshape array of size ${r} into shape (${e})`);let a=t;for(let i=e.length-1;i>=0;i--)a=a.reduce((s,o)=>{let u=s[s.length-1];return u.lengthr!==1):typeof e=="number"?t[e]===1&&t.splice(e,1):Array.isArray(e)&&(t=t.filter((r,n)=>r!==1||!e.includes(n))),t}function sp(t,e){return e=ur(e,t.length+1),t=t.slice(),t.splice(e,0,1),t}function ur(t,e,r=null,n=!0){if(n&&(t<-e||t>=e))throw new Error(`IndexError: index ${t} is out of bounds for dimension${r===null?"":" "+r} with size ${e}`);return t<0&&(t=(t%e+e)%e),t}function dr(t,e=0){e=ur(e,t[0].dims.length);const r=t[0].dims.slice();r[e]=t.reduce((s,o)=>s+o.dims[e],0);const n=r.reduce((s,o)=>s*o,1),a=new t[0].data.constructor(n),i=t[0].type;if(e===0){let s=0;for(let o of t)a.set(o.data,s),s+=o.data.length}else{let s=0;for(let o=0;o=0;--f){const y=u.dims[f];let w=m%y;f===e&&(w+=s),p+=w*c,c*=r[f],m=Math.floor(m/y)}a[p]=u.data[l]}s+=u.dims[e]}}return new pe(i,a,r)}function wa(t,e=0){return dr(t.map(r=>r.unsqueeze(e)),e)}function lg(t,e=null,r=1,n=!1){if(e===null){const l=t.data.reduce((c,y)=>c+y,0)/t.data.length,p=Math.sqrt(t.data.reduce((c,y)=>c+(y-l)**2,0)/(t.data.length-r)),f=new pe(t.type,[l],[]);return[new pe(t.type,[p],[]),f]}e=ur(e,t.dims.length);const a=ru(t,e,n),i=t.dims.slice();i[e]=1;const s=new t.data.constructor(t.data.length/t.dims[e]);for(let u=0;u=0;--p){const c=t.dims[p];if(p!==e){const y=f%c;l+=y*m,m*=i[p]}f=Math.floor(f/c)}s[l]+=(t.data[u]-a.data[l])**2}for(let u=0;us+o,0);return new pe(t.type,[i/t.data.length],[])}e=ur(e,t.dims.length);const n=t.dims.slice();n[e]=1;const a=new t.data.constructor(t.data.length/t.dims[e]);for(let i=0;i=0;--o){const p=t.dims[o];if(o!==e){const f=u%p;s+=f*l,l*=n[o]}u=Math.floor(u/p)}a[s]+=t.data[i]}if(t.dims[e]!==1)for(let i=0;i0||o>0;)switch(u.push(s-1),l.push(o-1),i[s][o].item()){case 0:--s,--o;break;case 1:--s;break;case 2:--o;break;default:throw new Error(`Internal error in dynamic time warping. Unexpected trace[${s}, ${o}]. Please file a bug report.`)}return u.reverse(),l.reverse(),[u,l]}function uw(t){const e=new Array(t.length);for(let r=t.length-1,n=1;r>=0;--r)e[r]=n,n*=t[r];return e}function nu(t,e,r,n){const a=t.reduce((i,s)=>i*s,1);return new pe(r,new n(a).fill(e),t)}function lw(t,e){let r,n;return r="float32",n=Float32Array,nu(t,e,r,n)}function dw(t,e){return lw(t.dims,e)}function On(t){return nu(t,1n,"int64",BigInt64Array)}function cw(t){return On(t.dims)}function pw(t){return nu(t,0n,"int64",BigInt64Array)}function hw(t){return pw(t.dims)}class fw{constructor(e=(r,n)=>r>n){this._heap=[],this._comparator=e}get size(){return this._heap.length}isEmpty(){return this.size===0}peek(){return this._heap[0]}push(...e){return this.extend(e)}extend(e){for(const r of e)this._heap.push(r),this._siftUp();return this.size}pop(){const e=this.peek(),r=this.size-1;return r>0&&this._swap(0,r),this._heap.pop(),this._siftDown(),e}replace(e){const r=this.peek();return this._heap[0]=e,this._siftDown(),r}_parent(e){return(e+1>>>1)-1}_left(e){return(e<<1)+1}_right(e){return e+1<<1}_greater(e,r){return this._comparator(this._heap[e],this._heap[r])}_swap(e,r){const n=this._heap[e];this._heap[e]=this._heap[r],this._heap[r]=n}_siftUp(){let e=this.size-1;for(;e>0&&this._greater(e,this._parent(e));)this._swap(e,this._parent(e)),e=this._parent(e)}_siftDown(){let e=0;for(;this._left(e)[]),this.endNodes=Array.from({length:this.len+1},()=>[]);const a=new pa(this.bosTokenId,0,0,0,0),i=new pa(this.eosTokenId,1,this.len,0,0);this.nodes.push(a.clone()),this.nodes.push(i.clone()),this.beginNodes[this.len].push(i),this.endNodes[0].push(a)}insert(e,r,n,a){const i=this.nodes.length,s=new pa(a,i,e,r,n);this.beginNodes[e].push(s),this.endNodes[e+r].push(s),this.nodes.push(s)}viterbi(){const e=this.len;let r=0;for(;r<=e;){if(this.beginNodes[r].length==0)return[];for(let o of this.beginNodes[r]){o.prev=null;let u=0,l=null;for(let p of this.endNodes[r]){const f=p.backtraceScore+o.score;(l===null||f>u)&&(l=p.clone(),u=f)}if(l!==null)o.prev=l,o.backtraceScore=u;else return[]}++r}const n=[],i=this.beginNodes[e][0].prev;if(i===null)return[];let s=i.clone();for(;s.prev!==null;)n.push(s.clone()),s=s.clone().prev.clone();return n.reverse(),n}piece(e){return this.sentence.slice(e.pos,e.pos+e.length)}tokens(){return this.viterbi().map(r=>this.piece(r))}tokenIds(){return this.viterbi().map(r=>r.tokenId)}}class pa{constructor(e,r,n,a,i){this.tokenId=e,this.nodeId=r,this.pos=n,this.length=a,this.score=i,this.prev=null,this.backtraceScore=0}clone(){const e=new pa(this.tokenId,this.nodeId,this.pos,this.length,this.score);return e.prev=this.prev,e.backtraceScore=this.backtraceScore,e}}var W=Object.freeze({Text:"Text",NumericLiteral:"NumericLiteral",BooleanLiteral:"BooleanLiteral",StringLiteral:"StringLiteral",Identifier:"Identifier",Equals:"Equals",OpenParen:"OpenParen",CloseParen:"CloseParen",OpenStatement:"OpenStatement",CloseStatement:"CloseStatement",OpenExpression:"OpenExpression",CloseExpression:"CloseExpression",OpenSquareBracket:"OpenSquareBracket",CloseSquareBracket:"CloseSquareBracket",OpenCurlyBracket:"OpenCurlyBracket",CloseCurlyBracket:"CloseCurlyBracket",Comma:"Comma",Dot:"Dot",Colon:"Colon",Pipe:"Pipe",CallOperator:"CallOperator",AdditiveBinaryOperator:"AdditiveBinaryOperator",MultiplicativeBinaryOperator:"MultiplicativeBinaryOperator",ComparisonBinaryOperator:"ComparisonBinaryOperator",UnaryOperator:"UnaryOperator",Set:"Set",If:"If",For:"For",In:"In",Is:"Is",NotIn:"NotIn",Else:"Else",EndIf:"EndIf",ElseIf:"ElseIf",EndFor:"EndFor",And:"And",Or:"Or",Not:"UnaryOperator"}),op=Object.freeze({set:W.Set,for:W.For,in:W.In,is:W.Is,if:W.If,else:W.Else,endif:W.EndIf,elif:W.ElseIf,endfor:W.EndFor,and:W.And,or:W.Or,not:W.Not,"not in":W.NotIn,true:W.BooleanLiteral,false:W.BooleanLiteral}),Vr=class{constructor(t,e){this.value=t,this.type=e}};function up(t){return/\w/.test(t)}function ao(t){return/[0-9]/.test(t)}var _w=[["{%",W.OpenStatement],["%}",W.CloseStatement],["{{",W.OpenExpression],["}}",W.CloseExpression],["(",W.OpenParen],[")",W.CloseParen],["{",W.OpenCurlyBracket],["}",W.CloseCurlyBracket],["[",W.OpenSquareBracket],["]",W.CloseSquareBracket],[",",W.Comma],[".",W.Dot],[":",W.Colon],["|",W.Pipe],["<=",W.ComparisonBinaryOperator],[">=",W.ComparisonBinaryOperator],["==",W.ComparisonBinaryOperator],["!=",W.ComparisonBinaryOperator],["<",W.ComparisonBinaryOperator],[">",W.ComparisonBinaryOperator],["+",W.AdditiveBinaryOperator],["-",W.AdditiveBinaryOperator],["*",W.MultiplicativeBinaryOperator],["/",W.MultiplicativeBinaryOperator],["%",W.MultiplicativeBinaryOperator],["=",W.Equals]],yw=new Map([["n",` -`],["t"," "],["r","\r"],["b","\b"],["f","\f"],["v","\v"],["'","'"],['"','"'],["\\","\\"]]);function ww(t,e={}){return t.endsWith(` -`)&&(t=t.slice(0,-1)),t=t.replace(/{#.*?#}/gs,"{##}"),e.lstrip_blocks&&(t=t.replace(/^[ \t]*({[#%])/gm,"$1")),e.trim_blocks&&(t=t.replace(/([#%]})\n/g,"$1")),t.replace(/{##}/g,"").replace(/-%}\s*/g,"%}").replace(/\s*{%-/g,"{%").replace(/-}}\s*/g,"}}").replace(/\s*{{-/g,"{{")}function bw(t,e={}){const r=[],n=ww(t,e);let a=0;const i=s=>{let o="";for(;s(n[a]);){if(n[a]==="\\"){if(++a,a>=n.length)throw new SyntaxError("Unexpected end of input");const u=n[a++],l=yw.get(u);if(l===void 0)throw new SyntaxError(`Unexpected escaped character: ${u}`);o+=l;continue}if(o+=n[a++],a>=n.length)throw new SyntaxError("Unexpected end of input")}return o};e:for(;a0){r.push(new Vr(u,W.Text));continue}}i(u=>/\s/.test(u));const o=n[a];if(o==="-"||o==="+"){const u=r.at(-1)?.type;if(u===W.Text||u===void 0)throw new SyntaxError(`Unexpected character: ${o}`);switch(u){case W.Identifier:case W.NumericLiteral:case W.BooleanLiteral:case W.StringLiteral:case W.CloseParen:case W.CloseSquareBracket:break;default:{++a;const l=i(ao);r.push(new Vr(`${o}${l}`,l.length>0?W.NumericLiteral:W.UnaryOperator));continue}}}for(const[u,l]of _w)if(n.slice(a,a+u.length)===u){r.push(new Vr(u,l)),a+=u.length;continue e}if(o==="'"||o==='"'){++a;const u=i(l=>l!==o);r.push(new Vr(u,W.StringLiteral)),++a;continue}if(ao(o)){const u=i(ao);r.push(new Vr(u,W.NumericLiteral));continue}if(up(o)){const u=i(up),l=Object.hasOwn(op,u)?op[u]:W.Identifier;l===W.In&&r.at(-1)?.type===W.Not?(r.pop(),r.push(new Vr("not in",W.NotIn))):r.push(new Vr(u,l));continue}throw new SyntaxError(`Unexpected character: ${o}`)}return r}var ka=class{type="Statement"},vw=class extends ka{constructor(t){super(),this.body=t}type="Program"},lp=class extends ka{constructor(t,e,r){super(),this.test=t,this.body=e,this.alternate=r}type="If"},$w=class extends ka{constructor(t,e,r){super(),this.loopvar=t,this.iterable=e,this.body=r}type="For"},xw=class extends ka{constructor(t,e){super(),this.assignee=t,this.value=e}type="Set"},cr=class extends ka{type="Expression"},Sw=class extends cr{constructor(t,e,r){super(),this.object=t,this.property=e,this.computed=r}type="MemberExpression"},kw=class extends cr{constructor(t,e){super(),this.callee=t,this.args=e}type="CallExpression"},$n=class extends cr{constructor(t){super(),this.value=t}type="Identifier"},zn=class extends cr{constructor(t){super(),this.value=t}type="Literal"},Ew=class extends zn{type="NumericLiteral"},dp=class extends zn{type="StringLiteral"},cp=class extends zn{type="BooleanLiteral"},Cw=class extends zn{type="ArrayLiteral"},pp=class extends zn{type="TupleLiteral"},Tw=class extends zn{type="ObjectLiteral"},oa=class extends cr{constructor(t,e,r){super(),this.operator=t,this.left=e,this.right=r}type="BinaryExpression"},Iw=class extends cr{constructor(t,e){super(),this.operand=t,this.filter=e}type="FilterExpression"},Aw=class extends cr{constructor(t,e,r){super(),this.operand=t,this.negate=e,this.test=r}type="TestExpression"},Mw=class extends cr{constructor(t,e){super(),this.operator=t,this.argument=e}type="UnaryExpression"},Ow=class extends cr{constructor(t=void 0,e=void 0,r=void 0){super(),this.start=t,this.stop=e,this.step=r}type="SliceExpression"},zw=class extends cr{constructor(t,e){super(),this.key=t,this.value=e}type="KeywordArgumentExpression"};function Pw(t){const e=new vw([]);let r=0;function n(M,P){const H=t[r++];if(!H||H.type!==M)throw new Error(`Parser Error: ${P}. ${H.type} !== ${M}.`);return H}function a(){switch(t[r].type){case W.Text:return o();case W.OpenStatement:return u();case W.OpenExpression:return l();default:throw new SyntaxError(`Unexpected token type: ${t[r].type}`)}}function i(...M){return r+M.length<=t.length&&M.some((P,H)=>P!==t[r+H].type)}function s(...M){return r+M.length<=t.length&&M.every((P,H)=>P===t[r+H].type)}function o(){return new dp(n(W.Text,"Expected text token").value)}function u(){n(W.OpenStatement,"Expected opening statement token");let M;switch(t[r].type){case W.Set:++r,M=p(),n(W.CloseStatement,"Expected closing statement token");break;case W.If:++r,M=f(),n(W.OpenStatement,"Expected {% token"),n(W.EndIf,"Expected endif token"),n(W.CloseStatement,"Expected %} token");break;case W.For:++r,M=c(),n(W.OpenStatement,"Expected {% token"),n(W.EndFor,"Expected endfor token"),n(W.CloseStatement,"Expected %} token");break;default:throw new SyntaxError(`Unknown statement type: ${t[r].type}`)}return M}function l(){n(W.OpenExpression,"Expected opening expression token");const M=y();return n(W.CloseExpression,"Expected closing expression token"),M}function p(){const M=y();if(s(W.Equals)){++r;const P=p();return new xw(M,P)}return M}function f(){const M=y();n(W.CloseStatement,"Expected closing statement token");const P=[],H=[];for(;!(t[r]?.type===W.OpenStatement&&(t[r+1]?.type===W.ElseIf||t[r+1]?.type===W.Else||t[r+1]?.type===W.EndIf));)P.push(a());if(t[r]?.type===W.OpenStatement&&t[r+1]?.type!==W.EndIf)if(++r,s(W.ElseIf))n(W.ElseIf,"Expected elseif token"),H.push(f());else for(n(W.Else,"Expected else token"),n(W.CloseStatement,"Expected closing statement token");!(t[r]?.type===W.OpenStatement&&t[r+1]?.type===W.EndIf);)H.push(a());return new lp(M,P,H)}function m(M=!1){const P=M?re:y,H=[P()],le=s(W.Comma);for(;le&&(++r,H.push(P()),!!s(W.Comma)););return le?new pp(H):H[0]}function c(){const M=m(!0);if(!(M instanceof $n||M instanceof pp))throw new SyntaxError(`Expected identifier/tuple for the loop variable, got ${M.type} instead`);n(W.In,"Expected `in` keyword following loop variable");const P=y();n(W.CloseStatement,"Expected closing statement token");const H=[];for(;i(W.OpenStatement,W.EndFor);)H.push(a());return new $w(M,P,H)}function y(){return w()}function w(){const M=v();if(s(W.If)){++r;const P=v();n(W.Else,"Expected else token");const H=v();return new lp(P,[M],[H])}return M}function v(){let M=k();for(;s(W.Or);){const P=t[r];++r;const H=k();M=new oa(P,M,H)}return M}function k(){let M=$();for(;s(W.And);){const P=t[r];++r;const H=$();M=new oa(P,M,H)}return M}function $(){let M;for(;s(W.Not);){const P=t[r];++r;const H=$();M=new Mw(P,H)}return M??C()}function C(){let M=T();for(;s(W.ComparisonBinaryOperator)||s(W.In)||s(W.NotIn);){const P=t[r];++r;const H=T();M=new oa(P,M,H)}return M}function T(){let M=ie();for(;s(W.AdditiveBinaryOperator);){const P=t[r];++r;const H=ie();M=new oa(P,M,H)}return M}function A(){const M=j();return s(W.OpenParen)?B(M):M}function B(M){let P=new kw(M,R());return s(W.OpenParen)&&(P=B(P)),P}function R(){n(W.OpenParen,"Expected opening parenthesis for arguments list");const M=D();return n(W.CloseParen,"Expected closing parenthesis for arguments list"),M}function D(){const M=[];for(;!s(W.CloseParen);){let P=y();if(s(W.Equals)){if(++r,!(P instanceof $n))throw new SyntaxError("Expected identifier for keyword argument");const H=y();P=new zw(P,H)}M.push(P),s(W.Comma)&&++r}return M}function K(){const M=[];let P=!1;for(;!s(W.CloseSquareBracket);)s(W.Colon)?(M.push(void 0),++r,P=!0):(M.push(y()),s(W.Colon)&&(++r,P=!0));if(M.length===0)throw new SyntaxError("Expected at least one argument for member/slice expression");if(P){if(M.length>3)throw new SyntaxError("Expected 0-3 arguments for slice expression");return new Ow(...M)}return M[0]}function j(){let M=re();for(;s(W.Dot)||s(W.OpenSquareBracket);){const P=t[r];++r;let H;const le=P.type!==W.Dot;if(le)H=K(),n(W.CloseSquareBracket,"Expected closing square bracket");else if(H=re(),H.type!=="Identifier")throw new SyntaxError("Expected identifier following dot operator");M=new Sw(M,H,le)}return M}function ie(){let M=te();for(;s(W.MultiplicativeBinaryOperator);){const P=t[r];++r;const H=te();M=new oa(P,M,H)}return M}function te(){let M=oe();for(;s(W.Is);){++r;const P=s(W.Not);P&&++r;let H=re();if(H instanceof cp&&(H=new $n(H.value.toString())),!(H instanceof $n))throw new SyntaxError("Expected identifier for the test");M=new Aw(M,P,H)}return M}function oe(){let M=A();for(;s(W.Pipe);){++r;let P=re();if(!(P instanceof $n))throw new SyntaxError("Expected identifier for the filter");s(W.OpenParen)&&(P=B(P)),M=new Iw(M,P)}return M}function re(){const M=t[r];switch(M.type){case W.NumericLiteral:return++r,new Ew(Number(M.value));case W.StringLiteral:return++r,new dp(M.value);case W.BooleanLiteral:return++r,new cp(M.value==="true");case W.Identifier:return++r,new $n(M.value);case W.OpenParen:{++r;const P=m();if(t[r].type!==W.CloseParen)throw new SyntaxError(`Expected closing parenthesis, got ${t[r].type} instead`);return++r,P}case W.OpenSquareBracket:{++r;const P=[];for(;!s(W.CloseSquareBracket);)P.push(y()),s(W.Comma)&&++r;return++r,new Cw(P)}case W.OpenCurlyBracket:{++r;const P=new Map;for(;!s(W.CloseCurlyBracket);){const H=y();n(W.Colon,"Expected colon between key and value in object literal");const le=y();P.set(H,le),s(W.Comma)&&++r}return++r,new Tw(P)}default:throw new SyntaxError(`Unexpected token: ${M.type}`)}}for(;r=0?(e=(e??=0)<0?Math.max(t.length+e,0):Math.min(e,t.length),r=(r??=t.length)<0?Math.max(t.length+r,0):Math.min(r,t.length)):(e=(e??=t.length-1)<0?Math.max(t.length+e,-1):Math.min(e,t.length-1),r=(r??=-1)<-1?Math.max(t.length+r,-1):Math.min(r,t.length-1));const i=[];for(let s=e;a*se.toUpperCase())}var xr=class{type="RuntimeValue";value;builtins=new Map;constructor(t=void 0){this.value=t}__bool__(){return new et(!!this.value)}},He=class extends xr{type="NumericValue"},Pe=class extends xr{type="StringValue";builtins=new Map([["upper",new br(()=>new Pe(this.value.toUpperCase()))],["lower",new br(()=>new Pe(this.value.toLowerCase()))],["strip",new br(()=>new Pe(this.value.trim()))],["title",new br(()=>new Pe(dg(this.value)))],["length",new He(this.value.length)]])},et=class extends xr{type="BooleanValue"},er=class extends xr{type="ObjectValue";__bool__(){return new et(this.value.size>0)}builtins=new Map([["get",new br(([t,e])=>{if(!(t instanceof Pe))throw new Error(`Object key must be a string: got ${t.type}`);return this.value.get(t.value)??e??new ha})],["items",new br(()=>new Je(Array.from(this.value.entries()).map(([t,e])=>new Je([new Pe(t),e]))))]])},Je=class extends xr{type="ArrayValue";builtins=new Map([["length",new He(this.value.length)]]);__bool__(){return new et(this.value.length>0)}},Bw=class extends Je{type="TupleValue"},br=class extends xr{type="FunctionValue"},ha=class extends xr{type="NullValue"},Zt=class extends xr{type="UndefinedValue"},To=class{constructor(t){this.parent=t}variables=new Map([["namespace",new br(t=>{if(t.length===0)return new er(new Map);if(t.length!==1||!(t[0]instanceof er))throw new Error("`namespace` expects either zero arguments or a single object argument");return t[0]})]]);tests=new Map([["boolean",t=>t.type==="BooleanValue"],["callable",t=>t instanceof br],["odd",t=>{if(t.type!=="NumericValue")throw new Error(`Cannot apply test "odd" to type: ${t.type}`);return t.value%2!==0}],["even",t=>{if(t.type!=="NumericValue")throw new Error(`Cannot apply test "even" to type: ${t.type}`);return t.value%2===0}],["false",t=>t.type==="BooleanValue"&&!t.value],["true",t=>t.type==="BooleanValue"&&t.value],["number",t=>t.type==="NumericValue"],["integer",t=>t.type==="NumericValue"&&Number.isInteger(t.value)],["iterable",t=>t instanceof Je||t instanceof Pe],["lower",t=>{const e=t.value;return t.type==="StringValue"&&e===e.toLowerCase()}],["upper",t=>{const e=t.value;return t.type==="StringValue"&&e===e.toUpperCase()}],["none",t=>t.type==="NullValue"],["defined",t=>t.type!=="UndefinedValue"],["undefined",t=>t.type==="UndefinedValue"],["equalto",(t,e)=>t.value===e.value]]);set(t,e){return this.declareVariable(t,Mi(e))}declareVariable(t,e){if(this.variables.has(t))throw new SyntaxError(`Variable already declared: ${t}`);return this.variables.set(t,e),e}setVariable(t,e){return this.variables.set(t,e),e}resolve(t){if(this.variables.has(t))return this;if(this.parent)return this.parent.resolve(t);throw new Error(`Unknown variable: ${t}`)}lookupVariable(t){try{return this.resolve(t).variables.get(t)??new Zt}catch{return new Zt}}},Dw=class{global;constructor(t){this.global=t??new To}run(t){return this.evaluate(t,this.global)}evaluateBinaryExpression(t,e){const r=this.evaluate(t.left,e);switch(t.operator.value){case"and":return r.__bool__().value?this.evaluate(t.right,e):r;case"or":return r.__bool__().value?r:this.evaluate(t.right,e)}const n=this.evaluate(t.right,e);switch(t.operator.value){case"==":return new et(r.value==n.value);case"!=":return new et(r.value!=n.value)}if(r instanceof Zt||n instanceof Zt)throw new Error("Cannot perform operation on undefined values");if(r instanceof ha||n instanceof ha)throw new Error("Cannot perform operation on null values");if(r instanceof He&&n instanceof He)switch(t.operator.value){case"+":return new He(r.value+n.value);case"-":return new He(r.value-n.value);case"*":return new He(r.value*n.value);case"/":return new He(r.value/n.value);case"%":return new He(r.value%n.value);case"<":return new et(r.value":return new et(r.value>n.value);case">=":return new et(r.value>=n.value);case"<=":return new et(r.value<=n.value)}else if(r instanceof Je&&n instanceof Je)switch(t.operator.value){case"+":return new Je(r.value.concat(n.value))}else if(n instanceof Je){const a=n.value.find(i=>i.value===r.value)!==void 0;switch(t.operator.value){case"in":return new et(a);case"not in":return new et(!a)}}if(r instanceof Pe||n instanceof Pe)switch(t.operator.value){case"+":return new Pe(r.value.toString()+n.value.toString())}if(r instanceof Pe&&n instanceof Pe)switch(t.operator.value){case"in":return new et(n.value.includes(r.value));case"not in":return new et(!n.value.includes(r.value))}if(r instanceof Pe&&n instanceof er)switch(t.operator.value){case"in":return new et(n.value.has(r.value));case"not in":return new et(!n.value.has(r.value))}throw new SyntaxError(`Unknown operator "${t.operator.value}" between ${r.type} and ${n.type}`)}evaluateFilterExpression(t,e){const r=this.evaluate(t.operand,e);if(t.filter.type==="Identifier"){const n=t.filter;if(r instanceof Je)switch(n.value){case"list":return r;case"first":return r.value[0];case"last":return r.value[r.value.length-1];case"length":return new He(r.value.length);case"reverse":return new Je(r.value.reverse());case"sort":return new Je(r.value.sort((a,i)=>{if(a.type!==i.type)throw new Error(`Cannot compare different types: ${a.type} and ${i.type}`);switch(a.type){case"NumericValue":return a.value-i.value;case"StringValue":return a.value.localeCompare(i.value);default:throw new Error(`Cannot compare type: ${a.type}`)}}));default:throw new Error(`Unknown ArrayValue filter: ${n.value}`)}else if(r instanceof Pe)switch(n.value){case"length":return new He(r.value.length);case"upper":return new Pe(r.value.toUpperCase());case"lower":return new Pe(r.value.toLowerCase());case"title":return new Pe(dg(r.value));case"capitalize":return new Pe(r.value.charAt(0).toUpperCase()+r.value.slice(1));case"trim":return new Pe(r.value.trim());default:throw new Error(`Unknown StringValue filter: ${n.value}`)}else if(r instanceof He)switch(n.value){case"abs":return new He(Math.abs(r.value));default:throw new Error(`Unknown NumericValue filter: ${n.value}`)}else if(r instanceof er)switch(n.value){case"items":return new Je(Array.from(r.value.entries()).map(([a,i])=>new Je([new Pe(a),i])));case"length":return new He(r.value.size);default:throw new Error(`Unknown ObjectValue filter: ${n.value}`)}throw new Error(`Cannot apply filter "${n.value}" to type: ${r.type}`)}else if(t.filter.type==="CallExpression"){const n=t.filter;if(n.callee.type!=="Identifier")throw new Error(`Unknown filter: ${n.callee.type}`);const a=n.callee.value;if(r instanceof Je){switch(a){case"selectattr":{if(r.value.some(p=>!(p instanceof er)))throw new Error("`selectattr` can only be applied to array of objects");if(n.args.some(p=>p.type!=="StringLiteral"))throw new Error("arguments of `selectattr` must be strings");const[i,s,o]=n.args.map(p=>this.evaluate(p,e));let u;if(s){const p=e.tests.get(s.value);if(!p)throw new Error(`Unknown test: ${s.value}`);u=p}else u=(...p)=>p[0].__bool__().value;const l=r.value.filter(p=>{const f=p.value.get(i.value);return f?u(f,o):!1});return new Je(l)}}throw new Error(`Unknown ArrayValue filter: ${a}`)}else throw new Error(`Cannot apply filter "${a}" to type: ${r.type}`)}throw new Error(`Unknown filter: ${t.filter.type}`)}evaluateTestExpression(t,e){const r=this.evaluate(t.operand,e),n=e.tests.get(t.test.value);if(!n)throw new Error(`Unknown test: ${t.test.value}`);const a=n(r);return new et(t.negate?!a:a)}evaluateUnaryExpression(t,e){const r=this.evaluate(t.argument,e);switch(t.operator.value){case"not":return new et(!r.value);default:throw new SyntaxError(`Unknown operator: ${t.operator.value}`)}}evalProgram(t,e){return this.evaluateBlock(t.body,e)}evaluateBlock(t,e){let r="";for(const n of t){const a=this.evaluate(n,e);a.type!=="NullValue"&&a.type!=="UndefinedValue"&&(r+=a.value)}return new Pe(r)}evaluateIdentifier(t,e){return e.lookupVariable(t.value)}evaluateCallExpression(t,e){const r=[],n=new Map;for(const i of t.args)if(i.type==="KeywordArgumentExpression"){const s=i;n.set(s.key.value,this.evaluate(s.value,e))}else r.push(this.evaluate(i,e));n.size>0&&r.push(new er(n));const a=this.evaluate(t.callee,e);if(a.type!=="FunctionValue")throw new Error(`Cannot call something that is not a function: got ${a.type}`);return a.value(r,e)}evaluateSliceExpression(t,e,r){if(!(t instanceof Je||t instanceof Pe))throw new Error("Slice object must be an array or string");const n=this.evaluate(e.start,r),a=this.evaluate(e.stop,r),i=this.evaluate(e.step,r);if(!(n instanceof He||n instanceof Zt))throw new Error("Slice start must be numeric or undefined");if(!(a instanceof He||a instanceof Zt))throw new Error("Slice stop must be numeric or undefined");if(!(i instanceof He||i instanceof Zt))throw new Error("Slice step must be numeric or undefined");return t instanceof Je?new Je(hp(t.value,n.value,a.value,i.value)):new Pe(hp(Array.from(t.value),n.value,a.value,i.value).join(""))}evaluateMemberExpression(t,e){const r=this.evaluate(t.object,e);let n;if(t.computed){if(t.property.type==="SliceExpression")return this.evaluateSliceExpression(r,t.property,e);n=this.evaluate(t.property,e)}else n=new Pe(t.property.value);let a;if(r instanceof er){if(!(n instanceof Pe))throw new Error(`Cannot access property with non-string: got ${n.type}`);a=r.value.get(n.value)??r.builtins.get(n.value)}else if(r instanceof Je||r instanceof Pe)if(n instanceof He)a=r.value.at(n.value),r instanceof Pe&&(a=new Pe(r.value.at(n.value)));else if(n instanceof Pe)a=r.builtins.get(n.value);else throw new Error(`Cannot access property with non-string/non-number: got ${n.type}`);else{if(!(n instanceof Pe))throw new Error(`Cannot access property with non-string: got ${n.type}`);a=r.builtins.get(n.value)}return a instanceof xr?a:new Zt}evaluateSet(t,e){const r=this.evaluate(t.value,e);if(t.assignee.type==="Identifier"){const n=t.assignee.value;e.setVariable(n,r)}else if(t.assignee.type==="MemberExpression"){const n=t.assignee,a=this.evaluate(n.object,e);if(!(a instanceof er))throw new Error("Cannot assign to member of non-object");if(n.property.type!=="Identifier")throw new Error("Cannot assign to member with non-identifier property");a.value.set(n.property.value,r)}else throw new Error(`Invalid LHS inside assignment expression: ${JSON.stringify(t.assignee)}`);return new ha}evaluateIf(t,e){const r=this.evaluate(t.test,e);return this.evaluateBlock(r.__bool__().value?t.body:t.alternate,e)}evaluateFor(t,e){const r=new To(e),n=this.evaluate(t.iterable,r);if(!(n instanceof Je))throw new Error(`Expected iterable type in for loop: got ${n.type}`);let a="";for(let i=0;i0?n.value[i-1]:new Zt],["nextitem",ip.value.length?"few":"many"} items to unpack`);for(let f=0;fthis.evaluate(r,e)));case"TupleLiteral":return new Bw(t.value.map(r=>this.evaluate(r,e)));case"ObjectLiteral":{const r=new Map;for(const[n,a]of t.value){const i=this.evaluate(n,e);if(!(i instanceof Pe))throw new Error(`Object keys must be strings: got ${i.type}`);r.set(i.value,this.evaluate(a,e))}return new er(r)}case"Identifier":return this.evaluateIdentifier(t,e);case"CallExpression":return this.evaluateCallExpression(t,e);case"MemberExpression":return this.evaluateMemberExpression(t,e);case"UnaryExpression":return this.evaluateUnaryExpression(t,e);case"BinaryExpression":return this.evaluateBinaryExpression(t,e);case"FilterExpression":return this.evaluateFilterExpression(t,e);case"TestExpression":return this.evaluateTestExpression(t,e);default:throw new SyntaxError(`Unknown node type: ${t.type}`)}}};function Mi(t){switch(typeof t){case"number":return new He(t);case"string":return new Pe(t);case"boolean":return new et(t);case"object":return t===null?new ha:Array.isArray(t)?new Je(t.map(Mi)):new er(new Map(Object.entries(t).map(([e,r])=>[e,Mi(r)])));case"function":return new br((e,r)=>{const n=t(...e.map(a=>a.value))??null;return Mi(n)});default:throw new Error(`Cannot convert to runtime value: ${t}`)}}var Nw=class{parsed;constructor(t){const e=bw(t,{lstrip_blocks:!0,trim_blocks:!0});this.parsed=Pw(e)}render(t){const e=new To;e.set("false",!1),e.set("true",!0),e.set("raise_exception",a=>{throw new Error(a)}),e.set("range",Rw);for(const[a,i]of Object.entries(t))e.set(a,i);return new Dw(e).run(this.parsed).value}};const cg=[["en","english"],["zh","chinese"],["de","german"],["es","spanish"],["ru","russian"],["ko","korean"],["fr","french"],["ja","japanese"],["pt","portuguese"],["tr","turkish"],["pl","polish"],["ca","catalan"],["nl","dutch"],["ar","arabic"],["sv","swedish"],["it","italian"],["id","indonesian"],["hi","hindi"],["fi","finnish"],["vi","vietnamese"],["he","hebrew"],["uk","ukrainian"],["el","greek"],["ms","malay"],["cs","czech"],["ro","romanian"],["da","danish"],["hu","hungarian"],["ta","tamil"],["no","norwegian"],["th","thai"],["ur","urdu"],["hr","croatian"],["bg","bulgarian"],["lt","lithuanian"],["la","latin"],["mi","maori"],["ml","malayalam"],["cy","welsh"],["sk","slovak"],["te","telugu"],["fa","persian"],["lv","latvian"],["bn","bengali"],["sr","serbian"],["az","azerbaijani"],["sl","slovenian"],["kn","kannada"],["et","estonian"],["mk","macedonian"],["br","breton"],["eu","basque"],["is","icelandic"],["hy","armenian"],["ne","nepali"],["mn","mongolian"],["bs","bosnian"],["kk","kazakh"],["sq","albanian"],["sw","swahili"],["gl","galician"],["mr","marathi"],["pa","punjabi"],["si","sinhala"],["km","khmer"],["sn","shona"],["yo","yoruba"],["so","somali"],["af","afrikaans"],["oc","occitan"],["ka","georgian"],["be","belarusian"],["tg","tajik"],["sd","sindhi"],["gu","gujarati"],["am","amharic"],["yi","yiddish"],["lo","lao"],["uz","uzbek"],["fo","faroese"],["ht","haitian creole"],["ps","pashto"],["tk","turkmen"],["nn","nynorsk"],["mt","maltese"],["sa","sanskrit"],["lb","luxembourgish"],["my","myanmar"],["bo","tibetan"],["tl","tagalog"],["mg","malagasy"],["as","assamese"],["tt","tatar"],["haw","hawaiian"],["ln","lingala"],["ha","hausa"],["ba","bashkir"],["jw","javanese"],["su","sundanese"]],Oi=new Map(cg),Fw=new Map([...cg.map(([t,e])=>[e,t]),["burmese","my"],["valencian","ca"],["flemish","nl"],["haitian","ht"],["letzeburgesch","lb"],["pushto","ps"],["panjabi","pa"],["moldavian","ro"],["moldovan","ro"],["sinhalese","si"],["castilian","es"]]);function pg(t){t=t.toLowerCase();let e=Fw.get(t);if(e===void 0)if(Oi.has(t))e=t;else{const n=t.length===2?Oi.keys():Oi.values();throw new Error(`Language "${t}" is not supported. Must be one of: ${JSON.stringify(n)}`)}return e}const io="https://github.com/xenova/transformers.js/issues/new/choose";async function hg(t,e){const r=await Promise.all([Mr(t,"tokenizer.json",!0,e),Mr(t,"tokenizer_config.json",!0,e)]);return e.legacy!==null&&(r[1].legacy=e.legacy),r}function Lw(t,e){const r=[];let n=0;for(const a of t.matchAll(e)){const i=a[0];n0&&r.push(i),n=a.index+i.length}return n=19968&&t<=40959||t>=13312&&t<=19903||t>=131072&&t<=173791||t>=173824&&t<=177983||t>=177984&&t<=178207||t>=178208&&t<=183983||t>=63744&&t<=64255||t>=194560&&t<=195103}function Vw(t,e,r){const n=[];let a=0;for(;athis.tokens_to_ids.get(r)??this.unk_token_id)}convert_ids_to_tokens(e){return e.map(r=>this.vocab[r]??this.unk_token)}}class qw extends Ea{constructor(e){super(e),this.tokens_to_ids=au(e.vocab),this.unk_token_id=this.tokens_to_ids.get(e.unk_token),this.unk_token=e.unk_token,this.max_input_chars_per_word=e.max_input_chars_per_word??100,this.vocab=new Array(this.tokens_to_ids.size);for(const[r,n]of this.tokens_to_ids)this.vocab[n]=r}encode(e){const r=[];for(const n of e){const a=[...n];if(a.length>this.max_input_chars_per_word){r.push(this.unk_token);continue}let i=!1,s=0;const o=[];for(;s0&&(p=this.config.continuing_subword_prefix+p),this.tokens_to_ids.has(p)){l=p;break}--u}if(l===null){i=!0;break}o.push(l),s=u}i?r.push(this.unk_token):r.push(...o)}return r}}class Kw extends Ea{constructor(e,r){super(e);const n=e.vocab.length;this.vocab=new Array(n),this.scores=new Array(n);for(let a=0;a[a,i])),this.bosToken=" ",this.bosTokenId=this.tokens_to_ids.get(this.bosToken),this.eosToken=r.eos_token,this.eosTokenId=this.tokens_to_ids.get(this.eosToken),this.unkToken=this.vocab[this.unk_token_id],this.minScore=Op(this.scores)[0],this.unkScore=this.minScore-10,this.scores[this.unk_token_id]=this.unkScore,this.trie=new mw,this.trie.extend(this.vocab),this.fuse_unk=!0}populateNodes(e){const r=e.sentence,n=r.length;let a=0;for(;a{const t=[...Array.from({length:94},(a,i)=>i+33),...Array.from({length:12},(a,i)=>i+161),...Array.from({length:82},(a,i)=>i+174)],e=t.slice();let r=0;for(let a=0;a<256;++a)t.includes(a)||(t.push(a),e.push(256+r),r+=1);const n=e.map(a=>String.fromCharCode(a));return Object.fromEntries(t.map((a,i)=>[a,n[i]]))})(),Yw=d_(gg);class Xw extends Ea{constructor(e){super(e),this.BPE_SPLIT_TOKEN=" ",this.tokens_to_ids=au(e.vocab),this.unk_token_id=this.tokens_to_ids.get(e.unk_token),this.unk_token=e.unk_token,this.vocab=new Array(this.tokens_to_ids.size);for(const[r,n]of this.tokens_to_ids)this.vocab[n]=r;this.bpe_ranks=new Map(e.merges.map((r,n)=>[r,n])),this.merges=e.merges.map(r=>r.split(this.BPE_SPLIT_TOKEN)),this.end_of_word_suffix=e.end_of_word_suffix,this.continuing_subword_suffix=e.continuing_subword_suffix??null,this.byte_fallback=this.config.byte_fallback??!1,this.byte_fallback&&(this.text_encoder=new TextEncoder),this.ignore_merges=this.config.ignore_merges??!1,this.cache=new Map}bpe(e){if(e.length===0)return[];const r=this.cache.get(e);if(r!==void 0)return r;const n=Array.from(e);this.end_of_word_suffix&&(n[n.length-1]+=this.end_of_word_suffix);let a=[];if(n.length>1){const i=new fw((u,l)=>u.score`<0x${s.toString(16).toUpperCase().padStart(2,"0")}>`)):r.push(this.unk_token)}return r}}class Qw extends Ea{constructor(e,r){super(e),this.tokens_to_ids=au(r.target_lang?e.vocab[r.target_lang]:e.vocab),this.bos_token=r.bos_token,this.bos_token_id=this.tokens_to_ids.get(this.bos_token),this.eos_token=r.eos_token,this.eos_token_id=this.tokens_to_ids.get(this.eos_token),this.pad_token=r.pad_token,this.pad_token_id=this.tokens_to_ids.get(this.pad_token),this.unk_token=r.unk_token,this.unk_token_id=this.tokens_to_ids.get(this.unk_token),this.vocab=new Array(this.tokens_to_ids.size);for(const[n,a]of this.tokens_to_ids)this.vocab[a]=n}encode(e){return e}}class Pt extends vt{constructor(e){super(),this.config=e}static fromConfig(e){if(e===null)return null;switch(e.type){case"BertNormalizer":return new ob(e);case"Precompiled":return new Eb(e);case"Sequence":return new sb(e);case"Replace":return new Jw(e);case"NFC":return new Zw(e);case"NFKC":return new eb(e);case"NFKD":return new tb(e);case"Strip":return new rb(e);case"StripAccents":return new nb(e);case"Lowercase":return new ab(e);case"Prepend":return new ib(e);default:throw new Error(`Unknown Normalizer type: ${e.type}`)}}normalize(e){throw Error("normalize should be implemented in subclass.")}_call(e){return this.normalize(e)}}class Jw extends Pt{normalize(e){const r=Qi(this.config.pattern);return r===null?e:e.replaceAll(r,this.config.content)}}class Zw extends Pt{normalize(e){return e=e.normalize("NFC"),e}}class eb extends Pt{normalize(e){return e=e.normalize("NFKC"),e}}class tb extends Pt{normalize(e){return e=e.normalize("NFKD"),e}}class rb extends Pt{normalize(e){return this.config.strip_left&&this.config.strip_right?e=e.trim():(this.config.strip_left&&(e=e.trimStart()),this.config.strip_right&&(e=e.trimEnd())),e}}class nb extends Pt{normalize(e){return e=mg(e),e}}class ab extends Pt{normalize(e){return e=e.toLowerCase(),e}}class ib extends Pt{normalize(e){return e=this.config.prepend+e,e}}class sb extends Pt{constructor(e){super(e),this.normalizers=e.normalizers.map(r=>Pt.fromConfig(r))}normalize(e){return this.normalizers.reduce((r,n)=>n.normalize(r),e)}}class ob extends Pt{_tokenize_chinese_chars(e){const r=[];for(let n=0;nthis.pre_tokenize_text(n,r)):this.pre_tokenize_text(e,r)).flat()}_call(e,r){return this.pre_tokenize(e,r)}}class ub extends Ut{constructor(e){super(),this.pattern=new RegExp(`[^\\s${ba}]+|[${ba}]`,"gu")}pre_tokenize_text(e,r){return e.trim().match(this.pattern)||[]}}class lb extends Ut{constructor(e){super(),this.config=e,this.add_prefix_space=this.config.add_prefix_space,this.trim_offsets=this.config.trim_offsets,this.use_regex=this.config.use_regex??!0,this.pattern=/'s|'t|'re|'ve|'m|'ll|'d| ?\p{L}+| ?\p{N}+| ?[^\s\p{L}\p{N}]+|\s+(?!\S)|\s+/gu,this.byte_encoder=gg,this.text_encoder=new TextEncoder}pre_tokenize_text(e,r){return this.add_prefix_space&&!e.startsWith(" ")&&(e=" "+e),(this.use_regex?e.match(this.pattern)||[]:[e]).map(a=>Array.from(this.text_encoder.encode(a),i=>this.byte_encoder[i]).join(""))}}class db extends Ut{constructor(e){super(),this.config=e,this.pattern=Qi(this.config.pattern,this.config.invert)}pre_tokenize_text(e,r){return this.pattern===null?[]:this.config.invert?e.match(this.pattern)||[]:Lw(e,this.pattern)}}class cb extends Ut{constructor(e){super(),this.config=e,this.pattern=new RegExp(`[^${ba}]+|[${ba}]+`,"gu")}pre_tokenize_text(e,r){return e.match(this.pattern)||[]}}class pb extends Ut{constructor(e){super(),this.config=e;const r=`[^\\d]+|\\d${this.config.individual_digits?"":"+"}`;this.pattern=new RegExp(r,"gu")}pre_tokenize_text(e,r){return e.match(this.pattern)||[]}}class Tn extends vt{constructor(e){super(),this.config=e}static fromConfig(e){if(e===null)return null;switch(e.type){case"TemplateProcessing":return new hb(e);case"ByteLevel":return new wg(e);case"RobertaProcessing":return new yg(e);case"BertProcessing":return new _g(e);case"Sequence":return new fb(e);default:throw new Error(`Unknown PostProcessor type: ${e.type}`)}}post_process(e,...r){throw Error("post_process should be implemented in subclass.")}_call(e,...r){return this.post_process(e,...r)}}class _g extends Tn{constructor(e){super(e),this.cls=e.cls[0],this.sep=e.sep[0]}post_process(e,r=null,{add_special_tokens:n=!0}={}){n&&(e=ct([this.cls],e,[this.sep]));let a=new Array(e.length).fill(0);if(r!==null){const i=n&&this instanceof yg?[this.sep]:[],s=n?[this.sep]:[];e=ct(e,i,r,s),a=ct(a,new Array(r.length+i.length+s.length).fill(1))}return{tokens:e,token_type_ids:a}}}class yg extends _g{}class hb extends Tn{constructor(e){super(e),this.single=e.single,this.pair=e.pair}post_process(e,r=null,{add_special_tokens:n=!0}={}){const a=r===null?this.single:this.pair;let i=[],s=[];for(const o of a)"SpecialToken"in o?n&&(i.push(o.SpecialToken.id),s.push(o.SpecialToken.type_id)):"Sequence"in o&&(o.Sequence.id==="A"?(i=ct(i,e),s=ct(s,new Array(e.length).fill(o.Sequence.type_id))):o.Sequence.id==="B"&&(i=ct(i,r),s=ct(s,new Array(r.length).fill(o.Sequence.type_id))));return{tokens:i,token_type_ids:s}}}class wg extends Tn{post_process(e,r=null){return r&&(e=ct(e,r)),{tokens:e}}}class fb extends Tn{constructor(e){super(e),this.processors=e.processors.map(r=>Tn.fromConfig(r))}post_process(e,r=null,n={}){let a;for(const i of this.processors)if(i instanceof wg)e=i.post_process(e).tokens,r&&(r=i.post_process(r).tokens);else{const s=i.post_process(e,r,n);e=s.tokens,a=s.token_type_ids}return{tokens:e,token_type_ids:a}}}class Rt extends vt{constructor(e){super(),this.config=e,this.added_tokens=[],this.end_of_word_suffix=null,this.trim_offsets=e.trim_offsets}static fromConfig(e){if(e===null)return null;switch(e.type){case"WordPiece":return new wb(e);case"Metaspace":return new kb(e);case"ByteLevel":return new bb(e);case"Replace":return new mb(e);case"ByteFallback":return new gb(e);case"Fuse":return new _b(e);case"Strip":return new yb(e);case"Sequence":return new $b(e);case"CTC":return new vb(e);case"BPEDecoder":return new xb(e);default:throw new Error(`Unknown Decoder type: ${e.type}`)}}_call(e){return this.decode(e)}decode(e){return this.decode_chain(e).join("")}decode_chain(e){throw Error("`decode_chain` should be implemented in subclass.")}}class mb extends Rt{decode_chain(e){const r=Qi(this.config.pattern);return r===null?e:e.map(n=>n.replaceAll(r,this.config.content))}}class gb extends Rt{constructor(e){super(e),this.text_decoder=new TextDecoder}decode_chain(e){const r=[];let n=[];for(const a of e){let i=null;if(a.length===6&&a.startsWith("<0x")&&a.endsWith(">")){const s=parseInt(a.slice(3,5),16);isNaN(s)||(i=s)}if(i!==null)n.push(i);else{if(n.length>0){const s=this.text_decoder.decode(Uint8Array.from(n));r.push(s),n=[]}r.push(a)}}if(n.length>0){const a=this.text_decoder.decode(Uint8Array.from(n));r.push(a),n=[]}return r}}class _b extends Rt{decode_chain(e){return[e.join("")]}}class yb extends Rt{constructor(e){super(e),this.content=this.config.content,this.start=this.config.start,this.stop=this.config.stop}decode_chain(e){return e.map(r=>{let n=0;for(let i=0;i(n!==0&&(r.startsWith(this.config.prefix)?r=r.replace(this.config.prefix,""):r=" "+r),this.cleanup&&(r=iu(r)),r))}}class bb extends Rt{constructor(e){super(e),this.byte_decoder=Yw,this.text_decoder=new TextDecoder("utf-8",{fatal:!1,ignoreBOM:!0}),this.end_of_word_suffix=null}convert_tokens_to_string(e){const r=e.join(""),n=new Uint8Array([...r].map(i=>this.byte_decoder[i]));return this.text_decoder.decode(n)}decode_chain(e){const r=[];let n=[];for(const a of e)this.added_tokens.find(i=>i.content===a)!==void 0?(n.length>0&&(r.push(this.convert_tokens_to_string(n)),n=[]),r.push(a)):n.push(a);return n.length>0&&r.push(this.convert_tokens_to_string(n)),r}}class vb extends Rt{constructor(e){super(e),this.pad_token=this.config.pad_token,this.word_delimiter_token=this.config.word_delimiter_token,this.cleanup=this.config.cleanup}convert_tokens_to_string(e){if(e.length===0)return"";const r=[e[0]];for(let i=1;ii!==this.pad_token).join("");return this.cleanup&&(a=iu(a).replaceAll(this.word_delimiter_token," ").trim()),a}decode_chain(e){return[this.convert_tokens_to_string(e)]}}class $b extends Rt{constructor(e){super(e),this.decoders=e.decoders.map(r=>Rt.fromConfig(r))}decode_chain(e){return this.decoders.reduce((r,n)=>n.decode_chain(r),e)}}class xb extends Rt{constructor(e){super(e),this.suffix=this.config.suffix}decode_chain(e){return e.map((r,n)=>r.replaceAll(this.suffix,n===e.length-1?"":" "))}}class Sb extends Rt{decode_chain(e){let r="";for(let n=1;nn.normalize("NFKC")).join("~"):e=e.normalize("NFKC"),e}}class Cb extends Ut{constructor(e){super(),this.tokenizers=e.pretokenizers.map(r=>Ut.fromConfig(r))}pre_tokenize_text(e,r){return this.tokenizers.reduce((n,a)=>a.pre_tokenize(n,r),[e])}}class Tb extends Ut{constructor(e){super()}pre_tokenize_text(e,r){return e.match(/\w+|[^\w\s]+/g)||[]}}class Ib extends Ut{constructor(e){super()}pre_tokenize_text(e,r){return Gw(e)}}class Ab extends Ut{constructor(e){super(),this.config=e,this.pattern=Qi(this.config.pattern),this.content=this.config.content}pre_tokenize_text(e,r){return this.pattern===null?[e]:[e.replaceAll(this.pattern,this.config.content)]}}const Mb=["bos_token","eos_token","unk_token","sep_token","pad_token","cls_token","mask_token"];function Ob(t,e,r,n){for(const a of Object.keys(t)){const i=e-t[a].length,s=r(a),o=new Array(i).fill(s);t[a]=n==="right"?ct(t[a],o):ct(o,t[a])}}function zb(t,e){for(const r of Object.keys(t))t[r].length=e}class Ee extends vt{return_token_type_ids=!1;_default_chat_template=`{% for message in messages %}{{'<|im_start|>' + message['role'] + ' -' + message['content'] + '<|im_end|>' + ' -'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant -' }}{% endif %}`;padding_side="right";constructor(e,r){super(),this._tokenizer_config=r,this.normalizer=Pt.fromConfig(e.normalizer),this.pre_tokenizer=Ut.fromConfig(e.pre_tokenizer),this.model=Ea.fromConfig(e.model,r),this.post_processor=Tn.fromConfig(e.post_processor),this.decoder=Rt.fromConfig(e.decoder),this.special_tokens=[],this.all_special_ids=[],this.added_tokens=[];for(const n of e.added_tokens){const a=new jw(n);this.added_tokens.push(a),this.model.tokens_to_ids.set(a.content,a.id),this.model.vocab[a.id]=a.content,a.special&&(this.special_tokens.push(a.content),this.all_special_ids.push(a.id))}if(this.additional_special_tokens=r.additional_special_tokens??[],this.special_tokens.push(...this.additional_special_tokens),this.special_tokens=[...new Set(this.special_tokens)],this.decoder&&(this.decoder.added_tokens=this.added_tokens,this.decoder.end_of_word_suffix=this.model.end_of_word_suffix),this.added_tokens_regex=this.added_tokens.length>0?new RegExp(this.added_tokens.map(n=>`${n.lstrip?"\\s*":""}(${Ap(n.content)})${n.rstrip?"\\s*":""}`).join("|")):null,this.mask_token=this.getToken("mask_token"),this.mask_token_id=this.model.tokens_to_ids.get(this.mask_token),this.pad_token=this.getToken("pad_token","eos_token"),this.pad_token_id=this.model.tokens_to_ids.get(this.pad_token),this.sep_token=this.getToken("sep_token"),this.sep_token_id=this.model.tokens_to_ids.get(this.sep_token),this.unk_token=this.getToken("unk_token"),this.unk_token_id=this.model.tokens_to_ids.get(this.unk_token),this.model_max_length=r.model_max_length,this.remove_space=r.remove_space,this.clean_up_tokenization_spaces=r.clean_up_tokenization_spaces??!0,this.do_lowercase_and_remove_accent=r.do_lowercase_and_remove_accent??!1,r.padding_side&&(this.padding_side=r.padding_side),this.legacy=!1,this.chat_template=r.chat_template??null,Array.isArray(this.chat_template)){const n=Object.create(null);for(const{name:a,template:i}of this.chat_template){if(typeof a!="string"||typeof i!="string")throw new Error('Chat template must be a list of objects with "name" and "template" properties');n[a]=i}this.chat_template=n}this._compiled_template_cache=new Map}getToken(...e){for(const r of e){const n=this._tokenizer_config[r];if(n)if(typeof n=="object"){if(n.__type==="AddedToken")return n.content;throw Error(`Unknown token: ${n}`)}else return n}return null}static async from_pretrained(e,{progress_callback:r=null,config:n=null,cache_dir:a=null,local_files_only:i=!1,revision:s="main",legacy:o=null}={}){const u=await hg(e,{progress_callback:r,config:n,cache_dir:a,local_files_only:i,revision:s,legacy:o});return new this(...u)}_call(e,{text_pair:r=null,add_special_tokens:n=!0,padding:a=!1,truncation:i=null,max_length:s=null,return_tensor:o=!0,return_token_type_ids:u=null}={}){const l=Array.isArray(e);let p;if(l){if(e.length===0)throw Error("text array must be non-empty");if(r!==null){if(Array.isArray(r)){if(e.length!==r.length)throw Error("text and text_pair must have the same length")}else throw Error("text_pair must also be an array");p=e.map((m,c)=>this._encode_plus(m,{text_pair:r[c],add_special_tokens:n,return_token_type_ids:u}))}else p=e.map(m=>this._encode_plus(m,{add_special_tokens:n,return_token_type_ids:u}))}else{if(e==null)throw Error("text may not be null or undefined");if(Array.isArray(r))throw Error("When specifying `text_pair`, since `text` is a string, `text_pair` must also be a string (i.e., not an array).");p=[this._encode_plus(e,{text_pair:r,add_special_tokens:n,return_token_type_ids:u})]}if(s===null?a==="max_length"?s=this.model_max_length:s=$r(p.map(m=>m.input_ids.length))[0]:i||console.warn("Truncation was not explicitly activated but `max_length` is provided a specific value, please use `truncation=true` to explicitly truncate examples to max length."),s=Math.min(s,this.model_max_length),a||i)for(let m=0;ms?i&&zb(p[m],s):a&&Ob(p[m],s,c=>c==="input_ids"?this.pad_token_id:0,this.padding_side));const f={};if(o){if(!(a&&i)&&p.some(c=>{for(const y of Object.keys(c))if(c[y].length!==p[0][y]?.length)return!0;return!1}))throw Error("Unable to create tensor, you should probably activate truncation and/or padding with 'padding=true' and 'truncation=true' to have batched tensors with the same length.");const m=[p.length,p[0].input_ids.length];for(const c of Object.keys(p[0]))f[c]=new pe("int64",BigInt64Array.from(p.flatMap(y=>y[c]).map(BigInt)),m)}else{for(const m of Object.keys(p[0]))f[m]=p.map(c=>c[m]);if(!l)for(const m of Object.keys(f))f[m]=f[m][0]}return f}_encode_text(e){return e===null?null:(this.added_tokens_regex?e.split(this.added_tokens_regex).filter(a=>a):[e]).map((a,i)=>{if(this.added_tokens.find(o=>o.content===a)!==void 0)return a;{if(this.remove_space===!0&&(a=a.trim().split(/\s+/).join(" ")),this.do_lowercase_and_remove_accent&&(a=Uw(a)),this.normalizer!==null&&(a=this.normalizer(a)),a.length===0)return[];const o=this.pre_tokenizer!==null?this.pre_tokenizer(a,{section_index:i}):[a];return this.model(o)}}).flat()}_encode_plus(e,{text_pair:r=null,add_special_tokens:n=!0,return_token_type_ids:a=null}={}){const{tokens:i,token_type_ids:s}=this._tokenize_helper(e,{pair:r,add_special_tokens:n}),o=this.model.convert_tokens_to_ids(i),u={input_ids:o,attention_mask:new Array(o.length).fill(1)};return(a??this.return_token_type_ids)&&s&&(u.token_type_ids=s),u}_tokenize_helper(e,{pair:r=null,add_special_tokens:n=!1}={}){const a=this._encode_text(e),i=this._encode_text(r);return this.post_processor?this.post_processor(a,i,{add_special_tokens:n}):{tokens:ct(a??[],i??[])}}tokenize(e,{pair:r=null,add_special_tokens:n=!1}={}){return this._tokenize_helper(e,{pair:r,add_special_tokens:n}).tokens}encode(e,{text_pair:r=null,add_special_tokens:n=!0,return_token_type_ids:a=null}={}){return this._encode_plus(e,{text_pair:r,add_special_tokens:n,return_token_type_ids:a}).input_ids}batch_decode(e,r={}){return e instanceof pe&&(e=e.tolist()),e.map(n=>this.decode(n,r))}decode(e,r={}){if(e instanceof pe&&(e=fg(e)),!Array.isArray(e)||e.length===0||!c_(e[0]))throw Error("token_ids must be a non-empty array of integers.");return this.decode_single(e,r)}decode_single(e,{skip_special_tokens:r=!1,clean_up_tokenization_spaces:n=null}){let a=this.model.convert_ids_to_tokens(e);r&&(a=a.filter(s=>!this.special_tokens.includes(s)));let i=this.decoder?this.decoder(a):a.join(" ");return this.decoder&&this.decoder.end_of_word_suffix&&(i=i.replaceAll(this.decoder.end_of_word_suffix," "),r&&(i=i.trim())),(n??this.clean_up_tokenization_spaces)&&(i=iu(i)),i}get default_chat_template(){return this._warned_about_chat_template||(console.warn("No chat template is defined for this tokenizer - using a default chat template that implements the ChatML format. If the default is not appropriate for your model, please set `tokenizer.chat_template` to an appropriate template. See https://huggingface.co/docs/transformers/main/chat_templating for more information."),this._warned_about_chat_template=!0),this._default_chat_template}apply_chat_template(e,{chat_template:r=null,add_generation_prompt:n=!1,tokenize:a=!0,padding:i=!1,truncation:s=!1,max_length:o=null,return_tensor:u=!0,return_dict:l=!1,tokenizer_kwargs:p={},...f}={}){if(this.chat_template&&typeof this.chat_template=="object"||this.chat_template===null&&this.default_chat_template&&typeof this.default_chat_template=="object"){const w=this.chat_template??this.default_chat_template;if(r!==null&&Object.hasOwn(w,r))r=w[r];else if(r===null&&"default"in w)r=w.default;else if(r===null)throw Error(`This model has multiple chat templates with no default specified! Please either pass a chat template or the name of the template you wish to use to the 'chat_template' argument. Available template names are ${Object.keys(w).sort()}.`)}else r??=this.chat_template??this.default_chat_template;if(typeof r!="string")throw Error(`chat_template must be a string, but got ${typeof r}`);let m=this._compiled_template_cache.get(r);m===void 0&&(m=new Nw(r),this._compiled_template_cache.set(r,m));const c=Object.create(null);for(const w of Mb){const v=this.getToken(w);v&&(c[w]=v)}const y=m.render({messages:e,add_generation_prompt:n,...c,...f});if(a){const w=this._call(y,{add_special_tokens:!1,padding:i,truncation:s,max_length:o,return_tensor:u,...p});return l?w:w.input_ids}return y}}class Pb extends Ee{return_token_type_ids=!0}class Rb extends Ee{return_token_type_ids=!0}class Bb extends Ee{return_token_type_ids=!0}class Db extends Ee{return_token_type_ids=!0}class Nb extends Ee{return_token_type_ids=!0}class Fb extends Ee{return_token_type_ids=!0}class Lb extends Ee{return_token_type_ids=!0}class Ub extends Ee{return_token_type_ids=!0}class Wb extends Ee{return_token_type_ids=!0}class Vb extends Ee{}class Gb extends Ee{}class Hb extends Ee{return_token_type_ids=!0;constructor(e,r){super(e,r),console.warn('WARNING: `XLMTokenizer` is not yet supported by Hugging Face\'s "fast" tokenizers library. Therefore, you may experience slightly inaccurate results.')}}class jb extends Ee{return_token_type_ids=!0}class qb extends Ee{}class vg extends Ee{_default_chat_template='{% for message in messages %}" "{{ message.content }}{{ eos_token }}" "{% endfor %}'}class Kb extends Ee{}class $g extends Ee{constructor(e,r){super(e,r),this.languageRegex=/^[a-z]{2}_[A-Z]{2}$/,this.language_codes=this.special_tokens.filter(n=>this.languageRegex.test(n)),this.lang_to_token=n=>n}_build_translation_inputs(e,r,n){return su(this,e,r,n)}}class Yb extends $g{}class Xb extends Ee{}class Qb extends vg{constructor(e,r){const n=".,!?…。,、।۔،",a=e.pre_tokenizer?.pretokenizers[0]?.pattern;a&&a.Regex===` ?[^(\\s|[${n}])]+`&&(a.Regex=` ?[^\\s${n}]+`),super(e,r)}}const vi="▁";class xg extends Ee{_default_chat_template=`{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% elif USE_DEFAULT_PROMPT == true and not '<>' in messages[0]['content'] %}{% set loop_messages = messages %}{% set system_message = 'DEFAULT_SYSTEM_MESSAGE' %}{% else %}{% set loop_messages = messages %}{% set system_message = false %}{% endif %}{% for message in loop_messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if loop.index0 == 0 and system_message != false %}{% set content = '<> -' + system_message + ' -<> - -' + message['content'] %}{% else %}{% set content = message['content'] %}{% endif %}{% if message['role'] == 'user' %}{{ bos_token + '[INST] ' + content.strip() + ' [/INST]' }}{% elif message['role'] == 'system' %}{{ '<> -' + content.strip() + ' -<> - -' }}{% elif message['role'] == 'assistant' %}{{ ' ' + content.strip() + ' ' + eos_token }}{% endif %}{% endfor %}`;DEFAULT_SYSTEM_PROMPT=`You are a helpful, respectful and honest assistant. Always answer as helpfully as possible, while being safe. Your answers should not include any harmful, unethical, racist, sexist, toxic, dangerous, or illegal content. Please ensure that your responses are socially unbiased and positive in nature. - -If a question does not make any sense, or is not factually coherent, explain why instead of answering something not correct. If you don't know the answer to a question, please don't share false information.`;padding_side="left";constructor(e,r){super(e,r),this.use_default_system_prompt=r.use_default_system_prompt??!1,this.legacy=r.legacy??!0,this.legacy||(this.normalizer=null,this.pre_tokenizer=new bg({replacement:vi,add_prefix_space:!0,prepend_scheme:"first"}))}_encode_text(e){if(e===null)return null;if(this.legacy||e.length===0)return super._encode_text(e);let r=super._encode_text(vi+e.replaceAll(vi," "));return r.length>1&&r[0]===vi&&this.special_tokens.includes(r[1])&&(r=r.slice(1)),r}get default_chat_template(){return super.default_chat_template.replaceAll("USE_DEFAULT_PROMPT",this.use_default_system_prompt?"true":"false").replaceAll("DEFAULT_SYSTEM_MESSAGE",this.DEFAULT_SYSTEM_PROMPT.replaceAll(` -`,"\\n").replaceAll("'","\\'"))}}class Jb extends xg{}class Zb extends Ee{}class ev extends Ee{}class tv extends Ee{}class rv extends Ee{}class nv extends Ee{}class av extends Ee{}class iv extends Ee{_default_chat_template=`{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if (message['role'] == 'assistant') %}{% set role = 'model' %}{% else %}{% set role = message['role'] %}{% endif %}{{ '' + role + ' -' + message['content'] | trim + ' -' }}{% endfor %}{% if add_generation_prompt %}{{'model -'}}{% endif %}`}class sv extends Ee{}function su(t,e,r,n){if(!("language_codes"in t)||!Array.isArray(t.language_codes))throw new Error("Tokenizer must have `language_codes` attribute set and it should be an array of language ids.");if(!("languageRegex"in t)||!(t.languageRegex instanceof RegExp))throw new Error("Tokenizer must have `languageRegex` attribute set and it should be a regular expression.");if(!("lang_to_token"in t)||typeof t.lang_to_token!="function")throw new Error("Tokenizer must have `lang_to_token` attribute set and it should be a function.");const a=n.src_lang,i=n.tgt_lang;if(!t.language_codes.includes(i))throw new Error(`Target language code "${i}" is not valid. Must be one of: {${t.language_codes.join(", ")}}`);if(a!==void 0){if(!t.language_codes.includes(a))throw new Error(`Source language code "${a}" is not valid. Must be one of: {${t.language_codes.join(", ")}}`);for(const s of t.post_processor.config.single)if("SpecialToken"in s&&t.languageRegex.test(s.SpecialToken.id)){s.SpecialToken.id=t.lang_to_token(a);break}}return n.forced_bos_token_id=t.model.convert_tokens_to_ids([t.lang_to_token(i)])[0],t._call(e,r)}class ov extends Ee{constructor(e,r){super(e,r),this.languageRegex=/^[a-z]{3}_[A-Z][a-z]{3}$/,this.language_codes=this.special_tokens.filter(n=>this.languageRegex.test(n)),this.lang_to_token=n=>n}_build_translation_inputs(e,r,n){return su(this,e,r,n)}}class uv extends Ee{constructor(e,r){super(e,r),this.languageRegex=/^__[a-z]{2,3}__$/,this.language_codes=this.special_tokens.filter(n=>this.languageRegex.test(n)).map(n=>n.slice(2,-2)),this.lang_to_token=n=>`__${n}__`}_build_translation_inputs(e,r,n){return su(this,e,r,n)}}class lv extends Ee{_default_chat_template='{% for message in messages %}" "{{ message.content }}{{ eos_token }}" "{% endfor %}';get timestamp_begin(){return this.model.convert_tokens_to_ids(["<|notimestamps|>"])[0]+1}_decode_asr(e,{return_timestamps:r=!1,return_language:n=!1,time_precision:a=null,force_full_sequences:i=!0}={}){if(a===null)throw Error("Must specify time_precision");let s=null;const o=r==="word";function u(){return{language:s,timestamp:[null,null],text:""}}const l=[];let p=u(),f=0;const m=this.timestamp_begin;let c=[],y=[],w=!1,v=null;const k=new Set(this.all_special_ids);for(const T of e){const A=T.tokens,B=o?T.token_timestamps:null;let R=null,D=m;if("stride"in T){const[ie,te,oe]=T.stride;if(f-=te,v=ie-oe,te&&(D=te/a+m),oe)for(let re=A.length-1;re>=0;--re){const M=Number(A[re]);if(M>=m){if(R!==null&&(M-m)*a=m){const oe=(te-m)*a+f,re=Ss(oe,2);if(R!==null&&te>=R)w=!0;else if(w||c.length>0&&te0?(c.push(K),o&&y.push(j)):c.every(ie=>ie.length===0)&&(p=u(),c=[],K=[],y=[],j=[])}if(c.length>0){if(i&&r)throw new Error("Whisper did not predict an ending timestamp, which can happen if audio is cut off in the middle of a word. Also make sure WhisperTimeStampLogitsProcessor was used during generation.");const[T,A]=this.findLongestCommonSequence(c,y),B=this.decode(T);p.text=B,o&&(p.words=this.collateWordTimestamps(T,A,s)),l.push(p)}let $=Object.create(null);const C=l.map(T=>T.text).join("");if(r||n){for(let T=0;T0;let o=s?[]:null,u=s?r[0]:null;for(let l=1;lre===ie[M]).length,oe=te/T+A;te>1&&oe>f&&(f=oe,m=[B,R,K,j])}const[y,w,v,k]=m,$=Math.floor((w+y)/2),C=Math.floor((k+v)/2);i.push(...n.slice(0,$)),n=p.slice(C),a=n.length,s&&(o.push(...u.slice(0,$)),u=r[l].slice(C))}return i.push(...n),s?(o.push(...u),[i,o]):[i,[]]}collateWordTimestamps(e,r,n){const[a,i,s]=this.combineTokensIntoWords(e,n),o=[];for(let u=0;u=a){const o=((s-a)*n).toFixed(2);i.push(`<|${o}|>`),i.push([])}else i[i.length-1].push(s);return i=i.map(s=>typeof s=="string"?s:super.decode(s,r)),i.join("")}splitTokensOnUnicode(e){const r=this.decode(e,{decode_with_timestamps:!0}),n="�",a=[],i=[],s=[];let o=[],u=[],l=0;for(let p=0;p=this.model.tokens_to_ids.get("<|endoftext|>"),y=p.startsWith(" "),w=p.trim(),v=u.test(w);if(c||y||v||i.length===0)i.push(p),s.push(f),o.push(m);else{const k=i.length-1;i[k]+=p,s[k].push(...f),o[k].push(...m)}}return[i,s,o]}mergePunctuations(e,r,n,a,i){const s=structuredClone(e),o=structuredClone(r),u=structuredClone(n);let l=s.length-2,p=s.length-1;for(;l>=0;)s[l].startsWith(" ")&&a.includes(s[l].trim())?(s[p]=s[l]+s[p],o[p]=ct(o[l],o[p]),u[p]=ct(u[l],u[p]),s[l]="",o[l]=[],u[l]=[]):p=l,--l;for(l=0,p=1;pf),o.filter(f=>f.length>0),u.filter(f=>f.length>0)]}get_decoder_prompt_ids({language:e=null,task:r=null,no_timestamps:n=!0}={}){const a=[];if(e){const i=pg(e),s=this.model.tokens_to_ids.get(`<|${i}|>`);if(s===void 0)throw new Error(`Unable to find language "${i}" in model vocabulary. Please report this issue at ${io}.`);a.push(s)}else a.push(null);if(r){if(r=r.toLowerCase(),r!=="transcribe"&&r!=="translate")throw new Error(`Task "${r}" is not supported. Must be one of: ["transcribe", "translate"]`);const i=this.model.tokens_to_ids.get(`<|${r}|>`);if(i===void 0)throw new Error(`Unable to find task "${r}" in model vocabulary. Please report this issue at ${io}.`);a.push(i)}else a.push(null);if(n){const i=this.model.tokens_to_ids.get("<|notimestamps|>");if(i===void 0)throw new Error(`Unable to find "<|notimestamps|>" in model vocabulary. Please report this issue at ${io}.`);a.push(i)}return a.map((i,s)=>[s+1,i]).filter(i=>i[1]!==null)}}class dv extends Ee{}class cv extends Ee{}class pv extends Ee{}class hv extends Ee{constructor(e,r){super(e,r),this.languageRegex=/^(>>\w+<<)\s*/g,this.supported_language_codes=this.model.vocab.filter(n=>this.languageRegex.test(n)),console.warn('WARNING: `MarianTokenizer` is not yet supported by Hugging Face\'s "fast" tokenizers library. Therefore, you may experience slightly inaccurate results.')}_encode_text(e){if(e===null)return null;const[r,...n]=e.trim().split(this.languageRegex);if(n.length===0)return super._encode_text(r);if(n.length===2){const[a,i]=n;return this.supported_language_codes.includes(a)||console.warn(`Unsupported language code "${a}" detected, which may lead to unexpected behavior. Should be one of: ${JSON.stringify(this.supported_language_codes)}`),ct([a],super._encode_text(i))}}}class fv extends Ee{}class Sg extends Ee{_default_chat_template="{% for message in messages %}{% if message['role'] == 'user' %}{{ ' ' }}{% endif %}{{ message['content'] }}{% if not loop.last %}{{ ' ' }}{% endif %}{% endfor %}{{ eos_token }}"}class mv extends Sg{}class gv extends Ee{}class _v extends Ee{}class yv extends Ee{constructor(e,r){super(e,r),this.decoder=new Sb({})}}class wv extends Ee{}class bv{static TOKENIZER_CLASS_MAPPING={T5Tokenizer:qb,DistilBertTokenizer:Vb,CamembertTokenizer:Gb,DebertaTokenizer:Nb,DebertaV2Tokenizer:Fb,BertTokenizer:Pb,HerbertTokenizer:Lb,ConvBertTokenizer:Ub,RoFormerTokenizer:Wb,XLMTokenizer:Hb,ElectraTokenizer:jb,MobileBertTokenizer:Bb,SqueezeBertTokenizer:Db,AlbertTokenizer:Rb,GPT2Tokenizer:vg,BartTokenizer:Kb,MBartTokenizer:$g,MBart50Tokenizer:Yb,RobertaTokenizer:Xb,WhisperTokenizer:lv,CodeGenTokenizer:dv,CLIPTokenizer:cv,SiglipTokenizer:pv,MarianTokenizer:hv,BloomTokenizer:Qb,NllbTokenizer:ov,M2M100Tokenizer:uv,LlamaTokenizer:xg,CodeLlamaTokenizer:Jb,XLMRobertaTokenizer:Zb,MPNetTokenizer:ev,FalconTokenizer:tv,GPTNeoXTokenizer:rv,EsmTokenizer:nv,Wav2Vec2CTCTokenizer:fv,BlenderbotTokenizer:Sg,BlenderbotSmallTokenizer:mv,SpeechT5Tokenizer:gv,NougatTokenizer:_v,VitsTokenizer:yv,Qwen2Tokenizer:av,GemmaTokenizer:iv,Grok1Tokenizer:sv,CohereTokenizer:wv,PreTrainedTokenizer:Ee};static async from_pretrained(e,{progress_callback:r=null,config:n=null,cache_dir:a=null,local_files_only:i=!1,revision:s="main",legacy:o=null}={}){const[u,l]=await hg(e,{progress_callback:r,config:n,cache_dir:a,local_files_only:i,revision:s,legacy:o}),p=l.tokenizer_class?.replace(/Fast$/,"")??"PreTrainedTokenizer";let f=this.TOKENIZER_CLASS_MAPPING[p];return f||(console.warn(`Unknown tokenizer class "${p}", attempting to construct from base class.`),f=Ee),new f(u,l)}}async function vv(t,e){return await Mr(t,"config.json",!0,e)}function xn(t){const e={};let r={};switch(t.model_type){case"llava":case"paligemma":r=xn(t.text_config);break;case"moondream1":r=xn(t.phi_config);break;case"musicgen":r=xn(t.decoder);break;case"gpt2":case"gptj":case"codegen":case"gpt_bigcode":e.num_heads="n_head",e.num_layers="n_layer",e.hidden_size="n_embd";break;case"gpt_neox":case"stablelm":case"opt":case"phi":case"phi3":case"falcon":e.num_heads="num_attention_heads",e.num_layers="num_hidden_layers",e.hidden_size="hidden_size";break;case"llama":case"mistral":case"starcoder2":case"qwen2":e.num_heads="num_key_value_heads",e.num_layers="num_hidden_layers",e.hidden_size="hidden_size",e.num_attention_heads="num_attention_heads";break;case"gemma":e.num_heads="num_key_value_heads",e.num_layers="num_hidden_layers",e.dim_kv="head_dim";break;case"openelm":e.num_heads="num_kv_heads",e.num_layers="num_transformer_layers",e.dim_kv="head_dim";break;case"gpt_neo":e.num_heads="num_heads",e.num_layers="num_layers",e.hidden_size="hidden_size";break;case"bloom":e.num_heads="n_head",e.num_layers="n_layer",e.hidden_size="hidden_size";break;case"mpt":e.num_heads="n_heads",e.num_layers="n_layers",e.hidden_size="d_model";break;case"t5":case"mt5":case"longt5":e.num_decoder_layers="num_decoder_layers",e.num_decoder_heads="num_heads",e.decoder_dim_kv="d_kv",e.num_encoder_layers="num_layers",e.num_encoder_heads="num_heads",e.encoder_dim_kv="d_kv";break;case"bart":case"mbart":case"marian":case"whisper":case"m2m_100":case"blenderbot":case"blenderbot-small":e.num_decoder_layers="decoder_layers",e.num_decoder_heads="decoder_attention_heads",e.decoder_hidden_size="d_model",e.num_encoder_layers="encoder_layers",e.num_encoder_heads="encoder_attention_heads",e.encoder_hidden_size="d_model";break;case"speecht5":e.num_decoder_layers="decoder_layers",e.num_decoder_heads="decoder_attention_heads",e.decoder_hidden_size="hidden_size",e.num_encoder_layers="encoder_layers",e.num_encoder_heads="encoder_attention_heads",e.encoder_hidden_size="hidden_size";break;case"trocr":e.num_encoder_layers=e.num_decoder_layers="decoder_layers",e.num_encoder_heads=e.num_decoder_heads="decoder_attention_heads",e.encoder_hidden_size=e.decoder_hidden_size="d_model";break;case"musicgen_decoder":e.num_encoder_layers=e.num_decoder_layers="num_hidden_layers",e.num_encoder_heads=e.num_decoder_heads="num_attention_heads",e.encoder_hidden_size=e.decoder_hidden_size="hidden_size";break;case"vision-encoder-decoder":const a=xn(t.encoder),i=xn(t.decoder),s="num_decoder_layers"in i,o={};return s?(o.num_decoder_layers=i.num_layers,o.num_decoder_heads=i.num_heads,o.decoder_hidden_size=i.hidden_size,o.num_encoder_layers=a.num_layers,o.num_encoder_heads=a.num_heads,o.encoder_hidden_size=a.hidden_size):(o.num_layers=i.num_layers,o.num_heads=i.num_heads,o.hidden_size=i.hidden_size),o}const n={...r,...Qr(t,["model_type","multi_query","is_encoder_decoder"])};for(const a in e)n[a]=t[e[a]];return n}function kg(t,{prefix:e="past_key_values",encoder_add_pkv:r=!0}={}){const n={},a=t.normalized_config,i=1;if(a.is_encoder_decoder&&r){const s=a.encoder_dim_kv??a.encoder_hidden_size/a.num_encoder_heads,o=a.decoder_dim_kv??a.decoder_hidden_size/a.num_decoder_heads,u=[i,a.num_encoder_heads,0,s],l=[i,a.num_decoder_heads,0,o];for(let p=0;p=1&&s[s.length-1]>=this.timestamp_begin,u=s.length<2||s[s.length-2]>=this.timestamp_begin;if(o&&(u?i.subarray(this.timestamp_begin).fill(-1/0):i.subarray(0,this.eos_token_id).fill(-1/0)),e[n].length===this.begin_index&&this.max_initial_timestamp_index!==null){const m=this.timestamp_begin+this.max_initial_timestamp_index;i.subarray(m+1).fill(-1/0)}const l=y_(i),p=Math.log(l.subarray(this.timestamp_begin).map(Math.exp).reduce((m,c)=>m+c)),f=$r(l.subarray(0,this.timestamp_begin))[0];p>f&&i.subarray(0,this.timestamp_begin).fill(-1/0)}return r}}class Tv extends pr{constructor(e){super(),this.no_repeat_ngram_size=e}getNgrams(e){const r=e.length,n=[];for(let i=0;i1 to use the classifier free guidance processor, got guidance scale ${e}.`);this.guidance_scale=e}_call(e,r){if(r.dims[0]!==2*e.length)throw new Error(`Logits should have twice the batch size of the input ids, the first half of batches corresponding to the conditional inputs, and the second half of batches corresponding to the unconditional inputs. Got batch size ${r.dims[0]} for the logits and ${e.length} for the input ids.`);const n=e.length,a=r.slice([0,n],null),i=r.slice([n,r.dims[0]],null);for(let s=0;s1)throw new Error(`\`top_p\` must be a float > 0 and < 1, but is ${e}`);if(!Number.isInteger(n)||n<1)throw new Error(`\`min_tokens_to_keep\` must be a positive integer, but is ${n}`);this.top_p=e,this.filter_value=r,this.min_tokens_to_keep=n}}class Bv extends ou{constructor(e,{filter_value:r=-1/0,min_tokens_to_keep:n=1}={}){if(super(),!Number.isInteger(e)||e<0)throw new Error(`\`top_k\` must be a positive integer, but is ${e}`);this.top_k=Math.max(e,n),this.filter_value=r}}class Cg{max_length=20;max_new_tokens=null;min_length=0;min_new_tokens=null;early_stopping=!1;max_time=null;do_sample=!1;num_beams=1;num_beam_groups=1;penalty_alpha=null;use_cache=!0;temperature=1;top_k=50;top_p=1;typical_p=1;epsilon_cutoff=0;eta_cutoff=0;diversity_penalty=0;repetition_penalty=1;encoder_repetition_penalty=1;length_penalty=1;no_repeat_ngram_size=0;bad_words_ids=null;force_words_ids=null;renormalize_logits=!1;constraints=null;forced_bos_token_id=null;forced_eos_token_id=null;remove_invalid_values=!1;exponential_decay_length_penalty=null;suppress_tokens=null;begin_suppress_tokens=null;forced_decoder_ids=null;guidance_scale=null;num_return_sequences=1;output_attentions=!1;output_hidden_states=!1;output_scores=!1;return_dict_in_generate=!1;pad_token_id=null;bos_token_id=null;eos_token_id=null;encoder_no_repeat_ngram_size=0;decoder_start_token_id=null;generation_kwargs={};constructor(e){Object.assign(this,Qr(e,Object.getOwnPropertyNames(this)))}}class uu extends vt{_call(e,r){throw Error("StoppingCriteria needs to be subclassed")}}class lu extends vt{constructor(){super(),this.criteria=[]}push(e){this.criteria.push(e)}extend(e){e instanceof lu?e=e.criteria:e instanceof uu&&(e=[e]),this.criteria.push(...e)}_call(e,r){const n=new Array(e.length).fill(!1);for(const a of this.criteria){const i=a(e,r);for(let s=0;sr.length>=this.max_length)}}class Nv extends uu{constructor(e){super(),Array.isArray(e)||(e=[e]),this.eos_token_id=e}_call(e,r){return e.map(n=>{const a=n.at(-1);return this.eos_token_id.some(i=>a==i)})}}class Ji extends vt{constructor(e){super(),this.generation_config=e}_call(e,r=-1){return this.sample(e,r)}sample(e,r){throw Error("sample should be implemented in subclasses.")}getLogits(e,r){let n=e.dims.at(-1),a=e.data;if(r===-1)a=a.slice(-n);else{let i=r*n;a=a.slice(i,i+n)}return a}randomSelect(e){let r=e.reduce((a,i)=>a+i,0),n=Math.random()*r;for(let a=0;a1)return new Uv(e);if(e.num_return_sequences>1)throw Error(`num_return_sequences has to be 1 when doing greedy search, but is ${e.num_return_sequences}.`);return new Fv(e)}}class Fv extends Ji{sample(e,r=-1){let n=this.getLogits(e,r);return[[$r(n)[1],0]]}}class Lv extends Ji{sample(e,r=-1){let n=e.dims.at(-1);this.generation_config.top_k>0&&(n=Math.min(this.generation_config.top_k,n));const a=this.getLogits(e,r),i=Mp(a,n),s=In(i.map(o=>o[1]));return Array.from({length:this.generation_config.num_beams},()=>{const o=this.randomSelect(s);return[i[o][0],Math.log(s[o])]})}}class Uv extends Ji{sample(e,r=-1){let n=e.dims.at(-1);this.generation_config.top_k>0&&(n=Math.min(this.generation_config.top_k,n));const a=this.getLogits(e,r),i=Mp(a,n),s=In(i.map(o=>o[1]));return Array.from({length:this.generation_config.num_beams},(o,u)=>[i[u][0],Math.log(s[u])])}}class Wv extends Cg{return_timestamps=null;return_token_timestamps=null;num_frames=null;alignment_heads=null;task=null;language=null;no_timestamps_token_id=null;prompt_ids=null;is_multilingual=null;lang_to_id=null;task_to_id=null;max_initial_timestamp_index=1}const ve={EncoderOnly:0,EncoderDecoder:1,Seq2Seq:2,Vision2Seq:3,DecoderOnly:4,MaskGeneration:5,ImageTextToText:6,Musicgen:7},qi=new Map,Tg=new Map,fa=new Map;async function Vv(t,e,r){let n=r.device;n&&typeof n!="string"&&(n.hasOwnProperty(e)?n=n[e]:(console.warn(`Device not specified for ${e}. Using the default device.`),n=null));const a=rw(n);let i=r.dtype;if(typeof i!="string"&&(i&&i.hasOwnProperty(e)?i=i[e]:(i=xv[a[0]],console.warn(`Dtype not specified for ${e}. Using the default dtype: ${i}.`))),fp.hasOwnProperty(i)){if(i===It.fp16&&!await $v())throw new Error("The device does not support fp16.")}else throw new Error(`Invalid dtype: ${i}. Should be one of: ${Object.keys(It).join(", ")}`);const s=fp[i],o=`${r.subfolder??""}/${e}${s}.onnx`,u={...r.session_options};u.executionProviders??=a;const l=ki(t,o,!0,r);let p=[];if(r.use_external_data_format){if(Zr.IS_NODE_ENV)throw new Error("External data format is not yet supported in Node.js");const m=`${e}${s}.onnx_data`,c=`${r.subfolder??""}/${m}`;p.push(new Promise(async(y,w)=>{const v=await ki(t,c,!0,r);y({path:m,data:v})}))}else u.externalData!==void 0&&(p=u.externalData.map(async m=>{if(typeof m.data=="string"){const c=await ki(t,m.data,!0,r);return{...m,data:c}}return m}));if(p.length>0&&(u.externalData=await Promise.all(p)),n==="webgpu"){const m=kg(r.config,{prefix:"present"});if(Object.keys(m).length>0){const c={};for(const y in m)c[y]="gpu-buffer";u.preferredOutputLocation=c}}return{buffer:await l,session_options:u}}async function Gr(t,e,r){const n=Object.keys(e),a=await Promise.all(n.map(async s=>Vv(t,e[s],r))),i={};for(let s=0;s0)throw new Error(`An error occurred during model execution: "Missing the following inputs: ${n.join(", ")}.`);const a=Object.keys(e).length,i=t.inputNames.length;if(a>i){let s=Object.keys(e).filter(o=>!t.inputNames.includes(o));console.warn(`WARNING: Too many inputs were provided (${a} > ${i}). The following inputs will be ignored: "${s.join(", ")}".`)}return r}async function zr(t,e){const r=Gv(t,e);try{const n=Object.fromEntries(Object.entries(r).map(([i,s])=>[i,s.ort_tensor]));let a=await t.run(n);return a=Ig(a),a}catch(n){throw console.error(`An error occurred during model execution: "${n}".`),console.error("Inputs given to model:",r),n}}function Ig(t){for(let e in t)og(t[e])?t[e]=new pe(t[e]):typeof t[e]=="object"&&Ig(t[e]);return t}function Ag(t){if(t instanceof pe)return t;if(t.length===0)throw Error("items must be non-empty");if(Array.isArray(t[0])){if(t.some(e=>e.length!==t[0].length))throw Error("Unable to create tensor, you should probably activate truncation and/or padding with 'padding=True' and/or 'truncation=True' to have batched tensors with the same length.");return new pe("int64",BigInt64Array.from(t.flat().map(e=>BigInt(e))),[t.length,t[0].length])}else return new pe("int64",BigInt64Array.from(t.map(e=>BigInt(e))),[1,t.length])}function Mg(t){return new pe("bool",[t],[1])}async function mp(t,e){let{encoder_outputs:r,past_key_values:n}=e;if(!r){const u=Qr(e,t.sessions.model.inputNames);r=(await va(t,u)).last_hidden_state}const{input_ids:a,decoder_input_ids:i,...s}=e;return s.input_ids=i,s.encoder_hidden_states=r,t.sessions.decoder_model_merged.inputNames.includes("encoder_attention_mask")&&(s.encoder_attention_mask=e.attention_mask),await du(t,s,!0)}async function va(t,e){const r=t.sessions.model,n=Object.create(null);for(const a of r.inputNames)n[a]=e[a];return r.inputNames.includes("token_type_ids")&&!n.token_type_ids&&(n.token_type_ids=new pe("int64",new BigInt64Array(n.input_ids.data.length),n.input_ids.dims)),await zr(r,n)}async function du(t,e,r=!1){const n=t.sessions[r?"decoder_model_merged":"model"],{past_key_values:a,...i}=e;n.inputNames.includes("use_cache_branch")&&(i.use_cache_branch=Mg(!!a)),n.inputNames.includes("position_ids")&&i.attention_mask&&!i.position_ids&&(i.position_ids=jv(i,a)),t.addPastKeyValues(i,a);const s=Qr(i,n.inputNames);return await zr(n,s)}async function Hv(t,{input_ids:e=null,attention_mask:r=null,pixel_values:n=null,position_ids:a=null,inputs_embeds:i=null,past_key_values:s=null,generation_config:o=null,logits_processor:u=null,...l}){if(!i){if(i=await t.encode_text({input_ids:e}),n&&e.dims[1]!==1){const f=await t.encode_image({pixel_values:n});({inputs_embeds:i,attention_mask:r}=t._merge_input_ids_with_image_features({image_features:f,inputs_embeds:i,input_ids:e,attention_mask:r}))}else if(s&&n&&e.dims[1]===1){const f=e.dims[1],m=Object.values(s)[0].dims.at(-2);r=dr([On([e.dims[0],m]),r.slice(null,[r.dims[1]-f,r.dims[1]])],1)}}return await du(t,{inputs_embeds:i,past_key_values:s,attention_mask:r,position_ids:a,generation_config:o,logits_processor:u},!0)}function jv(t,e=null){const{input_ids:r,inputs_embeds:n,attention_mask:a}=t,[i,s]=a.dims,o=new BigInt64Array(a.data.length);for(let l=0;li.dims[1])){if(ao==t.config.image_token_index)){const o=t.config.num_image_tokens;if(!o)throw new Error("`num_image_tokens` is missing in the model configuration.");const u=i.dims[1]-(a-o);r.input_ids=i.slice(null,[-u,null]),r.attention_mask=On([1,a+u])}}}return r}function qv(t,e,r,n){const{...a}=r;return r.past_key_values&&(e=e.map(s=>[s.at(-1)])),a.decoder_input_ids=Ag(e),a}class ee extends vt{main_input_name="input_ids";forward_params=["input_ids","attention_mask"];constructor(e,r){super(),this.config=e,this.sessions=r;const n=fa.get(this.constructor),a=qi.get(n);this.can_generate=!1,this._forward=null,this._prepare_inputs_for_generation=null,a===ve.DecoderOnly?(this.can_generate=!0,this._forward=du,this._prepare_inputs_for_generation=gp):a===ve.Seq2Seq||a===ve.Vision2Seq||a===ve.Musicgen?(this.can_generate=!0,this._forward=mp,this._prepare_inputs_for_generation=qv):a===ve.EncoderDecoder?this._forward=mp:a===ve.ImageTextToText?(this.can_generate=!0,this._forward=Hv,this._prepare_inputs_for_generation=gp):this._forward=va,this.can_generate&&this.forward_params.push("past_key_values"),this.custom_config=this.config["transformers.js_config"]??{}}async dispose(){const e=[];for(const r of Object.values(this.sessions))r?.handler?.dispose&&e.push(r.handler.dispose());return await Promise.all(e)}static async from_pretrained(e,{progress_callback:r=null,config:n=null,cache_dir:a=null,local_files_only:i=!1,revision:s="main",model_file_name:o=null,subfolder:u="onnx",device:l=null,dtype:p=null,use_external_data_format:f=null,session_options:m={}}={}){let c={progress_callback:r,config:n,cache_dir:a,local_files_only:i,revision:s,model_file_name:o,subfolder:u,device:l,dtype:p,use_external_data_format:f,session_options:m};const y=fa.get(this),w=qi.get(y);c.config=await Eg.from_pretrained(e,c);let v;return w===ve.DecoderOnly?v=await Promise.all([Gr(e,{model:c.model_file_name??"model"},c),Mr(e,"generation_config.json",!1,c)]):w===ve.Seq2Seq||w===ve.Vision2Seq?v=await Promise.all([Gr(e,{model:"encoder_model",decoder_model_merged:"decoder_model_merged"},c),Mr(e,"generation_config.json",!1,c)]):w===ve.MaskGeneration?v=await Promise.all([Gr(e,{model:"vision_encoder",prompt_encoder_mask_decoder:"prompt_encoder_mask_decoder"},c)]):w===ve.EncoderDecoder?v=await Promise.all([Gr(e,{model:"encoder_model",decoder_model_merged:"decoder_model_merged"},c)]):w===ve.ImageTextToText?v=await Promise.all([Gr(e,{embed_tokens:"embed_tokens",vision_encoder:"vision_encoder",decoder_model_merged:"decoder_model_merged"},c),Mr(e,"generation_config.json",!1,c)]):w===ve.Musicgen?v=await Promise.all([Gr(e,{model:"text_encoder",decoder_model_merged:"decoder_model_merged",encodec_decode:"encodec_decode"},c),Mr(e,"generation_config.json",!1,c)]):(w!==ve.EncoderOnly&&console.warn(`Model type for '${y??n?.model_type}' not found, assuming encoder-only architecture. Please report this at https://github.com/xenova/transformers.js/issues/new/choose.`),v=await Promise.all([Gr(e,{model:c.model_file_name??"model"},c)])),new this(c.config,...v)}async _call(e){return await this.forward(e)}async forward(e){return await this._forward(this,e)}_get_logits_warper(e){const r=new Io;return e.temperature!==null&&e.temperature!==1&&r.push(new Pv(e.temperature)),e.top_k!==null&&e.top_k!==0&&r.push(new Bv(e.top_k)),e.top_p!==null&&e.top_p<1&&r.push(new Rv(e.top_p)),r}_get_logits_processor(e,r,n=null){const a=new Io;if(e.repetition_penalty!==null&&e.repetition_penalty!==1&&a.push(new Iv(e.repetition_penalty)),e.no_repeat_ngram_size!==null&&e.no_repeat_ngram_size>0&&a.push(new Tv(e.no_repeat_ngram_size)),e.bad_words_ids!==null&&a.push(new Ov(e.bad_words_ids,e.eos_token_id)),e.min_length!==null&&e.eos_token_id!==null&&e.min_length>0&&a.push(new Av(e.min_length,e.eos_token_id)),e.min_new_tokens!==null&&e.eos_token_id!==null&&e.min_new_tokens>0&&a.push(new Mv(r,e.min_new_tokens,e.eos_token_id)),e.forced_bos_token_id!==null&&a.push(new Sv(e.forced_bos_token_id)),e.forced_eos_token_id!==null&&a.push(new kv(e.max_length,e.forced_eos_token_id)),e.begin_suppress_tokens!==null){const i=r>1||e.forced_bos_token_id===null?r:r+1;a.push(new Ev(e.begin_suppress_tokens,i))}return e.guidance_scale!==null&&e.guidance_scale>1&&a.push(new zv(e.guidance_scale)),n!==null&&a.extend(n),a}_prepare_generation_config(e,r,n=Cg){const a={...this.config};for(const s of["decoder","generator","text_config"])s in a&&Object.assign(a,a[s]);const i=new n(a);return"generation_config"in this&&Object.assign(i,this.generation_config),e&&Object.assign(i,e),r&&Object.assign(i,Qr(r,Object.getOwnPropertyNames(i))),i}_get_stopping_criteria(e,r=null){const n=new lu;return e.max_length!==null&&n.push(new Dv(e.max_length,this.config.max_position_embeddings??null)),e.eos_token_id!==null&&n.push(new Nv(e.eos_token_id)),r&&n.extend(r),n}_validate_model_class(){if(!this.can_generate){const e=[R0,B0,P0,z0],r=fa.get(this.constructor),n=new Set,a=this.config.model_type;for(const s of e){const o=s.get(a);o&&n.add(o[0])}let i=`The current model class (${r}) is not compatible with \`.generate()\`, as it doesn't have a language model head.`;throw n.size>0&&(i+=` Please use the following class instead: ${[...n].join(", ")}`),Error(i)}}prepare_inputs_for_generation(...e){return this._prepare_inputs_for_generation(this,...e)}_update_model_kwargs_for_generation({generated_input_ids:e,outputs:r,model_inputs:n,is_encoder_decoder:a}){return n.past_key_values=this.getPastKeyValues(r,n.past_key_values),n.input_ids=new pe("int64",e.flat(),[e.length,1]),a||(n.attention_mask=dr([n.attention_mask,On([n.attention_mask.dims[0],1])],1)),n.position_ids=null,n}_prepare_model_inputs({inputs:e,bos_token_id:r,model_kwargs:n}){const a=Qr(n,this.forward_params),i=this.main_input_name;if(i in a){if(e)throw new Error("`inputs`: {inputs}` were passed alongside {input_name} which is not allowed. Make sure to either pass {inputs} or {input_name}=...")}else a[i]=e;return{inputs_tensor:a[i],model_inputs:a,model_input_name:i}}async _prepare_encoder_decoder_kwargs_for_generation({inputs_tensor:e,model_inputs:r,model_input_name:n,generation_config:a}){const i=Qr(r,this.sessions.model.inputNames);let{last_hidden_state:s}=await va(this,i);return a.guidance_scale!==null&&a.guidance_scale>1&&(s=dr([s,dw(s,0)],0),"attention_mask"in r&&(r.attention_mask=dr([r.attention_mask,hw(r.attention_mask)],0))),r.encoder_outputs=s,r}_prepare_decoder_input_ids_for_generation({batch_size:e,model_input_name:r,model_kwargs:n,decoder_start_token_id:a,bos_token_id:i,generation_config:s}){let{decoder_input_ids:o,...u}=n;if(!o)if(a??=i,this.config.model_type==="musicgen")o=Array.from({length:e*this.config.decoder.num_codebooks},()=>[a]);else if(Array.isArray(a)){if(a.length!==e)throw new Error(`\`decoder_start_token_id\` expcted to have length ${e} but got ${a.length}`);o=a}else o=Array.from({length:e},()=>[a]);return o=Ag(o),n.decoder_attention_mask=cw(o),{input_ids:o,model_inputs:u}}async generate({inputs:e=null,generation_config:r=null,logits_processor:n=null,stopping_criteria:a=null,streamer:i=null,...s}){this._validate_model_class(),r=this._prepare_generation_config(r,s);let{inputs_tensor:o,model_inputs:u,model_input_name:l}=this._prepare_model_inputs({inputs:e,model_kwargs:s});const p=this.config.is_encoder_decoder;p&&("encoder_outputs"in u||(u=await this._prepare_encoder_decoder_kwargs_for_generation({inputs_tensor:o,model_inputs:u,model_input_name:l,generation_config:r})));let f;p?{input_ids:f,model_inputs:u}=this._prepare_decoder_input_ids_for_generation({batch_size:u[l].dims.at(0),model_input_name:l,model_kwargs:u,decoder_start_token_id:r.decoder_start_token_id,bos_token_id:r.bos_token_id,generation_config:r}):f=u[l];let m=f.dims.at(-1);r.max_new_tokens!==null&&(r.max_length=m+r.max_new_tokens);const c=this._get_logits_processor(r,m,n),y=this._get_stopping_criteria(r,a),w=u[l].dims.at(0),v=Ji.getSampler(r),k=new Array(w).fill(0),$=f.tolist();i&&i.put($);let C=null;for(;;){u=this.prepare_inputs_for_generation($,u,r);const A=await this.forward(u),B=A.logits.slice(null,-1,null),R=c($,B),D=[];for(let j=0;jj)){r.return_dict_in_generate&&(C=this.getPastKeyValues(A,u.past_key_values,!1));break}u=this._update_model_kwargs_for_generation({generated_input_ids:D,outputs:A,model_inputs:u,is_encoder_decoder:p})}i&&i.end();const T=new pe("int64",$.flat(),[$.length,$[0].length]);return r.return_dict_in_generate?{sequences:T,past_key_values:C}:T}addAttentionsToBeam(e,r){if(this.config.is_encoder_decoder){if(!r.cross_attentions||r.cross_attentions.length===0)throw Error("`output_attentions` is true, but the model did not produce cross-attentions. This is most likely because the model was not exported with `output_attentions=True`.");e.cross_attentions||(e.cross_attentions=[]),e.cross_attentions.push(r.cross_attentions)}if(!r.decoder_attentions||r.decoder_attentions.length===0)throw Error("`output_attentions` is true, but the model did not produce decoder-attentions. This is most likely because the model was not exported with `output_attentions=True`.");e.decoder_attentions||(e.decoder_attentions=[]),e.decoder_attentions.push(r.decoder_attentions)}groupBeams(e){const r=Object.create(null);for(const n of e)r[n.id]===void 0?r[n.id]=[n]:r[n.id].push(n);return Object.values(r)}getPastKeyValues(e,r,n=!0){const a=Object.create(null);for(const i in e)if(i.startsWith("present")){let s=i.replace("present","past_key_values");if(r&&i.includes("encoder"))a[s]=r[s];else{if(n&&r){const o=r[s];o.location==="gpu-buffer"&&o.dispose()}a[s]=e[i]}}return a}getAttentions(e){const r=Object.create(null);for(const n of["cross_attentions","decoder_attentions"]){const a=[];for(const i in e)if(i.startsWith(n)){const s=i.split(".").pop();a[s]=e[i]}r[n]=a}return r}addPastKeyValues(e,r){if(r)Object.assign(e,r);else{const n=this.custom_config.kv_cache_dtype??"float32",a=n==="float16"?new Uint16Array:[],i=kg(this.config);for(const s in i)e[s]=new pe(n,a,i[s])}}}class Wt{}class Ca extends ee{}class Kv extends Ca{}class Yv extends Ca{async _call(e){return new gt(await super._call(e))}}class Xv extends Ca{async _call(e){return new Me(await super._call(e))}}class Qv extends Ca{async _call(e){return new mt(await super._call(e))}}class Jv extends Ca{async _call(e){return new $t(await super._call(e))}}class Zv extends ee{}class e2 extends Zv{}class Ta extends ee{}class t2 extends Ta{}class r2 extends Ta{async _call(e){return new gt(await super._call(e))}}class n2 extends Ta{async _call(e){return new Me(await super._call(e))}}class a2 extends Ta{async _call(e){return new mt(await super._call(e))}}class i2 extends Ta{async _call(e){return new $t(await super._call(e))}}class Ia extends ee{}class s2 extends Ia{}class o2 extends Ia{async _call(e){return new gt(await super._call(e))}}class u2 extends Ia{async _call(e){return new Me(await super._call(e))}}class l2 extends Ia{async _call(e){return new mt(await super._call(e))}}class d2 extends Ia{async _call(e){return new $t(await super._call(e))}}class Aa extends ee{}class c2 extends Aa{}class p2 extends Aa{async _call(e){return new gt(await super._call(e))}}class h2 extends Aa{async _call(e){return new Me(await super._call(e))}}class f2 extends Aa{async _call(e){return new mt(await super._call(e))}}class m2 extends Aa{async _call(e){return new $t(await super._call(e))}}class Ma extends ee{}class g2 extends Ma{}class _2 extends Ma{async _call(e){return new gt(await super._call(e))}}class y2 extends Ma{async _call(e){return new Me(await super._call(e))}}class w2 extends Ma{async _call(e){return new mt(await super._call(e))}}class b2 extends Ma{async _call(e){return new $t(await super._call(e))}}class Oa extends ee{}class v2 extends Oa{}class $2 extends Oa{async _call(e){return new gt(await super._call(e))}}class x2 extends Oa{async _call(e){return new Me(await super._call(e))}}class S2 extends Oa{async _call(e){return new mt(await super._call(e))}}class k2 extends Oa{async _call(e){return new $t(await super._call(e))}}class za extends ee{}class E2 extends za{}class C2 extends za{async _call(e){return new gt(await super._call(e))}}class T2 extends za{async _call(e){return new Me(await super._call(e))}}class I2 extends za{async _call(e){return new mt(await super._call(e))}}class A2 extends za{async _call(e){return new $t(await super._call(e))}}class Pa extends ee{}class M2 extends Pa{}class O2 extends Pa{async _call(e){return new Me(await super._call(e))}}class z2 extends Pa{async _call(e){return new mt(await super._call(e))}}class P2 extends Pa{async _call(e){return new $t(await super._call(e))}}class R2 extends Pa{async _call(e){return new gt(await super._call(e))}}class Zi extends ee{}class B2 extends Zi{}class D2 extends Zi{async _call(e){return new gt(await super._call(e))}}class N2 extends Zi{async _call(e){return new Me(await super._call(e))}}class F2 extends Zi{async _call(e){return new mt(await super._call(e))}}class es extends ee{}class L2 extends es{}class U2 extends es{async _call(e){return new gt(await super._call(e))}}class W2 extends es{async _call(e){return new Me(await super._call(e))}}class V2 extends es{async _call(e){return new $t(await super._call(e))}}class Ra extends ee{}class G2 extends Ra{}class H2 extends Ra{async _call(e){return new gt(await super._call(e))}}class j2 extends Ra{async _call(e){return new Me(await super._call(e))}}class q2 extends Ra{async _call(e){return new mt(await super._call(e))}}class K2 extends Ra{async _call(e){return new $t(await super._call(e))}}class ts extends ee{}class Y2 extends ts{}class X2 extends ts{async _call(e){return new gt(await super._call(e))}}class Q2 extends ts{async _call(e){return new Me(await super._call(e))}}class J2 extends ts{async _call(e){return new $t(await super._call(e))}}class rs extends ee{}class Z2 extends rs{}class e1 extends rs{async _call(e){return new Me(await super._call(e))}}class t1 extends rs{async _call(e){return new $t(await super._call(e))}}class r1 extends rs{async _call(e){return new gt(await super._call(e))}}class Og extends ee{forward_params=["input_ids","attention_mask","encoder_outputs","decoder_input_ids","decoder_attention_mask","past_key_values"];constructor(e,r,n){super(e,r),this.generation_config=n}}class n1 extends Og{}class a1 extends Og{}class zg extends ee{constructor(e,r,n){super(e,r),this.generation_config=n}}class i1 extends zg{}class s1 extends zg{}class Pg extends ee{constructor(e,r,n){super(e,r),this.generation_config=n}}class o1 extends Pg{}class u1 extends Pg{}class cu extends ee{constructor(e,r,n){super(e,r),this.generation_config=n}}class l1 extends cu{}class d1 extends cu{}class c1 extends cu{async _call(e){return new Me(await super._call(e))}}class ns extends ee{constructor(e,r,n){super(e,r),this.generation_config=n}}class p1 extends ns{}class h1 extends ns{}class f1 extends ns{async _call(e){return new Me(await super._call(e))}}class m1 extends ns{}class Rg extends ee{constructor(e,r,n){super(e,r),this.generation_config=n}}class g1 extends Rg{}class _1 extends Rg{}class Bg extends ee{constructor(e,r,n){super(e,r),this.generation_config=n}}class y1 extends Bg{}class w1 extends Bg{}class Ba extends ee{}class b1 extends Ba{}class v1 extends Ba{async _call(e){return new gt(await super._call(e))}}class $1 extends Ba{async _call(e){return new Me(await super._call(e))}}class x1 extends Ba{async _call(e){return new mt(await super._call(e))}}class S1 extends Ba{async _call(e){return new $t(await super._call(e))}}class Da extends ee{}class k1 extends Da{}class E1 extends Da{async _call(e){return new gt(await super._call(e))}}class C1 extends Da{async _call(e){return new Me(await super._call(e))}}class T1 extends Da{async _call(e){return new mt(await super._call(e))}}class I1 extends Da{async _call(e){return new $t(await super._call(e))}}class Na extends ee{}class A1 extends Na{}class M1 extends Na{async _call(e){return new gt(await super._call(e))}}class O1 extends Na{async _call(e){return new Me(await super._call(e))}}class z1 extends Na{async _call(e){return new mt(await super._call(e))}}class P1 extends Na{async _call(e){return new $t(await super._call(e))}}class Dg extends ee{}class R1 extends Dg{}class B1 extends Dg{}class Ng extends ee{requires_attention_mask=!1;main_input_name="input_features";forward_params=["input_features","attention_mask","decoder_input_ids","decoder_attention_mask","past_key_values"];constructor(e,r,n){super(e,r),this.generation_config=n}}class D1 extends Ng{}class N1 extends Ng{_prepare_generation_config(e,r){return super._prepare_generation_config(e,r,Wv)}_retrieve_init_tokens(e){const r=[e.decoder_start_token_id];let n=e.language;const a=e.task;if(e.is_multilingual){n||(console.warn("No language specified - defaulting to English (en)."),n="en");const s=`<|${pg(n)}|>`;r.push(e.lang_to_id[s]),r.push(e.task_to_id[a??"transcribe"])}else if(n||a)throw new Error("Cannot specify `task` or `language` for an English-only model. If the model is intended to be multilingual, pass `is_multilingual=true` to generate, or update the generation config.");return!e.return_timestamps&&e.no_timestamps_token_id&&r.at(-1)!==e.no_timestamps_token_id?r.push(e.no_timestamps_token_id):e.return_timestamps&&r.at(-1)===e.no_timestamps_token_id&&(console.warn("<|notimestamps|> prompt token is removed from generation_config since `return_timestamps` is set to `true`."),r.pop()),r.filter(i=>i!=null)}async generate({inputs:e=null,generation_config:r=null,logits_processor:n=null,stopping_criteria:a=null,...i}){r=this._prepare_generation_config(r,i);const s=this._retrieve_init_tokens(r);return r.return_timestamps&&(n??=new Io,n.push(new Cv(r,s))),await super.generate({inputs:e,generation_config:r,logits_processor:n,decoder_input_ids:s,...i})}_extract_token_timestamps(e,r,n=null,a=.02){if(!e.cross_attentions)throw new Error("Model outputs must contain cross attentions to extract timestamps. This is most likely because the model was not exported with `output_attentions=True`.");let i=this.config.median_filter_width;i===void 0&&(console.warn("Model config has no `median_filter_width`, using default value of 7."),i=7);const s=e.cross_attentions.map(l=>{let p=Array.from({length:this.config.decoder_layers},(v,k)=>dr(l.map($=>$[k]),2)),f=wa(r.map(([v,k])=>n?p[v].slice(null,k,null,[0,n]):p[v].slice(null,k)));f=f.transpose(1,0,2,3);let[m,c]=lg(f,-2,0,!0),y=f.clone();for(let v=0;vf[k+1]-f[k]),y=ct([1],c).map(v=>!!v),w=[];for(let v=0;vm.findIndex(c=>c==i)),u=o.every(m=>m===-1),l=o.every(m=>m!==-1);if(!u&&!l)throw new Error("Every input should contain either 0 or 1 image token.");if(u)return{inputs_embeds:e,attention_mask:a};const p=[],f=[];for(let m=0;mi*s,1);e.input_labels=new pe("int64",new BigInt64Array(a).fill(1n),n)}const r={image_embeddings:e.image_embeddings,image_positional_embeddings:e.image_positional_embeddings};return e.input_points&&(r.input_points=e.input_points),e.input_labels&&(r.input_labels=e.input_labels),e.input_boxes&&(r.input_boxes=e.input_boxes),await zr(this.sessions.prompt_encoder_mask_decoder,r)}async _call(e){return new Sx(await super._call(e))}}class Sx extends Wt{constructor({iou_scores:e,pred_masks:r}){super(),this.iou_scores=e,this.pred_masks=r}}class $0 extends ee{constructor(e,r,n){super(e,r),this.generation_config=n}}class kx extends $0{}class Ex extends $0{}class x0 extends ee{constructor(e,r,n){super(e,r),this.generation_config=n}}class Cx extends x0{}class Tx extends x0{}class sn extends ee{}class Ix extends sn{}class Ax extends sn{async _call(e){return new Pn(await super._call(e))}}class Mx extends sn{async _call(e){return new Me(await super._call(e))}}class Ox extends sn{async _call(e){return new mt(await super._call(e))}}class hu extends ee{}class zx extends hu{}class Px extends hu{async _call(e){return new Pn(await super._call(e))}}class Rx extends hu{async _call(e){return new Me(await super._call(e))}}class is extends ee{}class Bx extends is{}class Dx extends is{async _call(e){return new Pn(await super._call(e))}}class Nx extends is{async _call(e){return new Me(await super._call(e))}}class Fx extends is{async _call(e){return new mt(await super._call(e))}}class fu extends ee{}class Lx extends fu{}class Ux extends fu{async _call(e){return new Pn(await super._call(e))}}class Wx extends fu{async _call(e){return new Me(await super._call(e))}}class Vx extends sn{}class Gx extends sn{async _call(e){return new Pn(await super._call(e))}}class Hx extends sn{async _call(e){return new Me(await super._call(e))}}class Fa extends ee{}class jx extends Fa{}class qx extends Fa{async _call(e){return new Pn(await super._call(e))}}class Kx extends Fa{async _call(e){return new Me(await super._call(e))}}class Yx extends Fa{async _call(e){return new GS(await super._call(e))}}class Xx extends Fa{async _call(e){return new mt(await super._call(e))}}class S0 extends ee{constructor(e,r,n){super(e,r),this.generation_config=n}}class Qx extends S0{}class Jx extends S0{async generate_speech(e,r,{threshold:n=.5,minlenratio:a=0,maxlenratio:i=20,vocoder:s=null}={}){const o={input_ids:e},{encoder_outputs:u,encoder_attention_mask:l}=await va(this,o),p=u.dims[1]/this.config.reduction_factor,f=Math.floor(p*i),m=Math.floor(p*a),c=this.config.num_mel_bins;let y=[],w=null,v=null,k=0;for(;;){++k;const T=Mg(!!v);let A;v?A=v.output_sequence_out:A=new pe("float32",new Float32Array(c),[1,1,c]);let B={use_cache_branch:T,output_sequence:A,encoder_attention_mask:l,speaker_embeddings:r,encoder_hidden_states:u};this.addPastKeyValues(B,w),v=await zr(this.sessions.decoder_model_merged,B),w=this.getPastKeyValues(v,w);const{prob:R,spectrum:D}=v;if(y.push(D),k>=m&&(Array.from(R.data).filter(K=>K>=n).length>0||k>=f))break}const $=dr(y),{waveform:C}=await zr(s.sessions.model,{spectrogram:$});return{spectrogram:$,waveform:C}}}class Zx extends ee{main_input_name="spectrogram"}class eS extends ee{constructor(e,r,n){super(e,r),this.generation_config=n}}class tS extends eS{}class k0 extends ee{constructor(e,r,n){super(e,r),this.generation_config=n}}class rS extends k0{}class nS extends k0{}class E0 extends ee{constructor(e,r,n){super(e,r),this.generation_config=n}}class aS extends E0{}class iS extends E0{}class C0 extends ee{constructor(e,r,n){super(e,r),this.generation_config=n}}class sS extends C0{}class oS extends C0{}class mu extends ee{}class uS extends mu{}class lS extends mu{static async from_pretrained(e,r={}){return r.model_file_name??="text_model",super.from_pretrained(e,r)}}class dS extends mu{static async from_pretrained(e,r={}){return r.model_file_name??="audio_model",super.from_pretrained(e,r)}}class cS extends ee{}class T0 extends cS{async _call(e){return new jS(await super._call(e))}}class I0 extends ee{}class pS extends I0{}class hS extends I0{}class A0 extends ee{constructor(e,r,n){super(e,r),this.generation_config=n}}class fS extends A0{}class mS extends A0{}class M0 extends ee{}class gS extends M0{}class _S extends M0{async _call(e){return new Me(await super._call(e))}}class O0 extends ee{forward_params=["input_ids","attention_mask","encoder_outputs","decoder_input_ids","decoder_attention_mask","past_key_values"];constructor(e,r,n){super(e,r),this.generation_config=n}_apply_and_filter_by_delay_pattern_mask(e){const[r,n]=e.dims,a=this.config.decoder.num_codebooks,i=n-a;let s=0;for(let l=0;l0&&m<=i&&(e.data[s++]=e.data[l])}const o=Math.floor(r/a),u=s/(o*a);return new pe(e.type,e.data.slice(0,s),[o,a,u])}prepare_inputs_for_generation(e,r,n){let a=structuredClone(e);for(let s=0;s=o&&(a[s][o]=BigInt(this.config.decoder.pad_token_id));return n.guidance_scale!==null&&n.guidance_scale>1&&(a=a.concat(a)),super.prepare_inputs_for_generation(a,r,n)}async generate(e){const r=await super.generate(e),n=this._apply_and_filter_by_delay_pattern_mask(r).unsqueeze_(0),{audio_values:a}=await zr(this.sessions.encodec_decode,{audio_codes:n});return a}}class yS{static MODEL_CLASS_MAPPINGS=null;static BASE_IF_FAIL=!1;static async from_pretrained(e,{progress_callback:r=null,config:n=null,cache_dir:a=null,local_files_only:i=!1,revision:s="main",model_file_name:o=null,subfolder:u="onnx",device:l=null,dtype:p=null,use_external_data_format:f=null,session_options:m={}}={}){let c={progress_callback:r,config:n,cache_dir:a,local_files_only:i,revision:s,model_file_name:o,subfolder:u,device:l,dtype:p,use_external_data_format:f,session_options:m};if(c.config=await Eg.from_pretrained(e,c),!this.MODEL_CLASS_MAPPINGS)throw new Error("`MODEL_CLASS_MAPPINGS` not implemented for this type of `AutoClass`: "+this.name);for(let y of this.MODEL_CLASS_MAPPINGS){const w=y.get(c.config.model_type);if(w)return await w[1].from_pretrained(e,c)}if(this.BASE_IF_FAIL)return console.warn(`Unknown model class "${c.config.model_type}", attempting to construct from base class.`),await ee.from_pretrained(e,c);throw Error(`Unsupported model type: ${c.config.model_type}`)}}const wS=new Map([["bert",["BertModel",Kv]],["nomic_bert",["NomicBertModel",e2]],["roformer",["RoFormerModel",t2]],["electra",["ElectraModel",c2]],["esm",["EsmModel",B2]],["convbert",["ConvBertModel",s2]],["camembert",["CamembertModel",g2]],["deberta",["DebertaModel",v2]],["deberta-v2",["DebertaV2Model",E2]],["mpnet",["MPNetModel",G2]],["albert",["AlbertModel",Z2]],["distilbert",["DistilBertModel",M2]],["roberta",["RobertaModel",b1]],["xlm",["XLMModel",k1]],["xlm-roberta",["XLMRobertaModel",A1]],["clap",["ClapModel",uS]],["clip",["CLIPModel",W1]],["clipseg",["CLIPSegModel",X1]],["chinese_clip",["ChineseCLIPModel",Y1]],["siglip",["SiglipModel",H1]],["mobilebert",["MobileBertModel",L2]],["squeezebert",["SqueezeBertModel",Y2]],["wav2vec2",["Wav2Vec2Model",Ix]],["wav2vec2-bert",["Wav2Vec2BertModel",Lx]],["unispeech",["UniSpeechModel",zx]],["unispeech-sat",["UniSpeechSatModel",Bx]],["hubert",["HubertModel",Vx]],["wavlm",["WavLMModel",jx]],["audio-spectrogram-transformer",["ASTModel",R1]],["vits",["VitsModel",T0]],["detr",["DetrModel",G$]],["table-transformer",["TableTransformerModel",K$]],["vit",["ViTModel",T$]],["fastvit",["FastViTModel",A$]],["mobilevit",["MobileViTModel",P$]],["mobilevitv2",["MobileViTV2Model",B$]],["owlvit",["OwlViTModel",N$]],["owlv2",["Owlv2Model",L$]],["beit",["BeitModel",W$]],["deit",["DeiTModel",Q$]],["convnext",["ConvNextModel",hx]],["convnextv2",["ConvNextV2Model",mx]],["dinov2",["Dinov2Model",_x]],["resnet",["ResNetModel",Z$]],["swin",["SwinModel",tx]],["swin2sr",["Swin2SRModel",nx]],["donut-swin",["DonutSwinModel",px]],["yolos",["YolosModel",wx]],["dpt",["DPTModel",ix]],["glpn",["GLPNModel",lx]],["hifigan",["SpeechT5HifiGan",Zx]],["efficientnet",["EfficientNetModel",gS]]]),bS=new Map([["t5",["T5Model",n1]],["longt5",["LongT5Model",i1]],["mt5",["MT5Model",o1]],["bart",["BartModel",l1]],["mbart",["MBartModel",p1]],["marian",["MarianModel",kx]],["whisper",["WhisperModel",D1]],["m2m_100",["M2M100Model",Cx]],["blenderbot",["BlenderbotModel",g1]],["blenderbot-small",["BlenderbotSmallModel",y1]]]),vS=new Map([["bloom",["BloomModel",$$]],["gpt2",["GPT2Model",J1]],["gptj",["GPTJModel",a$]],["gpt_bigcode",["GPTBigCodeModel",s$]],["gpt_neo",["GPTNeoModel",e$]],["gpt_neox",["GPTNeoXModel",r$]],["codegen",["CodeGenModel",u$]],["llama",["LlamaModel",d$]],["gemma",["GemmaModel",p$]],["openelm",["OpenELMModel",f$]],["qwen2",["Qwen2Model",g$]],["phi",["PhiModel",y$]],["phi3",["Phi3Model",b$]],["mpt",["MptModel",S$]],["opt",["OPTModel",E$]],["mistral",["MistralModel",rS]],["starcoder2",["Starcoder2Model",aS]],["falcon",["FalconModel",sS]],["stablelm",["StableLmModel",fS]]]),z0=new Map([["speecht5",["SpeechT5ForSpeechToText",Qx]],["whisper",["WhisperForConditionalGeneration",N1]]]),$S=new Map([["speecht5",["SpeechT5ForTextToSpeech",Jx]]]),xS=new Map([["vits",["VitsModel",T0]],["musicgen",["MusicgenForConditionalGeneration",O0]]]),SS=new Map([["bert",["BertForSequenceClassification",Xv]],["roformer",["RoFormerForSequenceClassification",n2]],["electra",["ElectraForSequenceClassification",h2]],["esm",["EsmForSequenceClassification",N2]],["convbert",["ConvBertForSequenceClassification",u2]],["camembert",["CamembertForSequenceClassification",y2]],["deberta",["DebertaForSequenceClassification",x2]],["deberta-v2",["DebertaV2ForSequenceClassification",T2]],["mpnet",["MPNetForSequenceClassification",j2]],["albert",["AlbertForSequenceClassification",e1]],["distilbert",["DistilBertForSequenceClassification",O2]],["roberta",["RobertaForSequenceClassification",$1]],["xlm",["XLMForSequenceClassification",C1]],["xlm-roberta",["XLMRobertaForSequenceClassification",O1]],["bart",["BartForSequenceClassification",c1]],["mbart",["MBartForSequenceClassification",f1]],["mobilebert",["MobileBertForSequenceClassification",W2]],["squeezebert",["SqueezeBertForSequenceClassification",Q2]]]),kS=new Map([["bert",["BertForTokenClassification",Qv]],["roformer",["RoFormerForTokenClassification",a2]],["electra",["ElectraForTokenClassification",f2]],["esm",["EsmForTokenClassification",F2]],["convbert",["ConvBertForTokenClassification",l2]],["camembert",["CamembertForTokenClassification",w2]],["deberta",["DebertaForTokenClassification",S2]],["deberta-v2",["DebertaV2ForTokenClassification",I2]],["mpnet",["MPNetForTokenClassification",q2]],["distilbert",["DistilBertForTokenClassification",z2]],["roberta",["RobertaForTokenClassification",x1]],["xlm",["XLMForTokenClassification",T1]],["xlm-roberta",["XLMRobertaForTokenClassification",z1]]]),P0=new Map([["t5",["T5ForConditionalGeneration",a1]],["longt5",["LongT5ForConditionalGeneration",s1]],["mt5",["MT5ForConditionalGeneration",u1]],["bart",["BartForConditionalGeneration",d1]],["mbart",["MBartForConditionalGeneration",h1]],["marian",["MarianMTModel",Ex]],["m2m_100",["M2M100ForConditionalGeneration",Tx]],["blenderbot",["BlenderbotForConditionalGeneration",_1]],["blenderbot-small",["BlenderbotSmallForConditionalGeneration",w1]]]),R0=new Map([["bloom",["BloomForCausalLM",x$]],["gpt2",["GPT2LMHeadModel",Z1]],["gptj",["GPTJForCausalLM",i$]],["gpt_bigcode",["GPTBigCodeForCausalLM",o$]],["gpt_neo",["GPTNeoForCausalLM",t$]],["gpt_neox",["GPTNeoXForCausalLM",n$]],["codegen",["CodeGenForCausalLM",l$]],["llama",["LlamaForCausalLM",c$]],["gemma",["GemmaForCausalLM",h$]],["openelm",["OpenELMForCausalLM",m$]],["qwen2",["Qwen2ForCausalLM",_$]],["phi",["PhiForCausalLM",w$]],["phi3",["Phi3ForCausalLM",v$]],["mpt",["MptForCausalLM",k$]],["opt",["OPTForCausalLM",C$]],["mbart",["MBartForCausalLM",m1]],["mistral",["MistralForCausalLM",nS]],["starcoder2",["Starcoder2ForCausalLM",iS]],["falcon",["FalconForCausalLM",oS]],["trocr",["TrOCRForCausalLM",tS]],["stablelm",["StableLmForCausalLM",mS]]]),ES=new Map([["bert",["BertForMaskedLM",Yv]],["roformer",["RoFormerForMaskedLM",r2]],["electra",["ElectraForMaskedLM",p2]],["esm",["EsmForMaskedLM",D2]],["convbert",["ConvBertForMaskedLM",o2]],["camembert",["CamembertForMaskedLM",_2]],["deberta",["DebertaForMaskedLM",$2]],["deberta-v2",["DebertaV2ForMaskedLM",C2]],["mpnet",["MPNetForMaskedLM",H2]],["albert",["AlbertForMaskedLM",r1]],["distilbert",["DistilBertForMaskedLM",R2]],["roberta",["RobertaForMaskedLM",v1]],["xlm",["XLMWithLMHeadModel",E1]],["xlm-roberta",["XLMRobertaForMaskedLM",M1]],["mobilebert",["MobileBertForMaskedLM",U2]],["squeezebert",["SqueezeBertForMaskedLM",X2]]]),CS=new Map([["bert",["BertForQuestionAnswering",Jv]],["roformer",["RoFormerForQuestionAnswering",i2]],["electra",["ElectraForQuestionAnswering",m2]],["convbert",["ConvBertForQuestionAnswering",d2]],["camembert",["CamembertForQuestionAnswering",b2]],["deberta",["DebertaForQuestionAnswering",k2]],["deberta-v2",["DebertaV2ForQuestionAnswering",A2]],["mpnet",["MPNetForQuestionAnswering",K2]],["albert",["AlbertForQuestionAnswering",t1]],["distilbert",["DistilBertForQuestionAnswering",P2]],["roberta",["RobertaForQuestionAnswering",S1]],["xlm",["XLMForQuestionAnswering",I1]],["xlm-roberta",["XLMRobertaForQuestionAnswering",P1]],["mobilebert",["MobileBertForQuestionAnswering",V2]],["squeezebert",["SqueezeBertForQuestionAnswering",J2]]]),B0=new Map([["vision-encoder-decoder",["VisionEncoderDecoderModel",F1]]]),TS=new Map([["llava",["LlavaForConditionalGeneration",Fg]],["moondream1",["Moondream1ForConditionalGeneration",U1]]]),IS=new Map([["vit",["ViTForImageClassification",I$]],["fastvit",["FastViTForImageClassification",M$]],["mobilevit",["MobileViTForImageClassification",R$]],["mobilevitv2",["MobileViTV2ForImageClassification",D$]],["beit",["BeitForImageClassification",V$]],["deit",["DeiTForImageClassification",J$]],["convnext",["ConvNextForImageClassification",fx]],["convnextv2",["ConvNextV2ForImageClassification",gx]],["dinov2",["Dinov2ForImageClassification",yx]],["resnet",["ResNetForImageClassification",ex]],["swin",["SwinForImageClassification",rx]],["segformer",["SegformerForImageClassification",pS]],["efficientnet",["EfficientNetForImageClassification",_S]]]),AS=new Map([["detr",["DetrForObjectDetection",H$]],["table-transformer",["TableTransformerForObjectDetection",Y$]],["yolos",["YolosForObjectDetection",bx]]]),MS=new Map([["owlvit",["OwlViTForObjectDetection",F$]],["owlv2",["Owlv2ForObjectDetection",U$]]]),OS=new Map([["detr",["DetrForSegmentation",j$]],["clipseg",["CLIPSegForImageSegmentation",Q1]]]),zS=new Map([["segformer",["SegformerForSemanticSegmentation",hS]]]),PS=new Map([["sam",["SamModel",xx]]]),RS=new Map([["wav2vec2",["Wav2Vec2ForCTC",Ax]],["wav2vec2-bert",["Wav2Vec2BertForCTC",Ux]],["unispeech",["UniSpeechForCTC",Px]],["unispeech-sat",["UniSpeechSatForCTC",Dx]],["wavlm",["WavLMForCTC",qx]],["hubert",["HubertForCTC",Gx]]]),BS=new Map([["wav2vec2",["Wav2Vec2ForSequenceClassification",Mx]],["wav2vec2-bert",["Wav2Vec2BertForSequenceClassification",Wx]],["unispeech",["UniSpeechForSequenceClassification",Rx]],["unispeech-sat",["UniSpeechSatForSequenceClassification",Nx]],["wavlm",["WavLMForSequenceClassification",Kx]],["hubert",["HubertForSequenceClassification",Hx]],["audio-spectrogram-transformer",["ASTForAudioClassification",B1]]]),DS=new Map([["wavlm",["WavLMForXVector",Yx]]]),NS=new Map([["unispeech-sat",["UniSpeechSatForAudioFrameClassification",Fx]],["wavlm",["WavLMForAudioFrameClassification",Xx]],["wav2vec2",["Wav2Vec2ForAudioFrameClassification",Ox]]]),FS=new Map([["vitmatte",["VitMatteForImageMatting",z$]]]),LS=new Map([["swin2sr",["Swin2SRForImageSuperResolution",ax]]]),US=new Map([["dpt",["DPTForDepthEstimation",sx]],["depth_anything",["DepthAnythingForDepthEstimation",ux]],["glpn",["GLPNForDepthEstimation",dx]]]),WS=new Map([["clip",["CLIPVisionModelWithProjection",G1]],["siglip",["SiglipVisionModel",q1]]]),D0=[[wS,ve.EncoderOnly],[bS,ve.EncoderDecoder],[vS,ve.DecoderOnly],[SS,ve.EncoderOnly],[kS,ve.EncoderOnly],[P0,ve.Seq2Seq],[z0,ve.Seq2Seq],[R0,ve.DecoderOnly],[ES,ve.EncoderOnly],[CS,ve.EncoderOnly],[B0,ve.Vision2Seq],[TS,ve.ImageTextToText],[IS,ve.EncoderOnly],[OS,ve.EncoderOnly],[zS,ve.EncoderOnly],[FS,ve.EncoderOnly],[LS,ve.EncoderOnly],[US,ve.EncoderOnly],[AS,ve.EncoderOnly],[MS,ve.EncoderOnly],[PS,ve.MaskGeneration],[RS,ve.EncoderOnly],[BS,ve.EncoderOnly],[$S,ve.Seq2Seq],[xS,ve.EncoderOnly],[DS,ve.EncoderOnly],[NS,ve.EncoderOnly],[WS,ve.EncoderOnly]];for(const[t,e]of D0)for(const[r,n]of t.values())qi.set(r,e),fa.set(n,r),Tg.set(r,n);const VS=[["MusicgenForConditionalGeneration",O0,ve.Musicgen],["CLIPTextModelWithProjection",V1,ve.EncoderOnly],["SiglipTextModel",j1,ve.EncoderOnly],["ClapTextModelWithProjection",lS,ve.EncoderOnly],["ClapAudioModelWithProjection",dS,ve.EncoderOnly]];for(const[t,e,r]of VS)qi.set(t,r),fa.set(e,t),Tg.set(t,e);class _p extends yS{static MODEL_CLASS_MAPPINGS=D0.map(e=>e[0]);static BASE_IF_FAIL=!0}class Me extends Wt{constructor({logits:e}){super(),this.logits=e}}class GS extends Wt{constructor({logits:e,embeddings:r}){super(),this.logits=e,this.embeddings=r}}class mt extends Wt{constructor({logits:e}){super(),this.logits=e}}class gt extends Wt{constructor({logits:e}){super(),this.logits=e}}class $t extends Wt{constructor({start_logits:e,end_logits:r}){super(),this.start_logits=e,this.end_logits=r}}class Pn extends Wt{constructor({logits:e}){super(),this.logits=e}}class HS extends Wt{constructor({alphas:e}){super(),this.alphas=e}}class jS extends Wt{constructor({waveform:e,spectrogram:r}){super(),this.waveform=e,this.spectrogram=r}}const Nt=typeof self<"u",qS=Nt&&self.constructor.name==="DedicatedWorkerGlobalScope";let Hr,N0,Ar;if(Nt)Hr=(t,e)=>{if(!self.OffscreenCanvas)throw new Error("OffscreenCanvas not supported by this browser.");return new self.OffscreenCanvas(t,e)},Ar=self.createImageBitmap,N0=self.ImageData;else if(Ze)Ar=async t=>{const r=(await t.metadata()).channels,{data:n,info:a}=await t.rotate().raw().toBuffer({resolveWithObject:!0}),i=new tr(new Uint8ClampedArray(n),a.width,a.height,a.channels);return r!==void 0&&r!==a.channels&&i.convert(r),i};else throw new Error("Unable to load image processing library.");const KS={0:"nearest",1:"lanczos",2:"bilinear",3:"bicubic",4:"box",5:"hamming"},YS=new Map([["png","image/png"],["jpg","image/jpeg"],["jpeg","image/jpeg"],["gif","image/gif"]]);class tr{constructor(e,r,n,a){this.data=e,this.width=r,this.height=n,this.channels=a}get size(){return[this.width,this.height]}static async read(e){if(e instanceof tr)return e;if(typeof e=="string"||e instanceof URL)return await this.fromURL(e);throw new Error(`Unsupported input type: ${typeof e}`)}static fromCanvas(e){if(!Nt)throw new Error("fromCanvas() is only supported in browser environments.");const n=e.getContext("2d").getImageData(0,0,e.width,e.height).data;return new tr(n,e.width,e.height,4)}static async fromURL(e){const r=await ho(e);if(r.status!==200)throw new Error(`Unable to read image from "${e}" (${r.status} ${r.statusText})`);const n=await r.blob();return this.fromBlob(n)}static async fromBlob(e){if(Nt){const r=await Ar(e),n=Hr(r.width,r.height).getContext("2d");return n.drawImage(r,0,0),new this(n.getImageData(0,0,r.width,r.height).data,r.width,r.height,4)}else{const r=Ze(await e.arrayBuffer());return await Ar(r)}}static fromTensor(e,r="CHW"){if(e.dims.length!==3)throw new Error(`Tensor should have 3 dimensions, but has ${e.dims.length} dimensions.`);if(r==="CHW")e=e.transpose(1,2,0);else if(r!=="HWC")throw new Error(`Unsupported channel format: ${r}`);if(!(e.data instanceof Uint8ClampedArray||e.data instanceof Uint8Array))throw new Error(`Unsupported tensor type: ${e.type}`);switch(e.dims[2]){case 1:case 2:case 3:case 4:return new tr(e.data,e.dims[1],e.dims[0],e.dims[2]);default:throw new Error(`Unsupported number of channels: ${e.dims[2]}`)}}grayscale(){if(this.channels===1)return this;const e=new Uint8ClampedArray(this.width*this.height*1);switch(this.channels){case 3:case 4:for(let r=0,n=0;r=0?u=n:p=-n,a>=0?l=a:f=-a,o.drawImage(s,u,l,e,r,p,f,e,r),new tr(o.getImageData(0,0,e,r).data,e,r,4).convert(i)}else{let i=this.toSharp();if(n>=0&&a>=0)i=i.extract({left:Math.floor(n),top:Math.floor(a),width:e,height:r});else if(n<=0&&a<=0){const s=Math.floor(-a),o=Math.floor(-n);i=i.extend({top:s,left:o,right:e-this.width-o,bottom:r-this.height-s})}else{let s=[0,0],o=0;a<0?(s[0]=Math.floor(-a),s[1]=r-this.height-s[0]):o=Math.floor(a);let u=[0,0],l=0;n<0?(u[0]=Math.floor(-n),u[1]=e-this.width-u[0]):l=Math.floor(n),i=i.extend({top:s[0],bottom:s[1],left:u[0],right:u[1]}).extract({left:l,top:o,width:e,height:r})}return await Ar(i)}}async toBlob(e="image/png",r=1){if(!Nt)throw new Error("toBlob() is only supported in browser environments.");return await this.toCanvas().convertToBlob({type:e,quality:r})}toTensor(e="CHW"){let r=new pe("uint8",new Uint8Array(this.data),[this.height,this.width,this.channels]);if(e!=="HWC")if(e==="CHW")r=r.permute(2,0,1);else throw new Error(`Unsupported channel format: ${e}`);return r}toCanvas(){if(!Nt)throw new Error("toCanvas() is only supported in browser environments.");const e=this.clone().rgba(),r=Hr(e.width,e.height),n=new N0(e.data,e.width,e.height);return r.getContext("2d").putImageData(n,0,0),r}_update(e,r,n,a=null){return this.data=e,this.width=r,this.height=n,a!==null&&(this.channels=a),this}clone(){return new tr(this.data.slice(),this.width,this.height,this.channels)}convert(e){if(this.channels===e)return this;switch(e){case 1:this.grayscale();break;case 3:this.rgb();break;case 4:this.rgba();break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this}async save(e){if(Nt){if(qS)throw new Error("Unable to save an image from a Web Worker.");const r=e.split(".").pop().toLowerCase(),n=YS.get(r)??"image/png",a=await this.toBlob(n),i=URL.createObjectURL(a),s=document.createElement("a");s.href=i,s.download=e,s.click(),s.remove()}else{if(Ct.useFS)return await this.toSharp().toFile(e);throw new Error("Unable to save the image because filesystem is disabled in this environment.")}}toSharp(){if(Nt)throw new Error("toSharp() is only supported in server-side environments.");return Ze(this.data,{raw:{width:this.width,height:this.height,channels:this.channels}})}}function yp(t){if(t<1)return new Float64Array;if(t===1)return new Float64Array([1]);const e=t-1,r=Math.PI/e,n=new Float64Array(t);for(let a=0;a2595*Math.log10(1+t/700),kaldi:t=>1127*Math.log(1+t/700),slaney:(t,e=1e3,r=15,n=27/Math.log(6.4))=>t>=e?r+Math.log(t/e)*n:3*t/200};function so(t,e="htk"){const r=XS[e];if(!r)throw new Error('mel_scale should be one of "htk", "slaney" or "kaldi".');return typeof t=="number"?r(t):t.map(n=>r(n))}const QS={htk:t=>700*(10**(t/2595)-1),kaldi:t=>700*(Math.exp(t/1127)-1),slaney:(t,e=1e3,r=15,n=Math.log(6.4)/27)=>t>=r?e*Math.exp(n*(t-r)):200*t/3};function JS(t,e="htk"){const r=QS[e];if(!r)throw new Error('mel_scale should be one of "htk", "slaney" or "kaldi".');return typeof t=="number"?r(t):t.map(n=>r(n))}function ZS(t,e){const r=Float64Array.from({length:e.length-1},(s,o)=>e[o+1]-e[o]),n=Array.from({length:t.length},()=>new Array(e.length));for(let s=0;snew Array(t.length));for(let s=0;st+n*i)}function $a(t,e,r,n,a,i=null,s="htk",o=!1){if(i!==null&&i!=="slaney")throw new Error('norm must be one of null or "slaney"');const u=so(r,s),l=so(n,s),p=wp(u,l,e+2);let f=JS(p,s),m;if(o){const y=a/(t*2);m=so(Float64Array.from({length:t},(w,v)=>v*y),s),f=p}else m=wp(0,Math.floor(a/2),t);const c=ZS(m,f);if(i!==null&&i==="slaney")for(let y=0;ya)throw Error(`frame_length (${r}) may not be larger than fft_length (${a})`);if(T!==r)throw new Error(`Length of the window (${T}) must equal frame_length (${r})`);if(n<=0)throw new Error("hop_length must be greater than zero");if(i===null&&p!==null)throw new Error("You have provided `mel_filters` but `power` is `None`. Mel spectrogram computation is not yet supported for complex-valued spectrogram. Specify `power` to fix this issue.");if(s){if(o!=="reflect")throw new Error(`pad_mode="${o}" not implemented yet.`);const P=Math.floor((a-1)/2)+1;t=e3(t,P,P)}const A=Math.floor(1+Math.floor((t.length-r)/n)),B=u?Math.floor(a/2)+1:a;let R=A,D=A;k!==null&&(k>A?$&&(D=k):D=R=k);const K=new v_(a),j=new Float64Array(a),ie=new Float64Array(K.outputBufferSize),te=new Array(R);for(let P=0;P=1;--G)j[G]-=l*j[G-1];j[0]*=1-l}for(let G=0;GMath.pow(o,.85));break;default:throw new Error(`Unknown window type ${e}.`)}if(r&&(s=s.subarray(0,t)),n===null)return s;if(t>n)throw new Error(`Length of the window (${t}) may not be larger than frame_length (${n})`);return s}function n3([t,e,r,n]){return[t-r/2,e-n/2,t+r/2,e+n/2]}function gu(t,e=.5,r=null,n=!1){const a=t.logits,i=t.pred_boxes,[s,o,u]=a.dims;if(r!==null&&r.length!==s)throw Error("Make sure that you pass in as many target sizes as the batch dimension of the logits");let l=[];for(let p=0;pe&&k.push(C)}else{let C=$r(v.data)[1];if(C===u-1||($=In(v.data),$[C]A*f[(B+1)%2])),m.boxes.push(T),m.classes.push(C),m.scores.push($[C])}}l.push(m)}return l}function La(t,e){if(!(t instanceof Float32Array||t instanceof Float64Array))throw new Error(`${e} expects input to be a Float32Array or a Float64Array, but got ${t?.constructor?.name??typeof t} instead. If using the feature extractor directly, remember to use \`read_audio(url, sampling_rate)\` to obtain the raw audio data of the file/url.`)}function bp(t,e,r=0,n=null){const a=t/e;let i=x_(a)*e;return n!==null&&i>n&&(i=Math.floor(a)*e),ii?l=Math.floor(i*u/a):i>a&&(u=Math.floor(a*l/i)),await e.resize(l,u,{resample:n}))}async crop_margin(e,r=200){const n=e.clone().grayscale(),a=Op(n.data)[0],s=$r(n.data)[0]-a;if(s===0)return e;const o=r/255;let u=n.width,l=n.height,p=0,f=0;const m=n.data;for(let c=0;cthis.preprocess(i)));return{pixel_values:wa(n.map(i=>i.pixel_values),0),original_sizes:n.map(i=>i.original_size),reshaped_input_sizes:n.map(i=>i.reshaped_input_size)}}}class a3 extends Xe{post_process_semantic_segmentation(e,r=null){const n=e.logits,a=n.dims[0];if(r!==null&&r.length!==a)throw Error("Make sure that you pass in as many target sizes as the batch dimension of the logits");const i=[];for(let s=0;sm[C]&&(m[C]=$[C],c[C]=k)}const y=new Array(u.dims[0]),w=f.data;for(let k=0;kk!==void 0);i.push({segmentation:f,labels:v})}return i}}class L0 extends Xe{}class i3 extends L0{}class s3 extends Xe{}class o3 extends Xe{}class U0 extends Xe{}class u3 extends U0{}class l3 extends Xe{}class d3 extends Xe{}class W0 extends Xe{constructor(e){super(e),this.crop_pct=this.config.crop_pct??224/256}async resize(e){const r=this.size?.shortest_edge;if(r===void 0)throw new Error("Size dictionary must contain 'shortest_edge' key.");if(r<384){const n=Math.floor(r/this.crop_pct),[a,i]=this.get_resize_output_image_size(e,{shortest_edge:n});e=await e.resize(a,i,{resample:this.resample}),e=await e.center_crop(r,r)}else e=await e.resize(r,r,{resample:this.resample});return e}}class c3 extends W0{}class p3 extends Xe{}class h3 extends Xe{}class f3 extends Xe{constructor(e){super(e),this.include_top=this.config.include_top??!0,this.include_top&&(this.image_std=this.image_std.map(r=>r*r))}}class V0 extends Xe{}class m3 extends V0{}class G0 extends Xe{post_process_object_detection(...e){return gu(...e)}}class g3 extends G0{}class _3 extends Xe{}class y3 extends Xe{}class H0 extends Xe{pad_image(e,r,n,a={}){const[i,s,o]=r;let u=this.image_mean;Array.isArray(this.image_mean)||(u=new Array(o).fill(u));let l=this.image_std;Array.isArray(l)||(l=new Array(o).fill(u));const p=u.map((f,m)=>-f/l[m]);return super.pad_image(e,r,n,{center:!0,constant_values:p,...a})}}class w3 extends H0{}class b3 extends Xe{async _call(e){const r=await super._call(e),n=[r.pixel_values.dims[0],64,64],a=new pe("int64",new BigInt64Array(n.reduce((i,s)=>i*s)).fill(1n),n);return{...r,pixel_mask:a}}post_process_object_detection(...e){return gu(...e)}remove_low_and_no_objects(e,r,n,a){let i=[],s=[],o=[];for(let u=0;un&&(i.push(p),s.push(c),o.push(f))}return[i,s,o]}check_segment_validity(e,r,n,a=.5,i=.8){let s=[],o=0,u=0;const l=r[n].data;for(let f=0;f=a&&++u;let p=o>0&&u>0;return p&&(p=o/u>i),[p,s]}compute_segments(e,r,n,a,i,s=null,o=null){let[u,l]=o??e[0].dims,p=new pe("int32",new Int32Array(u*l),[u,l]),f=[];if(o!==null)for(let v=0;vc[C]&&(m[C]=v,c[C]=$[C])}let y=0;const w=p.data;for(let v=0;va!==r.dims[i]))throw Error(`The first ${n.length} dimensions of 'input_points' and 'input_labels' must be the same.`);return new pe("int64",e.flat(1/0).map(BigInt),n)}async _call(e,{input_points:r=null,input_labels:n=null,input_boxes:a=null}={}){const i=await super._call(e);if(r&&(i.input_points=this.reshape_input_points(r,i.original_sizes,i.reshaped_input_sizes)),n){if(!i.input_points)throw Error("`input_points` must be provided if `input_labels` are provided.");i.input_labels=this.add_input_labels(n,i.input_points)}return a&&(i.input_boxes=this.reshape_input_points(a,i.original_sizes,i.reshaped_input_sizes,!0)),i}async post_process_masks(e,r,n,{mask_threshold:a=0,binarize:i=!0,pad_size:s=null}={}){const o=[];s=s??this.pad_size;const u=[s.height,s.width];for(let l=0;la&&(y[w]=1);m=new pe("bool",y,m.dims)}o.push(m)}return o}generate_crop_boxes(e,r,{crop_n_layers:n=0,overlap_ratio:a=512/1500,points_per_crop:i=32,crop_n_points_downscale_factor:s=1}={}){}}class x3 extends Xe{pad_image(e,r,n,a={}){const[i,s,o]=r;return super.pad_image(e,r,{width:s+(n-s%n)%n,height:i+(n-i%n)%n},{mode:"symmetric",center:!1,constant_values:-1,...a})}}class S3 extends Xe{async _call(e,r){Array.isArray(e)||(e=[e]),Array.isArray(r)||(r=[r]);const n=await Promise.all(e.map(s=>this.preprocess(s))),a=await Promise.all(r.map(s=>this.preprocess(s,{do_normalize:!1,do_convert_rgb:!1,do_convert_grayscale:!0})));return{pixel_values:wa(n.map((s,o)=>dr([s.pixel_values,a[o].pixel_values],0)),0),original_sizes:n.map(s=>s.original_size),reshaped_input_sizes:n.map(s=>s.reshaped_input_size)}}}class k3 extends on{constructor(e){super(e),this.config.mel_filters??=$a(Math.floor(1+this.config.n_fft/2),this.config.feature_size,0,8e3,this.config.sampling_rate,"slaney","slaney"),this.window=os(this.config.n_fft,"hann")}_extract_fbank_features(e){const{data:r,dims:n}=ss(e,this.window,this.config.n_fft,this.config.hop_length,{power:2,mel_filters:this.config.mel_filters,log_mel:"log10",max_num_frames:this.config.nb_max_frames}),a=$r(r)[0];for(let i=0;ithis.config.n_samples?(console.warn("Attempting to extract features for audio longer than 30 seconds. If using a pipeline to extract transcript from a long audio clip, remember to specify `chunk_length_s` and/or `stride_length_s`."),r=e.slice(0,this.config.n_samples)):(r=new Float32Array(this.config.n_samples),r.set(e));const{data:n,dims:a}=this._extract_fbank_features(r);return{input_features:new pe("float32",n,[1,...a])}}}class E3 extends on{_zero_mean_unit_var_norm(e){const n=e.reduce((i,s)=>i+s,0)/e.length,a=e.reduce((i,s)=>i+(s-n)**2,0)/e.length;return e.map(i=>(i-n)/Math.sqrt(a+1e-7))}async _call(e){La(e,"Wav2Vec2FeatureExtractor"),e instanceof Float64Array&&(e=new Float32Array(e));let r=e;this.config.do_normalize&&(r=this._zero_mean_unit_var_norm(r));const n=[1,r.length];return{input_values:new pe("float32",r,n),attention_mask:new pe("int64",new BigInt64Array(r.length).fill(1n),n)}}}class C3 extends on{constructor(e){super(e);const r=this.config.sampling_rate,n=$a(256,this.config.num_mel_bins,20,Math.floor(r/2),r,null,"kaldi",!0);for(let a=0;an*32768),ss(e,this.window,400,160,{fft_length:512,power:2,center:!1,preemphasis:.97,mel_filters:this.mel_filters,log_mel:"log",mel_floor:1192092955078125e-22,remove_dc_offset:!0,max_num_frames:r,transpose:!0})}async _call(e,{padding:r=!0,pad_to_multiple_of:n=2,do_normalize_per_mel_bins:a=!0,return_attention_mask:i=!0}={}){La(e,"SeamlessM4TFeatureExtractor");let{data:s,dims:o}=this._extract_fbank_features(e,this.config.max_length);if(a){const[w,v]=o;for(let k=0;k0){const $=new Float32Array(v*(w+k));$.set(s),$.fill(this.config.padding_value,s.length);const C=w+k;s=$,o=[C,v],i&&(u=new pe("int64",new BigInt64Array(C),[1,C]),u.data.fill(1n,0,w))}}const[l,p]=o,f=this.config.stride;if(l%f!==0)throw new Error(`The number of frames (${l}) must be a multiple of the stride (${f}).`);const c=new pe("float32",s,o).view(1,Math.floor(l/f),p*f),y={input_features:c};if(i){const w=c.dims[1],v=new BigInt64Array(w);if(u){const k=u.data;for(let $=1,C=0;$0)if(n==="rand_trunc"){s=!0;const u=Math.floor(Math.random()*(o+1));e=e.subarray(u,u+r),i=this._extract_fbank_features(e,this.mel_filters_slaney,this.config.nb_max_samples),i.dims=[1,...i.dims]}else throw new Error(`Truncation strategy "${n}" not implemented`);else{if(o<0){let u=new Float64Array(r);if(u.set(e),a==="repeat")for(let l=e.length;lt),Si.length>0){const t=Si.map(n=>zi.value.replaceAll("{}",n)),e=j0(t,{padding:!0,truncation:!0}),{last_hidden_state:r}=await q0(e);yr=ap(r,e.attention_mask),yr=sw(yr,[yr.dims[1]]),yr=yr.normalize(2,-1).tolist()}else xi.innerHTML="";if(yr){$p.drawImage(da,0,0,jr,jr);const t=$p.getImageData(0,0,jr,jr).data,e=new tr(t,jr,jr,4),r=await K0(e),{last_hidden_state:n}=await Y0(r);Sp??=On(n.dims.slice(0,2));let a=ap(n,Sp);a=a.normalize(2,-1).tolist()[0];const i=yr.map(o=>w_(o,a)*N3),s=In(i).map((o,u)=>[o,u]).sort((o,u)=>u[0]-o[0]);xi.innerHTML="";for(const[o,u]of s)xi.appendChild(document.createTextNode(`${Si[u]}: ${o.toFixed(2)}`)),xi.appendChild(document.createElement("br"))}if(lo!==void 0){const t=1e3/(performance.now()-lo);us.textContent=`FPS: ${t.toFixed(2)}`}lo=performance.now(),uo=!1}()),window.requestAnimationFrame(X0)}navigator.mediaDevices.getUserMedia({video:!0}).then(t=>{da.srcObject=t,da.play();const e=t.getVideoTracks()[0],{width:r,height:n}=e.getSettings();da.width=r,da.height=n;const a=r/n,[i,s]=a>720/405?[720,720/a]:[405*a,405];vp.style.width=`${i}px`,vp.style.height=`${s}px`,window.requestAnimationFrame(X0)}).catch(t=>{alert(t)}); diff --git a/assets/index-DDYN1ddX.css b/assets/index-DwBfK3bE.css similarity index 85% rename from assets/index-DDYN1ddX.css rename to assets/index-DwBfK3bE.css index eb4d9ba2a8177b48689c1d98854e8aa6e91cc749..fea15f28c37ee7127b9c9c35811746f891ef5c5e 100644 --- a/assets/index-DDYN1ddX.css +++ b/assets/index-DwBfK3bE.css @@ -1 +1 @@ -*{box-sizing:border-box;padding:0;margin:0;font-family:sans-serif}html,body{height:100%}body{padding:16px 32px}body,#container{display:flex;flex-direction:column;justify-content:center;align-items:center}#controls{display:flex;padding:1rem;gap:1rem}#controls>div{text-align:center}h1,h3{text-align:center}h3{margin-top:.5rem}#container{position:relative;width:720px;height:405px;max-width:100%;max-height:100%;border:2px dashed #D1D5DB;border-radius:.75rem;overflow:hidden;margin-top:1rem;background-size:100% 100%;background-position:center;background-repeat:no-repeat}#status{min-height:16px;margin:8px 0}video{width:100%;height:100%}input[type=text]{padding:.25rem .5rem;border:1px solid #D1D5DB;border-radius:.25rem;margin-top:2px}input[type=range]{margin-top:6px}#overlay{position:absolute;top:0;left:0;background-color:#ffffffe6;font-size:1.25rem;border-radius:2px}#overlay:not(:empty){padding:.5rem} +*{box-sizing:border-box;padding:0;margin:0;font-family:sans-serif}html,body{height:100%}body{padding:16px 32px}body,#container{display:flex;flex-direction:column;justify-content:center;align-items:center}#controls{display:flex;padding:1rem;gap:1rem}#controls>div{text-align:center}h1,h3{text-align:center}h3{margin-top:.5rem}#container{position:relative;width:720px;height:405px;max-width:100%;max-height:100%;border:2px dashed #d1d5db;border-radius:.75rem;overflow:hidden;margin-top:1rem;background-size:100% 100%;background-position:center;background-repeat:no-repeat}#status{min-height:16px;margin:8px 0}video{width:100%;height:100%}input[type=text]{padding:.25rem .5rem;border:1px solid #d1d5db;border-radius:.25rem;margin-top:2px}input[type=range]{margin-top:6px}#overlay{position:absolute;top:0;left:0;background-color:#ffffffe6;font-size:1.25rem;border-radius:2px}#overlay:not(:empty){padding:.5rem} diff --git a/index.html b/index.html index adef0070b7024b28414482a6eb1ea2699b4ebb34..86684eaa90a6f00283720b97baf3f55c9aefbf16 100644 --- a/index.html +++ b/index.html @@ -1,40 +1,41 @@ - - - - - - - Transformers.js | real-time Nomic-Embed-v1.5 - - - - - -

- Real-time zero-shot image classification (WebGPU) -

-

- Runs Nomic-Embed-v1.5 locally in your browser w/ - 🤗 Transformers.js -

-
- -
-
-
-
- -
- -
-
- -
- -
-
- - - - - \ No newline at end of file + + + + + + Transformers.js | real-time CLIP + + + + + +

Real-time zero-shot image classification (WebGPU)

+

+ Runs locally in your browser w/ + 🤗 Transformers.js +

+
+ +
+
+
+
+ +
+ +
+
+ +
+ +
+
+ + + +