onnxruntime-web

// Copyright (c) Microsoft Corporation. All rights reserved. // Licensed under the MIT License. import { AttributeWithCacheKey, createAttributeWithCacheKey } from '../../../attribute-with-cache-key'; import { Graph } from '../../../graph'; import { OperatorImplementation, OperatorInitialization } from '../../../operators'; import { Tensor } from '../../../tensor'; import { GemmUtil } from '../../../util'; import { WebGLInferenceHandler } from '../inference-handler'; import { ProgramInfo, ProgramInfoLoader, ProgramMetadata, TextureType } from '../types'; export interface GemmAttributes extends AttributeWithCacheKey { transA: boolean; transB: boolean; alpha: number; beta: number; isOptionalC: boolean; // in opset 11, C becomes optional } export const gemm: OperatorImplementation<GemmAttributes> = ( inferenceHandler: WebGLInferenceHandler, inputs: Tensor[], attributes: GemmAttributes, ): Tensor[] => { validateInputs(inputs, attributes); const output = inferenceHandler.run(createGemmProgramInfoLoader(inputs, attributes), inputs); return [output]; }; const parseGemmAttributes = (node: Graph.Node, isOptionalC: boolean): GemmAttributes => { const transA = node.attributes.getInt('transA', 0) !== 0; const transB = node.attributes.getInt('transB', 0) !== 0; const alpha = node.attributes.getFloat('alpha', 1.0); const beta = node.attributes.getFloat('beta', 1.0); return createAttributeWithCacheKey({ transA, transB, alpha, beta, isOptionalC }); }; export const parseGemmAttributesV7: OperatorInitialization<GemmAttributes> = (node: Graph.Node): GemmAttributes => parseGemmAttributes(node, false); export const parseGemmAttributesV11: OperatorInitialization<GemmAttributes> = (node: Graph.Node): GemmAttributes => parseGemmAttributes(node, true); const createGemmProgramInfoLoader = (inputs: Tensor[], attributes: GemmAttributes): ProgramInfoLoader => { const metadata = { name: 'Gemm', inputNames: inputs.length === 3 ? ['A', 'B', 'C'] : ['A', 'B'], inputTypes: inputs.length === 3 ? [TextureType.unpacked, TextureType.unpacked, TextureType.unpacked] : [TextureType.unpacked, TextureType.unpacked], key: attributes.cacheKey, }; return { ...metadata, get: () => createGemmProgramInfo(metadata, inputs, attributes) }; }; const createGemmProgramInfo = ( metadata: ProgramMetadata, inputs: Tensor[], attributes: GemmAttributes, ): ProgramInfo => { const aShape = inputs[0].dims.slice(); const bShape = inputs[1].dims.slice(); const [M, N] = GemmUtil.getShapeOfGemmResult( aShape, attributes.transA, bShape, attributes.transB, inputs.length === 3 ? inputs[2].dims : undefined, ); const outputShape = [M, N]; if (!outputShape) { throw new Error("Can't use gemm on the given tensors"); } let sharedDim = aShape[aShape.length - 1]; let line = ''; if (attributes.transA) { sharedDim = aShape[0]; } if (attributes.transA && attributes.transB) { line = 'value += _A_T(a) * _B_T(b);'; } else if (attributes.transA && !attributes.transB) { line = 'value += _A_T(a) * _B(b);'; } else if (!attributes.transA && attributes.transB) { line = 'value += _A(a) * _B_T(b);'; } else if (!attributes.transA && !attributes.transB) { line = 'value += _A(a) * _B(b);'; } const rank = outputShape.length; const declareC = inputs.length === 3 ? `int c[${inputs[2].dims.length}];` : ''; const broadcastC = inputs.length === 3 ? 'bcastIndices_C(indices, c);' : ''; const calculateC = inputs.length === 3 ? 'value += beta * _C(c);' : ''; const shaderSource = ` float process(int indices[${rank}]) { int a[${rank}]; int b[${rank}]; ${declareC} copyVec(indices, a); copyVec(indices, b); ${broadcastC} float value = 0.0; for (int k=0; k<${sharedDim}; ++k) { a[${rank - 1}] = k; b[${rank - 2}] = k; ${line} } value = value * alpha; ${calculateC} return value; }`; return { ...metadata, output: { dims: outputShape, type: inputs[0].type, textureType: TextureType.unpacked }, variables: [ { name: 'alpha', type: 'float', data: attributes.alpha }, { name: 'beta', type: 'float', data: attributes.beta }, ], shaderSource, }; }; const validateInputs = (inputs: Tensor[], attributes: GemmAttributes): void => { if (!inputs) { throw new Error('Input is missing'); } if (attributes.isOptionalC && (inputs.length < 2 || inputs.length > 3)) { throw new Error('Invaid input shape.'); } if (!attributes.isOptionalC && inputs.length !== 3) { throw new Error('Gemm requires 3 inputs'); } // 'C' can be of dimensionality 1 or 2 only if (inputs.length === 3 && inputs[2].dims.length !== 1 && inputs[2].dims.length !== 2) { throw new Error('Invalid input shape of C'); } if ( (inputs[0].type !== 'float32' && inputs[0].type !== 'float64') || (inputs[1].type !== 'float32' && inputs[1].type !== 'float64') || (inputs.length === 3 && inputs[2].type !== 'float32' && inputs[2].type !== 'float64') ) { throw new Error('Invalid input type.'); } if (inputs[0].type !== inputs[1].type || (inputs.length === 3 && inputs[0].type !== inputs[2].type)) { throw new Error('Input types are mismatched'); } };