UNPKG

onnxruntime-web

Version:

A Javascript library for running ONNX models on browsers

97 lines (84 loc) 3.85 kB
// Copyright (c) Microsoft Corporation. All rights reserved. // Licensed under the MIT License. import { Backend, env, InferenceSession, InferenceSessionHandler } from 'onnxruntime-common'; import { initializeOrtEp, initializeWebAssemblyAndOrtRuntime } from './wasm/proxy-wrapper'; import { OnnxruntimeWebAssemblySessionHandler } from './wasm/session-handler-inference'; /** * This function initializes all flags for WebAssembly. * * Those flags are accessible from `ort.env.wasm`. Users are allow to set those flags before the first inference session * being created, to override default value. */ export const initializeFlags = (): void => { if (typeof env.wasm.initTimeout !== 'number' || env.wasm.initTimeout < 0) { env.wasm.initTimeout = 0; } const simd = env.wasm.simd; if (typeof simd !== 'boolean' && simd !== undefined && simd !== 'fixed' && simd !== 'relaxed') { // eslint-disable-next-line no-console console.warn( `Property "env.wasm.simd" is set to unknown value "${simd}". Reset it to \`false\` and ignore SIMD feature checking.`, ); env.wasm.simd = false; } if (typeof env.wasm.proxy !== 'boolean') { env.wasm.proxy = false; } if (typeof env.wasm.trace !== 'boolean') { env.wasm.trace = false; } if (typeof env.wasm.numThreads !== 'number' || !Number.isInteger(env.wasm.numThreads) || env.wasm.numThreads <= 0) { // The following logic only applies when `ort.env.wasm.numThreads` is not set by user. We will always honor user's // setting if it is provided. // Browser: when crossOriginIsolated is false, SharedArrayBuffer is not available so WebAssembly threads will not // work. In this case, we will set numThreads to 1. // // There is an exception: when the browser is configured to force-enable SharedArrayBuffer (e.g. Chromuim with // --enable-features=SharedArrayBuffer), it is possible that `self.crossOriginIsolated` is false and // SharedArrayBuffer is available at the same time. This is usually for testing. In this case, we will still set // numThreads to 1 here. If we want to enable multi-threading in test, we should set `ort.env.wasm.numThreads` to a // value greater than 1. if (typeof self !== 'undefined' && !self.crossOriginIsolated) { env.wasm.numThreads = 1; } else { const numCpuLogicalCores = typeof navigator === 'undefined' ? require('node:os').cpus().length : navigator.hardwareConcurrency; env.wasm.numThreads = Math.min(4, Math.ceil((numCpuLogicalCores || 1) / 2)); } } }; export class OnnxruntimeWebAssemblyBackend implements Backend { /** * This function initializes the WebAssembly backend. * * This function will be called only once for each backend name. It will be called the first time when * `ort.InferenceSession.create()` is called with a registered backend name. * * @param backendName - the registered backend name. */ async init(backendName: string): Promise<void> { // populate wasm flags initializeFlags(); // init wasm await initializeWebAssemblyAndOrtRuntime(); // performe EP specific initialization await initializeOrtEp(backendName); } createInferenceSessionHandler( path: string, options?: InferenceSession.SessionOptions, ): Promise<InferenceSessionHandler>; createInferenceSessionHandler( buffer: Uint8Array, options?: InferenceSession.SessionOptions, ): Promise<InferenceSessionHandler>; async createInferenceSessionHandler( pathOrBuffer: string | Uint8Array, options?: InferenceSession.SessionOptions, ): Promise<InferenceSessionHandler> { const handler = new OnnxruntimeWebAssemblySessionHandler(); await handler.loadModel(pathOrBuffer, options); return handler; } } export const wasmBackend = new OnnxruntimeWebAssemblyBackend();