react-native-executorch

import { BaseModule } from '../BaseModule'; import { RnExecutorchErrorCode } from '../../errors/ErrorCodes'; import { RnExecutorchError } from '../../errors/errorUtils'; import { Frame, PixelData, ScalarType } from '../../types/common'; export function isPixelData(input: unknown): input is PixelData { return ( typeof input === 'object' && input !== null && 'dataPtr' in input && input.dataPtr instanceof Uint8Array && 'sizes' in input && Array.isArray(input.sizes) && input.sizes.length === 3 && 'scalarType' in input && input.scalarType === ScalarType.BYTE ); } /** * Base class for computer vision models that support multiple input types. * * VisionModule extends BaseModule with: * - Unified `forward()` API accepting string paths or raw pixel data * - `runOnFrame` getter for real-time VisionCamera frame processing * - Shared frame processor creation logic * * Subclasses implement model-specific loading logic and may override `forward` for typed signatures. * @category Typescript API */ export abstract class VisionModule<TOutput> extends BaseModule { /** * Synchronous worklet function for real-time VisionCamera frame processing. * * Only available after the model is loaded. * * **Use this for VisionCamera frame processing in worklets.** * For async processing, use `forward()` instead. * @example * ```typescript * const model = new ClassificationModule(); * await model.load({ modelSource: MODEL }); * * // Use the functional form of setState to store the worklet — passing it * // directly would cause React to invoke it immediately as an updater fn. * const [runOnFrame, setRunOnFrame] = useState(null); * setRunOnFrame(() => model.runOnFrame); * * const frameOutput = useFrameOutput({ * onFrame(frame) { * 'worklet'; * if (!runOnFrame) return; * const result = runOnFrame(frame, isFrontCamera); * frame.dispose(); * } * }); * ``` * @returns A worklet function for frame processing. * @throws {RnExecutorchError} If the model is not loaded. */ get runOnFrame(): (frame: Frame, ...args: any[]) => TOutput { if (!this.nativeModule) { throw new RnExecutorchError( RnExecutorchErrorCode.ModuleNotLoaded, 'The model is currently not loaded. Please load the model before calling runOnFrame().' ); } // Extract pure JSI function reference (runs on JS thread) const nativeGenerateFromFrame = this.nativeModule.generateFromFrame; // Return worklet that captures ONLY the JSI function return (frame: Frame, isFrontCamera: boolean, ...args: any[]): TOutput => { 'worklet'; let nativeBuffer: { pointer: bigint; release(): void } | null = null; try { nativeBuffer = frame.getNativeBuffer(); /** Currently isMirrored is never set to true in VisionCamera. That's why we need to use our own property to determine if we need to mirror the results */ const frameData = { nativeBuffer: nativeBuffer.pointer, orientation: frame.orientation, isMirrored: isFrontCamera, }; return nativeGenerateFromFrame(frameData, ...args); } finally { if (nativeBuffer?.release) { nativeBuffer.release(); } } }; } /** * Executes the model's forward pass with automatic input type detection. * * Supports two input types: * 1. **String path/URI**: File path, URL, or Base64-encoded string * 2. **PixelData**: Raw pixel data from image libraries (e.g., NitroImage) * * **Note**: For VisionCamera frame processing, use `runOnFrame` instead. * This method is async and cannot be called in worklet context. * @param input - Image source (string path or PixelData object) * @param args - Additional model-specific arguments * @returns A Promise that resolves to the model output. * @example * ```typescript * // String path (async) * const result1 = await model.forward('file:///path/to/image.jpg'); * * // Pixel data (async) * const result2 = await model.forward({ * dataPtr: new Uint8Array(pixelBuffer), * sizes: [480, 640, 3], * scalarType: ScalarType.BYTE * }); * * // For VisionCamera frames, use runOnFrame in worklet: * const frameOutput = useFrameOutput({ * onFrame(frame) { * 'worklet'; * if (!model.runOnFrame) return; * const result = model.runOnFrame(frame); * } * }); * ``` */ async forward(input: string | PixelData, ...args: any[]): Promise<TOutput> { if (this.nativeModule == null) throw new RnExecutorchError( RnExecutorchErrorCode.ModuleNotLoaded, 'The model is currently not loaded. Please load the model before calling forward().' ); // Type detection and routing if (typeof input === 'string') { return await this.nativeModule.generateFromString(input, ...args); } else if (isPixelData(input)) { return await this.nativeModule.generateFromPixels(input, ...args); } else { throw new RnExecutorchError( RnExecutorchErrorCode.InvalidArgument, 'Invalid input: expected string path or PixelData object. For VisionCamera frames, use runOnFrame instead.' ); } } }