node-llama-cpp

Version:

Run AI models locally on your machine with node.js bindings for llama.cpp. Enforce a JSON schema on the model output on the generation level

node-llama-cpp.withcat.ai

withcatai/node-llama-cpp

46 lines (45 loc) • 1.73 kB

TypeScript

View Raw

import retry from "async-retry"; import { ModelFileAccessTokens } from "../utils/modelFileAccesTokens.js"; import { GgufFileInfo } from "./types/GgufFileInfoTypes.js"; /** * Read a GGUF file and return its metadata and tensor info (unless `readTensorInfo` is set to `false`). * Only the parts of the file required for the metadata and tensor info are read. * @param pathOrUri * @param options */ export declare function readGgufFileInfo(pathOrUri: string, { readTensorInfo, sourceType, ignoreKeys, logWarnings, fetchRetryOptions, fetchHeaders, spliceSplitFiles, signal, tokens }?: { /** * Whether to read the tensor info from the file's header. * * Defaults to `true`. */ readTensorInfo?: boolean; /** * Set to a specific value to force it to only use that source type. * By default, it detects whether the path is a network URL or a filesystem path and uses the appropriate reader accordingly. */ sourceType?: "network" | "filesystem"; /** * Metadata keys to ignore when parsing the metadata. * For example, `["tokenizer.ggml.tokens"]` */ ignoreKeys?: string[]; /** * Whether to log warnings * * Defaults to `true`. */ logWarnings?: boolean; /** Relevant only when fetching from a network */ fetchRetryOptions?: retry.Options; /** Relevant only when fetching from a network */ fetchHeaders?: Record<string, string>; /** * When split files are detected, read the metadata of the first file and splice the tensor info from all the parts. * * Defaults to `true`. */ spliceSplitFiles?: boolean; signal?: AbortSignal; tokens?: ModelFileAccessTokens; }): Promise<GgufFileInfo>;