@papra/lecture
Version:
A simple library to extract text from files
39 lines (34 loc) • 1.05 kB
TypeScript
import { DeepPartial } from '@corentinth/chisels';
type ExtractorConfig = {
tesseract: {
languages: string[];
};
};
type PartialExtractorConfig = undefined | DeepPartial<ExtractorConfig>;
declare const ocrLanguages: string[];
declare function extractText({ arrayBuffer, mimeType, config: rawConfig }: {
arrayBuffer: ArrayBuffer;
mimeType: string;
config?: PartialExtractorConfig;
}): Promise<{
extractorName: string | undefined;
textContent: string | undefined;
error?: Error;
}>;
declare function extractTextFromBlob({ blob, config }: {
blob: Blob;
config?: PartialExtractorConfig;
}): Promise<{
extractorName: string | undefined;
textContent: string | undefined;
error?: Error;
}>;
declare function extractTextFromFile({ file, config }: {
file: File;
config?: PartialExtractorConfig;
}): Promise<{
extractorName: string | undefined;
textContent: string | undefined;
error?: Error;
}>;
export { extractText, extractTextFromBlob, extractTextFromFile, ocrLanguages };