@thecodingwhale/cv-processor

Version:

CV Processor to extract structured data from PDF resumes using TypeScript

16 lines (15 loc) • 462 B

TypeScript

/** * Class for extracting text from PDF documents */ export declare class TextExtractor { /** * Extract text from a PDF file, with OCR fallback if needed */ extractTextFromPDF(pdfPath: string): Promise<string>; /** * Extract text using OCR with Tesseract.js * Note: This is a simplified implementation as converting PDF pages to images * is more complex in Node.js than in Python */ private extractTextWithOCR; }