file2md

Version:

A TypeScript library for converting various document types (PDF, DOCX, XLSX, PPTX, HWP, HWPX) into Markdown with image and layout preservation

github.com/ricky-clevi/file2md

ricky-clevi/file2md

50 lines • 1.59 kB

TypeScript

View Raw

import type JSZip from 'jszip'; import type { Buffer } from 'node:buffer'; import type { ImageData } from '../types/interfaces.js'; export declare class ImageExtractor { private readonly outputDir; private imageCounter; private readonly extractedImages; constructor(outputDir?: string); /** * Extract images from a ZIP archive (DOCX, XLSX, PPTX) */ extractImagesFromZip(zip: JSZip, basePath?: string): Promise<readonly ImageData[]>; /** * Save an image buffer to disk */ saveImage(buffer: Buffer, originalPath: string, basePath?: string): Promise<string | null>; /** * Check if a file path represents an image */ isImageFile(filePath: string): boolean; /** * Get image format from file extension */ private getImageFormat; /** * Get markdown reference for an image by its original path */ getImageReference(originalPath: string, basePath?: string): string | null; /** * Create markdown image reference using HTML img tag for better compatibility */ getImageMarkdown(description?: string, imagePath?: string): string; /** * Reset the image counter and clear extracted images map */ reset(): void; /** * Get the output directory for images */ get imageDirectory(): string; /** * Get the current image counter */ get currentImageCount(): number; /** * Get all extracted image mappings */ get extractedImageMappings(): ReadonlyMap<string, string>; } //# sourceMappingURL=image-extractor.d.ts.map