zon-format
Version:
ZON: The most token-efficient serialization format for LLMs - beats CSV, TOON, JSON, and all competitors
26 lines (25 loc) • 626 B
TypeScript
export interface SplitOptions {
maxTokens: number;
overlap?: number;
tokenRatio?: number;
}
export interface ChunkResult {
chunks: string[];
metadata: {
totalChunks: number;
totalTokens: number;
chunkSizes: number[];
};
}
export declare class ZonSplitter {
private maxChars;
private overlap;
constructor(options: SplitOptions);
/**
* Splits a large array of data into ZON-encoded chunks.
*
* @param data - Array of objects to split
* @returns ChunkResult containing encoded strings and metadata
*/
split(data: any[]): ChunkResult;
}