UNPKG

gpt-tokenizer

Version:

A pure JavaScript implementation of a BPE tokenizer (Encoder/Decoder) for GPT-2 / GPT-3 / GPT-4 and other OpenAI models

23 lines 1.01 kB
import { Cl100KBase } from './encodingParams/cl100k_base.js'; import { O200KBase } from './encodingParams/o200k_base.js'; import { P50KBase } from './encodingParams/p50k_base.js'; import { P50KEdit } from './encodingParams/p50k_edit.js'; import { R50KBase } from './encodingParams/r50k_base.js'; export function getEncodingParams(encodingName, getMergeableRanks) { const mergeableBytePairRanks = getMergeableRanks(encodingName); switch (encodingName.toLowerCase()) { case 'r50k_base': return R50KBase(mergeableBytePairRanks); case 'p50k_base': return P50KBase(mergeableBytePairRanks); case 'p50k_edit': return P50KEdit(mergeableBytePairRanks); case 'cl100k_base': return Cl100KBase(mergeableBytePairRanks); case 'o200k_base': return O200KBase(mergeableBytePairRanks); default: throw new Error(`Unknown encoding name: ${encodingName}`); } } //# sourceMappingURL=modelParams.js.map