tokenx

Version:

GPT token estimation and context size utilities without a full tokenizer

31 lines (28 loc) • 2.39 kB

text/typescript

type EncodingType = 'gpt2' | 'r50k_base' | 'p50k_base' | 'p50k_edit' | 'cl100k_base' | 'o200k_base'; type ModelName = 'davinci-002' | 'babbage-002' | 'text-davinci-003' | 'text-davinci-002' | 'text-davinci-001' | 'text-curie-001' | 'text-babbage-001' | 'text-ada-001' | 'davinci' | 'curie' | 'babbage' | 'ada' | 'code-davinci-002' | 'code-davinci-001' | 'code-cushman-002' | 'code-cushman-001' | 'davinci-codex' | 'cushman-codex' | 'text-davinci-edit-001' | 'code-davinci-edit-001' | 'text-embedding-ada-002' | 'text-similarity-davinci-001' | 'text-similarity-curie-001' | 'text-similarity-babbage-001' | 'text-similarity-ada-001' | 'text-search-davinci-doc-001' | 'text-search-curie-doc-001' | 'text-search-babbage-doc-001' | 'text-search-ada-doc-001' | 'code-search-babbage-code-001' | 'code-search-ada-code-001' | 'gpt2' | 'gpt-3.5-turbo' | 'gpt-35-turbo' | 'gpt-3.5-turbo-0301' | 'gpt-3.5-turbo-0613' | 'gpt-3.5-turbo-1106' | 'gpt-3.5-turbo-0125' | 'gpt-3.5-turbo-16k' | 'gpt-3.5-turbo-16k-0613' | 'gpt-3.5-turbo-instruct' | 'gpt-3.5-turbo-instruct-0914' | 'gpt-4' | 'gpt-4-0314' | 'gpt-4-0613' | 'gpt-4-32k' | 'gpt-4-32k-0314' | 'gpt-4-32k-0613' | 'gpt-4-turbo' | 'gpt-4-turbo-2024-04-09' | 'gpt-4-turbo-preview' | 'gpt-4-1106-preview' | 'gpt-4-0125-preview' | 'gpt-4-vision-preview' | 'gpt-4o' | 'gpt-4o-2024-05-13'; /** * Resolve a model name to a canonical model name. */ declare function resolveModelName(modelName: string): ModelName; /** * Returns the maximum number of tokens that can be generated by the model. */ declare function getModelContextSize(modelName: string): number; /** * Estimate the number of tokens in a string. */ declare function approximateTokenSize(input?: string): number; /** * Returns the maximum number of tokens that can be generated by the model. */ declare function approximateMaxTokenSize({ prompt, modelName, maxTokensInResponse, }: { prompt: string; modelName: ModelName; /** The maximum number of tokens to generate in the reply. 1000 tokens are roughly 750 English words. */ maxTokensInResponse?: number; }): number; /** * Ensures that the input string is within the token limit. */ declare function isWithinTokenLimit(input: string, tokenLimit: number): boolean; export { type EncodingType, type ModelName, approximateMaxTokenSize, approximateTokenSize, getModelContextSize, isWithinTokenLimit, resolveModelName };