openai

// File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details. import { APIResource } from '../../../resource'; import { isRequestOptions } from '../../../core'; import { APIPromise } from '../../../core'; import * as Core from '../../../core'; import * as CompletionsCompletionsAPI from './completions'; import * as CompletionsAPI from '../../completions'; import * as Shared from '../../shared'; import * as MessagesAPI from './messages'; import { MessageListParams, Messages } from './messages'; import { CursorPage, type CursorPageParams } from '../../../pagination'; import { Stream } from '../../../streaming'; export class Completions extends APIResource { messages: MessagesAPI.Messages = new MessagesAPI.Messages(this._client); /** * **Starting a new project?** We recommend trying * [Responses](https://platform.openai.com/docs/api-reference/responses) to take * advantage of the latest OpenAI platform features. Compare * [Chat Completions with Responses](https://platform.openai.com/docs/guides/responses-vs-chat-completions?api-mode=responses). * * --- * * Creates a model response for the given chat conversation. Learn more in the * [text generation](https://platform.openai.com/docs/guides/text-generation), * [vision](https://platform.openai.com/docs/guides/vision), and * [audio](https://platform.openai.com/docs/guides/audio) guides. * * Parameter support can differ depending on the model used to generate the * response, particularly for newer reasoning models. Parameters that are only * supported for reasoning models are noted below. For the current state of * unsupported parameters in reasoning models, * [refer to the reasoning guide](https://platform.openai.com/docs/guides/reasoning). */ create( body: ChatCompletionCreateParamsNonStreaming, options?: Core.RequestOptions, ): APIPromise<ChatCompletion>; create( body: ChatCompletionCreateParamsStreaming, options?: Core.RequestOptions, ): APIPromise<Stream<ChatCompletionChunk>>; create( body: ChatCompletionCreateParamsBase, options?: Core.RequestOptions, ): APIPromise<Stream<ChatCompletionChunk> | ChatCompletion>; create( body: ChatCompletionCreateParams, options?: Core.RequestOptions, ): APIPromise<ChatCompletion> | APIPromise<Stream<ChatCompletionChunk>> { return this._client.post('/chat/completions', { body, ...options, stream: body.stream ?? false }) as | APIPromise<ChatCompletion> | APIPromise<Stream<ChatCompletionChunk>>; } /** * Get a stored chat completion. Only Chat Completions that have been created with * the `store` parameter set to `true` will be returned. */ retrieve(completionId: string, options?: Core.RequestOptions): Core.APIPromise<ChatCompletion> { return this._client.get(`/chat/completions/${completionId}`, options); } /** * Modify a stored chat completion. Only Chat Completions that have been created * with the `store` parameter set to `true` can be modified. Currently, the only * supported modification is to update the `metadata` field. */ update( completionId: string, body: ChatCompletionUpdateParams, options?: Core.RequestOptions, ): Core.APIPromise<ChatCompletion> { return this._client.post(`/chat/completions/${completionId}`, { body, ...options }); } /** * List stored Chat Completions. Only Chat Completions that have been stored with * the `store` parameter set to `true` will be returned. */ list( query?: ChatCompletionListParams, options?: Core.RequestOptions, ): Core.PagePromise<ChatCompletionsPage, ChatCompletion>; list(options?: Core.RequestOptions): Core.PagePromise<ChatCompletionsPage, ChatCompletion>; list( query: ChatCompletionListParams | Core.RequestOptions = {}, options?: Core.RequestOptions, ): Core.PagePromise<ChatCompletionsPage, ChatCompletion> { if (isRequestOptions(query)) { return this.list({}, query); } return this._client.getAPIList('/chat/completions', ChatCompletionsPage, { query, ...options }); } /** * Delete a stored chat completion. Only Chat Completions that have been created * with the `store` parameter set to `true` can be deleted. */ del(completionId: string, options?: Core.RequestOptions): Core.APIPromise<ChatCompletionDeleted> { return this._client.delete(`/chat/completions/${completionId}`, options); } } export class ChatCompletionsPage extends CursorPage<ChatCompletion> {} export class ChatCompletionStoreMessagesPage extends CursorPage<ChatCompletionStoreMessage> {} /** * Represents a chat completion response returned by model, based on the provided * input. */ export interface ChatCompletion { /** * A unique identifier for the chat completion. */ id: string; /** * A list of chat completion choices. Can be more than one if `n` is greater * than 1. */ choices: Array<ChatCompletion.Choice>; /** * The Unix timestamp (in seconds) of when the chat completion was created. */ created: number; /** * The model used for the chat completion. */ model: string; /** * The object type, which is always `chat.completion`. */ object: 'chat.completion'; /** * Specifies the latency tier to use for processing the request. This parameter is * relevant for customers subscribed to the scale tier service: * * - If set to 'auto', and the Project is Scale tier enabled, the system will * utilize scale tier credits until they are exhausted. * - If set to 'auto', and the Project is not Scale tier enabled, the request will * be processed using the default service tier with a lower uptime SLA and no * latency guarentee. * - If set to 'default', the request will be processed using the default service * tier with a lower uptime SLA and no latency guarentee. * - If set to 'flex', the request will be processed with the Flex Processing * service tier. * [Learn more](https://platform.openai.com/docs/guides/flex-processing). * - When not set, the default behavior is 'auto'. * * When this parameter is set, the response body will include the `service_tier` * utilized. */ service_tier?: 'auto' | 'default' | 'flex' | null; /** * This fingerprint represents the backend configuration that the model runs with. * * Can be used in conjunction with the `seed` request parameter to understand when * backend changes have been made that might impact determinism. */ system_fingerprint?: string; /** * Usage statistics for the completion request. */ usage?: CompletionsAPI.CompletionUsage; } export namespace ChatCompletion { export interface Choice { /** * The reason the model stopped generating tokens. This will be `stop` if the model * hit a natural stop point or a provided stop sequence, `length` if the maximum * number of tokens specified in the request was reached, `content_filter` if * content was omitted due to a flag from our content filters, `tool_calls` if the * model called a tool, or `function_call` (deprecated) if the model called a * function. */ finish_reason: 'stop' | 'length' | 'tool_calls' | 'content_filter' | 'function_call'; /** * The index of the choice in the list of choices. */ index: number; /** * Log probability information for the choice. */ logprobs: Choice.Logprobs | null; /** * A chat completion message generated by the model. */ message: CompletionsCompletionsAPI.ChatCompletionMessage; } export namespace Choice { /** * Log probability information for the choice. */ export interface Logprobs { /** * A list of message content tokens with log probability information. */ content: Array<CompletionsCompletionsAPI.ChatCompletionTokenLogprob> | null; /** * A list of message refusal tokens with log probability information. */ refusal: Array<CompletionsCompletionsAPI.ChatCompletionTokenLogprob> | null; } } } /** * Messages sent by the model in response to user messages. */ export interface ChatCompletionAssistantMessageParam { /** * The role of the messages author, in this case `assistant`. */ role: 'assistant'; /** * Data about a previous audio response from the model. * [Learn more](https://platform.openai.com/docs/guides/audio). */ audio?: ChatCompletionAssistantMessageParam.Audio | null; /** * The contents of the assistant message. Required unless `tool_calls` or * `function_call` is specified. */ content?: string | Array<ChatCompletionContentPartText | ChatCompletionContentPartRefusal> | null; /** * @deprecated Deprecated and replaced by `tool_calls`. The name and arguments of a * function that should be called, as generated by the model. */ function_call?: ChatCompletionAssistantMessageParam.FunctionCall | null; /** * An optional name for the participant. Provides the model information to * differentiate between participants of the same role. */ name?: string; /** * The refusal message by the assistant. */ refusal?: string | null; /** * The tool calls generated by the model, such as function calls. */ tool_calls?: Array<ChatCompletionMessageToolCall>; } export namespace ChatCompletionAssistantMessageParam { /** * Data about a previous audio response from the model. * [Learn more](https://platform.openai.com/docs/guides/audio). */ export interface Audio { /** * Unique identifier for a previous audio response from the model. */ id: string; } /** * @deprecated Deprecated and replaced by `tool_calls`. The name and arguments of a * function that should be called, as generated by the model. */ export interface FunctionCall { /** * The arguments to call the function with, as generated by the model in JSON * format. Note that the model does not always generate valid JSON, and may * hallucinate parameters not defined by your function schema. Validate the * arguments in your code before calling your function. */ arguments: string; /** * The name of the function to call. */ name: string; } } /** * If the audio output modality is requested, this object contains data about the * audio response from the model. * [Learn more](https://platform.openai.com/docs/guides/audio). */ export interface ChatCompletionAudio { /** * Unique identifier for this audio response. */ id: string; /** * Base64 encoded audio bytes generated by the model, in the format specified in * the request. */ data: string; /** * The Unix timestamp (in seconds) for when this audio response will no longer be * accessible on the server for use in multi-turn conversations. */ expires_at: number; /** * Transcript of the audio generated by the model. */ transcript: string; } /** * Parameters for audio output. Required when audio output is requested with * `modalities: ["audio"]`. * [Learn more](https://platform.openai.com/docs/guides/audio). */ export interface ChatCompletionAudioParam { /** * Specifies the output audio format. Must be one of `wav`, `mp3`, `flac`, `opus`, * or `pcm16`. */ format: 'wav' | 'aac' | 'mp3' | 'flac' | 'opus' | 'pcm16'; /** * The voice the model uses to respond. Supported voices are `alloy`, `ash`, * `ballad`, `coral`, `echo`, `fable`, `nova`, `onyx`, `sage`, and `shimmer`. */ voice: | (string & {}) | 'alloy' | 'ash' | 'ballad' | 'coral' | 'echo' | 'fable' | 'onyx' | 'nova' | 'sage' | 'shimmer' | 'verse'; } /** * Represents a streamed chunk of a chat completion response returned by the model, * based on the provided input. * [Learn more](https://platform.openai.com/docs/guides/streaming-responses). */ export interface ChatCompletionChunk { /** * A unique identifier for the chat completion. Each chunk has the same ID. */ id: string; /** * A list of chat completion choices. Can contain more than one elements if `n` is * greater than 1. Can also be empty for the last chunk if you set * `stream_options: {"include_usage": true}`. */ choices: Array<ChatCompletionChunk.Choice>; /** * The Unix timestamp (in seconds) of when the chat completion was created. Each * chunk has the same timestamp. */ created: number; /** * The model to generate the completion. */ model: string; /** * The object type, which is always `chat.completion.chunk`. */ object: 'chat.completion.chunk'; /** * Specifies the latency tier to use for processing the request. This parameter is * relevant for customers subscribed to the scale tier service: * * - If set to 'auto', and the Project is Scale tier enabled, the system will * utilize scale tier credits until they are exhausted. * - If set to 'auto', and the Project is not Scale tier enabled, the request will * be processed using the default service tier with a lower uptime SLA and no * latency guarentee. * - If set to 'default', the request will be processed using the default service * tier with a lower uptime SLA and no latency guarentee. * - If set to 'flex', the request will be processed with the Flex Processing * service tier. * [Learn more](https://platform.openai.com/docs/guides/flex-processing). * - When not set, the default behavior is 'auto'. * * When this parameter is set, the response body will include the `service_tier` * utilized. */ service_tier?: 'auto' | 'default' | 'flex' | null; /** * This fingerprint represents the backend configuration that the model runs with. * Can be used in conjunction with the `seed` request parameter to understand when * backend changes have been made that might impact determinism. */ system_fingerprint?: string; /** * An optional field that will only be present when you set * `stream_options: {"include_usage": true}` in your request. When present, it * contains a null value **except for the last chunk** which contains the token * usage statistics for the entire request. * * **NOTE:** If the stream is interrupted or cancelled, you may not receive the * final usage chunk which contains the total token usage for the request. */ usage?: CompletionsAPI.CompletionUsage | null; } export namespace ChatCompletionChunk { export interface Choice { /** * A chat completion delta generated by streamed model responses. */ delta: Choice.Delta; /** * The reason the model stopped generating tokens. This will be `stop` if the model * hit a natural stop point or a provided stop sequence, `length` if the maximum * number of tokens specified in the request was reached, `content_filter` if * content was omitted due to a flag from our content filters, `tool_calls` if the * model called a tool, or `function_call` (deprecated) if the model called a * function. */ finish_reason: 'stop' | 'length' | 'tool_calls' | 'content_filter' | 'function_call' | null; /** * The index of the choice in the list of choices. */ index: number; /** * Log probability information for the choice. */ logprobs?: Choice.Logprobs | null; } export namespace Choice { /** * A chat completion delta generated by streamed model responses. */ export interface Delta { /** * The contents of the chunk message. */ content?: string | null; /** * @deprecated Deprecated and replaced by `tool_calls`. The name and arguments of a * function that should be called, as generated by the model. */ function_call?: Delta.FunctionCall; /** * The refusal message generated by the model. */ refusal?: string | null; /** * The role of the author of this message. */ role?: 'developer' | 'system' | 'user' | 'assistant' | 'tool'; tool_calls?: Array<Delta.ToolCall>; } export namespace Delta { /** * @deprecated Deprecated and replaced by `tool_calls`. The name and arguments of a * function that should be called, as generated by the model. */ export interface FunctionCall { /** * The arguments to call the function with, as generated by the model in JSON * format. Note that the model does not always generate valid JSON, and may * hallucinate parameters not defined by your function schema. Validate the * arguments in your code before calling your function. */ arguments?: string; /** * The name of the function to call. */ name?: string; } export interface ToolCall { index: number; /** * The ID of the tool call. */ id?: string; function?: ToolCall.Function; /** * The type of the tool. Currently, only `function` is supported. */ type?: 'function'; } export namespace ToolCall { export interface Function { /** * The arguments to call the function with, as generated by the model in JSON * format. Note that the model does not always generate valid JSON, and may * hallucinate parameters not defined by your function schema. Validate the * arguments in your code before calling your function. */ arguments?: string; /** * The name of the function to call. */ name?: string; } } } /** * Log probability information for the choice. */ export interface Logprobs { /** * A list of message content tokens with log probability information. */ content: Array<CompletionsCompletionsAPI.ChatCompletionTokenLogprob> | null; /** * A list of message refusal tokens with log probability information. */ refusal: Array<CompletionsCompletionsAPI.ChatCompletionTokenLogprob> | null; } } } /** * Learn about * [text inputs](https://platform.openai.com/docs/guides/text-generation). */ export type ChatCompletionContentPart = | ChatCompletionContentPartText | ChatCompletionContentPartImage | ChatCompletionContentPartInputAudio | ChatCompletionContentPart.File; export namespace ChatCompletionContentPart { /** * Learn about [file inputs](https://platform.openai.com/docs/guides/text) for text * generation. */ export interface File { file: File.File; /** * The type of the content part. Always `file`. */ type: 'file'; } export namespace File { export interface File { /** * The base64 encoded file data, used when passing the file to the model as a * string. */ file_data?: string; /** * The ID of an uploaded file to use as input. */ file_id?: string; /** * The name of the file, used when passing the file to the model as a string. */ filename?: string; } } } /** * Learn about [image inputs](https://platform.openai.com/docs/guides/vision). */ export interface ChatCompletionContentPartImage { image_url: ChatCompletionContentPartImage.ImageURL; /** * The type of the content part. */ type: 'image_url'; } export namespace ChatCompletionContentPartImage { export interface ImageURL { /** * Either a URL of the image or the base64 encoded image data. */ url: string; /** * Specifies the detail level of the image. Learn more in the * [Vision guide](https://platform.openai.com/docs/guides/vision#low-or-high-fidelity-image-understanding). */ detail?: 'auto' | 'low' | 'high'; } } /** * Learn about [audio inputs](https://platform.openai.com/docs/guides/audio). */ export interface ChatCompletionContentPartInputAudio { input_audio: ChatCompletionContentPartInputAudio.InputAudio; /** * The type of the content part. Always `input_audio`. */ type: 'input_audio'; } export namespace ChatCompletionContentPartInputAudio { export interface InputAudio { /** * Base64 encoded audio data. */ data: string; /** * The format of the encoded audio data. Currently supports "wav" and "mp3". */ format: 'wav' | 'mp3'; } } export interface ChatCompletionContentPartRefusal { /** * The refusal message generated by the model. */ refusal: string; /** * The type of the content part. */ type: 'refusal'; } /** * Learn about * [text inputs](https://platform.openai.com/docs/guides/text-generation). */ export interface ChatCompletionContentPartText { /** * The text content. */ text: string; /** * The type of the content part. */ type: 'text'; } export interface ChatCompletionDeleted { /** * The ID of the chat completion that was deleted. */ id: string; /** * Whether the chat completion was deleted. */ deleted: boolean; /** * The type of object being deleted. */ object: 'chat.completion.deleted'; } /** * Developer-provided instructions that the model should follow, regardless of * messages sent by the user. With o1 models and newer, `developer` messages * replace the previous `system` messages. */ export interface ChatCompletionDeveloperMessageParam { /** * The contents of the developer message. */ content: string | Array<ChatCompletionContentPartText>; /** * The role of the messages author, in this case `developer`. */ role: 'developer'; /** * An optional name for the participant. Provides the model information to * differentiate between participants of the same role. */ name?: string; } /** * Specifying a particular function via `{"name": "my_function"}` forces the model * to call that function. */ export interface ChatCompletionFunctionCallOption { /** * The name of the function to call. */ name: string; } /** * @deprecated */ export interface ChatCompletionFunctionMessageParam { /** * The contents of the function message. */ content: string | null; /** * The name of the function to call. */ name: string; /** * The role of the messages author, in this case `function`. */ role: 'function'; } /** * A chat completion message generated by the model. */ export interface ChatCompletionMessage { /** * The contents of the message. */ content: string | null; /** * The refusal message generated by the model. */ refusal: string | null; /** * The role of the author of this message. */ role: 'assistant'; /** * Annotations for the message, when applicable, as when using the * [web search tool](https://platform.openai.com/docs/guides/tools-web-search?api-mode=chat). */ annotations?: Array<ChatCompletionMessage.Annotation>; /** * If the audio output modality is requested, this object contains data about the * audio response from the model. * [Learn more](https://platform.openai.com/docs/guides/audio). */ audio?: ChatCompletionAudio | null; /** * @deprecated Deprecated and replaced by `tool_calls`. The name and arguments of a * function that should be called, as generated by the model. */ function_call?: ChatCompletionMessage.FunctionCall | null; /** * The tool calls generated by the model, such as function calls. */ tool_calls?: Array<ChatCompletionMessageToolCall>; } export namespace ChatCompletionMessage { /** * A URL citation when using web search. */ export interface Annotation { /** * The type of the URL citation. Always `url_citation`. */ type: 'url_citation'; /** * A URL citation when using web search. */ url_citation: Annotation.URLCitation; } export namespace Annotation { /** * A URL citation when using web search. */ export interface URLCitation { /** * The index of the last character of the URL citation in the message. */ end_index: number; /** * The index of the first character of the URL citation in the message. */ start_index: number; /** * The title of the web resource. */ title: string; /** * The URL of the web resource. */ url: string; } } /** * @deprecated Deprecated and replaced by `tool_calls`. The name and arguments of a * function that should be called, as generated by the model. */ export interface FunctionCall { /** * The arguments to call the function with, as generated by the model in JSON * format. Note that the model does not always generate valid JSON, and may * hallucinate parameters not defined by your function schema. Validate the * arguments in your code before calling your function. */ arguments: string; /** * The name of the function to call. */ name: string; } } /** * Developer-provided instructions that the model should follow, regardless of * messages sent by the user. With o1 models and newer, `developer` messages * replace the previous `system` messages. */ export type ChatCompletionMessageParam = | ChatCompletionDeveloperMessageParam | ChatCompletionSystemMessageParam | ChatCompletionUserMessageParam | ChatCompletionAssistantMessageParam | ChatCompletionToolMessageParam | ChatCompletionFunctionMessageParam; export interface ChatCompletionMessageToolCall { /** * The ID of the tool call. */ id: string; /** * The function that the model called. */ function: ChatCompletionMessageToolCall.Function; /** * The type of the tool. Currently, only `function` is supported. */ type: 'function'; } export namespace ChatCompletionMessageToolCall { /** * The function that the model called. */ export interface Function { /** * The arguments to call the function with, as generated by the model in JSON * format. Note that the model does not always generate valid JSON, and may * hallucinate parameters not defined by your function schema. Validate the * arguments in your code before calling your function. */ arguments: string; /** * The name of the function to call. */ name: string; } } export type ChatCompletionModality = 'text' | 'audio'; /** * Specifies a tool the model should use. Use to force the model to call a specific * function. */ export interface ChatCompletionNamedToolChoice { function: ChatCompletionNamedToolChoice.Function; /** * The type of the tool. Currently, only `function` is supported. */ type: 'function'; } export namespace ChatCompletionNamedToolChoice { export interface Function { /** * The name of the function to call. */ name: string; } } /** * Static predicted output content, such as the content of a text file that is * being regenerated. */ export interface ChatCompletionPredictionContent { /** * The content that should be matched when generating a model response. If * generated tokens would match this content, the entire model response can be * returned much more quickly. */ content: string | Array<ChatCompletionContentPartText>; /** * The type of the predicted content you want to provide. This type is currently * always `content`. */ type: 'content'; } /** * The role of the author of a message */ export type ChatCompletionRole = 'developer' | 'system' | 'user' | 'assistant' | 'tool' | 'function'; /** * A chat completion message generated by the model. */ export interface ChatCompletionStoreMessage extends ChatCompletionMessage { /** * The identifier of the chat message. */ id: string; } /** * Options for streaming response. Only set this when you set `stream: true`. */ export interface ChatCompletionStreamOptions { /** * If set, an additional chunk will be streamed before the `data: [DONE]` message. * The `usage` field on this chunk shows the token usage statistics for the entire * request, and the `choices` field will always be an empty array. * * All other chunks will also include a `usage` field, but with a null value. * **NOTE:** If the stream is interrupted, you may not receive the final usage * chunk which contains the total token usage for the request. */ include_usage?: boolean; } /** * Developer-provided instructions that the model should follow, regardless of * messages sent by the user. With o1 models and newer, use `developer` messages * for this purpose instead. */ export interface ChatCompletionSystemMessageParam { /** * The contents of the system message. */ content: string | Array<ChatCompletionContentPartText>; /** * The role of the messages author, in this case `system`. */ role: 'system'; /** * An optional name for the participant. Provides the model information to * differentiate between participants of the same role. */ name?: string; } export interface ChatCompletionTokenLogprob { /** * The token. */ token: string; /** * A list of integers representing the UTF-8 bytes representation of the token. * Useful in instances where characters are represented by multiple tokens and * their byte representations must be combined to generate the correct text * representation. Can be `null` if there is no bytes representation for the token. */ bytes: Array<number> | null; /** * The log probability of this token, if it is within the top 20 most likely * tokens. Otherwise, the value `-9999.0` is used to signify that the token is very * unlikely. */ logprob: number; /** * List of the most likely tokens and their log probability, at this token * position. In rare cases, there may be fewer than the number of requested * `top_logprobs` returned. */ top_logprobs: Array<ChatCompletionTokenLogprob.TopLogprob>; } export namespace ChatCompletionTokenLogprob { export interface TopLogprob { /** * The token. */ token: string; /** * A list of integers representing the UTF-8 bytes representation of the token. * Useful in instances where characters are represented by multiple tokens and * their byte representations must be combined to generate the correct text * representation. Can be `null` if there is no bytes representation for the token. */ bytes: Array<number> | null; /** * The log probability of this token, if it is within the top 20 most likely * tokens. Otherwise, the value `-9999.0` is used to signify that the token is very * unlikely. */ logprob: number; } } export interface ChatCompletionTool { function: Shared.FunctionDefinition; /** * The type of the tool. Currently, only `function` is supported. */ type: 'function'; } /** * Controls which (if any) tool is called by the model. `none` means the model will * not call any tool and instead generates a message. `auto` means the model can * pick between generating a message or calling one or more tools. `required` means * the model must call one or more tools. Specifying a particular tool via * `{"type": "function", "function": {"name": "my_function"}}` forces the model to * call that tool. * * `none` is the default when no tools are present. `auto` is the default if tools * are present. */ export type ChatCompletionToolChoiceOption = 'none' | 'auto' | 'required' | ChatCompletionNamedToolChoice; export interface ChatCompletionToolMessageParam { /** * The contents of the tool message. */ content: string | Array<ChatCompletionContentPartText>; /** * The role of the messages author, in this case `tool`. */ role: 'tool'; /** * Tool call that this message is responding to. */ tool_call_id: string; } /** * Messages sent by an end user, containing prompts or additional context * information. */ export interface ChatCompletionUserMessageParam { /** * The contents of the user message. */ content: string | Array<ChatCompletionContentPart>; /** * The role of the messages author, in this case `user`. */ role: 'user'; /** * An optional name for the participant. Provides the model information to * differentiate between participants of the same role. */ name?: string; } /** * @deprecated ChatCompletionMessageParam should be used instead */ export type CreateChatCompletionRequestMessage = ChatCompletionMessageParam; export type ChatCompletionReasoningEffort = Shared.ReasoningEffort | null; export type ChatCompletionCreateParams = | ChatCompletionCreateParamsNonStreaming | ChatCompletionCreateParamsStreaming; export interface ChatCompletionCreateParamsBase { /** * A list of messages comprising the conversation so far. Depending on the * [model](https://platform.openai.com/docs/models) you use, different message * types (modalities) are supported, like * [text](https://platform.openai.com/docs/guides/text-generation), * [images](https://platform.openai.com/docs/guides/vision), and * [audio](https://platform.openai.com/docs/guides/audio). */ messages: Array<ChatCompletionMessageParam>; /** * Model ID used to generate the response, like `gpt-4o` or `o3`. OpenAI offers a * wide range of models with different capabilities, performance characteristics, * and price points. Refer to the * [model guide](https://platform.openai.com/docs/models) to browse and compare * available models. */ model: (string & {}) | Shared.ChatModel; /** * Parameters for audio output. Required when audio output is requested with * `modalities: ["audio"]`. * [Learn more](https://platform.openai.com/docs/guides/audio). */ audio?: ChatCompletionAudioParam | null; /** * Number between -2.0 and 2.0. Positive values penalize new tokens based on their * existing frequency in the text so far, decreasing the model's likelihood to * repeat the same line verbatim. */ frequency_penalty?: number | null; /** * Deprecated in favor of `tool_choice`. * * Controls which (if any) function is called by the model. * * `none` means the model will not call a function and instead generates a message. * * `auto` means the model can pick between generating a message or calling a * function. * * Specifying a particular function via `{"name": "my_function"}` forces the model * to call that function. * * `none` is the default when no functions are present. `auto` is the default if * functions are present. */ function_call?: 'none' | 'auto' | ChatCompletionFunctionCallOption; /** * Deprecated in favor of `tools`. * * A list of functions the model may generate JSON inputs for. */ functions?: Array<ChatCompletionCreateParams.Function>; /** * Modify the likelihood of specified tokens appearing in the completion. * * Accepts a JSON object that maps tokens (specified by their token ID in the * tokenizer) to an associated bias value from -100 to 100. Mathematically, the * bias is added to the logits generated by the model prior to sampling. The exact * effect will vary per model, but values between -1 and 1 should decrease or * increase likelihood of selection; values like -100 or 100 should result in a ban * or exclusive selection of the relevant token. */ logit_bias?: Record<string, number> | null; /** * Whether to return log probabilities of the output tokens or not. If true, * returns the log probabilities of each output token returned in the `content` of * `message`. */ logprobs?: boolean | null; /** * An upper bound for the number of tokens that can be generated for a completion, * including visible output tokens and * [reasoning tokens](https://platform.openai.com/docs/guides/reasoning). */ max_completion_tokens?: number | null; /** * The maximum number of [tokens](/tokenizer) that can be generated in the chat * completion. This value can be used to control * [costs](https://openai.com/api/pricing/) for text generated via API. * * This value is now deprecated in favor of `max_completion_tokens`, and is not * compatible with * [o-series models](https://platform.openai.com/docs/guides/reasoning). */ max_tokens?: number | null; /** * Set of 16 key-value pairs that can be attached to an object. This can be useful * for storing additional information about the object in a structured format, and * querying for objects via API or the dashboard. * * Keys are strings with a maximum length of 64 characters. Values are strings with * a maximum length of 512 characters. */ metadata?: Shared.Metadata | null; /** * Output types that you would like the model to generate. Most models are capable * of generating text, which is the default: * * `["text"]` * * The `gpt-4o-audio-preview` model can also be used to * [generate audio](https://platform.openai.com/docs/guides/audio). To request that * this model generate both text and audio responses, you can use: * * `["text", "audio"]` */ modalities?: Array<'text' | 'audio'> | null; /** * How many chat completion choices to generate for each input message. Note that * you will be charged based on the number of generated tokens across all of the * choices. Keep `n` as `1` to minimize costs. */ n?: number | null; /** * Whether to enable * [parallel function calling](https://platform.openai.com/docs/guides/function-calling#configuring-parallel-function-calling) * during tool use. */ parallel_tool_calls?: boolean; /** * Static predicted output content, such as the content of a text file that is * being regenerated. */ prediction?: ChatCompletionPredictionContent | null; /** * Number between -2.0 and 2.0. Positive values penalize new tokens based on * whether they appear in the text so far, increasing the model's likelihood to * talk about new topics. */ presence_penalty?: number | null; /** * **o-series models only** * * Constrains effort on reasoning for * [reasoning models](https://platform.openai.com/docs/guides/reasoning). Currently * supported values are `low`, `medium`, and `high`. Reducing reasoning effort can * result in faster responses and fewer tokens used on reasoning in a response. */ reasoning_effort?: Shared.ReasoningEffort | null; /** * An object specifying the format that the model must output. * * Setting to `{ "type": "json_schema", "json_schema": {...} }` enables Structured * Outputs which ensures the model will match your supplied JSON schema. Learn more * in the * [Structured Outputs guide](https://platform.openai.com/docs/guides/structured-outputs). * * Setting to `{ "type": "json_object" }` enables the older JSON mode, which * ensures the message the model generates is valid JSON. Using `json_schema` is * preferred for models that support it. */ response_format?: | Shared.ResponseFormatText | Shared.ResponseFormatJSONSchema | Shared.ResponseFormatJSONObject; /** * This feature is in Beta. If specified, our system will make a best effort to * sample deterministically, such that repeated requests with the same `seed` and * parameters should return the same result. Determinism is not guaranteed, and you * should refer to the `system_fingerprint` response parameter to monitor changes * in the backend. */ seed?: number | null; /** * Specifies the latency tier to use for processing the request. This parameter is * relevant for customers subscribed to the scale tier service: * * - If set to 'auto', and the Project is Scale tier enabled, the system will * utilize scale tier credits until they are exhausted. * - If set to 'auto', and the Project is not Scale tier enabled, the request will * be processed using the default service tier with a lower uptime SLA and no * latency guarentee. * - If set to 'default', the request will be processed using the default service * tier with a lower uptime SLA and no latency guarentee. * - If set to 'flex', the request will be processed with the Flex Processing * service tier. * [Learn more](https://platform.openai.com/docs/guides/flex-processing). * - When not set, the default behavior is 'auto'. * * When this parameter is set, the response body will include the `service_tier` * utilized. */ service_tier?: 'auto' | 'default' | 'flex' | null; /** * Not supported with latest reasoning models `o3` and `o4-mini`. * * Up to 4 sequences where the API will stop generating further tokens. The * returned text will not contain the stop sequence. */ stop?: string | null | Array<string>; /** * Whether or not to store the output of this chat completion request for use in * our [model distillation](https://platform.openai.com/docs/guides/distillation) * or [evals](https://platform.openai.com/docs/guides/evals) products. */ store?: boolean | null; /** * If set to true, the model response data will be streamed to the client as it is * generated using * [server-sent events](https://developer.mozilla.org/en-US/docs/Web/API/Server-sent_events/Using_server-sent_events#Event_stream_format). * See the * [Streaming section below](https://platform.openai.com/docs/api-reference/chat/streaming) * for more information, along with the * [streaming responses](https://platform.openai.com/docs/guides/streaming-responses) * guide for more information on how to handle the streaming events. */ stream?: boolean | null; /** * Options for streaming response. Only set this when you set `stream: true`. */ stream_options?: ChatCompletionStreamOptions | null; /** * What sampling temperature to use, between 0 and 2. Higher values like 0.8 will * make the output more random, while lower values like 0.2 will make it more * focused and deterministic. We generally recommend altering this or `top_p` but * not both. */ temperature?: number | null; /** * Controls which (if any) tool is called by the model. `none` means the model will * not call any tool and instead generates a message. `auto` means the model can * pick between generating a message or calling one or more tools. `required` means * the model must call one or more tools. Specifying a particular tool via * `{"type": "function", "function": {"name": "my_function"}}` forces the model to * call that tool. * * `none` is the default when no tools are present. `auto` is the default if tools * are present. */ tool_choice?: ChatCompletionToolChoiceOption; /** * A list of tools the model may call. Currently, only functions are supported as a * tool. Use this to provide a list of functions the model may generate JSON inputs * for. A max of 128 functions are supported. */ tools?: Array<ChatCompletionTool>; /** * An integer between 0 and 20 specifying the number of most likely tokens to * return at each token position, each with an associated log probability. * `logprobs` must be set to `true` if this parameter is used. */ top_logprobs?: number | null; /** * An alternative to sampling with temperature, called nucleus sampling, where the * model considers the results of the tokens with top_p probability mass. So 0.1 * means only the tokens comprising the top 10% probability mass are considered. * * We generally recommend altering this or `temperature` but not both. */ top_p?: number | null; /** * A unique identifier representing your end-user, which can help OpenAI to monitor * and detect abuse. * [Learn more](https://platform.openai.com/docs/guides/safety-best-practices#end-user-ids). */ user?: string; /** * This tool searches the web for relevant results to use in a response. Learn more * about the * [web search tool](https://platform.openai.com/docs/guides/tools-web-search?api-mode=chat). */ web_search_options?: ChatCompletionCreateParams.WebSearchOptions; } export namespace ChatCompletionCreateParams { /** * @deprecated */ export interface Function { /** * The name of the function to be called. Must be a-z, A-Z, 0-9, or contain * underscores and dashes, with a maximum length of 64. */ name: string; /** * A description of what the function does, used by the model to choose when and * how to call the function. */ description?: string; /** * The parameters the functions accepts, described as a JSON Schema object. See the * [guide](https://platform.openai.com/docs/guides/function-calling) for examples, * and the * [JSON Schema reference](https://json-schema.org/understanding-json-schema/) for * documentation about the format. * * Omitting `parameters` defines a function with an empty parameter list. */ parameters?: Shared.FunctionParameters; } /** * This tool searches the web for relevant results to use in a response. Learn more * about the * [web search tool](https://platform.openai.com/docs/guides/tools-web-search?api-mode=chat). */ export interface WebSearchOptions { /** * High level guidance for the amount of context window space to use for the * search. One of `low`, `medium`, or `high`. `medium` is the default. */ search_context_size?: 'low' | 'medium' | 'high'; /** * Approximate location parameters for the search. */ user_location?: WebSearchOptions.UserLocation | null; } export namespace WebSearchOptions { /** * Approximate location parameters for the search. */ export interface UserLocation { /** * Approximate location parameters for the search. */ approximate: UserLocation.Approximate; /** * The type of location approximation. Always `approximate`. */ type: 'approximate'; } export namespace UserLocation { /** * Approximate location parameters for the search. */ export interface Approximate { /** * Free text input for the city of the user, e.g. `San Francisco`. */ city?: string; /** * The two-letter [ISO country code](https://en.wikipedia.org/wiki/ISO_3166-1) of * the user, e.g. `US`. */ country?: string; /** * Free text input for the region of the user, e.g. `California`. */ region?: string; /** * The [IANA timezone](https://timeapi.io/documentation/iana-timezones) of the * user, e.g. `America/Los_Angeles`. */ timezone?: string; } } } export type ChatCompletionCreateParamsNonStreaming = CompletionsCompletionsAPI.ChatCompletionCreateParamsNonStreaming; export type ChatCompletionCreateParamsStreaming = CompletionsCompletionsAPI.ChatCompletionCreateParamsStreaming; } /** * @deprecated Use ChatCompletionCreateParams instead */ export type CompletionCreateParams = ChatCompletionCreateParams; export interface ChatCompletionCreateParamsNonStreaming extends ChatCompletionCreateParamsBase { /** * If set to true, the model response data will be streamed to the client as it is * generated using * [server-sent events](https://developer.mozilla.org/en-US/docs/Web/API/Server-sent_events/Using_server-sent_events#Event_stream_format). * See the * [Streaming section below](https://platform.openai.com/docs/api-reference/chat/streaming) * for more information, along with the * [streaming responses](https://platform.openai.com/docs/guides/streaming-responses) * guide for more information on how to handle the streaming events. */ stream?: false | null; } /** * @deprecated Use ChatCompletionCreateParamsNonStreaming instead */ export type CompletionCreateParamsNonStreaming = ChatCompletionCreateParamsNonStreaming; export interface ChatCompletionCreateParamsStreaming extends ChatCompletionCreateParamsBase { /** * If set to true, the model response data will be streamed to the client as it is * generated using * [server-sent events](https://developer.mozilla.org/en-US/docs/Web/API/Server-sent_events/Using_server-sent_events#Event_stream_format). * See the * [Streaming section below](https://platform.openai.com/docs/api-reference/chat/streaming) * for more information, along with the * [streaming responses](https://platform.openai.com/docs/guides/streaming-responses) * guide for more information on how to handle the streaming events. */ stream: true; } /** * @deprecated Use ChatCompletionCreateParamsStreaming instead */ export type CompletionCreateParamsStreaming = ChatCompletionCreateParamsStreaming; export interface ChatCompletionUpdateParams { /** * Set of 16 key-value pairs that can be attached to an object. This can be useful * for storing additional information about the object in a structured format, and * querying for objects via API or the dashboard. * * Keys are strings with a maximum length of 64 characters. Values are strings with * a maximum length of 512 characters. */ metadata: Shared.Metadata | null; } /** * @deprecated Use ChatCompletionUpdateParams instead */ export type CompletionUpdateParams = ChatCompletionUpdateParams; export interface ChatCompletionListParams extends CursorPageParams { /