resources/chat/completions.ts (405 lines of code) (raw):
// File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
import { APIResource } from "../../resource.ts";
import { APIPromise } from "../../core.ts";
import * as Core from "../../core.ts";
import * as ChatCompletionsAPI from "./completions.ts";
import * as CompletionsAPI from "../completions.ts";
import * as Shared from "../shared.ts";
import * as ChatAPI from "./chat.ts";
import { Stream } from "../../streaming.ts";
export class Completions extends APIResource {
/**
* Creates a model response for the given chat conversation. Learn more in the
* [text generation](https://platform.openai.com/docs/guides/text-generation),
* [vision](https://platform.openai.com/docs/guides/vision), and
* [audio](https://platform.openai.com/docs/guides/audio) guides.
*/
create(
body: ChatCompletionCreateParamsNonStreaming,
options?: Core.RequestOptions,
): APIPromise<ChatCompletion>;
create(
body: ChatCompletionCreateParamsStreaming,
options?: Core.RequestOptions,
): APIPromise<Stream<ChatCompletionChunk>>;
create(
body: ChatCompletionCreateParamsBase,
options?: Core.RequestOptions,
): APIPromise<Stream<ChatCompletionChunk> | ChatCompletion>;
create(
body: ChatCompletionCreateParams,
options?: Core.RequestOptions,
): APIPromise<ChatCompletion> | APIPromise<Stream<ChatCompletionChunk>> {
return this._client.post("/chat/completions", {
body,
...options,
stream: body.stream ?? false,
}) as
| APIPromise<ChatCompletion>
| APIPromise<Stream<ChatCompletionChunk>>;
}
}
/**
* Represents a chat completion response returned by model, based on the provided
* input.
*/
export interface ChatCompletion {
/**
* A unique identifier for the chat completion.
*/
id: string;
/**
* A list of chat completion choices. Can be more than one if `n` is greater
* than 1.
*/
choices: Array<ChatCompletion.Choice>;
/**
* The Unix timestamp (in seconds) of when the chat completion was created.
*/
created: number;
/**
* The model used for the chat completion.
*/
model: string;
/**
* The object type, which is always `chat.completion`.
*/
object: "chat.completion";
/**
* The service tier used for processing the request. This field is only included if
* the `service_tier` parameter is specified in the request.
*/
service_tier?: "scale" | "default" | null;
/**
* This fingerprint represents the backend configuration that the model runs with.
*
* Can be used in conjunction with the `seed` request parameter to understand when
* backend changes have been made that might impact determinism.
*/
system_fingerprint?: string;
/**
* Usage statistics for the completion request.
*/
usage?: CompletionsAPI.CompletionUsage;
}
export namespace ChatCompletion {
export interface Choice {
/**
* The reason the model stopped generating tokens. This will be `stop` if the model
* hit a natural stop point or a provided stop sequence, `length` if the maximum
* number of tokens specified in the request was reached, `content_filter` if
* content was omitted due to a flag from our content filters, `tool_calls` if the
* model called a tool, or `function_call` (deprecated) if the model called a
* function.
*/
finish_reason:
| "stop"
| "length"
| "tool_calls"
| "content_filter"
| "function_call";
/**
* The index of the choice in the list of choices.
*/
index: number;
/**
* Log probability information for the choice.
*/
logprobs: Choice.Logprobs | null;
/**
* A chat completion message generated by the model.
*/
message: ChatCompletionsAPI.ChatCompletionMessage;
}
export namespace Choice {
/**
* Log probability information for the choice.
*/
export interface Logprobs {
/**
* A list of message content tokens with log probability information.
*/
content: Array<ChatCompletionsAPI.ChatCompletionTokenLogprob> | null;
/**
* A list of message refusal tokens with log probability information.
*/
refusal: Array<ChatCompletionsAPI.ChatCompletionTokenLogprob> | null;
}
}
}
export interface ChatCompletionAssistantMessageParam {
/**
* The role of the messages author, in this case `assistant`.
*/
role: "assistant";
/**
* Data about a previous audio response from the model.
* [Learn more](https://platform.openai.com/docs/guides/audio).
*/
audio?: ChatCompletionAssistantMessageParam.Audio | null;
/**
* The contents of the assistant message. Required unless `tool_calls` or
* `function_call` is specified.
*/
content?:
| string
| Array<ChatCompletionContentPartText | ChatCompletionContentPartRefusal>
| null;
/**
* @deprecated: Deprecated and replaced by `tool_calls`. The name and arguments of
* a function that should be called, as generated by the model.
*/
function_call?: ChatCompletionAssistantMessageParam.FunctionCall | null;
/**
* An optional name for the participant. Provides the model information to
* differentiate between participants of the same role.
*/
name?: string;
/**
* The refusal message by the assistant.
*/
refusal?: string | null;
/**
* The tool calls generated by the model, such as function calls.
*/
tool_calls?: Array<ChatCompletionMessageToolCall>;
}
export namespace ChatCompletionAssistantMessageParam {
/**
* Data about a previous audio response from the model.
* [Learn more](https://platform.openai.com/docs/guides/audio).
*/
export interface Audio {
/**
* Unique identifier for a previous audio response from the model.
*/
id: string;
}
/**
* @deprecated: Deprecated and replaced by `tool_calls`. The name and arguments of
* a function that should be called, as generated by the model.
*/
export interface FunctionCall {
/**
* The arguments to call the function with, as generated by the model in JSON
* format. Note that the model does not always generate valid JSON, and may
* hallucinate parameters not defined by your function schema. Validate the
* arguments in your code before calling your function.
*/
arguments: string;
/**
* The name of the function to call.
*/
name: string;
}
}
/**
* If the audio output modality is requested, this object contains data about the
* audio response from the model.
* [Learn more](https://platform.openai.com/docs/guides/audio).
*/
export interface ChatCompletionAudio {
/**
* Unique identifier for this audio response.
*/
id: string;
/**
* Base64 encoded audio bytes generated by the model, in the format specified in
* the request.
*/
data: string;
/**
* The Unix timestamp (in seconds) for when this audio response will no longer be
* accessible on the server for use in multi-turn conversations.
*/
expires_at: number;
/**
* Transcript of the audio generated by the model.
*/
transcript: string;
}
/**
* Parameters for audio output. Required when audio output is requested with
* `modalities: ["audio"]`.
* [Learn more](https://platform.openai.com/docs/guides/audio).
*/
export interface ChatCompletionAudioParam {
/**
* Specifies the output audio format. Must be one of `wav`, `mp3`, `flac`, `opus`,
* or `pcm16`.
*/
format: "wav" | "mp3" | "flac" | "opus" | "pcm16";
/**
* The voice the model uses to respond. Supported voices are `alloy`, `ash`,
* `ballad`, `coral`, `echo`, `sage`, `shimmer`, and `verse`.
*/
voice:
| "alloy"
| "ash"
| "ballad"
| "coral"
| "echo"
| "sage"
| "shimmer"
| "verse";
}
/**
* Represents a streamed chunk of a chat completion response returned by model,
* based on the provided input.
*/
export interface ChatCompletionChunk {
/**
* A unique identifier for the chat completion. Each chunk has the same ID.
*/
id: string;
/**
* A list of chat completion choices. Can contain more than one elements if `n` is
* greater than 1. Can also be empty for the last chunk if you set
* `stream_options: {"include_usage": true}`.
*/
choices: Array<ChatCompletionChunk.Choice>;
/**
* The Unix timestamp (in seconds) of when the chat completion was created. Each
* chunk has the same timestamp.
*/
created: number;
/**
* The model to generate the completion.
*/
model: string;
/**
* The object type, which is always `chat.completion.chunk`.
*/
object: "chat.completion.chunk";
/**
* The service tier used for processing the request. This field is only included if
* the `service_tier` parameter is specified in the request.
*/
service_tier?: "scale" | "default" | null;
/**
* This fingerprint represents the backend configuration that the model runs with.
* Can be used in conjunction with the `seed` request parameter to understand when
* backend changes have been made that might impact determinism.
*/
system_fingerprint?: string;
/**
* An optional field that will only be present when you set
* `stream_options: {"include_usage": true}` in your request. When present, it
* contains a null value except for the last chunk which contains the token usage
* statistics for the entire request.
*/
usage?: CompletionsAPI.CompletionUsage | null;
}
export namespace ChatCompletionChunk {
export interface Choice {
/**
* A chat completion delta generated by streamed model responses.
*/
delta: Choice.Delta;
/**
* The reason the model stopped generating tokens. This will be `stop` if the model
* hit a natural stop point or a provided stop sequence, `length` if the maximum
* number of tokens specified in the request was reached, `content_filter` if
* content was omitted due to a flag from our content filters, `tool_calls` if the
* model called a tool, or `function_call` (deprecated) if the model called a
* function.
*/
finish_reason:
| "stop"
| "length"
| "tool_calls"
| "content_filter"
| "function_call"
| null;
/**
* The index of the choice in the list of choices.
*/
index: number;
/**
* Log probability information for the choice.
*/
logprobs?: Choice.Logprobs | null;
}
export namespace Choice {
/**
* A chat completion delta generated by streamed model responses.
*/
export interface Delta {
/**
* The contents of the chunk message.
*/
content?: string | null;
/**
* @deprecated: Deprecated and replaced by `tool_calls`. The name and arguments of
* a function that should be called, as generated by the model.
*/
function_call?: Delta.FunctionCall;
/**
* The refusal message generated by the model.
*/
refusal?: string | null;
/**
* The role of the author of this message.
*/
role?: "system" | "user" | "assistant" | "tool";
tool_calls?: Array<Delta.ToolCall>;
}
export namespace Delta {
/**
* @deprecated: Deprecated and replaced by `tool_calls`. The name and arguments of
* a function that should be called, as generated by the model.
*/
export interface FunctionCall {
/**
* The arguments to call the function with, as generated by the model in JSON
* format. Note that the model does not always generate valid JSON, and may
* hallucinate parameters not defined by your function schema. Validate the
* arguments in your code before calling your function.
*/
arguments?: string;
/**
* The name of the function to call.
*/
name?: string;
}
export interface ToolCall {
index: number;
/**
* The ID of the tool call.
*/
id?: string;
function?: ToolCall.Function;
/**
* The type of the tool. Currently, only `function` is supported.
*/
type?: "function";
}
export namespace ToolCall {
export interface Function {
/**
* The arguments to call the function with, as generated by the model in JSON
* format. Note that the model does not always generate valid JSON, and may
* hallucinate parameters not defined by your function schema. Validate the
* arguments in your code before calling your function.
*/
arguments?: string;
/**
* The name of the function to call.
*/
name?: string;
}
}
}
/**
* Log probability information for the choice.
*/
export interface Logprobs {
/**
* A list of message content tokens with log probability information.
*/
content: Array<ChatCompletionsAPI.ChatCompletionTokenLogprob> | null;
/**
* A list of message refusal tokens with log probability information.
*/
refusal: Array<ChatCompletionsAPI.ChatCompletionTokenLogprob> | null;
}
}
}
/**
* Learn about
* [text inputs](https://platform.openai.com/docs/guides/text-generation).
*/
export type ChatCompletionContentPart =
| ChatCompletionContentPartText
| ChatCompletionContentPartImage
| ChatCompletionContentPartInputAudio;
/**
* Learn about [image inputs](https://platform.openai.com/docs/guides/vision).
*/
export interface ChatCompletionContentPartImage {
image_url: ChatCompletionContentPartImage.ImageURL;
/**
* The type of the content part.
*/
type: "image_url";
}
export namespace ChatCompletionContentPartImage {
export interface ImageURL {
/**
* Either a URL of the image or the base64 encoded image data.
*/
url: string;
/**
* Specifies the detail level of the image. Learn more in the
* [Vision guide](https://platform.openai.com/docs/guides/vision/low-or-high-fidelity-image-understanding).
*/
detail?: "auto" | "low" | "high";
}
}
/**
* Learn about [audio inputs](https://platform.openai.com/docs/guides/audio).
*/
export interface ChatCompletionContentPartInputAudio {
input_audio: ChatCompletionContentPartInputAudio.InputAudio;
/**
* The type of the content part. Always `input_audio`.
*/
type: "input_audio";
}
export namespace ChatCompletionContentPartInputAudio {
export interface InputAudio {
/**
* Base64 encoded audio data.
*/
data: string;
/**
* The format of the encoded audio data. Currently supports "wav" and "mp3".
*/
format: "wav" | "mp3";
}
}
export interface ChatCompletionContentPartRefusal {
/**
* The refusal message generated by the model.
*/
refusal: string;
/**
* The type of the content part.
*/
type: "refusal";
}
/**
* Learn about
* [text inputs](https://platform.openai.com/docs/guides/text-generation).
*/
export interface ChatCompletionContentPartText {
/**
* The text content.
*/
text: string;
/**
* The type of the content part.
*/
type: "text";
}
/**
* Specifying a particular function via `{"name": "my_function"}` forces the model
* to call that function.
*/
export interface ChatCompletionFunctionCallOption {
/**
* The name of the function to call.
*/
name: string;
}
/**
* @deprecated
*/
export interface ChatCompletionFunctionMessageParam {
/**
* The contents of the function message.
*/
content: string | null;
/**
* The name of the function to call.
*/
name: string;
/**
* The role of the messages author, in this case `function`.
*/
role: "function";
}
/**
* A chat completion message generated by the model.
*/
export interface ChatCompletionMessage {
/**
* The contents of the message.
*/
content: string | null;
/**
* The refusal message generated by the model.
*/
refusal: string | null;
/**
* The role of the author of this message.
*/
role: "assistant";
/**
* If the audio output modality is requested, this object contains data about the
* audio response from the model.
* [Learn more](https://platform.openai.com/docs/guides/audio).
*/
audio?: ChatCompletionAudio | null;
/**
* @deprecated: Deprecated and replaced by `tool_calls`. The name and arguments of
* a function that should be called, as generated by the model.
*/
function_call?: ChatCompletionMessage.FunctionCall | null;
/**
* The tool calls generated by the model, such as function calls.
*/
tool_calls?: Array<ChatCompletionMessageToolCall>;
}
export namespace ChatCompletionMessage {
/**
* @deprecated: Deprecated and replaced by `tool_calls`. The name and arguments of
* a function that should be called, as generated by the model.
*/
export interface FunctionCall {
/**
* The arguments to call the function with, as generated by the model in JSON
* format. Note that the model does not always generate valid JSON, and may
* hallucinate parameters not defined by your function schema. Validate the
* arguments in your code before calling your function.
*/
arguments: string;
/**
* The name of the function to call.
*/
name: string;
}
}
export type ChatCompletionMessageParam =
| ChatCompletionSystemMessageParam
| ChatCompletionUserMessageParam
| ChatCompletionAssistantMessageParam
| ChatCompletionToolMessageParam
| ChatCompletionFunctionMessageParam;
export interface ChatCompletionMessageToolCall {
/**
* The ID of the tool call.
*/
id: string;
/**
* The function that the model called.
*/
function: ChatCompletionMessageToolCall.Function;
/**
* The type of the tool. Currently, only `function` is supported.
*/
type: "function";
}
export namespace ChatCompletionMessageToolCall {
/**
* The function that the model called.
*/
export interface Function {
/**
* The arguments to call the function with, as generated by the model in JSON
* format. Note that the model does not always generate valid JSON, and may
* hallucinate parameters not defined by your function schema. Validate the
* arguments in your code before calling your function.
*/
arguments: string;
/**
* The name of the function to call.
*/
name: string;
}
}
export type ChatCompletionModality = "text" | "audio";
/**
* Specifies a tool the model should use. Use to force the model to call a specific
* function.
*/
export interface ChatCompletionNamedToolChoice {
function: ChatCompletionNamedToolChoice.Function;
/**
* The type of the tool. Currently, only `function` is supported.
*/
type: "function";
}
export namespace ChatCompletionNamedToolChoice {
export interface Function {
/**
* The name of the function to call.
*/
name: string;
}
}
/**
* The role of the author of a message
*/
export type ChatCompletionRole =
| "system"
| "user"
| "assistant"
| "tool"
| "function";
/**
* Options for streaming response. Only set this when you set `stream: true`.
*/
export interface ChatCompletionStreamOptions {
/**
* If set, an additional chunk will be streamed before the `data: [DONE]` message.
* The `usage` field on this chunk shows the token usage statistics for the entire
* request, and the `choices` field will always be an empty array. All other chunks
* will also include a `usage` field, but with a null value.
*/
include_usage?: boolean;
}
export interface ChatCompletionSystemMessageParam {
/**
* The contents of the system message.
*/
content: string | Array<ChatCompletionContentPartText>;
/**
* The role of the messages author, in this case `system`.
*/
role: "system";
/**
* An optional name for the participant. Provides the model information to
* differentiate between participants of the same role.
*/
name?: string;
}
export interface ChatCompletionTokenLogprob {
/**
* The token.
*/
token: string;
/**
* A list of integers representing the UTF-8 bytes representation of the token.
* Useful in instances where characters are represented by multiple tokens and
* their byte representations must be combined to generate the correct text
* representation. Can be `null` if there is no bytes representation for the token.
*/
bytes: Array<number> | null;
/**
* The log probability of this token, if it is within the top 20 most likely
* tokens. Otherwise, the value `-9999.0` is used to signify that the token is very
* unlikely.
*/
logprob: number;
/**
* List of the most likely tokens and their log probability, at this token
* position. In rare cases, there may be fewer than the number of requested
* `top_logprobs` returned.
*/
top_logprobs: Array<ChatCompletionTokenLogprob.TopLogprob>;
}
export namespace ChatCompletionTokenLogprob {
export interface TopLogprob {
/**
* The token.
*/
token: string;
/**
* A list of integers representing the UTF-8 bytes representation of the token.
* Useful in instances where characters are represented by multiple tokens and
* their byte representations must be combined to generate the correct text
* representation. Can be `null` if there is no bytes representation for the token.
*/
bytes: Array<number> | null;
/**
* The log probability of this token, if it is within the top 20 most likely
* tokens. Otherwise, the value `-9999.0` is used to signify that the token is very
* unlikely.
*/
logprob: number;
}
}
export interface ChatCompletionTool {
function: Shared.FunctionDefinition;
/**
* The type of the tool. Currently, only `function` is supported.
*/
type: "function";
}
/**
* Controls which (if any) tool is called by the model. `none` means the model will
* not call any tool and instead generates a message. `auto` means the model can
* pick between generating a message or calling one or more tools. `required` means
* the model must call one or more tools. Specifying a particular tool via
* `{"type": "function", "function": {"name": "my_function"}}` forces the model to
* call that tool.
*
* `none` is the default when no tools are present. `auto` is the default if tools
* are present.
*/
export type ChatCompletionToolChoiceOption =
| "none"
| "auto"
| "required"
| ChatCompletionNamedToolChoice;
export interface ChatCompletionToolMessageParam {
/**
* The contents of the tool message.
*/
content: string | Array<ChatCompletionContentPartText>;
/**
* The role of the messages author, in this case `tool`.
*/
role: "tool";
/**
* Tool call that this message is responding to.
*/
tool_call_id: string;
}
export interface ChatCompletionUserMessageParam {
/**
* The contents of the user message.
*/
content: string | Array<ChatCompletionContentPart>;
/**
* The role of the messages author, in this case `user`.
*/
role: "user";
/**
* An optional name for the participant. Provides the model information to
* differentiate between participants of the same role.
*/
name?: string;
}
/**
* @deprecated ChatCompletionMessageParam should be used instead
*/
export type CreateChatCompletionRequestMessage = ChatCompletionMessageParam;
export type ChatCompletionCreateParams =
| ChatCompletionCreateParamsNonStreaming
| ChatCompletionCreateParamsStreaming;
export interface ChatCompletionCreateParamsBase {
/**
* A list of messages comprising the conversation so far. Depending on the
* [model](https://platform.openai.com/docs/models) you use, different message
* types (modalities) are supported, like
* [text](https://platform.openai.com/docs/guides/text-generation),
* [images](https://platform.openai.com/docs/guides/vision), and
* [audio](https://platform.openai.com/docs/guides/audio).
*/
messages: Array<ChatCompletionMessageParam>;
/**
* ID of the model to use. See the
* [model endpoint compatibility](https://platform.openai.com/docs/models/model-endpoint-compatibility)
* table for details on which models work with the Chat API.
*/
model: (string & {}) | ChatAPI.ChatModel;
/**
* Parameters for audio output. Required when audio output is requested with
* `modalities: ["audio"]`.
* [Learn more](https://platform.openai.com/docs/guides/audio).
*/
audio?: ChatCompletionAudioParam | null;
/**
* Number between -2.0 and 2.0. Positive values penalize new tokens based on their
* existing frequency in the text so far, decreasing the model's likelihood to
* repeat the same line verbatim.
*
* [See more information about frequency and presence penalties.](https://platform.openai.com/docs/guides/text-generation/parameter-details)
*/
frequency_penalty?: number | null;
/**
* Deprecated in favor of `tool_choice`.
*
* Controls which (if any) function is called by the model. `none` means the model
* will not call a function and instead generates a message. `auto` means the model
* can pick between generating a message or calling a function. Specifying a
* particular function via `{"name": "my_function"}` forces the model to call that
* function.
*
* `none` is the default when no functions are present. `auto` is the default if
* functions are present.
*/
function_call?: "none" | "auto" | ChatCompletionFunctionCallOption;
/**
* Deprecated in favor of `tools`.
*
* A list of functions the model may generate JSON inputs for.
*/
functions?: Array<ChatCompletionCreateParams.Function>;
/**
* Modify the likelihood of specified tokens appearing in the completion.
*
* Accepts a JSON object that maps tokens (specified by their token ID in the
* tokenizer) to an associated bias value from -100 to 100. Mathematically, the
* bias is added to the logits generated by the model prior to sampling. The exact
* effect will vary per model, but values between -1 and 1 should decrease or
* increase likelihood of selection; values like -100 or 100 should result in a ban
* or exclusive selection of the relevant token.
*/
logit_bias?: Record<string, number> | null;
/**
* Whether to return log probabilities of the output tokens or not. If true,
* returns the log probabilities of each output token returned in the `content` of
* `message`.
*/
logprobs?: boolean | null;
/**
* An upper bound for the number of tokens that can be generated for a completion,
* including visible output tokens and
* [reasoning tokens](https://platform.openai.com/docs/guides/reasoning).
*/
max_completion_tokens?: number | null;
/**
* The maximum number of [tokens](/tokenizer) that can be generated in the chat
* completion. This value can be used to control
* [costs](https://openai.com/api/pricing/) for text generated via API.
*
* This value is now deprecated in favor of `max_completion_tokens`, and is not
* compatible with
* [o1 series models](https://platform.openai.com/docs/guides/reasoning).
*/
max_tokens?: number | null;
/**
* Developer-defined tags and values used for filtering completions in the
* [dashboard](https://platform.openai.com/chat-completions).
*/
metadata?: Record<string, string> | null;
/**
* Output types that you would like the model to generate for this request. Most
* models are capable of generating text, which is the default:
*
* `["text"]`
*
* The `gpt-4o-audio-preview` model can also be used to
* [generate audio](https://platform.openai.com/docs/guides/audio). To request that
* this model generate both text and audio responses, you can use:
*
* `["text", "audio"]`
*/
modalities?: Array<ChatCompletionModality> | null;
/**
* How many chat completion choices to generate for each input message. Note that
* you will be charged based on the number of generated tokens across all of the
* choices. Keep `n` as `1` to minimize costs.
*/
n?: number | null;
/**
* Whether to enable
* [parallel function calling](https://platform.openai.com/docs/guides/function-calling/parallel-function-calling)
* during tool use.
*/
parallel_tool_calls?: boolean;
/**
* Number between -2.0 and 2.0. Positive values penalize new tokens based on
* whether they appear in the text so far, increasing the model's likelihood to
* talk about new topics.
*
* [See more information about frequency and presence penalties.](https://platform.openai.com/docs/guides/text-generation/parameter-details)
*/
presence_penalty?: number | null;
/**
* An object specifying the format that the model must output. Compatible with
* [GPT-4o](https://platform.openai.com/docs/models/gpt-4o),
* [GPT-4o mini](https://platform.openai.com/docs/models/gpt-4o-mini),
* [GPT-4 Turbo](https://platform.openai.com/docs/models/gpt-4-and-gpt-4-turbo) and
* all GPT-3.5 Turbo models newer than `gpt-3.5-turbo-1106`.
*
* Setting to `{ "type": "json_schema", "json_schema": {...} }` enables Structured
* Outputs which ensures the model will match your supplied JSON schema. Learn more
* in the
* [Structured Outputs guide](https://platform.openai.com/docs/guides/structured-outputs).
*
* Setting to `{ "type": "json_object" }` enables JSON mode, which ensures the
* message the model generates is valid JSON.
*
* **Important:** when using JSON mode, you **must** also instruct the model to
* produce JSON yourself via a system or user message. Without this, the model may
* generate an unending stream of whitespace until the generation reaches the token
* limit, resulting in a long-running and seemingly "stuck" request. Also note that
* the message content may be partially cut off if `finish_reason="length"`, which
* indicates the generation exceeded `max_tokens` or the conversation exceeded the
* max context length.
*/
response_format?:
| Shared.ResponseFormatText
| Shared.ResponseFormatJSONObject
| Shared.ResponseFormatJSONSchema;
/**
* This feature is in Beta. If specified, our system will make a best effort to
* sample deterministically, such that repeated requests with the same `seed` and
* parameters should return the same result. Determinism is not guaranteed, and you
* should refer to the `system_fingerprint` response parameter to monitor changes
* in the backend.
*/
seed?: number | null;
/**
* Specifies the latency tier to use for processing the request. This parameter is
* relevant for customers subscribed to the scale tier service:
*
* - If set to 'auto', and the Project is Scale tier enabled, the system will
* utilize scale tier credits until they are exhausted.
* - If set to 'auto', and the Project is not Scale tier enabled, the request will
* be processed using the default service tier with a lower uptime SLA and no
* latency guarentee.
* - If set to 'default', the request will be processed using the default service
* tier with a lower uptime SLA and no latency guarentee.
* - When not set, the default behavior is 'auto'.
*
* When this parameter is set, the response body will include the `service_tier`
* utilized.
*/
service_tier?: "auto" | "default" | null;
/**
* Up to 4 sequences where the API will stop generating further tokens.
*/
stop?: string | null | Array<string>;
/**
* Whether or not to store the output of this chat completion request for use in
* our [model distillation](https://platform.openai.com/docs/guides/distillation)
* or [evals](https://platform.openai.com/docs/guides/evals) products.
*/
store?: boolean | null;
/**
* If set, partial message deltas will be sent, like in ChatGPT. Tokens will be
* sent as data-only
* [server-sent events](https://developer.mozilla.org/en-US/docs/Web/API/Server-sent_events/Using_server-sent_events#Event_stream_format)
* as they become available, with the stream terminated by a `data: [DONE]`
* message.
* [Example Python code](https://cookbook.openai.com/examples/how_to_stream_completions).
*/
stream?: boolean | null;
/**
* Options for streaming response. Only set this when you set `stream: true`.
*/
stream_options?: ChatCompletionStreamOptions | null;
/**
* What sampling temperature to use, between 0 and 2. Higher values like 0.8 will
* make the output more random, while lower values like 0.2 will make it more
* focused and deterministic.
*
* We generally recommend altering this or `top_p` but not both.
*/
temperature?: number | null;
/**
* Controls which (if any) tool is called by the model. `none` means the model will
* not call any tool and instead generates a message. `auto` means the model can
* pick between generating a message or calling one or more tools. `required` means
* the model must call one or more tools. Specifying a particular tool via
* `{"type": "function", "function": {"name": "my_function"}}` forces the model to
* call that tool.
*
* `none` is the default when no tools are present. `auto` is the default if tools
* are present.
*/
tool_choice?: ChatCompletionToolChoiceOption;
/**
* A list of tools the model may call. Currently, only functions are supported as a
* tool. Use this to provide a list of functions the model may generate JSON inputs
* for. A max of 128 functions are supported.
*/
tools?: Array<ChatCompletionTool>;
/**
* An integer between 0 and 20 specifying the number of most likely tokens to
* return at each token position, each with an associated log probability.
* `logprobs` must be set to `true` if this parameter is used.
*/
top_logprobs?: number | null;
/**
* An alternative to sampling with temperature, called nucleus sampling, where the
* model considers the results of the tokens with top_p probability mass. So 0.1
* means only the tokens comprising the top 10% probability mass are considered.
*
* We generally recommend altering this or `temperature` but not both.
*/
top_p?: number | null;
/**
* A unique identifier representing your end-user, which can help OpenAI to monitor
* and detect abuse.
* [Learn more](https://platform.openai.com/docs/guides/safety-best-practices/end-user-ids).
*/
user?: string;
}
export namespace ChatCompletionCreateParams {
/**
* @deprecated
*/
export interface Function {
/**
* The name of the function to be called. Must be a-z, A-Z, 0-9, or contain
* underscores and dashes, with a maximum length of 64.
*/
name: string;
/**
* A description of what the function does, used by the model to choose when and
* how to call the function.
*/
description?: string;
/**
* The parameters the functions accepts, described as a JSON Schema object. See the
* [guide](https://platform.openai.com/docs/guides/function-calling) for examples,
* and the
* [JSON Schema reference](https://json-schema.org/understanding-json-schema/) for
* documentation about the format.
*
* Omitting `parameters` defines a function with an empty parameter list.
*/
parameters?: Shared.FunctionParameters;
}
export type ChatCompletionCreateParamsNonStreaming =
ChatCompletionsAPI.ChatCompletionCreateParamsNonStreaming;
export type ChatCompletionCreateParamsStreaming =
ChatCompletionsAPI.ChatCompletionCreateParamsStreaming;
}
/**
* @deprecated Use ChatCompletionCreateParams instead
*/
export type CompletionCreateParams = ChatCompletionCreateParams;
export interface ChatCompletionCreateParamsNonStreaming
extends ChatCompletionCreateParamsBase {
/**
* If set, partial message deltas will be sent, like in ChatGPT. Tokens will be
* sent as data-only
* [server-sent events](https://developer.mozilla.org/en-US/docs/Web/API/Server-sent_events/Using_server-sent_events#Event_stream_format)
* as they become available, with the stream terminated by a `data: [DONE]`
* message.
* [Example Python code](https://cookbook.openai.com/examples/how_to_stream_completions).
*/
stream?: false | null;
}
/**
* @deprecated Use ChatCompletionCreateParamsNonStreaming instead
*/
export type CompletionCreateParamsNonStreaming =
ChatCompletionCreateParamsNonStreaming;
export interface ChatCompletionCreateParamsStreaming
extends ChatCompletionCreateParamsBase {
/**
* If set, partial message deltas will be sent, like in ChatGPT. Tokens will be
* sent as data-only
* [server-sent events](https://developer.mozilla.org/en-US/docs/Web/API/Server-sent_events/Using_server-sent_events#Event_stream_format)
* as they become available, with the stream terminated by a `data: [DONE]`
* message.
* [Example Python code](https://cookbook.openai.com/examples/how_to_stream_completions).
*/
stream: true;
}
/**
* @deprecated Use ChatCompletionCreateParamsStreaming instead
*/
export type CompletionCreateParamsStreaming =
ChatCompletionCreateParamsStreaming;
export namespace Completions {
export type ChatCompletion = ChatCompletionsAPI.ChatCompletion;
export type ChatCompletionAssistantMessageParam =
ChatCompletionsAPI.ChatCompletionAssistantMessageParam;
export type ChatCompletionAudio = ChatCompletionsAPI.ChatCompletionAudio;
export type ChatCompletionAudioParam =
ChatCompletionsAPI.ChatCompletionAudioParam;
export type ChatCompletionChunk = ChatCompletionsAPI.ChatCompletionChunk;
export type ChatCompletionContentPart =
ChatCompletionsAPI.ChatCompletionContentPart;
export type ChatCompletionContentPartImage =
ChatCompletionsAPI.ChatCompletionContentPartImage;
export type ChatCompletionContentPartInputAudio =
ChatCompletionsAPI.ChatCompletionContentPartInputAudio;
export type ChatCompletionContentPartRefusal =
ChatCompletionsAPI.ChatCompletionContentPartRefusal;
export type ChatCompletionContentPartText =
ChatCompletionsAPI.ChatCompletionContentPartText;
export type ChatCompletionFunctionCallOption =
ChatCompletionsAPI.ChatCompletionFunctionCallOption;
export type ChatCompletionFunctionMessageParam =
ChatCompletionsAPI.ChatCompletionFunctionMessageParam;
export type ChatCompletionMessage = ChatCompletionsAPI.ChatCompletionMessage;
export type ChatCompletionMessageParam =
ChatCompletionsAPI.ChatCompletionMessageParam;
export type ChatCompletionMessageToolCall =
ChatCompletionsAPI.ChatCompletionMessageToolCall;
export type ChatCompletionModality =
ChatCompletionsAPI.ChatCompletionModality;
export type ChatCompletionNamedToolChoice =
ChatCompletionsAPI.ChatCompletionNamedToolChoice;
export type ChatCompletionRole = ChatCompletionsAPI.ChatCompletionRole;
export type ChatCompletionStreamOptions =
ChatCompletionsAPI.ChatCompletionStreamOptions;
export type ChatCompletionSystemMessageParam =
ChatCompletionsAPI.ChatCompletionSystemMessageParam;
export type ChatCompletionTokenLogprob =
ChatCompletionsAPI.ChatCompletionTokenLogprob;
export type ChatCompletionTool = ChatCompletionsAPI.ChatCompletionTool;
export type ChatCompletionToolChoiceOption =
ChatCompletionsAPI.ChatCompletionToolChoiceOption;
export type ChatCompletionToolMessageParam =
ChatCompletionsAPI.ChatCompletionToolMessageParam;
export type ChatCompletionUserMessageParam =
ChatCompletionsAPI.ChatCompletionUserMessageParam;
export type CreateChatCompletionRequestMessage =
ChatCompletionsAPI.CreateChatCompletionRequestMessage;
export type ChatCompletionCreateParams =
ChatCompletionsAPI.ChatCompletionCreateParams;
export type CompletionCreateParams =
ChatCompletionsAPI.CompletionCreateParams;
export type ChatCompletionCreateParamsNonStreaming =
ChatCompletionsAPI.ChatCompletionCreateParamsNonStreaming;
export type CompletionCreateParamsNonStreaming =
ChatCompletionsAPI.CompletionCreateParamsNonStreaming;
export type ChatCompletionCreateParamsStreaming =
ChatCompletionsAPI.ChatCompletionCreateParamsStreaming;
export type CompletionCreateParamsStreaming =
ChatCompletionsAPI.CompletionCreateParamsStreaming;
}