specification/cognitiveservices/data-plane/AzureOpenAI/authoring/preview/2025-02-01-preview/azureopenai.yaml

swagger: "2.0" info: title: Azure OpenAI API version 2025-02-01-preview description: APIs for fine-tuning and managing deployments of OpenAI models. version: 2025-02-01-preview paths: /batches: get: tags: - "Batch:" summary: Gets a list of all batches owned by the Azure OpenAI resource. operationId: Batch_List produces: - application/json parameters: - in: query name: after description: Identifier for the last event from the previous pagination request. type: string - in: query name: limit description: Number of batches to retrieve. Defaults to 20. type: integer format: int32 default: 20 - in: query name: $filter description: The OData expression to describe the filtering conditions. type: string - in: query name: $orderby description: The OData expression to describe the sorting order. type: string - $ref: "#/parameters/apiVersionQueryParameter" responses: "200": description: Success schema: $ref: "#/definitions/BatchesList" headers: deployment-enqueued-tokens: description: Sum of enqueued tokens of all jobs that target to the deployment. type: integer format: int64 deployment-maximum-enqueued-tokens: description: Maximum enqueued tokens of the deployment. type: integer format: int64 default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Getting all batches owned by this account.: $ref: ./examples/get_batches.json post: tags: - "Batch:" summary: "Creates and executes a batch from an uploaded file of requests.\r\nResponse includes details of the enqueued job including job status.\r\nThe ID of the result file is added to the response once complete." operationId: Batch_Create consumes: - application/json produces: - application/json parameters: - $ref: "#/parameters/apiVersionQueryParameter" - in: body name: createBatchRequest description: The specification of the batch to create and execute. required: true schema: $ref: "#/definitions/BatchCreateRequest" responses: "201": description: The batch has been successfully created. schema: $ref: "#/definitions/Batch" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Creating a batch.: $ref: ./examples/post_batch.json /batches/{batch-id}: get: tags: - "Batch:" summary: Gets details for a single batch specified by the given batch-id. operationId: Batch_Get produces: - application/json parameters: - in: path name: batch-id description: The identifier of the batch. required: true type: string - $ref: "#/parameters/apiVersionQueryParameter" responses: "200": description: Success schema: $ref: "#/definitions/Batch" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Getting a batch.: $ref: ./examples/get_batch.json /batches/{batch-id}/cancel: post: tags: - "Batch:" summary: Cancels the processing of the batch specified by the given batch-id. operationId: Batch_Cancel produces: - application/json parameters: - in: path name: batch-id description: The identifier of the batch. required: true type: string - $ref: "#/parameters/apiVersionQueryParameter" responses: "200": description: The batch has been successfully canceled. schema: $ref: "#/definitions/Batch" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Canceling a batch.: $ref: ./examples/cancel_batch.json '/chat/completions/{stored-completion-id}': get: tags: - 'StoredCompletion:' summary: Gets stored completion by the given stored completion id. operationId: StoredCompletion_Get produces: - application/json parameters: - in: path name: stored-completion-id description: The identifier of the stored completion. required: true type: string - $ref: '#/parameters/apiVersionQueryParameter' responses: '200': description: Success schema: $ref: '#/definitions/StoredCompletionResponse' default: description: An error occurred. schema: $ref: '#/definitions/ErrorResponse' x-ms-examples: Gets stored completion by the given stored completion id.: $ref: ./examples/get_stored_completion.yaml post: tags: - 'StoredCompletion:' summary: Update stored completion by the given stored completion id. operationId: StoredCompletion_Update consumes: - application/json produces: - application/json parameters: - in: path name: stored-completion-id description: The identifier of the stored completion. required: true type: string - $ref: '#/parameters/apiVersionQueryParameter' - in: body name: updateStoredCompletionRequest description: Arbitrary key-value pairs for additional information. required: true schema: $ref: '#/definitions/UpdateStoredCompletionRequest' responses: '200': description: Success schema: $ref: '#/definitions/StoredCompletion' default: description: An error occurred. schema: $ref: '#/definitions/ErrorResponse' x-ms-examples: Update stored completion by the given stored completion id.: $ref: ./examples/update_stored_completion.yaml delete: tags: - 'StoredCompletion:' summary: Delete stored completion by the given stored completion id. operationId: StoredCompletion_Delete produces: - application/json parameters: - in: path name: stored-completion-id description: The identifier of the stored completion. required: true type: string - $ref: '#/parameters/apiVersionQueryParameter' responses: '200': description: The stored completion was successfully deleted. schema: $ref: '#/definitions/StoredCompletionDelete' default: description: An error occurred. schema: $ref: '#/definitions/ErrorResponse' x-ms-examples: Delete stored completion by the given stored completion id.: $ref: ./examples/delete_stored_completion.yaml '/chat/completions/{stored-completion-id}/messages': get: tags: - 'StoredCompletion:' summary: Gets stored completion messages by the given stored completion id. operationId: StoredCompletion_GetMessages produces: - application/json parameters: - in: path name: stored-completion-id description: The identifier of the stored completion. required: true type: string - in: query name: after description: Identifier for the last stored completion message from the previous pagination request. type: string - in: query name: limit description: Number of stored completions messages to retrieve. Defaults to 20. type: integer format: int32 default: 20 - in: query name: order description: Order of the results by message index (ascending or descending). Default to asc. type: string - $ref: '#/parameters/apiVersionQueryParameter' responses: '200': description: Success schema: $ref: '#/definitions/StoredCompletionMessages' default: description: An error occurred. schema: $ref: '#/definitions/ErrorResponse' x-ms-examples: Gets stored completion messages by the given stored completion id.: $ref: ./examples/get_stored_completion_messages.yaml /chat/completions: get: tags: - 'StoredCompletion:' summary: Gets list of stored completions. operationId: StoredCompletion_List produces: - application/json parameters: - in: query name: metadata description: 'Filter by the (key, value) pair in stored completion.' type: string - in: query name: model description: Filter by model name. type: string - in: query name: after description: Identifier for the last stored completion from the previous pagination request. type: string - in: query name: limit description: Number of stored completions to retrieve. Defaults to 20. type: integer format: int32 default: 20 - in: query name: order description: Order of the results by created time (ascending or descending). Default to desc. type: string - $ref: '#/parameters/apiVersionQueryParameter' responses: '200': description: Success schema: $ref: '#/definitions/StoredCompletionList' default: description: An error occurred. schema: $ref: '#/definitions/ErrorResponse' x-ms-examples: Gets list of stored completions.: $ref: ./examples/get_stored_completion_list.yaml /files: get: tags: - "Files:" summary: "Gets a list of all files owned by the Azure OpenAI resource.\r\nThese include user uploaded content like files with purpose \"fine-tune\" for training or validation of fine-tunes models\r\nas well as files that are generated by the service such as \"fine-tune-results\" which contains various metrics for the corresponding fine-tune job." operationId: Files_List produces: - application/json parameters: - in: query name: purpose description: Only return files with the given purpose. type: string enum: - fine-tune - fine-tune-results - assistants - assistants_output - batch - batch_output x-ms-enum: name: Purpose modelAsString: true values: - value: fine-tune description: This file contains training data for a fine tune job. - value: fine-tune-results description: This file contains the results of a fine tune job. - value: assistants description: This file contains data to be used in assistants. - value: assistants_output description: This file contains the results of an assistant. - value: batch description: This file contains the input data for a batch. - value: batch_output description: This file contains the results of a batch. - $ref: "#/parameters/apiVersionQueryParameter" responses: "200": description: Success schema: $ref: "#/definitions/FileList" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Getting all files owned by this account.: $ref: ./examples/get_files.yaml post: tags: - "Files:" summary: Creates a new file entity by uploading data from a local machine. Uploaded files can, for example, be used for training or evaluating fine-tuned models. operationId: Files_Upload consumes: - multipart/form-data produces: - application/json parameters: - $ref: "#/parameters/apiVersionQueryParameter" - in: formData name: purpose description: The intended purpose of the uploaded documents. Use "fine-tune" for fine-tuning. This allows us to validate the format of the uploaded file. required: true type: string enum: - fine-tune - fine-tune-results - assistants - assistants_output - batch x-ms-enum: name: Purpose modelAsString: true values: - value: fine-tune description: This file contains training data for a fine tune job. - value: fine-tune-results description: This file contains the results of a fine tune job. - value: assistants description: This file contains data to be used in assistants. - value: assistants_output description: This file contains the results of an assistant. - value: batch description: This file contains the input data for a batch. - in: formData name: file description: Gets or sets the file to upload into Azure OpenAI. required: true type: file responses: "201": description: The file has been successfully created. schema: $ref: "#/definitions/File" headers: Location: description: The location of the newly created item. type: string format: url default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Upload a file.: $ref: ./examples/upload_file.yaml /files/import: post: tags: - "Files:" summary: Creates a new file entity by importing data from a provided url. Uploaded files can, for example, be used for training or evaluating fine-tuned models. operationId: Files_Import consumes: - application/json produces: - application/json parameters: - $ref: "#/parameters/apiVersionQueryParameter" - in: body name: fileImport description: The definition of the file to create including its purpose, the file name and the url of the file location. required: true schema: $ref: "#/definitions/FileImport" responses: "201": description: The file has been successfully created. schema: $ref: "#/definitions/File" headers: Location: description: The location of the newly created item. type: string format: url default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Importing a file with a blob url as source.: $ref: ./examples/import_file.yaml /files/{file-id}: get: tags: - "Files:" summary: Gets details for a single file specified by the given file-id including status, size, purpose, etc. operationId: Files_Get produces: - application/json parameters: - in: path name: file-id description: The identifier of the file. required: true type: string - $ref: "#/parameters/apiVersionQueryParameter" responses: "200": description: Success schema: $ref: "#/definitions/File" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Getting a file.: $ref: ./examples/get_file.yaml delete: tags: - "Files:" summary: "Deletes the file with the given file-id.\r\nDeletion is also allowed if a file was used, e.g., as training file in a fine-tune job." operationId: Files_Delete produces: - application/json parameters: - in: path name: file-id description: The identifier of the file. required: true type: string - $ref: "#/parameters/apiVersionQueryParameter" responses: "200": description: The file was successfully deleted. schema: $ref: '#/definitions/FileDelete' default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Deleting a file.: $ref: ./examples/delete_file.yaml /files/{file-id}/content: get: tags: - "Files:" summary: "Gets the content of the file specified by the given file-id.\r\nFiles can be user uploaded content or generated by the service like result metrics of a fine-tune job." operationId: Files_GetContent produces: - application/octet-stream - application/json parameters: - in: path name: file-id description: The identifier of the file. required: true type: string - $ref: "#/parameters/apiVersionQueryParameter" responses: "200": description: Success schema: type: file default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Getting the file content.: $ref: ./examples/get_file_content.yaml /fine_tuning/jobs: get: tags: - "Fine-tuning:" summary: "Gets a list of all fine-tune jobs owned by the Azure OpenAI resource.\r\nThe details that are returned for each fine-tune job contain besides its identifier\r\nthe base model, training and validation files, hyper parameters, time stamps, status and events.\r\nEvents are created when the job status changes, e.g. running or complete, and when results are uploaded." operationId: FineTuning_List produces: - application/json parameters: - in: query name: after description: Identifier for the last event from the previous pagination request. type: string - in: query name: limit description: Number of events to retrieve. Defaults to 20. type: integer format: int32 default: 20 - $ref: "#/parameters/apiVersionQueryParameter" responses: "200": description: Success schema: $ref: "#/definitions/FineTuningJobList" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Getting all fine tuning jobs owned by this account.: $ref: ./examples/get_finetuning_jobs.yaml post: tags: - "Fine-tuning:" summary: "Creates a job that fine-tunes a specified model from a given training file.\r\nResponse includes details of the enqueued job including job status and hyper parameters.\r\nThe name of the fine-tuned model is added to the response once complete." operationId: FineTuning_Create consumes: - application/json produces: - application/json parameters: - $ref: "#/parameters/apiVersionQueryParameter" - in: body name: fineTuningJob description: "The specification of the fine-tuned model to create.\r\nRequired parameters are the base model and the training file to use.\r\nOptionally a validation file can be specified to compute validation metrics during training.\r\nHyper parameters will be set to default values or can be optionally specified.\r\nThese include batch size, learning rate multiplier, number of epochs and others." required: true schema: $ref: "#/definitions/FineTuningJobCreation" responses: "201": description: The fine tune has been successfully created. schema: $ref: "#/definitions/FineTuningJob" headers: Location: description: The location of the newly created item. type: string format: url default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Creating a fine tuning job.: $ref: ./examples/post_finetuning_job.yaml /fine_tuning/jobs/{fine-tuning-job-id}: get: tags: - "Fine-tuning:" summary: "Gets details for a single fine-tune job specified by the given fine-tune-id.\r\nThe details contain the base model, training and validation files, hyper parameters, time stamps, status and events.\r\nEvents are created when the job status changes, e.g. running or complete, and when results are uploaded." operationId: FineTuning_Get produces: - application/json parameters: - in: path name: fine-tuning-job-id description: The identifier of the fine-tune job. required: true type: string - $ref: "#/parameters/apiVersionQueryParameter" responses: "200": description: Success schema: $ref: "#/definitions/FineTuningJob" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Getting a fine tuning job.: $ref: ./examples/get_finetuning_job.yaml delete: tags: - "Fine-tuning:" summary: Deletes the fine-tune job specified by the given fine-tune-id. operationId: FineTuning_Delete produces: - application/json parameters: - in: path name: fine-tuning-job-id description: The identifier of the fine-tune job. required: true type: string - $ref: "#/parameters/apiVersionQueryParameter" responses: "204": description: The fine tune was successfully deleted. default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Deleting a fine tuning job.: $ref: ./examples/delete_finetuning_job.yaml /fine_tuning/jobs/{fine-tuning-job-id}/cancel: post: tags: - "Fine-tuning:" summary: Cancels the processing of the fine-tune job specified by the given fine-tune-id. operationId: FineTuning_Cancel produces: - application/json parameters: - in: path name: fine-tuning-job-id description: The identifier of the fine-tune job. required: true type: string - $ref: "#/parameters/apiVersionQueryParameter" responses: "200": description: The fine tune has been successfully canceled schema: $ref: "#/definitions/FineTuningJob" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Canceling a fine tuning job.: $ref: ./examples/cancel_finetuning_job.yaml /fine_tuning/jobs/{fine-tuning-job-id}/checkpoints: get: tags: - "Fine-tuning:" summary: "Gets the checkpoints for the fine-tune job specified by the given fine-tune-id.\r\nCheckpoints are created at the end of successful epochs during training." operationId: FineTuning_GetCheckpoints produces: - application/json parameters: - in: path name: fine-tuning-job-id description: The identifier of the fine-tune job. required: true type: string - in: query name: after description: Identifier for the last checkpoint ID from the previous pagination request. type: string - in: query name: limit description: Number of checkpoints to retrieve. Defaults to 10. type: integer format: int32 default: 10 - $ref: "#/parameters/apiVersionQueryParameter" responses: "200": description: Success schema: $ref: "#/definitions/FineTuningJobCheckpointList" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Getting checkpoints of a fine tuning job.: $ref: ./examples/get_finetuning_job_checkpoints.yaml /fine_tuning/jobs/{fine-tuning-job-id}/events: get: tags: - "Fine-tuning:" summary: "Gets the events for the fine-tune job specified by the given fine-tune-id.\r\nEvents are created when the job status changes, e.g. running or complete, and when results are uploaded." operationId: FineTuning_GetEvents produces: - application/json parameters: - in: path name: fine-tuning-job-id description: The identifier of the fine-tune job. required: true type: string - in: query name: after description: Identifier for the last event from the previous pagination request. type: string - in: query name: limit description: Number of events to retrieve. Defaults to 20. type: integer format: int32 default: 20 - $ref: "#/parameters/apiVersionQueryParameter" responses: "200": description: Success schema: $ref: "#/definitions/FineTuningJobEventList" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Getting events of a fine tuning job.: $ref: ./examples/get_finetuning_job_events.yaml /ingestion/jobs: get: tags: - "Ingestion:" summary: Lists the ingestion jobs. operationId: IngestionJobs_List produces: - application/json parameters: - $ref: "#/parameters/apiVersionQueryParameter" - in: header name: mgmt-user-token type: string description: The token used to access the workspace (needed only for user compute jobs). responses: "200": description: Success schema: $ref: "#/definitions/IngestionJobList" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: List all ingestion jobs: $ref: ./examples/list_ingestion_jobs.json /ingestion/jobs/{job-id}: put: tags: - "Ingestion:" summary: Creates an ingestion job with the specified job id. operationId: IngestionJobs_Create consumes: - application/json produces: - application/json parameters: - $ref: "#/parameters/apiVersionQueryParameter" - in: path name: job-id required: true type: string description: The id of the job that will be created. - in: header name: mgmt-user-token type: string description: The token used to access the workspace (needed only for user compute jobs). - in: header name: aml-user-token type: string description: The token used to access the resources within the job in the workspace (needed only for user compute jobs). - in: body name: ingestionJob schema: $ref: "#/definitions/IngestionJob" responses: "200": description: Success schema: $ref: "#/definitions/IngestionJob" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Create a system-compute ingestion job: $ref: ./examples/put_ingestion_job_sc.json Create a user-compute ingestion job: $ref: ./examples/put_ingestion_job_uc.json get: tags: - "Ingestion:" summary: Gets the details of the specified job id. operationId: IngestionJobs_Get produces: - application/json parameters: - $ref: "#/parameters/apiVersionQueryParameter" - in: path name: job-id required: true description: The id of the job. type: string responses: "200": description: Success schema: $ref: "#/definitions/IngestionJob" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Get ingestion job: $ref: ./examples/get_ingestion_job.json /ingestion/jobs/{job-id}/runs: get: tags: - "Ingestion:" summary: Lists the runs of the specified job id. operationId: IngestionJobRuns_List produces: - application/json parameters: - $ref: "#/parameters/apiVersionQueryParameter" - in: path name: job-id required: true description: The id of the job. type: string - in: header name: mgmt-user-token type: string description: The token used to access the workspace (needed only for user compute jobs). responses: "200": description: Success schema: $ref: "#/definitions/IngestionJobRunList" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: List ingestion job runs: $ref: ./examples/list_ingestion_job_runs.json /ingestion/jobs/{job-id}/runs/{run-id}: get: tags: - "Ingestion:" summary: Gets the details of the specified run id as part of the specified job id. operationId: IngestionJobRuns_Get produces: - application/json parameters: - $ref: "#/parameters/apiVersionQueryParameter" - in: path name: job-id required: true description: The id of the job. type: string - in: path name: run-id required: true description: The id of the run. type: string - in: header name: mgmt-user-token type: string description: The token used to access the workspace (needed only for user compute jobs). responses: "200": description: Success schema: $ref: "#/definitions/IngestionJobRun" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Get ingestion job runs: $ref: ./examples/get_ingestion_job_run.json /models: get: tags: - "Models:" summary: "Gets a list of all models that are accessible by the Azure OpenAI resource.\r\nThese include base models as well as all successfully completed fine-tuned models owned by the Azure OpenAI resource." operationId: Models_List produces: - application/json parameters: - $ref: "#/parameters/apiVersionQueryParameter" responses: "200": description: Success schema: $ref: "#/definitions/ModelList" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Getting all models owned by account.: $ref: ./examples/get_models.yaml /models/{model-id}: get: tags: - "Models:" summary: Gets details for the model specified by the given modelId. operationId: Models_Get produces: - application/json parameters: - in: path name: model-id description: The identifier of the model. required: true type: string - $ref: "#/parameters/apiVersionQueryParameter" responses: "200": description: Success schema: $ref: "#/definitions/Model" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Getting a base model.: $ref: ./examples/get_model_base.yaml Getting a fine-tuned model.: $ref: ./examples/get_model_finetune.yaml /uploads: post: tags: - "UploadFile:" summary: "An intermediate Upload object is created, allowing you to add Parts to it. Currently, an Upload size can be a maximum of 9 GB in total and will expire two hours after being created.\r\nAfter the Upload is completed a File object will be generated, containing all the uploaded parts. This File object can then be used across our platform just like any other file." operationId: UploadFile_Start consumes: - application/json - text/json - application/*+json produces: - application/json parameters: - $ref: "#/parameters/apiVersionQueryParameter" - in: body name: requestBody description: The definition of the file to create including its purpose and the location on the local machine. required: true schema: $ref: "#/definitions/UploadFileStartBody" responses: "200": description: The upload has been successfully created. schema: $ref: "#/definitions/UploadResource" headers: Location: description: The location of the newly created item. type: string format: url default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Start a large file upload operation.: $ref: ./examples/upload_file_start.yaml /uploads/{upload-id}/cancel: post: tags: - "UploadFile:" summary: "Cancels the Upload, and will lead to all uploaded parts to be deleted asynchronously.\r\nNo Parts may be added after an Upload is cancelled." operationId: UploadFile_Cancel produces: - application/json parameters: - in: path name: upload-id description: The identifier of the upload. required: true type: string - $ref: "#/parameters/apiVersionQueryParameter" responses: "200": description: Success schema: $ref: "#/definitions/UploadResource" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Cancel a large file upload operation.: $ref: ./examples/upload_file_cancel.yaml /uploads/{upload-id}/complete: post: tags: - "UploadFile:" summary: "This completes the Upload, and the returned Upload object contains a nested File object that is ready for use across the platform.\r\nYou can define the order of the Parts by providing an ordered list of Part IDs.\r\nThe total number of bytes uploaded must match the size originally specified when creating the Upload object.\r\nAfter this operation no additional Parts can be added once the Upload is completed." operationId: UploadFile_Complete consumes: - application/json - text/json - application/*+json produces: - application/json parameters: - in: path name: upload-id description: The identifier of the upload. required: true type: string - $ref: "#/parameters/apiVersionQueryParameter" - in: body name: requestBody description: The definition of the file to create including its purpose and the location on the local machine. required: true schema: $ref: "#/definitions/UploadFileCompleteBody" responses: "200": description: Success schema: $ref: "#/definitions/UploadResource" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Complete and validate a large file upload operation.: $ref: ./examples/upload_file_complete.yaml /uploads/{upload-id}/parts: post: tags: - "UploadFile:" summary: "Adds a Part to an Upload object, where each Part represents a segment of the file you are uploading.\r\nEach Part can be up to the standard size limit for file upload, based on the File Purpose. You can continue adding Parts until reaching the Upload size limit of 9 GB." operationId: UploadFile_Part consumes: - multipart/form-data produces: - application/json parameters: - in: path name: upload-id description: The identifier of the upload. required: true type: string - $ref: "#/parameters/apiVersionQueryParameter" - in: formData name: data required: true type: file responses: "200": description: Success schema: $ref: "#/definitions/UploadPartResource" default: description: An error occurred. schema: $ref: "#/definitions/ErrorResponse" x-ms-examples: Upload a part of large file upload operation.: $ref: ./examples/upload_file_part.yaml definitions: AzureAISearchIndex: description: Azure AI Search Index. required: - connectionId allOf: - $ref: "#/definitions/TargetIndex" - type: object properties: connectionId: type: string description: The id of the connection pointing to the Azure AI Search Index. x-ms-discriminator-value: AzureAISearch BaseConnection: title: BaseConnection description: A connection to a resource. type: object required: - kind properties: kind: $ref: "#/definitions/ConnectionType" discriminator: kind Batch: title: Batch description: Defines the values of a batch. required: - id - input_file_id type: object properties: id: description: The identity of this item. type: string object: $ref: "#/definitions/TypeDiscriminator" endpoint: description: The API endpoint used by the batch. type: string readOnly: true errors: $ref: "#/definitions/BatchErrors" input_file_id: description: The ID of the input file for the batch. minLength: 1 type: string completion_window: description: The time frame within which the batch should be processed. type: string status: $ref: "#/definitions/BatchStatus" output_file_id: description: The ID of the file containing outputs of successfully executed requests. type: string error_file_id: description: The ID of the file containing outputs of requests with errors. type: string created_at: format: unixtime description: A timestamp when this batch was created (in unix epochs). type: integer readOnly: true in_progress_at: format: unixtime description: A timestamp when this batch started progressing (in unix epochs). type: integer readOnly: true expires_at: format: unixtime description: A timestamp when this batch will expire (in unix epochs). type: integer readOnly: true finalizing_at: format: unixtime description: A timestamp when this batch started finalizing (in unix epochs). type: integer readOnly: true completed_at: format: unixtime description: A timestamp when this batch was completed (in unix epochs). type: integer readOnly: true failed_at: format: unixtime description: A timestamp when this batch failed (in unix epochs). type: integer readOnly: true expired_at: format: unixtime description: A timestamp when this batch expired (in unix epochs). type: integer readOnly: true cancelling_at: format: unixtime description: A timestamp when this batch started cancelling (in unix epochs). type: integer readOnly: true cancelled_at: format: unixtime description: A timestamp when this batch was cancelled (in unix epochs). type: integer readOnly: true request_counts: $ref: "#/definitions/BatchRequestCounts" metadata: description: A set of key-value pairs that can be attached to the batch. This can be useful for storing additional infomration about the batch in a structured format. type: object additionalProperties: type: string BatchCreateRequest: title: BatchCreateRequest description: Defines the request to create a batch. required: - input_file_id - endpoint - completion_window type: object properties: input_file_id: description: The ID if the input file for the batch. minLength: 1 type: string endpoint: description: The API endpoint used by the batch. type: string completion_window: description: The time frame within which the batch should be processed. type: string metadata: description: A set of key-value pairs that can be attached to the batch. This can be useful for storing additional infomration about the batch in a structured format. type: object additionalProperties: type: string BatchErrorData: title: BatchErrorData description: Error information for a failure in batch. type: object properties: code: description: An error code identifying the error type. type: string message: description: A human-readable message providing more details about the error. type: string param: description: The name of the parameter that caused the error, if applicable (can be null). type: string line: description: The line number of the input file where the error occurred, if applicable (can be null). type: string BatchErrors: title: BatchErrors description: For batches that have failed, this will contain more information on the cause of the failures. type: object properties: object: description: The type of the errors object. This is always 'list'. type: string data: $ref: "#/definitions/BatchErrorData" BatchRequestCounts: title: BatchRequestCounts description: The request counts for different statuses within the batch. type: object properties: total: description: The total number of requests in the batch. type: integer completed: description: The number of requests in the batch that have been completed successfully. type: integer failed: description: The number of requests in the batch that have failed. type: integer BatchStatus: title: BatchStatus description: The status of a batch. enum: - validating - failed - in_progress - finalizing - completed - expired - cancelling - cancelled type: string readOnly: true x-ms-enum: name: BatchStatus modelAsString: true values: - value: validating description: The input file is being validated before the batch can begin. - value: failed description: The input file has failed the validation process. - value: in_progress description: The input file was successfully validated and the batch is currently being executed. - value: finalizing description: The batch has completed and the results are being prepared. - value: completed description: The batch has been completed and the results are ready. - value: expired description: The batch was not able to complete within the 24-hour time window. - value: cancelling description: Cancellation of the batch has been initiated. - value: cancelled description: The batch was cancelled. BatchesList: title: BatchList description: Represents a list of batches. type: object properties: object: $ref: "#/definitions/TypeDiscriminator" data: description: The list of items. type: array items: $ref: "#/definitions/Batch" first_id: description: The id of the first batch in the list of batches returned. type: string last_id: description: The id of the last batch in the list of batches returned. type: string has_more: description: A value indicating whether the list contains more elements than returned. type: boolean Capabilities: title: Capabilities description: The capabilities of a base or fine tune model. required: - chat_completion - completion - embeddings - fine_tune - inference type: object properties: fine_tune: description: A value indicating whether a model can be used for fine tuning. type: boolean inference: description: A value indicating whether a model can be deployed. type: boolean completion: description: A value indicating whether a model supports completion. type: boolean chat_completion: description: A value indicating whether a model supports chat completion. type: boolean embeddings: description: A value indicating whether a model supports embeddings. type: boolean Choice: title: Choice type: object properties: index: format: int32 description: The index of the choice in the list of choices. type: integer message: $ref: '#/definitions/ChoiceMessage' finish_reason: description: The reason the model stopped generating tokens. type: string logprobs: title: Dictionary`2 description: Log probability information for the choice. type: object additionalProperties: $ref: '#/definitions/Logprob' ChoiceMessage: title: ChoiceMessage type: object properties: content: description: The contents of the message. type: string role: description: The role of the entity that is creating the message. type: string tool_calls: description: A list of the relevant tool calls. type: array items: $ref: '#/definitions/ToolCall' ChunkingSettings: type: object title: ChunkingSettings description: Chunking settings properties: maxChunkSizeInTokens: type: integer CompletionAction: type: string description: The completion action. enum: - cleanUpTempAssets - keepAllAssets x-ms-enum: name: IngestionJobCompletionAction modelAsString: true values: - name: keepAllAssets value: keepAllAssets description: Will not clean up any of the intermediate assets created during the ingestion process. - name: cleanUpTempAssets value: cleanUpTempAssets description: Will clean up intermediate assets created during the ingestion process. ComputeType: type: string description: The compute type. enum: - ServerlessCompute - CustomCompute x-ms-enum: name: ComputeType modelAsString: true values: - name: ServerlessCompute value: ServerlessCompute description: Serverless user compute. - name: CustomCompute value: CustomCompute description: Custom user compute. ConnectionStringConnection: description: Connection string connection. required: - connectionString allOf: - $ref: "#/definitions/BaseConnection" - type: object properties: connectionString: type: string description: Connection string x-ms-discriminator-value: ConnectionString ConnectionType: type: string description: The connection type. enum: - EndpointWithKey - ConnectionString - EndpointWithManagedIdentity - WorkspaceConnection - RelativeConnection x-ms-enum: name: ConnectionType modelAsString: true values: - name: EndpointWithKey value: EndpointWithKey description: Endpoint and key connection. - name: ConnectionString value: ConnectionString description: Connection string. - name: EndpointWithManagedIdentity value: EndpointWithManagedIdentity description: Endpoint and managed identity. - name: WorkspaceConnection value: WorkspaceConnection description: AML Workspace connection. - name: RelativeConnection value: RelativeConnection description: Relative deployment CosmosDBIndex: description: CosmosDB Index. required: - connectionId allOf: - $ref: "#/definitions/TargetIndex" - type: object properties: connectionId: type: string description: The id of the connection pointing to the cosmos DB. collectionName: type: string description: The name of the cosmos DB collection. databaseName: type: string description: The name of the cosmos DB database. x-ms-discriminator-value: CosmosDB CrawlingSettings: type: object title: CrawlingSettings description: Crawling settings properties: maxCrawlDepth: type: integer maxCrawlTimeInMins: type: integer maxDownloadTimeInMins: type: integer maxFileSize: type: integer maxRedirects: type: integer maxFiles: type: integer CustomCompute: description: Custom compute. required: - computeId allOf: - $ref: "#/definitions/JobCompute" - type: object properties: computeId: type: string description: Id of the custom compute x-ms-discriminator-value: CustomCompute DeploymentConnection: description: Relative deployment connection. allOf: - $ref: "#/definitions/BaseConnection" x-ms-discriminator-value: RelativeConnection Deprecation: title: Deprecation description: "Defines the dates of deprecation for the different use cases of a model.\r\nUsually base models support 1 year of fine tuning after creation. Inference is typically supported 2 years after creation of base or\r\nfine tuned models. The exact dates are specified in the properties." required: - inference type: object properties: fine_tune: format: unixtime description: The end date of fine tune support of this model. Will be `null` for fine tune models. type: integer inference: format: unixtime description: The end date of inference support of this model. type: integer DpoHyperparamsRequest: title: DpoHyperparamsRequest type: object properties: n_epochs: type: integer description: The number of epochs to train the model for. An epoch refers to one full cycle through the training dataset. format: int32 batch_size: type: integer description: "The batch size to use for training. The batch size is the number of training examples used to train a single forward and backward pass.\r\nIn general, we've found that larger batch sizes tend to work better for larger datasets.\r\nThe default value as well as the maximum value for this property are specific to a base model." format: int32 learning_rate_multiplier: type: number description: "The learning rate multiplier to use for training. The fine-tuning learning rate is the original learning rate used for pre-training multiplied by this value.\r\nLarger learning rates tend to perform better with larger batch sizes.\r\nWe recommend experimenting with values in the range 0.02 to 0.2 to see what produces the best results." format: double beta: type: number description: Dpo beta value. format: double l2_multiplier: type: number description: L2 regularization multiplier format: double description: Hyperparameters for DPO method of finetuning DpoMethod: title: DpoMethod required: - dpo - type type: object allOf: - $ref: '#/definitions/FineTuneMethod' properties: type: $ref: '#/definitions/FineTuningMethodType' dpo: $ref: '#/definitions/DpoMethodConfigRequest' description: Request for DPO method finetuning DpoMethodConfigRequest: title: DpoMethodConfigRequest type: object properties: hyperparameters: $ref: '#/definitions/DpoHyperparamsRequest' description: Configuration for dpo finetuning method. Includes DPO specific hyperparameters DpoMethodRequest: title: DpoMethodRequest required: - dpo - type type: object allOf: - $ref: '#/definitions/FineTuneMethodRequest' properties: type: $ref: '#/definitions/FineTuningMethodType' dpo: $ref: '#/definitions/DpoMethodConfigRequest' description: Request for DPO method finetuning EndpointKeyConnection: description: Endpoint key connection. required: - endpoint - key allOf: - $ref: "#/definitions/BaseConnection" - type: object properties: endpoint: type: string description: Endpoint key: type: string description: Key x-ms-discriminator-value: EndpointWithKey EndpointMIConnection: description: Endpoint Managed Identity connection. required: - endpoint allOf: - $ref: "#/definitions/BaseConnection" - type: object properties: endpoint: type: string description: Endpoint resourceId: type: string description: Resource Id x-ms-discriminator-value: EndpointWithManagedIdentity Error: title: Error description: "Error content as defined in the Microsoft REST guidelines\r\n(https://github.com/microsoft/api-guidelines/blob/vNext/Guidelines.md#7102-error-condition-responses)." required: - code - message type: object properties: code: $ref: "#/definitions/ErrorCode" message: description: The message of this error. minLength: 1 type: string target: description: The location where the error happened if available. type: string details: description: The error details if available. type: array items: $ref: "#/definitions/Error" innererror: $ref: "#/definitions/InnerError" ErrorCode: title: ErrorCode description: "Error codes as defined in the Microsoft REST guidelines\r\n(https://github.com/microsoft/api-guidelines/blob/vNext/Guidelines.md#7102-error-condition-responses)." enum: - conflict - invalidPayload - forbidden - notFound - unexpectedEntityState - itemDoesAlreadyExist - serviceUnavailable - internalFailure - quotaExceeded - jsonlValidationFailed - fileImportFailed - tooManyRequests - unauthorized - contentFilter type: string x-ms-enum: name: ErrorCode modelAsString: true values: - value: conflict description: The requested operation conflicts with the current resource state. - value: invalidPayload description: The request data is invalid for this operation. - value: forbidden description: The operation is forbidden for the current user/api key. - value: notFound description: The resource is not found. - value: unexpectedEntityState description: The operation cannot be executed in the current resource's state. - value: itemDoesAlreadyExist description: The item does already exist. - value: serviceUnavailable description: The service is currently not available. - value: internalFailure description: Internal error. Please retry. - value: quotaExceeded description: Quota exceeded. - value: jsonlValidationFailed description: Validation of jsonl data failed. - value: fileImportFailed description: Import of file failed. - value: tooManyRequests description: Too many requests. Please retry later. - value: unauthorized description: The current user/api key is not authorized for the operation. - value: contentFilter description: Image generation failed as a result of our safety system. ErrorResponse: title: ErrorResponse description: "Error response as defined in the Microsoft REST guidelines\r\n(https://github.com/microsoft/api-guidelines/blob/vNext/Guidelines.md#7102-error-condition-responses)." required: - error type: object properties: error: $ref: "#/definitions/Error" EventType: title: EventType description: Defines the severity of a content filter result. enum: - message - metrics type: string x-ms-enum: name: EventType modelAsString: true values: - value: message description: Event only contains human readable messages. - value: metrics description: Event contains metrics. File: title: File description: A file is a document usable for training and validation. It can also be a service generated document with result details. required: - filename - purpose type: object properties: object: $ref: "#/definitions/TypeDiscriminator" created_at: format: unixtime description: A timestamp when this job or item was created (in unix epochs). type: integer readOnly: true id: description: The identity of this item. type: string readOnly: true status: $ref: '#/definitions/FileState' bytes: format: int64 description: "The size of this file when available (can be null). File sizes larger than 2^53-1 are not supported to ensure compatibility\r\nwith JavaScript integers." type: integer readOnly: true purpose: $ref: "#/definitions/Purpose" filename: description: The name of the file. minLength: 1 type: string status_details: description: The error message with details in case processing of this file failed. type: string readOnly: true readOnly: true FileCreate: title: FileCreate description: Defines a document to import from an external content url to be usable with Azure OpenAI. required: - content_url - purpose type: object properties: purpose: $ref: "#/definitions/Purpose" content_url: format: url description: The url to download the document from (can be SAS url of a blob or any other external url accessible with a GET request). type: string FileDetails: title: FileDetails description: A file detail is a document used by batch service to fetch file blob details. required: - filename - purpose type: object properties: id: description: The identity of this item. type: string readOnly: true filename: description: The name of the file. minLength: 1 type: string path: description: The the relative path to the file within the container. type: string readOnly: true storage_account_uri: format: url description: The storage account url of this file. type: string readOnly: true storage_container_name: description: The Storage Container Name of this file blob. type: string readOnly: true purpose: $ref: "#/definitions/Purpose" FileDelete: title: FileDelete required: - deleted - id - object type: object properties: object: minLength: 1 type: string description: The file object. deleted: type: boolean description: A value indicating whether the file was deleted. id: minLength: 1 type: string description: The file-id that was deleted. description: Defines the response for File Delete. FileImport: title: FileImport description: Defines a document to import from an external content url to be usable with Azure OpenAI. required: - content_url - filename - purpose type: object properties: purpose: $ref: "#/definitions/Purpose" filename: description: "The name of the [JSON Lines](https://jsonlines.readthedocs.io/en/latest/) file to be uploaded.\r\nIf the `purpose` is set to \"fine-tune\", each line is a JSON record with \"prompt\" and \"completion\" fields representing your training examples." minLength: 1 type: string content_url: format: url description: The url to download the document from (can be SAS url of a blob or any other external url accessible with a GET request). type: string FileList: title: FileList description: Represents a list of files. type: object properties: object: $ref: "#/definitions/TypeDiscriminator" data: description: The list of items. type: array items: $ref: "#/definitions/File" FileState: title: FileState description: The state of a file. enum: - uploaded - pending - running - processed - error - deleting - deleted type: string readOnly: true x-ms-enum: name: FileState modelAsString: true values: - value: uploaded description: >- The file has been uploaded but it's not yet processed. This state is not returned by Azure OpenAI and exposed only for compatibility. It can be categorized as an inactive state. - value: pending description: >- The operation was created and is not queued to be processed in the future. It can be categorized as an inactive state. - value: running description: >- The operation has started to be processed. It can be categorized as an active state. - value: processed description: >- The operation has successfully be processed and is ready for consumption. It can be categorized as a terminal state. - value: error description: >- The operation has completed processing with a failure and cannot be further consumed. It can be categorized as a terminal state. - value: deleting description: >- The entity is ni the process to be deleted. This state is not returned by Azure OpenAI and exposed only for compatibility. It can be categorized as an active state. - value: deleted description: >- The entity has been deleted but may still be referenced by other entities predating the deletion. It can be categorized as a terminal state. FineTuneMethod: title: FineTuneMethod required: - kind type: object properties: kind: $ref: '#/definitions/FineTuningMethodType' discriminator: kind FineTuneMethodRequest: title: FineTuneMethodRequest required: - kind type: object properties: kind: $ref: '#/definitions/FineTuningMethodType' discriminator: kind FineTuningHyperParameters: title: FineTuningHyperParameters description: The hyper parameter settings used in a fine tune job. type: object properties: n_epochs: format: int32 description: The number of epochs to train the model for. An epoch refers to one full cycle through the training dataset. type: integer batch_size: format: int32 description: "The batch size to use for training. The batch size is the number of training examples used to train a single forward and backward pass.\r\nIn general, we've found that larger batch sizes tend to work better for larger datasets.\r\nThe default value as well as the maximum value for this property are specific to a base model." type: integer learning_rate_multiplier: format: double description: "The learning rate multiplier to use for training. The fine-tuning learning rate is the original learning rate used for pre-training multiplied by this value.\r\nLarger learning rates tend to perform better with larger batch sizes.\r\nWe recommend experimenting with values in the range 0.02 to 0.2 to see what produces the best results." type: number FineTuningJob: title: FineTuningJob description: Defines the values of a fine tune job. required: - model - training_file type: object properties: object: $ref: "#/definitions/TypeDiscriminator" created_at: format: unixtime description: A timestamp when this job or item was created (in unix epochs). type: integer readOnly: true id: description: The identity of this item. type: string readOnly: true status: $ref: "#/definitions/FineTuningState" model: description: The identifier (model-id) of the base model used for the fine-tune. minLength: 1 type: string fine_tuned_model: description: "The identifier (model-id) of the resulting fine tuned model. This property is only populated for successfully completed fine-tune runs.\r\nUse this identifier to create a deployment for inferencing." type: string training_file: description: The file which is used for training. minLength: 1 type: string validation_file: description: The file which is used to evaluate the fine tuned model during training. type: string result_files: description: "The result file identities (file-id) containing training and evaluation metrics in csv format.\r\nThe file is only available for successfully completed fine-tune runs." type: array items: type: string finished_at: format: int32 description: A timestamp when this job or item has finished successfully (in unix epochs). type: integer organisation_id: description: The organisation id of this fine tune job. Unused on Azure OpenAI; compatibility for OpenAI only. type: string trained_tokens: format: int32 description: The total number of billable tokens processed by this fine tuning job. type: integer readOnly: true error: $ref: "#/definitions/FineTuningJobError" estimated_finish: format: int32 description: The Unix timestamp (in seconds) for when the fine-tuning job is estimated to finish. The value will be null if the fine-tuning job is not running. type: integer hyperparameters: $ref: "#/definitions/FineTuningHyperParameters" suffix: description: The suffix used to identify the fine-tuned model. The suffix can contain up to 40 characters (a-z, A-Z, 0-9,- and _) that will be added to your fine-tuned model name. type: string seed: format: int32 description: The seed used for the finetuning job. type: integer integrations: type: array items: $ref: "#/definitions/WandBIntegrationRequestWrapper" description: "A list configurations for integrations supporting the fine-tuning job.\r\nThere are many integrations planned, so make sure to check and act on the integration type." method: title: FineTuneMethod enum: - $ref: '#/definitions/SupervisedMethod' - $ref: '#/definitions/DpoMethod' description: A configuration for finetuning method for the finetuning job. Currently 'dpo' and 'supervised' methods are supported. FineTuningJobCheckpoint: title: FineTuningJobCheckpoint required: - created_at - fine_tuned_model_checkpoint - fine_tuning_job_id - metrics - step_number type: object properties: object: $ref: '#/definitions/TypeDiscriminator' id: type: string description: The identity of this checkpoint. readOnly: true created_at: type: integer description: The Unix timestamp (in seconds) for when the checkpoint was created. format: unixtime fine_tuned_model_checkpoint: minLength: 1 type: string description: The name of the fine-tuned checkpoint model that is created. step_number: type: integer description: The step number that the checkpoint was created at. format: int32 metrics: title: Dictionary`2 type: object additionalProperties: type: number format: double description: The metrics at the step number during the fine-tuning job. fine_tuning_job_id: minLength: 1 type: string description: The name of the fine-tuning job that this checkpoint was created from.. FineTuningJobCheckpointList: title: FineTuningJobCheckpointList description: Represents a list of checkpoints. type: object properties: object: $ref: "#/definitions/TypeDiscriminator" data: description: The list of items. type: array items: $ref: "#/definitions/FineTuningJobCheckpoint" has_more: description: A value indicating whether the list contains more elements than returned. type: boolean FineTuningJobCreation: title: FineTuningJobCreation description: Defines the values of a fine tune job. required: - model - training_file type: object properties: model: description: The identifier (model-id) of the base model used for this fine-tune. minLength: 1 type: string training_file: description: The file identity (file-id) that is used for training this fine tuned model. minLength: 1 type: string validation_file: description: The file identity (file-id) that is used to evaluate the fine tuned model during training. type: string hyperparameters: $ref: "#/definitions/FineTuningHyperParameters" suffix: description: The suffix used to identify the fine-tuned model. The suffix can contain up to 40 characters (a-z, A-Z, 0-9,- and _) that will be added to your fine-tuned model name. type: string seed: format: int32 description: The seed used for the finetuning job. Passing in the same seed and job parameters should produce the same results, but may differ in rare cases. If a seed is not specified, one will be generated for you. type: integer integrations: type: array items: $ref: "#/definitions/WandBIntegrationRequestWrapper" description: "A list configurations for integrations supporting the fine-tuning job.\r\nThere are many integrations planned, so make sure to check and act on the integration type." method: title: FineTuneMethodRequest enum: - $ref: '#/definitions/SupervisedMethodRequest' - $ref: '#/definitions/DpoMethodRequest' description: A configuration for finetuning method for the finetuning job. Currently 'dpo' and 'supervised' methods are supported. FineTuningJobError: title: FineTuningJobError description: For fine-tuning jobs that have failed, this will contain more information on the cause of the failure. type: object properties: code: description: The machine-readable error code.. type: string message: description: The human-readable error message. type: string param: description: The parameter that was invalid, usually training_file or validation_file. This field will be null if the failure was not parameter-specific. type: string FineTuningJobEvent: title: FineTuningJobEvent required: - created_at - level - message - type type: object properties: object: $ref: "#/definitions/TypeDiscriminator" id: description: The identity of this event. type: string readOnly: true created_at: format: unixtime description: A timestamp when this event was created (in unix epochs). type: integer level: $ref: "#/definitions/LogLevel" message: description: The message describing the event. This can be a change of state, e.g., enqueued, started, failed or completed, or other events like uploaded results. minLength: 1 type: string type: $ref: "#/definitions/EventType" data: description: Machine readable data of this event. FineTuningJobEventList: title: FineTuningJobEventList description: Represents a list of events. type: object properties: object: $ref: "#/definitions/TypeDiscriminator" data: description: The list of items. type: array items: $ref: "#/definitions/FineTuningJobEvent" has_more: description: A value indicating whether the list contains more elements than returned. type: boolean FineTuningJobList: title: FineTuningJobList description: Represents a list of fine tunes. type: object properties: object: $ref: "#/definitions/TypeDiscriminator" data: description: The list of items. type: array items: $ref: "#/definitions/FineTuningJob" has_more: description: A value indicating whether the list contains more elements than returned. type: boolean FineTuningState: title: FineTuningState description: The state of a finetunes object or fine tuning job. enum: - created - pending - running - succeeded - cancelled - failed type: string readOnly: true x-ms-enum: name: FineTuningState modelAsString: true values: - value: created description: The operation was created. This state is not returned by Azure OpenAI and exposed only for compatibility. It can be categorized as an inactive state. - value: pending description: The operation is not yet queued to be processed in the future. It can be categorized as an inactive state. - value: running description: The operation has started to be processed. It can be categorized as an active state. - value: succeeded description: The operation has successfully be processed and is ready for consumption. It can be categorized as a terminal state. - value: cancelled description: The operation has been cancelled and is incomplete. It can be categorized as a terminal state. - value: failed description: The operation has completed processing with a failure and cannot be further consumed. It can be categorized as a terminal state. FineTuningMethodType: title: FineTuningMethodType enum: - dpo - supervised type: string x-ms-enum: name: FineTuningMethodType modelAsString: true values: - value: dpo description: Finetunes using Dpo algorithm - value: supervised description: Finetunes using Supervised algorithm FunctionCallFunction: title: FunctionCallFunction type: object properties: name: description: The name of the function. type: string arguments: description: The arguments that the model expects you to pass to the function. type: string FunctionDefinition: title: FunctionDefinition type: object properties: parameters: description: 'The parameters the functions accepts, described as a JSON Schema object.' description: description: "A description of what the function does, used by the model to\r\nchoose when and how to call the function." type: string name: description: The name of the function to be called. type: string GenericEmbeddingSettings: title: ConnectionEmbeddingSettings description: Connection Embedding Settings type: object properties: connection: $ref: "#/definitions/BaseConnection" deploymentName: type: string modelName: type: string IngestionError: title: IngestionError description: The details of the ingestion error type: object properties: message: type: string innerErrors: type: array items: type: string IngestionJob: title: IngestionJob description: Represents the details of a job. type: object required: - kind discriminator: kind properties: kind: $ref: "#/definitions/IngestionJobType" jobId: type: string IngestionJobList: title: IngestionJobList description: Represents a list of ingestion jobs. type: object properties: nextLink: description: The link to the next page. type: string value: description: The list of items. type: array items: $ref: "#/definitions/IngestionJob" IngestionJobProgress: title: IngestionJobProgress type: object required: - stageProgress properties: stageProgress: type: array items: $ref: "#/definitions/IngestionJobStageProgress" IngestionJobRun: title: IngestionJobRun description: The details of a job run type: object properties: jobId: type: string runId: type: string status: $ref: "#/definitions/OperationState" error: $ref: "#/definitions/IngestionError" warnings: type: array items: type: string progress: $ref: "#/definitions/IngestionJobProgress" IngestionJobRunList: title: IngestionJobRunList description: Represents a list of ingestion job runs. type: object properties: nextLink: description: The link to the next page. type: string value: description: The list of items. type: array items: $ref: "#/definitions/IngestionJobRun" IngestionJobStageProgress: title: IngestionJobStageProgress type: object properties: name: type: string totalItems: type: integer format: int32 processedItems: type: integer format: int32 state: $ref: "#/definitions/OperationState" subStageProgress: type: array items: $ref: "#/definitions/IngestionJobStageProgress" IngestionJobSystemCompute: type: object allOf: - $ref: "#/definitions/IngestionJob" - type: object properties: searchServiceConnection: $ref: "#/definitions/BaseConnection" datasource: $ref: "#/definitions/SystemComputeDatasource" completionAction: $ref: "#/definitions/CompletionAction" dataRefreshIntervalInHours: type: integer x-ms-discriminator-value: SystemCompute IngestionJobType: title: IngestionJobType type: string description: The job type. enum: - SystemCompute - UserCompute x-ms-enum: name: IngestionJobType modelAsString: true values: - name: SystemCompute value: SystemCompute description: Jobs that run on service owned resources. - name: UserCompute value: UserCompute description: Jobs that run on user owned workspace. IngestionJobUserCompute: type: object required: - workspaceId allOf: - $ref: "#/definitions/IngestionJob" - type: object properties: workspaceId: type: string compute: $ref: "#/definitions/JobCompute" target: $ref: "#/definitions/TargetIndex" datasource: $ref: "#/definitions/UserComputeDatasource" dataRefreshIntervalInHours: type: integer x-ms-discriminator-value: UserCompute InnerError: title: InnerError description: "Inner error as defined in the Microsoft REST guidelines\r\n(https://github.com/microsoft/api-guidelines/blob/vNext/Guidelines.md#7102-error-condition-responses)." type: object properties: code: $ref: "#/definitions/InnerErrorCode" innererror: $ref: "#/definitions/InnerError" InnerErrorCode: title: InnerErrorCode description: "Inner error codes as defined in the Microsoft REST guidelines\r\n(https://github.com/microsoft/api-guidelines/blob/vNext/Guidelines.md#7102-error-condition-responses)." enum: - invalidPayload type: string x-ms-enum: name: InnerErrorCode modelAsString: true values: - value: invalidPayload description: The request data is invalid for this operation. InputMessage: title: InputMessage type: object properties: id: description: The identity of message. type: string role: description: The role of the entity that is creating the message. type: string content: description: The contents of the message. type: string name: description: "An optional name for the participant.\r\nProvides the model information to differentiate between participants of the same role." type: string IntegrationTypes: title: IntegrationTypes enum: - wandb type: string description: List of Fine Tune integrations available. JobCompute: title: JobCompute description: The compute settings of the job. type: object discriminator: kind required: - kind properties: kind: $ref: "#/definitions/ComputeType" LifeCycleStatus: title: LifeCycleStatus description: "The life cycle status of a model.\r\nNote: A model can be promoted from \"preview\" to \"generally-available\", but never from \"generally-available\" to \"preview\"." enum: - preview - generally-available type: string x-ms-enum: name: LifeCycleStatus modelAsString: true values: - value: preview description: Model is in preview and covered by the service preview terms. - value: generally-available description: Model is generally available. LogLevel: title: LogLevel description: The verbosity level of an event. enum: - info - warning - error type: string x-ms-enum: name: LogLevel modelAsString: true values: - value: info description: This event is for information only. - value: warning description: This event represents a mitigated issue. - value: error description: This message represents a non recoverable issue. Logprob: title: Logprob type: object properties: token: description: The token. type: string logprob: format: float description: "The log probability of this token, if it is within the top 20 most likely tokens.\r\nOtherwise, the value `-9999.0` is used to signify that the token is very unlikely." type: number Model: title: Model description: A model is either a base model or the result of a successful fine tune job. required: - capabilities - deprecation - lifecycle_status type: object properties: object: $ref: "#/definitions/TypeDiscriminator" created_at: format: unixtime description: A timestamp when this job or item was created (in unix epochs). type: integer readOnly: true id: description: The identity of this item. type: string readOnly: true status: $ref: "#/definitions/FineTuningState" model: description: The base model identity (model-id) if this is a fine tune model; otherwise `null`. type: string fine_tune: description: The fine tune job identity (fine-tune-id) if this is a fine tune model; otherwise `null`. type: string capabilities: $ref: "#/definitions/Capabilities" lifecycle_status: $ref: "#/definitions/LifeCycleStatus" deprecation: $ref: "#/definitions/Deprecation" ModelList: title: ModelList description: Represents a list of models. type: object properties: object: $ref: "#/definitions/TypeDiscriminator" data: description: The list of items. type: array items: $ref: "#/definitions/Model" OperationState: title: OperationState description: The state of a job or item. enum: - notRunning - running - succeeded - failed type: string readOnly: true x-ms-enum: name: OperationState modelAsString: true values: - value: notRunning description: The operation is not yet queued to be processed in the future. - value: running description: The operation has started to be processed. - value: succeeded description: The operation has successfully be processed and is ready for consumption. - value: failed description: The operation has completed processing with a failure and cannot be further consumed. PineconeIndex: description: Pinecone Index. required: - connectionId allOf: - $ref: "#/definitions/TargetIndex" - type: object properties: connectionId: type: string description: The id of the connection pointing to the pinecone. x-ms-discriminator-value: Pinecone Purpose: title: Purpose description: The intended purpose of the uploaded documents. Use "fine-tune" for fine-tuning. This allows us to validate the format of the uploaded file. enum: - fine-tune - fine-tune-results - assistants - assistants_output - batch - batch_output type: string readOnly: true x-ms-enum: name: Purpose modelAsString: true values: - value: fine-tune description: This file contains training data for a fine tune job. - value: fine-tune-results description: This file contains the results of a fine tune job. - value: assistants description: This file contains data to be used in assistants. - value: assistants_output description: This file contains the results of an assistant. - value: batch description: This file contains the input data for a batch. - value: batch_output description: This file contains the results of a batch. ServerlessCompute: description: Serverless compute. allOf: - $ref: "#/definitions/JobCompute" - type: object properties: sku: type: string description: SKU Level instanceCount: type: integer description: The count of instances to run the job on. x-ms-discriminator-value: ServerlessCompute StoredCompletion: title: StoredCompletion type: object properties: id: description: The identity of stored completion. type: string model: description: ID of the model to use. type: string created: format: int64 description: The Unix timestamp (in seconds) of when the chat completion was created. type: integer request_id: description: An unique identifier for the OpenAI API request. Please include this request ID when contacting support. type: string tool_choice: description: Controls which (if any) tool is called by the model. type: string usage: $ref: '#/definitions/Usage' seed: format: int64 description: "If specified, our system will make a best effort to sample\r\ndeterministically, such that repeated requests with the same `seed`\r\nand parameters should return the same result.\r\n \r\nDeterminism is not guaranteed, and you should refer to the\r\n`system_fingerprint` response parameter to monitor changes in the\r\nbackend." type: integer top_p: format: float description: "An alternative to sampling with temperature, called nucleus sampling,\r\nwhere the model considers the results of the tokens with top_p probability mass.\r\nSo 0.1 means only the tokens comprising the top 10% probability mass are considered.\r\n \r\nWe generally recommend altering this or `temperature` but not both." type: number temperature: format: float description: "What sampling temperature to use, between 0 and 2. Higher values\r\nlike 0.8 will make the output more random, while lower values like\r\n0.2 will make it more focused and deterministic.\r\n \r\nWe generally recommend altering this or `top_p` but not both." type: number presence_penalty: format: float description: "Number between -2.0 and 2.0. Positive values penalize new tokens based on\r\nwhether they appear in the text so far, increasing the model's likelihood to talk about new topics." type: number frequency_penalty: format: float description: "Number between -2.0 and 2.0. Positive values penalize new tokens based on\r\ntheir existing frequency in the text so far, decreasing the model's\r\nlikelihood to repeat the same line verbatim." type: number system_fingerprint: description: "This fingerprint represents the backend configuration that the model runs with.\r\n \r\nCan be used in conjunction with the `seed` request parameter to\r\nunderstand when backend changes have been made that might impact determinism." type: string input_user: description: The input user for this request. type: string service_tier: description: Specifies the latency tier to use for processing the request. type: string tools: description: "A list of tools the model may call. Currently, only functions are\r\nsupported as a tool. Use this to provide a list of functions the\r\nmodel may generate JSON inputs for. A max of 128 functions are supported." type: array items: $ref: '#/definitions/Tool' metadata: title: Dictionary`2 description: Arbitrary key-value pairs for additional information. type: object additionalProperties: type: string choices: description: A list of chat completion choices. Can be more than one if `n` is greater than 1. type: array items: $ref: '#/definitions/Choice' StoredCompletionDelete: title: StoredCompletionDelete required: - object type: object properties: object: description: If the stored completion was deleted. minLength: 1 type: string id: description: The stored completion id that was deleted. type: string deleted: description: A value indicating whether gets if the stored completion was deleted. type: boolean StoredCompletionList: title: StoredCompletionList type: object properties: object: description: 'The object type, which is always `list`' type: string data: description: The list of retrieved objects. type: array items: $ref: '#/definitions/StoredCompletion' total: format: int64 description: Total number of items. type: integer first_id: description: The first id in the retrieved `list` type: string last_id: description: The last id in the retrieved `list` type: string has_more: description: The `has_more` property is used for pagination to indicate there are additional results. type: boolean StoredCompletionMessages: title: StoredCompletionMessages type: object properties: object: description: 'The object type, which is always `list`' type: string data: description: The list of retrieved objects. type: array items: $ref: '#/definitions/InputMessage' total: format: int64 description: Total number of items. type: integer first_id: description: The first id in the retrieved `list` type: string last_id: description: The last id in the retrieved `list` type: string has_more: description: The `has_more` property is used for pagination to indicate there are additional results. type: boolean StoredCompletionResponse: title: StoredCompletionResponse type: object properties: id: description: The identity of stored completion. type: string model: description: ID of the model to use. type: string created: format: int64 description: The Unix timestamp (in seconds) of when the chat completion was created. type: integer request_id: description: An unique identifier for the OpenAI API request. Please include this request ID when contacting support. type: string tool_choice: description: Controls which (if any) tool is called by the model. type: string usage: $ref: '#/definitions/Usage' seed: format: int64 description: "If specified, our system will make a best effort to sample\r\ndeterministically, such that repeated requests with the same `seed`\r\nand parameters should return the same result.\r\n \r\nDeterminism is not guaranteed, and you should refer to the\r\n`system_fingerprint` response parameter to monitor changes in the\r\nbackend." type: integer top_p: format: float description: "An alternative to sampling with temperature, called nucleus sampling,\r\nwhere the model considers the results of the tokens with top_p probability mass.\r\nSo 0.1 means only the tokens comprising the top 10% probability mass are considered.\r\n \r\nWe generally recommend altering this or `temperature` but not both." type: number temperature: format: float description: "What sampling temperature to use, between 0 and 2. Higher values\r\nlike 0.8 will make the output more random, while lower values like\r\n0.2 will make it more focused and deterministic.\r\n \r\nWe generally recommend altering this or `top_p` but not both." type: number presence_penalty: format: float description: "Number between -2.0 and 2.0. Positive values penalize new tokens based on\r\nwhether they appear in the text so far, increasing the model's likelihood to talk about new topics." type: number frequency_penalty: format: float description: "Number between -2.0 and 2.0. Positive values penalize new tokens based on\r\ntheir existing frequency in the text so far, decreasing the model's\r\nlikelihood to repeat the same line verbatim." type: number system_fingerprint: description: "This fingerprint represents the backend configuration that the model runs with.\r\n \r\nCan be used in conjunction with the `seed` request parameter to\r\nunderstand when backend changes have been made that might impact determinism." type: string input_user: description: The input user for this request. type: string service_tier: description: Specifies the latency tier to use for processing the request. type: string tools: description: "A list of tools the model may call. Currently, only functions are\r\nsupported as a tool. Use this to provide a list of functions the\r\nmodel may generate JSON inputs for. A max of 128 functions are supported." type: array items: $ref: '#/definitions/Tool' metadata: title: Dictionary`2 description: Arbitrary key-value pairs for additional information. type: object additionalProperties: type: string choices: description: A list of chat completion choices. Can be more than one if `n` is greater than 1. type: array items: $ref: '#/definitions/Choice' object: description: The type of this object. type: string readOnly: true SystemComputeDatasource: title: SystemComputeDatasource type: object required: - kind properties: kind: $ref: "#/definitions/SystemComputeDatasourceType" discriminator: kind SystemComputeDatasourceType: type: string description: The datasource type. enum: - Storage - Urls x-ms-enum: name: SystemComputeDatasourceType modelAsString: true values: - name: Storage value: Storage description: Azure Storage Account. - name: Urls value: Urls description: URLs. SystemComputeStorage: title: SystemComputeStorage description: Storage account required: - connection - containerName - embeddings x-ms-discriminator-value: Storage allOf: - $ref: "#/definitions/SystemComputeDatasource" - type: object properties: connection: $ref: "#/definitions/BaseConnection" containerName: type: string description: container name chunking: $ref: "#/definitions/ChunkingSettings" embeddings: type: array items: $ref: "#/definitions/GenericEmbeddingSettings" SystemComputeUrl: title: SystemComputeUrl description: Urls required: - urls - connection - containerName - embeddings x-ms-discriminator-value: Urls allOf: - $ref: "#/definitions/SystemComputeDatasource" - type: object properties: urls: type: array items: type: string connection: $ref: "#/definitions/BaseConnection" containerName: type: string description: container name crawling: $ref: "#/definitions/CrawlingSettings" chunking: $ref: "#/definitions/ChunkingSettings" embeddings: type: array items: $ref: "#/definitions/GenericEmbeddingSettings" SupervisedMethod: title: SupervisedMethod required: - type type: object allOf: - $ref: '#/definitions/FineTuneMethod' properties: type: $ref: '#/definitions/FineTuningMethodType' description: Method used for supervised finetuning SupervisedMethodRequest: title: SupervisedMethodRequest required: - type type: object allOf: - $ref: '#/definitions/FineTuneMethodRequest' properties: type: $ref: '#/definitions/FineTuningMethodType' description: Method used for supervised finetuning TargetIndex: title: TargetIndex description: Information about the index to be created. type: object discriminator: kind required: - kind properties: kind: $ref: "#/definitions/TargetType" TargetType: type: string description: The target type. enum: - AzureAISearch - CosmosDB - Pinecone x-ms-enum: name: TargetType modelAsString: true values: - name: AzureAISearch value: AzureAISearch description: Azure AI Search Index. - name: CosmosDB value: CosmosDB description: CosmosDB Index. - name: Pinecone value: Pinecone description: Pinecone Index. Tool: title: Tool type: object properties: type: description: The type of tool call. This is always going to be `function` for this type of tool call. type: string function: $ref: '#/definitions/FunctionDefinition' ToolCall: title: ToolCall type: object properties: type: description: 'The type of tool call the output is required for. For now, this is always `function`.' type: string function: $ref: '#/definitions/FunctionCallFunction' id: description: The ID of the tool call. type: string TypeDiscriminator: title: TypeDiscriminator description: Defines the type of an object. enum: - list - fine_tuning.job - file - fine_tuning.job.event - fine_tuning.job.checkpoint - model - upload - upload.part - batch type: string readOnly: true x-ms-enum: name: TypeDiscriminator modelAsString: true values: - value: list description: This object represents a list of other objects. - value: fine_tuning.job description: This object represents a fine tune job. - value: file description: This object represents a file. - value: fine_tuning.job.event description: This object represents an event of a fine tuning job. - value: fine_tuning.job.checkpoint description: This object represents a checkpoint of a fine tuning job. - value: model description: This object represents a model (can be a base model or fine tune job result). - value: upload description: This object represents a file upload. - value: upload.part description: This object represents part of a file upload. - value: batch description: This object represents a batch. UpdateStoredCompletionRequest: title: UpdateStoredCompletionRequest type: object properties: metadata: title: Dictionary`2 description: Arbitrary key-value pairs for additional information. type: object additionalProperties: type: string UploadFileCompleteBody: title: UploadFileCompleteBody required: - part_ids type: object properties: part_ids: title: IList`1 type: array items: type: string md5: type: string UploadFileStartBody: title: UploadFileStartBody required: - bytes - filename - mime_type - purpose type: object properties: purpose: $ref: "#/definitions/Purpose" filename: minLength: 1 type: string bytes: format: int64 type: integer mime_type: minLength: 1 type: string UploadPartResource: title: UploadPartResource type: object properties: object: $ref: "#/definitions/TypeDiscriminator" created_at: format: unixtime description: A timestamp when this job or item was created (in unix epochs). type: integer readOnly: true id: description: The identity of this item. type: string readOnly: true upload_id: type: string readOnly: true azure_block_id: type: string readOnly: true UploadResource: title: UploadResource type: object properties: object: $ref: "#/definitions/TypeDiscriminator" created_at: format: unixtime description: A timestamp when this job or item was created (in unix epochs). type: integer readOnly: true id: description: The identity of this item. type: string readOnly: true bytes: format: int64 type: integer readOnly: true filename: type: string readOnly: true purpose: $ref: "#/definitions/Purpose" status: $ref: "#/definitions/UploadStatus" expires_at: format: unixtime type: integer readOnly: true file: $ref: "#/definitions/File" UploadStatus: title: UploadStatus enum: - pending - expired - completed - cancelled type: string readOnly: true Usage: title: Usage type: object properties: total_tokens: format: int32 description: Total number of tokens used in the request (prompt + completion). type: integer completion_tokens: format: int32 description: Number of tokens in the generated completion. type: integer prompt_tokens: format: int32 description: Number of tokens in the prompt. type: integer UserComputeDataset: type: object title: UserComputeStorage description: Storage account required: - datasetId - datasetType x-ms-discriminator-value: Dataset allOf: - $ref: "#/definitions/UserComputeDatasource" - type: object properties: datasetId: type: string datasetType: type: string chunking: $ref: "#/definitions/ChunkingSettings" embeddings: type: array items: $ref: "#/definitions/WorkspaceConnectionEmbeddingSettings" UserComputeDatasource: title: UserComputeDatasource type: object discriminator: kind required: - kind properties: kind: $ref: "#/definitions/UserComputeDatasourceType" UserComputeDatasourceType: type: string description: The datasource type. enum: - Dataset - Urls x-ms-enum: name: UserComputeDatasourceType modelAsString: true values: - name: Dataset value: Dataset description: Workspace Dataset. - name: Urls value: Urls description: URLs. UserComputeUrl: type: object title: UserComputeUrl description: Urls required: - urls - embeddings x-ms-discriminator-value: Urls allOf: - $ref: "#/definitions/UserComputeDatasource" - type: object properties: urls: type: array items: type: string crawling: $ref: "#/definitions/CrawlingSettings" chunking: $ref: "#/definitions/ChunkingSettings" embeddings: type: array items: $ref: "#/definitions/WorkspaceConnectionEmbeddingSettings" WandBIntegrationRequest: title: WandBIntegrationRequest required: - project type: object properties: project: minLength: 1 type: string name: type: string readOnly: true entity: type: string readOnly: true tags: type: array items: type: string readOnly: true WandBIntegrationRequestWrapper: title: WandBIntegrationRequestWrapper required: - type - wandb type: object properties: type: $ref: '#/definitions/IntegrationTypes' wandb: $ref: "#/definitions/WandBIntegrationRequest" WorkspaceConnection: description: AML Workspace connection. required: - connectionId allOf: - $ref: "#/definitions/BaseConnection" - type: object properties: connectionId: type: string description: ConnectionId x-ms-discriminator-value: WorkspaceConnection WorkspaceConnectionEmbeddingSettings: title: WorkspaceConnectionEmbeddingSettings description: Connection id to the embedding model type: object properties: connectionId: type: string deploymentName: type: string modelName: type: string parameters: endpoint: in: path name: endpoint description: 'Supported Cognitive Services endpoints (protocol and hostname, for example: https://aoairesource.openai.azure.com. Replace "aoairesource" with your Azure OpenAI account name).' required: true type: string format: url x-ms-skip-url-encoding: true x-ms-parameter-location: client apiVersionQueryParameter: in: query name: api-version description: The requested API version. required: true type: string x-ms-client-default: 2025-02-01-preview x-ms-parameter-location: client security: - ApiKeyAuth: [] - OAuth2Auth: - https://cognitiveservices.azure.com/.default securityDefinitions: ApiKeyAuth: description: API key authentication type: apiKey name: api-key in: header OAuth2Auth: description: OAuth2 authentication type: oauth2 flow: implicit authorizationUrl: https://login.microsoftonline.com/common/oauth2/v2.0/authorize scopes: https://cognitiveservices.azure.com/.default: "" schemes: - https x-ms-parameterized-host: hostTemplate: "{endpoint}/openai" useSchemePrefix: false parameters: - $ref: "#/parameters/endpoint"

specification/cognitiveservices/data-plane/AzureOpenAI/authoring/preview/2025-02-01-preview/azureopenai.yaml (3,303 lines of code) (raw):