assets/models/system/Mistral-7B-Instruct-v0-1/spec.yaml (33 lines of code) (raw):
$schema: https://azuremlschemas.azureedge.net/latest/model.schema.json
name: mistralai-Mistral-7B-Instruct-v01
path: ./
properties:
SharedComputeCapacityEnabled: true
SHA: b70aa86578567ba3301b21c8a27bea4e8f6d6d61
inference-min-sku-spec: 12|1|220|64
inference-recommended-sku: Standard_NC12s_v3, Standard_NC24s_v3, Standard_ND40rs_v2, Standard_NC24ads_A100_v4, Standard_NC48ads_A100_v4, Standard_NC96ads_A100_v4, Standard_ND96amsr_A100_v4, Standard_ND96asr_v4
languages: EN
tags:
Featured: ""
SharedComputeCapacityEnabled: ""
disable-batch: "true"
hiddenlayerscanned: ""
inference_compute_allow_list:
[
Standard_NC12s_v3,
Standard_NC24s_v3,
Standard_ND40rs_v2,
Standard_NC24ads_A100_v4,
Standard_NC48ads_A100_v4,
Standard_NC96ads_A100_v4,
Standard_ND96amsr_A100_v4,
Standard_ND96asr_v4,
]
inference_supported_envs:
- vllm
- ds_mii
license: apache-2.0
task: chat-completion
author: "Mistral AI"
benchmark: "quality"
version: 11