6.Compute.Cluster/config.auto.tfvars (913 lines of code) (raw):

resourceGroupName = "ArtistAnywhere.Cluster" ###################################################################################################### # Virtual Machine Scale Sets (https://learn.microsoft.com/azure/virtual-machine-scale-sets/overview) # ###################################################################################################### virtualMachineScaleSets = [ { enable = false name = "LnxClusterCPU-A" machine = { namePrefix = "" size = "Standard_HX176rs" count = 3 image = { versionId = "2.0.0" galleryName = "xstudio" definitionName = "Linux" resourceGroupName = "ArtistAnywhere.Image" } bootDiagnostics = { enable = true } } network = { acceleration = { # https://learn.microsoft.com/azure/virtual-network/accelerated-networking-overview enable = true } locationExtended = { enable = false } } osDisk = { type = "Linux" storageType = "Premium_LRS" cachingMode = "ReadOnly" sizeGB = 0 ephemeral = { # https://learn.microsoft.com/azure/virtual-machines/ephemeral-os-disks enable = true placement = "ResourceDisk" } } spot = { enable = true # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot evictionPolicy = "Delete" # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#eviction-policy tryRestore = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#try--restore enable = false timeout = "PT1H" } } extension = { custom = { enable = true name = "Custom" fileName = "cse.sh" parameters = { terminateNotification = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-terminate-notification enable = false delayTimeout = "PT5M" } } } health = { enable = true name = "Health" protocol = "tcp" port = 111 requestPath = "" } } monitor = { enable = true metric = { category = "AllMetrics" } } adminLogin = { userName = "" userPassword = "" sshKeyPublic = "" passwordAuth = { disable = true } } availabilityZones = { enable = false evenDistribution = { enable = true } } flexMode = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-orchestration-modes enable = false } }, { enable = false name = "LnxClusterCPU-I" machine = { namePrefix = "" size = "Standard_FX96ms_v2" count = 3 image = { versionId = "2.1.0" galleryName = "xstudio" definitionName = "Linux" resourceGroupName = "ArtistAnywhere.Image" } bootDiagnostics = { enable = true } } network = { acceleration = { # https://learn.microsoft.com/azure/virtual-network/accelerated-networking-overview enable = true } locationExtended = { enable = false } } osDisk = { type = "Linux" storageType = "Premium_LRS" cachingMode = "ReadOnly" sizeGB = 0 ephemeral = { # https://learn.microsoft.com/azure/virtual-machines/ephemeral-os-disks enable = true placement = "ResourceDisk" } } spot = { enable = true # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot evictionPolicy = "Delete" # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#eviction-policy tryRestore = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#try--restore enable = false timeout = "PT1H" } } extension = { custom = { enable = true name = "Custom" fileName = "cse.sh" parameters = { terminateNotification = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-terminate-notification enable = false delayTimeout = "PT5M" } } } health = { enable = true name = "Health" protocol = "tcp" port = 111 requestPath = "" } } monitor = { enable = true metric = { category = "AllMetrics" } } adminLogin = { userName = "" userPassword = "" sshKeyPublic = "" passwordAuth = { disable = true } } availabilityZones = { enable = false evenDistribution = { enable = true } } flexMode = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-orchestration-modes enable = false } }, { enable = false name = "LnxClusterGPU-N" machine = { namePrefix = "" size = "Standard_NC40ads_H100_v5" count = 3 image = { versionId = "2.2.0" galleryName = "xstudio" definitionName = "Linux" resourceGroupName = "ArtistAnywhere.Image" } bootDiagnostics = { enable = true } } network = { acceleration = { # https://learn.microsoft.com/azure/virtual-network/accelerated-networking-overview enable = true } locationExtended = { enable = false } } osDisk = { type = "Linux" storageType = "Premium_LRS" cachingMode = "ReadOnly" sizeGB = 0 ephemeral = { # https://learn.microsoft.com/azure/virtual-machines/ephemeral-os-disks enable = true placement = "CacheDisk" } } spot = { enable = false # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot evictionPolicy = "Delete" # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#eviction-policy tryRestore = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#try--restore enable = false timeout = "PT1H" } } extension = { custom = { enable = true name = "Custom" fileName = "cse.sh" parameters = { terminateNotification = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-terminate-notification enable = false delayTimeout = "PT5M" } } } health = { enable = true name = "Health" protocol = "tcp" port = 111 requestPath = "" } } monitor = { enable = true metric = { category = "AllMetrics" } } adminLogin = { userName = "" userPassword = "" sshKeyPublic = "" passwordAuth = { disable = true } } availabilityZones = { enable = false evenDistribution = { enable = true } } flexMode = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-orchestration-modes enable = false } }, { enable = false name = "LnxClusterGPU-A" machine = { namePrefix = "" size = "Standard_ND96isr_MI300X_v5" count = 3 image = { versionId = "2.3.0" galleryName = "xstudio" definitionName = "Linux" resourceGroupName = "ArtistAnywhere.Image" } bootDiagnostics = { enable = true } } network = { acceleration = { # https://learn.microsoft.com/azure/virtual-network/accelerated-networking-overview enable = true } locationExtended = { enable = false } } osDisk = { type = "Linux" storageType = "Premium_LRS" cachingMode = "ReadOnly" sizeGB = 0 ephemeral = { # https://learn.microsoft.com/azure/virtual-machines/ephemeral-os-disks enable = true placement = "ResourceDisk" } } spot = { enable = false # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot evictionPolicy = "Delete" # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#eviction-policy tryRestore = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#try--restore enable = false timeout = "PT1H" } } extension = { custom = { enable = true name = "Custom" fileName = "cse.sh" parameters = { terminateNotification = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-terminate-notification enable = false delayTimeout = "PT5M" } } } health = { enable = true name = "Health" protocol = "tcp" port = 111 requestPath = "" } } monitor = { enable = true metric = { category = "AllMetrics" } } adminLogin = { userName = "" userPassword = "" sshKeyPublic = "" passwordAuth = { disable = true } } availabilityZones = { enable = false evenDistribution = { enable = true } } flexMode = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-orchestration-modes enable = false } }, { enable = false name = "WinClusterCPU-A" machine = { namePrefix = "" size = "Standard_HX176rs" count = 3 image = { versionId = "2.0.0" galleryName = "xstudio" definitionName = "WinCluster" resourceGroupName = "ArtistAnywhere.Image" } bootDiagnostics = { enable = true } } network = { acceleration = { # https://learn.microsoft.com/azure/virtual-network/accelerated-networking-overview enable = true } locationExtended = { enable = false } } osDisk = { type = "Windows" storageType = "Premium_LRS" cachingMode = "ReadOnly" sizeGB = 0 ephemeral = { # https://learn.microsoft.com/azure/virtual-machines/ephemeral-os-disks enable = true placement = "ResourceDisk" } } spot = { enable = true # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot evictionPolicy = "Delete" # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#eviction-policy tryRestore = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#try--restore enable = false timeout = "PT1H" } } extension = { custom = { enable = true name = "Custom" fileName = "cse.ps1" parameters = { terminateNotification = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-terminate-notification enable = false delayTimeout = "PT5M" } } } health = { enable = true name = "Health" protocol = "tcp" port = 445 requestPath = "" } } monitor = { enable = true metric = { category = "AllMetrics" } } adminLogin = { userName = "" userPassword = "" sshKeyPublic = "" passwordAuth = { disable = false } } availabilityZones = { enable = false evenDistribution = { enable = true } } flexMode = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-orchestration-modes enable = false } }, { enable = false name = "WinClusterCPU-I" machine = { namePrefix = "" size = "Standard_FX96ms_v2" count = 3 image = { versionId = "2.1.0" galleryName = "xstudio" definitionName = "WinCluster" resourceGroupName = "ArtistAnywhere.Image" } bootDiagnostics = { enable = true } } network = { acceleration = { # https://learn.microsoft.com/azure/virtual-network/accelerated-networking-overview enable = true } locationExtended = { enable = false } } osDisk = { type = "Windows" storageType = "Premium_LRS" cachingMode = "ReadOnly" sizeGB = 0 ephemeral = { # https://learn.microsoft.com/azure/virtual-machines/ephemeral-os-disks enable = true placement = "ResourceDisk" } } spot = { enable = true # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot evictionPolicy = "Delete" # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#eviction-policy tryRestore = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#try--restore enable = false timeout = "PT1H" } } extension = { custom = { enable = true name = "Custom" fileName = "cse.ps1" parameters = { terminateNotification = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-terminate-notification enable = false delayTimeout = "PT5M" } } } health = { enable = true name = "Health" protocol = "tcp" port = 445 requestPath = "" } } monitor = { enable = true metric = { category = "AllMetrics" } } adminLogin = { userName = "" userPassword = "" sshKeyPublic = "" passwordAuth = { disable = false } } availabilityZones = { enable = false evenDistribution = { enable = true } } flexMode = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-orchestration-modes enable = false } }, { enable = false name = "WinClusterGPU-N" machine = { namePrefix = "" size = "Standard_NC40ads_H100_v5" count = 3 image = { versionId = "2.2.0" galleryName = "xstudio" definitionName = "WinCluster" resourceGroupName = "ArtistAnywhere.Image" } bootDiagnostics = { enable = true } } network = { acceleration = { # https://learn.microsoft.com/azure/virtual-network/accelerated-networking-overview enable = true } locationExtended = { enable = false } } osDisk = { type = "Windows" storageType = "Premium_LRS" cachingMode = "ReadOnly" sizeGB = 0 ephemeral = { # https://learn.microsoft.com/azure/virtual-machines/ephemeral-os-disks enable = true placement = "CacheDisk" } } spot = { enable = false # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot evictionPolicy = "Delete" # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#eviction-policy tryRestore = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#try--restore enable = false timeout = "PT1H" } } extension = { custom = { enable = true name = "Custom" fileName = "cse.ps1" parameters = { terminateNotification = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-terminate-notification enable = false delayTimeout = "PT5M" } } } health = { enable = true name = "Health" protocol = "tcp" port = 445 requestPath = "" } } monitor = { enable = true metric = { category = "AllMetrics" } } adminLogin = { userName = "" userPassword = "" sshKeyPublic = "" passwordAuth = { disable = false } } availabilityZones = { enable = false evenDistribution = { enable = true } } flexMode = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-orchestration-modes enable = false } }, { enable = false name = "WinClusterGPU-A" machine = { namePrefix = "" size = "Standard_ND96isr_MI300X_v5" count = 3 image = { versionId = "2.3.0" galleryName = "xstudio" definitionName = "WinCluster" resourceGroupName = "ArtistAnywhere.Image" } bootDiagnostics = { enable = true } } network = { acceleration = { # https://learn.microsoft.com/azure/virtual-network/accelerated-networking-overview enable = true } locationExtended = { enable = false } } osDisk = { type = "Windows" storageType = "Premium_LRS" cachingMode = "ReadOnly" sizeGB = 0 ephemeral = { # https://learn.microsoft.com/azure/virtual-machines/ephemeral-os-disks enable = true placement = "ResourceDisk" } } spot = { enable = false # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot evictionPolicy = "Delete" # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#eviction-policy tryRestore = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/use-spot#try--restore enable = false timeout = "PT1H" } } extension = { custom = { enable = true name = "Custom" fileName = "cse.ps1" parameters = { terminateNotification = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-terminate-notification enable = false delayTimeout = "PT5M" } } } health = { enable = true name = "Health" protocol = "tcp" port = 445 requestPath = "" } } monitor = { enable = true metric = { category = "AllMetrics" } } adminLogin = { userName = "" userPassword = "" sshKeyPublic = "" passwordAuth = { disable = false } } availabilityZones = { enable = false evenDistribution = { enable = true } } flexMode = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-orchestration-modes enable = false } } ] ################################################################################## # Compute Fleet (https://learn.microsoft.com/azure/azure-compute-fleet/overview) # ################################################################################## computeFleets = [ { enable = false name = "LnxClusterCPU-A" machine = { namePrefix = "" sizes = [ { name = "Standard_HX176rs" }, { name = "Standard_HX176-144rs" }, { name = "Standard_HX176-96rs" } ] image = { versionId = "2.0.0" galleryName = "xstudio" definitionName = "Linux" resourceGroupName = "ArtistAnywhere.Image" } osDisk = { type = "Linux" storageType = "Premium_LRS" cachingMode = "ReadOnly" sizeGB = 0 ephemeral = { # https://learn.microsoft.com/azure/virtual-machines/ephemeral-os-disks enable = true placement = "ResourceDisk" } } priority = { standard = { allocationStrategy = "LowestPrice" capacityTarget = 2 capacityMinimum = 1 } spot = { allocationStrategy = "PriceCapacityOptimized" evictionPolicy = "Delete" capacityTarget = 0 capacityMinimum = 0 capacityMaintain = { enable = true } } } extension = { custom = { enable = true name = "Custom" fileName = "cse.sh" parameters = { terminateNotification = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-terminate-notification enable = false delayTimeout = "PT5M" } } } health = { enable = true name = "Health" protocol = "tcp" port = 111 requestPath = "" } monitor = { enable = false name = "Monitor" } } adminLogin = { userName = "" userPassword = "" sshKeyPublic = "" } } network = { acceleration = { # https://learn.microsoft.com/azure/virtual-network/accelerated-networking-overview enable = true } locationExtended = { enable = false } } }, { enable = false name = "WinClusterCPU-A" machine = { namePrefix = "" sizes = [ { name = "Standard_HX176rs" }, { name = "Standard_HX176-144rs" }, { name = "Standard_HX176-96rs" } ] image = { versionId = "2.0.0" galleryName = "xstudio" definitionName = "WinCluster" resourceGroupName = "ArtistAnywhere.Image" } osDisk = { type = "Windows" storageType = "Premium_LRS" cachingMode = "ReadOnly" sizeGB = 0 ephemeral = { # https://learn.microsoft.com/azure/virtual-machines/ephemeral-os-disks enable = true placement = "ResourceDisk" } } priority = { standard = { allocationStrategy = "LowestPrice" capacityTarget = 2 capacityMinimum = 1 } spot = { allocationStrategy = "PriceCapacityOptimized" evictionPolicy = "Delete" capacityTarget = 0 capacityMinimum = 0 capacityMaintain = { enable = true } } } extension = { custom = { enable = true name = "Custom" fileName = "cse.ps1" parameters = { terminateNotification = { # https://learn.microsoft.com/azure/virtual-machine-scale-sets/virtual-machine-scale-sets-terminate-notification enable = false delayTimeout = "PT5M" } } } health = { enable = true name = "Health" protocol = "tcp" port = 445 requestPath = "" } monitor = { enable = false name = "Monitor" } } adminLogin = { userName = "" userPassword = "" sshKeyPublic = "" } } network = { acceleration = { # https://learn.microsoft.com/azure/virtual-network/accelerated-networking-overview enable = true } locationExtended = { enable = false } } } ] ######################## # Brownfield Resources # ######################## virtualNetwork = { name = "Studio" subnetName = "Cluster" resourceGroupName = "ArtistAnywhere.Network.SouthCentralUS" } virtualNetworkExtended = { enable = true name = "Studio" subnetName = "Cluster" resourceGroupName = "ArtistAnywhere.Network.WestUS.LosAngeles" } activeDirectory = { enable = false domain = { name = "azure.studio" } machine = { name = "WinADController" adminLogin = { userName = "" userPassword = "" } } } containerRegistry = { enable = true name = "xstudio" resourceGroupName = "ArtistAnywhere.Image.Registry" }