@@ -1662,7 +1662,7 @@ func Test_Ubuntu2404ARM(t *testing.T) {
1662
1662
})
1663
1663
}
1664
1664
1665
- func Test_Ubuntu2404Gen2Containerd_AMDGPU_MI300 (t * testing.T ) {
1665
+ func Test_Ubuntu2204Gen2Containerd_AMDGPU_MI300 (t * testing.T ) {
1666
1666
t .Skip ("Provisioning of Standard_ND96isr_MI300X_v5 isn't reliable yet" )
1667
1667
//E2E_LOCATION=eastus2euap
1668
1668
//SUBSCRIPTION_ID=4f3dc0e4-0c77-40ff-bf9a-6ade1e3048ef
@@ -1673,12 +1673,10 @@ func Test_Ubuntu2404Gen2Containerd_AMDGPU_MI300(t *testing.T) {
1673
1673
},
1674
1674
Config : Config {
1675
1675
Cluster : ClusterKubenet ,
1676
- VHD : config .VHDUbuntu2404Gen2Containerd , //TODO: add support for older
1676
+ VHD : config .VHDUbuntu2204Gen2Containerd ,
1677
1677
BootstrapConfigMutator : func (nbc * datamodel.NodeBootstrappingConfiguration ) {
1678
1678
nbc .ContainerService .Properties .AgentPoolProfiles [0 ].VMSize = "Standard_ND96isr_MI300X_v5"
1679
- nbc .ContainerService .Properties .AgentPoolProfiles [0 ].Distro = "aks-cblmariner-v2-gen2"
1680
1679
nbc .AgentPoolProfile .VMSize = "Standard_ND96isr_MI300X_v5"
1681
- nbc .AgentPoolProfile .Distro = "aks-cblmariner-v2-gen2"
1682
1680
nbc .EnableAMDGPU = true
1683
1681
nbc .ConfigGPUDriverIfNeeded = true
1684
1682
},
@@ -1709,9 +1707,7 @@ func Test_Ubuntu2204Gen2Containerd_AMDGPU_V710(t *testing.T) {
1709
1707
VHD : config .VHDUbuntu2204Gen2Containerd ,
1710
1708
BootstrapConfigMutator : func (nbc * datamodel.NodeBootstrappingConfiguration ) {
1711
1709
nbc .ContainerService .Properties .AgentPoolProfiles [0 ].VMSize = "Standard_NV4ads_V710_v5"
1712
- nbc .ContainerService .Properties .AgentPoolProfiles [0 ].Distro = "aks-cblmariner-v2-gen2"
1713
1710
nbc .AgentPoolProfile .VMSize = "Standard_NV4ads_V710_v5"
1714
- nbc .AgentPoolProfile .Distro = "aks-cblmariner-v2-gen2"
1715
1711
nbc .EnableAMDGPU = true
1716
1712
nbc .ConfigGPUDriverIfNeeded = true
1717
1713
@@ -1722,6 +1718,43 @@ func Test_Ubuntu2204Gen2Containerd_AMDGPU_V710(t *testing.T) {
1722
1718
vmss .Properties .VirtualMachineProfile .StorageProfile .OSDisk .DiskSizeGB = to.Ptr [int32 ](128 )
1723
1719
},
1724
1720
Validator : func (ctx context.Context , s * Scenario ) {
1721
+ res := execScriptOnVMForScenario (ctx , s , "df" )
1722
+ t .Log (res .String ())
1723
+ ValidateAMDGPU (ctx , s )
1724
+ },
1725
+ },
1726
+ })
1727
+ }
1728
+
1729
+ func Test_Ubuntu2404Gen2_AMDGPU_V710 (t * testing.T ) {
1730
+ // the SKU isn't available in subscriptrion/region we run tests
1731
+ // TODO: enable once the SKU is available
1732
+ t .Skip ("Provisioning of NV4ads_V710_v5 isn't reliable yet" )
1733
+ //E2E_LOCATION=southcentralus
1734
+ //SUBSCRIPTION_ID=4f3dc0e4-0c77-40ff-bf9a-6ade1e3048ef
1735
+ RunScenario (t , & Scenario {
1736
+ Description : "Tests that a GPU-enabled node using a MarinerV2 VHD can be properly bootstrapped" ,
1737
+ Tags : Tags {
1738
+ GPU : true ,
1739
+ },
1740
+ Config : Config {
1741
+ Cluster : ClusterKubenet ,
1742
+ VHD : config .VHDUbuntu2404Gen2Containerd ,
1743
+ BootstrapConfigMutator : func (nbc * datamodel.NodeBootstrappingConfiguration ) {
1744
+ nbc .ContainerService .Properties .AgentPoolProfiles [0 ].VMSize = "Standard_NV4ads_V710_v5"
1745
+ nbc .AgentPoolProfile .VMSize = "Standard_NV4ads_V710_v5"
1746
+ nbc .EnableAMDGPU = true
1747
+ nbc .ConfigGPUDriverIfNeeded = true
1748
+
1749
+ },
1750
+ VMConfigMutator : func (vmss * armcompute.VirtualMachineScaleSet ) {
1751
+ vmss .SKU .Name = to .Ptr ("Standard_NV4ads_V710_v5" )
1752
+ // rocm images are huge, some space for manual testing
1753
+ vmss .Properties .VirtualMachineProfile .StorageProfile .OSDisk .DiskSizeGB = to.Ptr [int32 ](128 )
1754
+ //vmss.Properties.VirtualMachineProfile.ExtensionProfile.Extensions[0].Properties.ProtectedSettings[]
1755
+ },
1756
+ Validator : func (ctx context.Context , s * Scenario ) {
1757
+ execScriptOnVMForScenario (ctx , s , "df" )
1725
1758
ValidateAMDGPU (ctx , s )
1726
1759
},
1727
1760
},
0 commit comments