@@ -1991,8 +1991,8 @@ def launchTestJobs(pipeline, testFilter, dockerNode=null)
1991
1991
x86SlurmTestConfigs = [
1992
1992
" DGX_B200-4_GPUs-PyTorch-1" : [" b200-x4" , " l0_dgx_b200" , 1 , 2 , 4 ],
1993
1993
" DGX_B200-4_GPUs-PyTorch-2" : [" b200-x4" , " l0_dgx_b200" , 2 , 2 , 4 ],
1994
- " DGX_B200-4_GPUs -PyTorch-Post-Merge- 1" : [" b200-x4 " , " l0_dgx_b200" , 1 , 2 , 4 ],
1995
- " DGX_B200-4_GPUs-PyTorch-Post-Merge-2 " : [" b200-x4" , " l0_dgx_b200" , 2 , 2 , 4 ],
1994
+ " DGX_B200-8_GPUs -PyTorch-1" : [" b200-x8 " , " l0_dgx_b200" , 1 , 1 , 8 ],
1995
+ " DGX_B200-4_GPUs-PyTorch-Post-Merge-1 " : [" b200-x4" , " l0_dgx_b200" , 1 , 1 , 4 ],
1996
1996
]
1997
1997
fullSet + = x86SlurmTestConfigs. keySet()
1998
1998
@@ -2012,8 +2012,7 @@ def launchTestJobs(pipeline, testFilter, dockerNode=null)
2012
2012
// Try to match what are being tested on x86 H100_PCIe.
2013
2013
// The total machine time is scaled proportionally according to the number of each GPU.
2014
2014
SBSATestConfigs = [
2015
- " GH200-TensorRT-Post-Merge-1" : [" gh200" , " l0_gh200" , 1 , 2 ],
2016
- " GH200-TensorRT-Post-Merge-2" : [" gh200" , " l0_gh200" , 2 , 2 ],
2015
+ " GH200-TensorRT-Post-Merge-1" : [" gh200" , " l0_gh200" , 1 , 1 ],
2017
2016
]
2018
2017
fullSet + = SBSATestConfigs . keySet()
2019
2018
@@ -2026,12 +2025,15 @@ def launchTestJobs(pipeline, testFilter, dockerNode=null)
2026
2025
2027
2026
multiNodesSBSAConfigs = [
2028
2027
// Each stage test 1 testcase with 8 GPUs and 2 nodes.
2029
- " GB200-8_GPUs-2_Nodes-PyTorch-Post-Merge-1" : [" gb200-multi-node" , " l0_gb200_multi_nodes" , 1 , 7 , 8 , 2 ],
2030
- " GB200-8_GPUs-2_Nodes-PyTorch-Post-Merge-2" : [" gb200-multi-node" , " l0_gb200_multi_nodes" , 2 , 7 , 8 , 2 ],
2031
- " GB200-8_GPUs-2_Nodes-PyTorch-Post-Merge-3" : [" gb200-multi-node" , " l0_gb200_multi_nodes" , 3 , 7 , 8 , 2 ],
2032
- " GB200-8_GPUs-2_Nodes-PyTorch-Post-Merge-4" : [" gb200-multi-node" , " l0_gb200_multi_nodes" , 4 , 7 , 8 , 2 ],
2033
- " GB200-8_GPUs-2_Nodes-PyTorch-Post-Merge-5" : [" gb200-multi-node" , " l0_gb200_multi_nodes" , 5 , 7 , 8 , 2 ],
2034
- " GB200-8_GPUs-2_Nodes-PyTorch-Post-Merge-6" : [" gb200-multi-node" , " l0_gb200_multi_nodes" , 6 , 7 , 8 , 2 ],
2028
+ " GB200-8_GPUs-2_Nodes-PyTorch-1" : [" gb200-multi-node" , " l0_gb200_multi_nodes" , 1 , 4 , 8 , 2 ],
2029
+ " GB200-8_GPUs-2_Nodes-PyTorch-2" : [" gb200-multi-node" , " l0_gb200_multi_nodes" , 2 , 4 , 8 , 2 ],
2030
+ " GB200-8_GPUs-2_Nodes-PyTorch-3" : [" gb200-multi-node" , " l0_gb200_multi_nodes" , 3 , 4 , 8 , 2 ],
2031
+ " GB200-8_GPUs-2_Nodes-PyTorch-4" : [" gb200-multi-node" , " l0_gb200_multi_nodes" , 4 , 4 , 8 , 2 ],
2032
+ " GB200-8_GPUs-2_Nodes-PyTorch-Post-Merge-1" : [" gb200-multi-node" , " l0_gb200_multi_nodes" , 1 , 5 , 8 , 2 ],
2033
+ " GB200-8_GPUs-2_Nodes-PyTorch-Post-Merge-2" : [" gb200-multi-node" , " l0_gb200_multi_nodes" , 2 , 5 , 8 , 2 ],
2034
+ " GB200-8_GPUs-2_Nodes-PyTorch-Post-Merge-3" : [" gb200-multi-node" , " l0_gb200_multi_nodes" , 3 , 5 , 8 , 2 ],
2035
+ " GB200-8_GPUs-2_Nodes-PyTorch-Post-Merge-4" : [" gb200-multi-node" , " l0_gb200_multi_nodes" , 4 , 5 , 8 , 2 ],
2036
+ " GB200-8_GPUs-2_Nodes-PyTorch-Post-Merge-5" : [" gb200-multi-node" , " l0_gb200_multi_nodes" , 5 , 5 , 8 , 2 ],
2035
2037
]
2036
2038
fullSet + = multiNodesSBSAConfigs. keySet()
2037
2039
0 commit comments