Set parallel count to avoid OOM in training GPU packaging pipeline (#…

…20255) ### Description make the compilation work on Azure CPU Agent by reduce the parallel count ### Motivation and Context The OOM issue mentioned in #20244 was caused the by low memory/parallel_count.
microsoft · Apr 10, 2024 · 0acde11 · 0acde11
1 parent 280b263
commit 0acde11
Showing 1 changed file with 3 additions and 2 deletions.
diff --git a/tools/ci_build/github/azure-pipelines/orttraining-py-packaging-pipeline-cuda12.yml b/tools/ci_build/github/azure-pipelines/orttraining-py-packaging-pipeline-cuda12.yml
@@ -11,7 +11,8 @@ resources:
 stages:
 - template: templates/py-packaging-training-cuda-stage.yml
   parameters:
-    build_py_parameters: --enable_training --update --build
+    # set the paralle count to reduce memory/build_threads to avoid OOM
+    build_py_parameters: --enable_training --update --build --parallel 8
     torch_version: '2.1.0'
     opset_version: '17'
     cuda_version: '12.2'
@@ -20,4 +21,4 @@ stages:
     agent_pool: Onnxruntime-Linux-GPU
     upload_wheel: 'yes'
     debug_build: false
-    build_pool_name: 'onnxruntime-Linux-GPU'
+    build_pool_name: 'onnxruntime-Ubuntu2204-AMD-CPU'