From cbede2969ba9878796b7e9b6723e823f68a3125f Mon Sep 17 00:00:00 2001 From: Jitesh Gupta Date: Mon, 28 Jul 2025 04:32:25 -0700 Subject: [PATCH] Add self-hosted runner scale set workflow for mi325 CI (#39651) --- .../self-scheduled-amd-mi325-caller.yml | 63 +++++++++++++++++++ 1 file changed, 63 insertions(+) create mode 100644 .github/workflows/self-scheduled-amd-mi325-caller.yml diff --git a/.github/workflows/self-scheduled-amd-mi325-caller.yml b/.github/workflows/self-scheduled-amd-mi325-caller.yml new file mode 100644 index 0000000000..bc0dfe0e57 --- /dev/null +++ b/.github/workflows/self-scheduled-amd-mi325-caller.yml @@ -0,0 +1,63 @@ +name: Self-hosted runner scale set (AMD mi325 scheduled CI caller) + +# Note: For every job in this workflow, the name of the runner scale set is finalized in the runner yaml i.e. huggingface/hf-workflows/.github/workflows/transformers_amd_ci_scheduled_arc_scale_set.yaml +# For example, 1gpu scale set: amd-mi325-ci-1gpu +# 2gpu scale set: amd-mi325-ci-2gpu + +on: + workflow_run: + workflows: ["Self-hosted runner (AMD scheduled CI caller)"] + branches: ["main"] + types: [completed] + push: + branches: + - run_amd_scheduled_ci_caller* + +jobs: + model-ci: + name: Model CI + uses: huggingface/hf-workflows/.github/workflows/transformers_amd_ci_scheduled_arc_scale_set.yaml@main + with: + job: run_models_gpu + slack_report_channel: "#amd-hf-ci" + runner_scale_set: amd-mi325-ci + docker: huggingface/transformers-pytorch-amd-gpu + ci_event: Scheduled CI (AMD) - mi325 + report_repo_id: optimum-amd/transformers_daily_ci + secrets: inherit + + torch-pipeline: + name: Torch pipeline CI + uses: huggingface/hf-workflows/.github/workflows/transformers_amd_ci_scheduled_arc_scale_set.yaml@main + with: + job: run_pipelines_torch_gpu + slack_report_channel: "#amd-hf-ci" + runner_scale_set: amd-mi325-ci + docker: huggingface/transformers-pytorch-amd-gpu + ci_event: Scheduled CI (AMD) - mi325 + report_repo_id: optimum-amd/transformers_daily_ci + secrets: inherit + + example-ci: + name: Example CI + uses: huggingface/hf-workflows/.github/workflows/transformers_amd_ci_scheduled_arc_scale_set.yaml@main + with: + job: run_examples_gpu + slack_report_channel: "#amd-hf-ci" + runner_scale_set: amd-mi325-ci + docker: huggingface/transformers-pytorch-amd-gpu + ci_event: Scheduled CI (AMD) - mi325 + report_repo_id: optimum-amd/transformers_daily_ci + secrets: inherit + + deepspeed-ci: + name: DeepSpeed CI + uses: huggingface/hf-workflows/.github/workflows/transformers_amd_ci_scheduled_arc_scale_set.yaml@main + with: + job: run_torch_cuda_extensions_gpu + slack_report_channel: "#amd-hf-ci" + runner_scale_set: amd-mi325-ci + docker: huggingface/transformers-pytorch-deepspeed-amd-gpu + ci_event: Scheduled CI (AMD) - mi325 + report_repo_id: optimum-amd/transformers_daily_ci + secrets: inherit