From b50075343aeb519d135e00c44ff3577eaa25c61b Mon Sep 17 00:00:00 2001 From: fduwjj Date: Wed, 25 Jun 2025 14:28:24 -0700 Subject: [PATCH] [distributed] Enable H100 test for all distributed related changes (#156721) We want to run H100 CI for distributed related changes. We already have a labeling of oncall:distributed when touching distributed related code: https://github.com/pytorch/pytorch/blob/4491326fb0c0e67eca1598ae33c41cdfced2cd33/.github/labeler.yml#L94. So we want to leverage that. Pull Request resolved: https://github.com/pytorch/pytorch/pull/156721 Approved by: https://github.com/huydhn --- .github/label_to_label.yml | 9 +++++++++ .github/workflows/h100-distributed.yml | 2 ++ 2 files changed, 11 insertions(+) diff --git a/.github/label_to_label.yml b/.github/label_to_label.yml index 28bad93f808d..0cd56143535f 100644 --- a/.github/label_to_label.yml +++ b/.github/label_to_label.yml @@ -48,3 +48,12 @@ - "module: dynamic shapes" then: - "oncall: pt2" +- any: + - "release notes: distributed (c10d)" + - "release notes: distributed (symm_mem)" + - "release notes: distributed (pipeline)" + - "release notes: distributed (fsdp)" + - "release notes: distributed (dtensor)" + - "oncall: distributed" + then: + - "ciflow/h100-distributed" diff --git a/.github/workflows/h100-distributed.yml b/.github/workflows/h100-distributed.yml index 6a8c76a8ec78..45579672f232 100644 --- a/.github/workflows/h100-distributed.yml +++ b/.github/workflows/h100-distributed.yml @@ -8,6 +8,8 @@ on: push: tags: - ciflow/h100-distributed/* + schedule: + - cron: 46 8 * * * # about 1:46am PDT concurrency: group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.sha }}-${{ github.event_name == 'workflow_dispatch' }}-${{ github.event_name == 'schedule' }}