diff --git a/.github/pytorch-probot.yml b/.github/pytorch-probot.yml index 9eae404af4..d46cd75c84 100644 --- a/.github/pytorch-probot.yml +++ b/.github/pytorch-probot.yml @@ -1,3 +1,4 @@ ciflow_push_tags: - ciflow/8gpu + - ciflow/h100.8 labeler_config: labeler.yml diff --git a/.github/workflows/integration_test_8gpu_graph_trainer_h100.yaml b/.github/workflows/integration_test_8gpu_graph_trainer_h100.yaml index 701b840ab6..01723af4ec 100644 --- a/.github/workflows/integration_test_8gpu_graph_trainer_h100.yaml +++ b/.github/workflows/integration_test_8gpu_graph_trainer_h100.yaml @@ -7,7 +7,7 @@ on: - 'torchtitan/experiments/graph_trainer/**' - '.github/workflows/integration_test_8gpu_graph_trainer_h100.yaml' pull_request: - types: [opened, synchronize, reopened, ready_for_review] + types: [labeled, synchronize] paths: - 'torchtitan/experiments/graph_trainer/**' - '.github/workflows/integration_test_8gpu_graph_trainer_h100.yaml' @@ -29,7 +29,7 @@ permissions: jobs: build-test: - if: github.event_name != 'pull_request' || github.event.pull_request.draft == false + if: github.event_name != 'pull_request' || contains(github.event.pull_request.labels.*.name, 'ciflow/h100.8') uses: pytorch/test-infra/.github/workflows/linux_job_v2.yml@main with: runner: linux.aws.h100.8 diff --git a/.github/workflows/integration_test_8gpu_h100.yaml b/.github/workflows/integration_test_8gpu_h100.yaml index fc884482cb..debfa87587 100644 --- a/.github/workflows/integration_test_8gpu_h100.yaml +++ b/.github/workflows/integration_test_8gpu_h100.yaml @@ -3,12 +3,10 @@ name: 8 GPU Integration Test on H100 on: push: branches: [ main ] - tags: - - ciflow/8gpu/* paths-ignore: - 'torchtitan/experiments/**' pull_request: - types: [opened, synchronize, reopened, ready_for_review] + types: [labeled, synchronize] branches: [ main ] paths-ignore: - 'torchtitan/experiments/**' @@ -31,6 +29,7 @@ permissions: jobs: # Step 1: Dynamically compute the matrix based on conditions set-matrix: + if: github.event_name != 'pull_request' || contains(github.event.pull_request.labels.*.name, 'ciflow/h100.8') uses: ./.github/workflows/set-matrix.yaml with: runner-rocm: linux.rocm.gpu.gfx942.8