From fa7f674253f1ad56612f282e7baaa269511d4955 Mon Sep 17 00:00:00 2001 From: drisspg Date: Wed, 30 Jul 2025 10:58:56 -0700 Subject: [PATCH 1/4] Update [ghstack-poisoned] --- .github/workflows/test-b200.yml | 59 +++++++++++++++++++++++++++++++++ 1 file changed, 59 insertions(+) create mode 100644 .github/workflows/test-b200.yml diff --git a/.github/workflows/test-b200.yml b/.github/workflows/test-b200.yml new file mode 100644 index 000000000000..63e29a82e891 --- /dev/null +++ b/.github/workflows/test-b200.yml @@ -0,0 +1,59 @@ +name: Limited CI on B200 + +on: + pull_request: + paths: + - .github/workflows/test-b200.yml + workflow_dispatch: + schedule: + - cron: 0 4,10,16,22 * * * # every 6 hours + push: + tags: + - ciflow/b200/* + +concurrency: + group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.sha }}-${{ github.event_name == 'workflow_dispatch' }}-${{ github.event_name == 'schedule' }} + cancel-in-progress: true + +permissions: + id-token: write + contents: read + +jobs: + + get-label-type: + if: github.repository_owner == 'pytorch' + name: get-label-type + uses: pytorch/pytorch/.github/workflows/_runner-determinator.yml@main + with: + triggering_actor: ${{ github.triggering_actor }} + issue_owner: ${{ github.event.pull_request.user.login || github.event.issue.user.login }} + curr_branch: ${{ github.head_ref || github.ref_name }} + curr_ref_type: ${{ github.ref_type }} + + linux-jammy-cuda12_8-py3_10-gcc11-sm100-build: + name: linux-jammy-cuda12.8-py3.10-gcc11-sm100 + uses: ./.github/workflows/_linux-build.yml + needs: get-label-type + with: + runner_prefix: "${{ needs.get-label-type.outputs.label-type }}" + runner: linux.12xlarge.memory + build-environment: linux-jammy-cuda12.8-py3.10-gcc11-sm100 + docker-image-name: ci-image:pytorch-linux-jammy-cuda12.8-cudnn9-py3-gcc11 + cuda-arch-list: '10.0' + test-matrix: | + { include: [ + { config: "smoke", shard: 1, num_shards: 1, runner: "linux.dgx.b200" }, + ]} + secrets: inherit + + linux-jammy-cuda12_8-py3_10-gcc11-sm100-test: + name: linux-jammy-cuda12.8-py3.10-gcc11-sm100 + uses: ./.github/workflows/_linux-test.yml + needs: + - linux-jammy-cuda12_8-py3_10-gcc11-sm100-build + with: + build-environment: linux-jammy-cuda12.8-py3.10-gcc11-sm100 + docker-image: ${{ needs.linux-jammy-cuda12_8-py3_10-gcc11-sm100-build.outputs.docker-image }} + test-matrix: ${{ needs.linux-jammy-cuda12_8-py3_10-gcc11-sm100-build.outputs.test-matrix }} + secrets: inherit \ No newline at end of file From 6ea0a7e9238c8c4f4e041444d418f3e9368d9445 Mon Sep 17 00:00:00 2001 From: drisspg Date: Wed, 30 Jul 2025 11:30:14 -0700 Subject: [PATCH 2/4] Update [ghstack-poisoned] --- .ci/pytorch/test.sh | 2 +- .github/workflows/test-b200.yml | 18 +++++++++++++++++- 2 files changed, 18 insertions(+), 2 deletions(-) diff --git a/.ci/pytorch/test.sh b/.ci/pytorch/test.sh index 35c828042ac8..2966eee0047f 100755 --- a/.ci/pytorch/test.sh +++ b/.ci/pytorch/test.sh @@ -323,7 +323,7 @@ test_python() { } test_python_smoke() { - # Smoke tests for H100 + # Smoke tests for H100/B200 time python test/run_test.py --include test_matmul_cuda inductor/test_fp8 inductor/test_max_autotune $PYTHON_TEST_EXTRA_OPTION --upload-artifacts-while-running assert_git_not_dirty } diff --git a/.github/workflows/test-b200.yml b/.github/workflows/test-b200.yml index 63e29a82e891..5712bd13b9cc 100644 --- a/.github/workflows/test-b200.yml +++ b/.github/workflows/test-b200.yml @@ -1,4 +1,19 @@ -name: Limited CI on B200 +# B200 Smoke Tests CI Workflow +# +# This workflow runs smoke tests on B200 hardware +# +# Flow: +# 1. Builds PyTorch with CUDA 12.8+ and sm100 architecture for B200 +# 2. Runs smoke tests on linux.dgx.b200 runner +# 3. Tests executed are defined in .ci/pytorch/test.sh -> test_python_smoke() function +# +# Triggered by: +# - Pull requests modifying this workflow file +# - Manual dispatch +# - Schedule (every 6 hours) +# - Adding ciflow/b200 label to a PR (creates ciflow/b200/* tag) + +name: B200 Smoke Tests on: pull_request: @@ -45,6 +60,7 @@ jobs: { include: [ { config: "smoke", shard: 1, num_shards: 1, runner: "linux.dgx.b200" }, ]} + # config: "smoke" maps to test_python_smoke() in .ci/pytorch/test.sh secrets: inherit linux-jammy-cuda12_8-py3_10-gcc11-sm100-test: From 301220775928533d1f1f3975694c09ac393cf662 Mon Sep 17 00:00:00 2001 From: drisspg Date: Mon, 4 Aug 2025 12:28:51 -0700 Subject: [PATCH 3/4] Update [ghstack-poisoned] --- .github/workflows/test-b200.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/test-b200.yml b/.github/workflows/test-b200.yml index 5712bd13b9cc..ac42234e3773 100644 --- a/.github/workflows/test-b200.yml +++ b/.github/workflows/test-b200.yml @@ -72,4 +72,5 @@ jobs: build-environment: linux-jammy-cuda12.8-py3.10-gcc11-sm100 docker-image: ${{ needs.linux-jammy-cuda12_8-py3_10-gcc11-sm100-build.outputs.docker-image }} test-matrix: ${{ needs.linux-jammy-cuda12_8-py3_10-gcc11-sm100-build.outputs.test-matrix }} + aws-role-to-assume: arn:aws:iam::308535385114:role/gha_workflow_s3_and_ecr_read_only secrets: inherit \ No newline at end of file From 876f42d844a9725e0eb35ac0623ab47536c54535 Mon Sep 17 00:00:00 2001 From: drisspg Date: Mon, 4 Aug 2025 14:59:56 -0700 Subject: [PATCH 4/4] Update [ghstack-poisoned] --- .github/pytorch-probot.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/pytorch-probot.yml b/.github/pytorch-probot.yml index a5982b63b70f..fce51aba06cb 100644 --- a/.github/pytorch-probot.yml +++ b/.github/pytorch-probot.yml @@ -34,6 +34,7 @@ ciflow_push_tags: - ciflow/win-arm64 - ciflow/h100-symm-mem - ciflow/h100-cutlass-backend +- ciflow/b200 retryable_workflows: - pull - trunk