-
Notifications
You must be signed in to change notification settings - Fork 488
113 lines (102 loc) · 3.5 KB
/
build_and_test.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
name: Build and test
on:
pull_request:
branches:
- master
- r[0-9]+.[0-9]+
paths-ignore:
- 'experimental/torch_xla2/**'
push:
branches:
- master
- r[0-9]+.[0-9]+
paths-ignore:
- 'experimental/torch_xla2/**'
workflow_dispatch:
concurrency:
group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.sha }}-${{ github.event_name == 'workflow_dispatch' }}-${{ github.event_name == 'schedule' }}
cancel-in-progress: true
jobs:
# Old CI workflow
build:
name: "Build PyTorch/XLA (GPU)"
uses: ./.github/workflows/_build.yml
with:
ecr-docker-image-base: 308535385114.dkr.ecr.us-east-1.amazonaws.com/pytorch/xla_base
gcr-docker-image: gcr.io/tpu-pytorch/xla_base:dev-3.8_cuda_12.1
cuda: 1
secrets:
gcloud-service-key: ${{ secrets.GCLOUD_SERVICE_KEY }}
test-cpp-cpu:
name: "CPU C++ tests"
uses: ./.github/workflows/_test_cpp.yml
needs: build
with:
docker-image: ${{ needs.build.outputs.docker-image }}
timeout-minutes: 120
collect-coverage: false # TODO(yeounoh) separate from CPU coverage metrics
secrets:
gcloud-service-key: ${{ secrets.GCLOUD_SERVICE_KEY }}
test-cpp-cuda:
name: "GPU C++ tests"
uses: ./.github/workflows/_test_cpp.yml
needs: build
with:
docker-image: ${{ needs.build.outputs.docker-image }}
runner: linux.8xlarge.nvidia.gpu
timeout-minutes: 300
collect-coverage: false # TODO(yeounoh) separate from CPU coverage metrics
secrets:
gcloud-service-key: ${{ secrets.GCLOUD_SERVICE_KEY }}
push-docs:
name: "Build & publish docs"
if: github.event_name == 'push' && (github.event.ref == 'refs/heads/master' || startsWith(github.event.ref, 'refs/tags/r'))
uses: ./.github/workflows/_docs.yml
needs: build
with:
docker-image: ${{ needs.build.outputs.docker-image }}
secrets:
torchxla-bot-token: ${{ secrets.TORCH_XLA_BOT_TOKEN }}
# New CI workflow
build-torch-xla:
name: "Build PyTorch/XLA (TPU)"
uses: ./.github/workflows/_build_torch_xla.yml
with:
dev-image: us-central1-docker.pkg.dev/tpu-pytorch-releases/docker/development:3.10_tpuvm
secrets:
gcloud-service-key: ${{ secrets.GCLOUD_SERVICE_KEY }}
build-cuda-plugin:
name: "Build XLA CUDA plugin"
uses: ./.github/workflows/_build_plugin.yml
with:
dev-image: us-central1-docker.pkg.dev/tpu-pytorch-releases/docker/development:3.10_cuda_12.1
secrets:
gcloud-service-key: ${{ secrets.GCLOUD_SERVICE_KEY }}
test-python-cpu:
name: "CPU Python tests"
uses: ./.github/workflows/_test_python.yml
needs: build-torch-xla
with:
dev-image: us-central1-docker.pkg.dev/tpu-pytorch-releases/docker/development:3.10_tpuvm
timeout-minutes: 120
collect-coverage: false
secrets:
gcloud-service-key: ${{ secrets.GCLOUD_SERVICE_KEY }}
test-python-cuda:
name: "GPU Python tests"
uses: ./.github/workflows/_test_python.yml
needs: [build-torch-xla, build-cuda-plugin]
with:
dev-image: us-central1-docker.pkg.dev/tpu-pytorch-releases/docker/development:3.10_cuda_12.1
runner: linux.8xlarge.nvidia.gpu
timeout-minutes: 300
collect-coverage: false
install-cuda-plugin: true
secrets:
gcloud-service-key: ${{ secrets.GCLOUD_SERVICE_KEY }}
test-tpu:
name: "TPU tests"
uses: ./.github/workflows/_tpu_ci.yml
needs: build-torch-xla
# Only run this for HEAD and releases
if: github.event_name == 'push'