forked from aws/aws-ofi-nccl
-
Notifications
You must be signed in to change notification settings - Fork 0
77 lines (71 loc) · 2.16 KB
/
distcheck.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
name: PR CI
on: [push, pull_request]
env:
APT_PACKAGES: >-
build-essential
clang
gcc
git
libhwloc-dev
make
jobs:
distcheck:
runs-on: ubuntu-22.04
strategy:
matrix:
cc:
- gcc
- clang
sdk:
- cuda
- neuron
fail-fast: false
steps:
- name: Install Dependencies
run: |
sudo apt-get update -y
sudo apt-get install -y ${{ env.APT_PACKAGES }}
- name: Install CUDA SDK
if: matrix.sdk == 'cuda'
run: |
sudo apt-get install -y nvidia-cuda-toolkit
- name: Install Neuron SDK
if: matrix.sdk == 'neuron'
run: |
# Configure Linux for Neuron repository updates
. /etc/os-release
sudo tee /etc/apt/sources.list.d/neuron.list > /dev/null << EOC
deb https://apt.repos.neuron.amazonaws.com ${VERSION_CODENAME} main
EOC
wget -qO - https://apt.repos.neuron.amazonaws.com/GPG-PUB-KEY-AMAZON-AWS-NEURON.PUB | sudo apt-key add -
# Install Neuron Runtime
sudo apt-get install aws-neuronx-runtime-lib -y
- uses: actions/checkout@v4
- name: Build and Distribution Checks (CUDA)
if: matrix.sdk == 'cuda'
run: |
set -x
# We're just doing distchecks, so it is fine if we
# just grab the latest master.
git clone --depth 1 https://github.com/ofiwg/libfabric.git
pushd libfabric
./autogen.sh
./configure --prefix=$PWD/install CC=${{ matrix.cc }}
make -j $(nproc)
make install
popd
# actions/checkout@v4 would drop the plugin source in $PWD,
# so go ahead and build it
./autogen.sh
./configure --with-libfabric=$PWD/libfabric/install --with-cuda=/usr/local/cuda/ CC=${{ matrix.cc }}
make -j $(nproc)
# Run Unit tests
make check
# Run dist tarball checks
make distcheck
- name: Upload build logs
if: failure()
uses: actions/upload-artifact@v4
with:
name: ${{ matrix.cc }}-config.log
path: config.log