Skip to content

Workflow file for this run

name: Rust GPU Tests
on:
push:
concurrency:
group: "${{ github.workflow }} @ ${{ github.event.pull_request.head.label || github.head_ref || github.ref }}"
cancel-in-progress: true
jobs:
e2e:
runs-on: gpu
steps:
- name: Checkout code
uses: actions/checkout@v4
- name: Show errors inline
uses: r7kamura/rust-problem-matchers@v1
- name: Install apt dependencies
run: sudo apt-get update && sudo apt-get install -y pkg-config libssl-dev
- name: Install CUDA and NCCL dependencies
env:
DEBIAN_FRONTEND: noninteractive
run: |
sudo apt-get purge nvidia-*
sudo apt-get autoremove
wget -q https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/x86_64/cuda-keyring_1.0-1_all.deb
sudo dpkg -i cuda-keyring_1.0-1_all.deb
sudo apt-get update
sudo apt-get -y install -f nvidia-dkms-555 vidia-kernel-common-555 nvidia-dkms-555-open nvidia-kernel-common-555 nvidia-driver-555 nvidia-driver-555-open cuda-drivers-555 cuda-drivers cuda-demo-suite-12-1 cuda-runtime-12-1 cuda-12-1
cd nccl
make -j4 pkg.debian.build
sudo dpkg -i build/pkg/deb/libnccl*.deb
- name: Install Rust nightly
uses: dtolnay/rust-toolchain@master
with:
toolchain: nightly
- name: E2E Tests
run: cargo test --release e2e
env:
NCCL_P2P_DIRECT_DISABLE: 1
NCCL_NET: Socket