summaryrefslogtreecommitdiff
path: root/.github
diff options
context:
space:
mode:
authorNicolas Patry <patry.nicolas@protonmail.com>2024-02-13 19:06:15 +0100
committerGitHub <noreply@github.com>2024-02-13 19:06:15 +0100
commit14010a8498af3383b004be1f55a2fa39bce5389d (patch)
treeae6e4e5b74999317b374e4a2b294bfdd7ff421f2 /.github
parent0de079522023002b74127a7767a13d6c1e8b007c (diff)
downloadcandle-14010a8498af3383b004be1f55a2fa39bce5389d.tar.gz
candle-14010a8498af3383b004be1f55a2fa39bce5389d.tar.bz2
candle-14010a8498af3383b004be1f55a2fa39bce5389d.zip
Update our cuda runner. (#1705)
* Update our cuda runner. * Fix install rust. * Simplify. * Docker in docker. * Install curl * Install curl * No sudo. * devel * Put curl again. * Add missing deps. * pkg-config. * Cleanup.
Diffstat (limited to '.github')
-rw-r--r--.github/workflows/ci_cuda.yaml74
1 files changed, 9 insertions, 65 deletions
diff --git a/.github/workflows/ci_cuda.yaml b/.github/workflows/ci_cuda.yaml
index 02814ed7..0c874e24 100644
--- a/.github/workflows/ci_cuda.yaml
+++ b/.github/workflows/ci_cuda.yaml
@@ -5,49 +5,15 @@ on:
pull_request:
jobs:
- start-runner:
- name: Start self-hosted EC2 runner
- runs-on: ubuntu-latest
- # Don't run on forks, they won't have access to secrets anyway.
- if: ${{ github.event.pull_request.head.repo.full_name == github.event.pull_request.base.repo.full_name }}
- env:
- AWS_REGION: us-east-1
- EC2_AMI_ID: ami-03cfed9ea28f4b002
- EC2_INSTANCE_TYPE: g5.xlarge
- EC2_SUBNET_ID: subnet-931b34f5,subnet-ecb993cd,subnet-943dc2d8,subnet-45371f1a,subnet-ee93e0df,subnet-fddc3dfc
- EC2_SECURITY_GROUP: sg-030175c435ac141d6
- outputs:
- label: ${{ steps.start-ec2-runner.outputs.label }}
- ec2-instance-id: ${{ steps.start-ec2-runner.outputs.ec2-instance-id }}
- steps:
- - name: Configure AWS credentials
- uses: aws-actions/configure-aws-credentials@v1
- with:
- aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
- aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
- aws-region: ${{ env.AWS_REGION }}
- - name: Start EC2 runner
- id: start-ec2-runner
- uses: philschmid/philschmid-ec2-github-runner@main
- with:
- mode: start
- github-token: ${{ secrets.GH_PERSONAL_ACCESS_TOKEN }}
- ec2-image-id: ${{ env.EC2_AMI_ID }}
- ec2-instance-type: ${{ env.EC2_INSTANCE_TYPE }}
- subnet-id: ${{ env.EC2_SUBNET_ID }}
- security-group-id: ${{ env.EC2_SECURITY_GROUP }}
- aws-resource-tags: > # optional, requires additional permissions
- [
- {"Key": "Name", "Value": "ec2-tgi-github-runner"},
- {"Key": "GitHubRepository", "Value": "${{ github.repository }}"}
- ]
-
test-cuda:
concurrency:
group: ${{ github.workflow }}-${{ github.job }}-${{ github.head_ref || github.run_id }}
cancel-in-progress: true
- needs: start-runner # required to start the main job when the runner is ready
- runs-on: ${{ needs.start-runner.outputs.label }} # run the job on the newly created runner
+ runs-on: [single-gpu, nvidia-gpu, t4, ci]
+ container:
+ image: nvidia/cuda:12.3.1-devel-ubuntu22.04
+ options: --gpus 0
+ if: ${{ github.event.pull_request.head.repo.full_name == github.event.pull_request.base.repo.full_name }}
permissions:
contents: write
packages: write
@@ -58,32 +24,10 @@ jobs:
steps:
- name: Checkout repository
uses: actions/checkout@v3
+ - name: Install dependencies
+ run: apt-get update && apt install curl build-essential libssl-dev protobuf-compiler pkg-config -y
- name: Install Rust Stable
- run: curl https://sh.rustup.rs -sSf | sh -s -- -y
+ uses: actions-rust-lang/setup-rust-toolchain@v1
- uses: Swatinem/rust-cache@v2
- - run: apt-get update -y && apt-get install libssl-dev protobuf-compiler -y
- name: Test (cuda)
- run: PATH=$PATH:/usr/local/cuda-11.8/bin/ /root/.cargo/bin/cargo test --features cuda
- stop-runner:
- name: Stop self-hosted EC2 runner
- needs:
- - start-runner
- - test-cuda
- runs-on: ubuntu-latest
- env:
- AWS_REGION: us-east-1
- if: ${{ (success() || failure()) && github.event.pull_request.head.repo.full_name == github.event.pull_request.base.repo.full_name }} # required to stop the runner even if the error happened in the previous jobs
- steps:
- - name: Configure AWS credentials
- uses: aws-actions/configure-aws-credentials@v1
- with:
- aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
- aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
- aws-region: ${{ env.AWS_REGION }}
- - name: Stop EC2 runner
- uses: philschmid/philschmid-ec2-github-runner@main
- with:
- mode: stop
- github-token: ${{ secrets.GH_PERSONAL_ACCESS_TOKEN }}
- label: ${{ needs.start-runner.outputs.label }}
- ec2-instance-id: ${{ needs.start-runner.outputs.ec2-instance-id }}
+ run: cargo test --features cuda