diff options
author | Nicolas Patry <patry.nicolas@protonmail.com> | 2024-02-13 19:06:15 +0100 |
---|---|---|
committer | GitHub <noreply@github.com> | 2024-02-13 19:06:15 +0100 |
commit | 14010a8498af3383b004be1f55a2fa39bce5389d (patch) | |
tree | ae6e4e5b74999317b374e4a2b294bfdd7ff421f2 /.github | |
parent | 0de079522023002b74127a7767a13d6c1e8b007c (diff) | |
download | candle-14010a8498af3383b004be1f55a2fa39bce5389d.tar.gz candle-14010a8498af3383b004be1f55a2fa39bce5389d.tar.bz2 candle-14010a8498af3383b004be1f55a2fa39bce5389d.zip |
Update our cuda runner. (#1705)
* Update our cuda runner.
* Fix install rust.
* Simplify.
* Docker in docker.
* Install curl
* Install curl
* No sudo.
* devel
* Put curl again.
* Add missing deps.
* pkg-config.
* Cleanup.
Diffstat (limited to '.github')
-rw-r--r-- | .github/workflows/ci_cuda.yaml | 74 |
1 files changed, 9 insertions, 65 deletions
diff --git a/.github/workflows/ci_cuda.yaml b/.github/workflows/ci_cuda.yaml index 02814ed7..0c874e24 100644 --- a/.github/workflows/ci_cuda.yaml +++ b/.github/workflows/ci_cuda.yaml @@ -5,49 +5,15 @@ on: pull_request: jobs: - start-runner: - name: Start self-hosted EC2 runner - runs-on: ubuntu-latest - # Don't run on forks, they won't have access to secrets anyway. - if: ${{ github.event.pull_request.head.repo.full_name == github.event.pull_request.base.repo.full_name }} - env: - AWS_REGION: us-east-1 - EC2_AMI_ID: ami-03cfed9ea28f4b002 - EC2_INSTANCE_TYPE: g5.xlarge - EC2_SUBNET_ID: subnet-931b34f5,subnet-ecb993cd,subnet-943dc2d8,subnet-45371f1a,subnet-ee93e0df,subnet-fddc3dfc - EC2_SECURITY_GROUP: sg-030175c435ac141d6 - outputs: - label: ${{ steps.start-ec2-runner.outputs.label }} - ec2-instance-id: ${{ steps.start-ec2-runner.outputs.ec2-instance-id }} - steps: - - name: Configure AWS credentials - uses: aws-actions/configure-aws-credentials@v1 - with: - aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }} - aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }} - aws-region: ${{ env.AWS_REGION }} - - name: Start EC2 runner - id: start-ec2-runner - uses: philschmid/philschmid-ec2-github-runner@main - with: - mode: start - github-token: ${{ secrets.GH_PERSONAL_ACCESS_TOKEN }} - ec2-image-id: ${{ env.EC2_AMI_ID }} - ec2-instance-type: ${{ env.EC2_INSTANCE_TYPE }} - subnet-id: ${{ env.EC2_SUBNET_ID }} - security-group-id: ${{ env.EC2_SECURITY_GROUP }} - aws-resource-tags: > # optional, requires additional permissions - [ - {"Key": "Name", "Value": "ec2-tgi-github-runner"}, - {"Key": "GitHubRepository", "Value": "${{ github.repository }}"} - ] - test-cuda: concurrency: group: ${{ github.workflow }}-${{ github.job }}-${{ github.head_ref || github.run_id }} cancel-in-progress: true - needs: start-runner # required to start the main job when the runner is ready - runs-on: ${{ needs.start-runner.outputs.label }} # run the job on the newly created runner + runs-on: [single-gpu, nvidia-gpu, t4, ci] + container: + image: nvidia/cuda:12.3.1-devel-ubuntu22.04 + options: --gpus 0 + if: ${{ github.event.pull_request.head.repo.full_name == github.event.pull_request.base.repo.full_name }} permissions: contents: write packages: write @@ -58,32 +24,10 @@ jobs: steps: - name: Checkout repository uses: actions/checkout@v3 + - name: Install dependencies + run: apt-get update && apt install curl build-essential libssl-dev protobuf-compiler pkg-config -y - name: Install Rust Stable - run: curl https://sh.rustup.rs -sSf | sh -s -- -y + uses: actions-rust-lang/setup-rust-toolchain@v1 - uses: Swatinem/rust-cache@v2 - - run: apt-get update -y && apt-get install libssl-dev protobuf-compiler -y - name: Test (cuda) - run: PATH=$PATH:/usr/local/cuda-11.8/bin/ /root/.cargo/bin/cargo test --features cuda - stop-runner: - name: Stop self-hosted EC2 runner - needs: - - start-runner - - test-cuda - runs-on: ubuntu-latest - env: - AWS_REGION: us-east-1 - if: ${{ (success() || failure()) && github.event.pull_request.head.repo.full_name == github.event.pull_request.base.repo.full_name }} # required to stop the runner even if the error happened in the previous jobs - steps: - - name: Configure AWS credentials - uses: aws-actions/configure-aws-credentials@v1 - with: - aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }} - aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }} - aws-region: ${{ env.AWS_REGION }} - - name: Stop EC2 runner - uses: philschmid/philschmid-ec2-github-runner@main - with: - mode: stop - github-token: ${{ secrets.GH_PERSONAL_ACCESS_TOKEN }} - label: ${{ needs.start-runner.outputs.label }} - ec2-instance-id: ${{ needs.start-runner.outputs.ec2-instance-id }} + run: cargo test --features cuda |