diff --git a/.github/workflows/aws_tfhe_multi_gpu_tests.yml b/.github/workflows/aws_tfhe_multi_gpu_tests.yml index 75189f05f..5edeb280d 100644 --- a/.github/workflows/aws_tfhe_multi_gpu_tests.yml +++ b/.github/workflows/aws_tfhe_multi_gpu_tests.yml @@ -48,6 +48,10 @@ jobs: - tfhe/src/high_level_api/** - tfhe/src/c_api/** - 'tfhe/docs/**.md' + - Makefile + - '.github/workflows/aws_tfhe_multi_gpu**' + - scripts/** + - ci/** setup-instance: name: Setup instance (cuda-tests-multi-gpu) diff --git a/.github/workflows/integer_multi_bit_multi_gpu_benchmark.yml b/.github/workflows/integer_multi_bit_multi_gpu_benchmark.yml index 017e15d91..ad8f43177 100644 --- a/.github/workflows/integer_multi_bit_multi_gpu_benchmark.yml +++ b/.github/workflows/integer_multi_bit_multi_gpu_benchmark.yml @@ -49,7 +49,7 @@ jobs: slab-url: ${{ secrets.SLAB_BASE_URL }} job-secret: ${{ secrets.JOB_SECRET }} backend: hyperstack - profile: multi-h100-nvlink + profile: multi-h100 cuda-integer-multi-bit-multi-gpu-benchmarks: name: Execute multi GPU integer multi-bit benchmarks @@ -153,7 +153,7 @@ jobs: run: | python3 ./ci/benchmark_parser.py target/criterion ${{ env.RESULTS_FILENAME }} \ --database tfhe_rs \ - --hardware "n3-H100x8-NVLink" \ + --hardware "n3-H100x8" \ --backend gpu \ --project-version "${{ env.COMMIT_HASH }}" \ --branch ${{ github.ref_name }} \ diff --git a/.github/workflows/integer_multi_gpu_full_benchmark.yml b/.github/workflows/integer_multi_gpu_full_benchmark.yml index b19ed9fe5..677da988f 100644 --- a/.github/workflows/integer_multi_gpu_full_benchmark.yml +++ b/.github/workflows/integer_multi_gpu_full_benchmark.yml @@ -36,7 +36,7 @@ jobs: slab-url: ${{ secrets.SLAB_BASE_URL }} job-secret: ${{ secrets.JOB_SECRET }} backend: hyperstack - profile: multi-h100-nvlink + profile: multi-h100 cuda-integer-full-multi-gpu-benchmarks: name: Execute multi GPU integer benchmarks for all operations flavor @@ -133,7 +133,7 @@ jobs: run: | python3 ./ci/benchmark_parser.py target/criterion ${{ env.RESULTS_FILENAME }} \ --database tfhe_rs \ - --hardware "n3-H100x8-NVLink" \ + --hardware "n3-H100x8" \ --backend gpu \ --project-version "${{ env.COMMIT_HASH }}" \ --branch ${{ github.ref_name }} \ diff --git a/ci/ec2_products_cost.json b/ci/ec2_products_cost.json index 3e9de534c..3ae3da8c4 100644 --- a/ci/ec2_products_cost.json +++ b/ci/ec2_products_cost.json @@ -7,5 +7,8 @@ "p5.48xlarge": 98.32, "rtx4090": 0.04, "n3-H100x1": 4.30, - "n3-H100x8-NVLink": 22.6 + "n3-H100x8-NVLink": 22.6, + "n3-H100x8": 22.016, + "n3-H100x4": 11.008, + "n3-H100x2": 5.504 } diff --git a/ci/slab.toml b/ci/slab.toml index 4d5203d43..8c6179be5 100644 --- a/ci/slab.toml +++ b/ci/slab.toml @@ -43,6 +43,11 @@ environment_name = "canada" image_name = "Ubuntu Server 22.04 LTS R535 CUDA 12.2" flavor_name = "n3-H100x1" +[backend.hyperstack.multi-h100] +environment_name = "canada" +image_name = "Ubuntu Server 22.04 LTS R535 CUDA 12.2" +flavor_name = "n3-H100x8" + [backend.hyperstack.multi-h100-nvlink] environment_name = "canada" image_name = "Ubuntu Server 22.04 LTS R535 CUDA 12.2"