Gpt2 benchmark with HALF and BEAM (#2636)

* benchmark gpt2 with half and beam

* BEAM=4

* optional validation

* green is good

* we care
This commit is contained in:
chenyu
2023-12-05 22:15:16 -05:00
committed by GitHub
parent a73579919f
commit 229ada5fe5
2 changed files with 18 additions and 2 deletions

View File

@@ -81,6 +81,8 @@ jobs:
run: |
CUDA=1 JIT=0 python3 examples/gpt2.py --prompt "Hello." --count 10 --temperature 0 --timing | tee gpt2_unjitted.txt
CUDA=1 JIT=1 python3 examples/gpt2.py --prompt "Hello." --count 10 --temperature 0 --timing | tee gpt2_jitted.txt
- name: Run GPT2 w HALF/BEAM
run: CUDA=1 JIT=1 HALF=1 BEAM=4 CACHELEVEL=0 python3 examples/gpt2.py --count 10 --temperature 0 --timing | tee gpt2_half_beam.txt
- uses: actions/upload-artifact@v3
with:
name: Speed (NVIDIA)
@@ -89,6 +91,7 @@ jobs:
torch_speed.txt
gpt2_unjitted.txt
gpt2_jitted.txt
gpt2_half_beam.txt
testamdbenchmark:
name: AMD Benchmark