diff --git a/.github/workflows/benchmark.yml b/.github/workflows/benchmark.yml index 40939472..286231cc 100644 --- a/.github/workflows/benchmark.yml +++ b/.github/workflows/benchmark.yml @@ -96,8 +96,8 @@ jobs: gpt2_half_beam.txt testamdbenchmark: - name: AMD Benchmark - runs-on: [self-hosted, Linux, ROCM] + name: tinybox Benchmark + runs-on: [self-hosted, Linux, tinybox] defaults: run: shell: bash -o pipefail {0} @@ -107,9 +107,10 @@ jobs: steps: - name: Checkout Code uses: actions/checkout@v3 + - name: Show off tinybox + run: /opt/rocm/bin/rocm-bandwidth-test - name: Symlink models and datasets run: | - ln -s ~/tinygrad/weights/sd-v1-4.ckpt weights/sd-v1-4.ckpt ln -s ~/tinygrad/weights/bpe_simple_vocab_16e6.txt.gz weights/bpe_simple_vocab_16e6.txt.gz ln -s ~/tinygrad/weights/LLaMA weights/LLaMA ln -s ~/tinygrad/extra/datasets/cifar-10-python.tar.gz extra/datasets/cifar-10-python.tar.gz @@ -121,10 +122,11 @@ jobs: run: HIP=1 HALF=1 DEBUG=2 python3 extra/gemm/simple_matmul.py | tee matmul.txt - name: Run Stable Diffusion run: python3 examples/stable_diffusion.py --seed 0 --noshow --timing | tee sd.txt - - name: Run LLaMA - run: | - JIT=0 python3 examples/llama.py --gen 1 --prompt "Hello." --count 10 --temperature 0 --timing | tee llama_unjitted.txt - JIT=1 python3 examples/llama.py --gen 1 --prompt "Hello." --count 10 --temperature 0 --timing | tee llama_jitted.txt + # TODO: rocm 6.0 broke this + #- name: Run LLaMA + # run: | + # JIT=0 python3 examples/llama.py --gen 1 --prompt "Hello." --count 10 --temperature 0 --timing | tee llama_unjitted.txt + # JIT=1 python3 examples/llama.py --gen 1 --prompt "Hello." --count 10 --temperature 0 --timing | tee llama_jitted.txt - name: Run GPT2 (with HIP) run: | HIP=1 JIT=0 python3 examples/gpt2.py --prompt "Hello." --count 10 --temperature 0 --timing | tee gpt2_unjitted.txt