From 89ea181fd0c08049a198bd5efbcaeed0413242f0 Mon Sep 17 00:00:00 2001 From: victor-eds Date: Mon, 18 Nov 2024 23:32:29 +0000 Subject: [PATCH] Enable long loads --- .github/workflows/triton-benchmarks.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/triton-benchmarks.yml b/.github/workflows/triton-benchmarks.yml index 29792b6af3..c4ccb37195 100644 --- a/.github/workflows/triton-benchmarks.yml +++ b/.github/workflows/triton-benchmarks.yml @@ -243,7 +243,7 @@ jobs: if: ${{ steps.install.outcome == 'success' && !cancelled() && !contains(fromJson(inputs.skip_benchmarks || '[]'), 'flash_attention_fwd_benchmark.py') }} run: | cd benchmarks/triton_kernels_benchmark - python flash_attention_fwd_benchmark.py --reports $REPORTS + IGC_EnableVector8LoadStore=1 python flash_attention_fwd_benchmark.py --reports $REPORTS source ../../scripts/capture-hw-details.sh python ../../scripts/build_report.py $REPORTS/attn-performance.csv $REPORTS/attn-triton-report.csv --benchmark attn --compiler triton --param_cols "Z,H,N_CTX,D_HEAD,CAUSAL" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG @@ -255,7 +255,7 @@ jobs: cd benchmarks/triton_kernels_benchmark TRITON_INTEL_ADVANCED_PATH=0 \ TRITON_INTEL_ENABLE_ADDRESS_PAYLOAD_OPT=1 \ - IGC_VISAOptions=" -enableBCR" \ + IGC_EnableVector8LoadStore=1 IGC_VISAOptions=" -enableBCR" \ python flash_attention_fwd_benchmark.py --reports $REPORTS TAG="${TAG}-dflt"