From dde3602046cbeb9b0ad081ab206bc9af438e767c Mon Sep 17 00:00:00 2001 From: Richard Yan Date: Thu, 30 Jan 2025 01:34:22 -0800 Subject: [PATCH 1/2] disable prints for virgo gemm --- kernels/sgemm_gemmini_dma/kernel.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/kernels/sgemm_gemmini_dma/kernel.cpp b/kernels/sgemm_gemmini_dma/kernel.cpp index 8ae36bd8..5b6c3f71 100644 --- a/kernels/sgemm_gemmini_dma/kernel.cpp +++ b/kernels/sgemm_gemmini_dma/kernel.cpp @@ -53,7 +53,7 @@ #define PRINTF(...) sprintf(PRINT_BUF, __VA_ARGS__) // #define PRINTF(...) vx_printf(__VA_ARGS__) #define SWISH(beta, x) ((x) / (1 + exp(-(beta) * (x)))) -// #define POWER +#define POWER typedef uint16_t smem_elem_t; // typedef float smem_elem_t; From 2c1ac4e938cfc123cd35c8b20ab5f2b00f7d6066 Mon Sep 17 00:00:00 2001 From: Hansung Kim Date: Thu, 30 Jan 2025 01:47:35 -0800 Subject: [PATCH 2/2] Do git pull to make sure up-to-date --- kernels/flash_attention/compile_flash.sh | 1 + kernels/sgemm_gemmini_dma/compile_virgo.sh | 4 ++++ kernels/sgemm_tcore/compile_tcore.sh | 1 + 3 files changed, 6 insertions(+) diff --git a/kernels/flash_attention/compile_flash.sh b/kernels/flash_attention/compile_flash.sh index 5808508c..a2209047 100755 --- a/kernels/flash_attention/compile_flash.sh +++ b/kernels/flash_attention/compile_flash.sh @@ -27,6 +27,7 @@ ln -sf input.c.rand.fp32.seqlen1024headdim64.row.bin input.c.bin for arch in "${archs[@]}"; do git checkout ae-flash-$arch + git pull # re-compile libvortexrt.a # FIXME after restructure diff --git a/kernels/sgemm_gemmini_dma/compile_virgo.sh b/kernels/sgemm_gemmini_dma/compile_virgo.sh index f2deb04c..de9b4b38 100755 --- a/kernels/sgemm_gemmini_dma/compile_virgo.sh +++ b/kernels/sgemm_gemmini_dma/compile_virgo.sh @@ -1,5 +1,9 @@ #!/bin/sh +# hopper and virgo has the same SIMT configurations +git checkout ae-hopper +git pull + if [ ! -f input.a.rand01.fp16.m256n256k256.row.bin ]; then echo "input binaries not found, generating operands" python3 generate_operands.py diff --git a/kernels/sgemm_tcore/compile_tcore.sh b/kernels/sgemm_tcore/compile_tcore.sh index 128eb175..d338521b 100755 --- a/kernels/sgemm_tcore/compile_tcore.sh +++ b/kernels/sgemm_tcore/compile_tcore.sh @@ -53,6 +53,7 @@ done for arch in "${archs[@]}"; do git checkout ae-$arch + git pull # re-compile libvortexrt.a # FIXME after restructure