Merge branch 'ae' into ae-hopper

2025-02-07 14:52:27 -08:00 · 2025-01-31 03:53:00 -08:00 · 2025-01-30 23:40:48 -08:00 · 2025-01-30 15:34:58 -08:00 · 2025-01-30 13:24:50 -08:00 · 2025-01-30 01:48:09 -08:00
3 changed files with 5 additions and 5 deletions
--- a/kernels/sgemm_tcore/sgemm_impl.hpp
+++ b/kernels/sgemm_tcore/sgemm_impl.hpp
@@ -6,7 +6,7 @@
 #include "include/gemmini.h"
 #include "gemmini_mmio.h"

-#define FP_SIZE 32
+#define FP_SIZE 16

 // "fake" fp16 type that only has the correct data width.
 using float16_t = uint16_t;
@@ -19,7 +19,7 @@ using float_type = float16_t;

 // Generate kernel for the Hopper-style SMEM-decoupled tensor core.  This uses
 // asynchronous HGMMA and HGMMA_WAIT instructions.
-#define TENSOR_HOPPER 0
+#define TENSOR_HOPPER 1

 // Constraints on parameters:
 // * Memory:
--- a/lib/gemmini/include/gemmini_params.h
+++ b/lib/gemmini/include/gemmini_params.h
@@ -1 +1 @@
-gemmini_params.dim8fp32.h
+gemmini_params.dim16fp16.h
--- a/lib/include/gemmini_mmio.h
+++ b/lib/include/gemmini_mmio.h
@@ -12,9 +12,9 @@
 // 64KB
 // #define SMEM_SIZE 0x10000
 // 128KB (FP16 GEMM)
-// #define SMEM_SIZE 0x20000
+#define SMEM_SIZE 0x20000
 // 256KB (FlashAttention)
-#define SMEM_SIZE 0x40000
+// #define SMEM_SIZE 0x40000

 #define SMEM_MASK (SMEM_SIZE - 1)
 #define SMEM_ADDR_END (SMEM_BASE + SMEM_SIZE)
Author	SHA1	Message	Date
Virgo-AE Eval	0884ba6fcb	Merge branch 'ae' into ae-hopper	2025-02-07 14:52:27 -08:00
Richard Yan	fd2fe71ca1	Merge branch 'ae' into ae-hopper	2025-01-31 03:53:00 -08:00
Richard Yan	8d71815809	Merge branch 'ae' into ae-hopper	2025-01-30 23:40:48 -08:00
Richard Yan	63f476eb83	Merge branch 'ae' into ae-hopper	2025-01-30 15:34:58 -08:00
Hansung Kim	0711f5f7a3	Merge branch 'ae' into ae-hopper	2025-01-30 13:24:50 -08:00
Hansung Kim	97227577b5	Merge branch 'ae' into ae-hopper	2025-01-30 01:48:09 -08:00
Richard Yan	3cd6aacc17	Merge branch 'ae' into ae-hopper	2025-01-30 01:35:10 -08:00