9 Commits

Author SHA1 Message Date
Virgo-AE Eval
c24585570d Merge branch 'ae' into ae-flash-virgo 2025-02-07 14:53:04 -08:00
Richard Yan
8071faf7c2 Merge branch 'ae' into ae-flash-virgo 2025-01-31 03:53:39 -08:00
Richard Yan
a4bd41392c Merge branch 'ae' into ae-flash-virgo 2025-01-30 23:42:05 -08:00
Hansung Kim
692f3dddff Merge branch 'ae' into ae-flash-virgo 2025-01-30 13:25:00 -08:00
Hansung Kim
c75ed0d531 Merge branch 'ae' into ae-flash-virgo 2025-01-30 01:49:05 -08:00
Hansung Kim
96500e0abc Turn off TENSOR_HOPPER for Virgo flash 2025-01-30 01:23:01 -08:00
Hansung Kim
4f12227327 Increase SMEM size for flash 2025-01-30 01:17:38 -08:00
Hansung Kim
efd2d232fe Merge branch 'ae' into ae-flash-virgo 2025-01-30 01:16:23 -08:00
Hansung Kim
b97df2ce6a Switch to fp32 for flash 2025-01-30 01:12:32 -08:00
3 changed files with 5 additions and 5 deletions

View File

@@ -6,7 +6,7 @@
#include "include/gemmini.h"
#include "gemmini_mmio.h"
#define FP_SIZE 16
#define FP_SIZE 32
// "fake" fp16 type that only has the correct data width.
using float16_t = uint16_t;
@@ -19,7 +19,7 @@ using float_type = float16_t;
// Generate kernel for the Hopper-style SMEM-decoupled tensor core. This uses
// asynchronous HGMMA and HGMMA_WAIT instructions.
#define TENSOR_HOPPER 1
#define TENSOR_HOPPER 0
// Constraints on parameters:
// * Memory:

View File

@@ -1 +1 @@
gemmini_params.dim16fp16.h
gemmini_params.dim8fp32.h

View File

@@ -12,9 +12,9 @@
// 64KB
// #define SMEM_SIZE 0x10000
// 128KB (FP16 GEMM)
#define SMEM_SIZE 0x20000
// #define SMEM_SIZE 0x20000
// 256KB (FlashAttention)
// #define SMEM_SIZE 0x40000
#define SMEM_SIZE 0x40000
#define SMEM_MASK (SMEM_SIZE - 1)
#define SMEM_ADDR_END (SMEM_BASE + SMEM_SIZE)