sgemm_tcore: Verify wo DMA; warn untested against K-major A + DMA

This commit is contained in:
Hansung Kim
2024-09-03 14:42:19 -07:00
parent 7aa0e6cbe4
commit f028a97f75
2 changed files with 3 additions and 2 deletions

View File

@@ -120,7 +120,6 @@ inline void thread_block_copy_tile(const float *src, float *dest,
constexpr uint32_t per_row_iter = B_COL / NUM_THREADS;
uint32_t thread_offset = first_thread_offset + tid_in_warp;
float per_thread_max = FLT_MIN;
#pragma GCC unroll
for (int i = 0; i < per_row_iter; i++) {
dest[thread_offset] = src[thread_offset];