opencl sgemm benchmark

This commit is contained in:
Blaise Tine
2019-11-21 00:41:17 -05:00
parent f3e2bacee7
commit 2dcd0ddfdc
9 changed files with 570 additions and 5 deletions

View File

@@ -0,0 +1,9 @@
__kernel void sgemm(__global float *A, __global float *B, __global float *C, int ldc)
{
long i = get_global_id(0);
long m = get_global_id(1);
long n = get_global_id(2);
float a = A[m+n*ldc];
float b = B[m*ldc+i];
C[i+n*ldc] = C[i+n*ldc] + a * b;
}