vortex/tests/opencl/sgemm/kernel.cl
Blaise Tine c1e168fdbe Vortex 2.0 changes:
+ Microarchitecture optimizations
+ 64-bit support
+ Xilinx FPGA support
+ LLVM-16 support
+ Refactoring and quality control fixes

minor update

minor update

minor update

minor update

minor update

minor update

cleanup

cleanup

cache bindings and memory perf refactory

minor update

minor update

hw unit tests fixes

minor update

minor update

minor update

minor update

minor update

minor udpate

minor update

minor update

minor update

minor update

minor update

minor update

minor update

minor updates

minor updates

minor update

minor update

minor update

minor update

minor update

minor update

minor updates

minor updates

minor updates

minor updates

minor update

minor update
2023-11-10 02:47:05 -08:00

20 lines
471 B
Common Lisp

#include "common.h"
__kernel void sgemm (__global const TYPE *A,
__global const TYPE *B,
__global TYPE *C,
int N)
{
// Thread identifiers
const int r = get_global_id(0); // Row ID
const int c = get_global_id(1); // Col ID
// Compute a single element (loop a K)
TYPE acc = 0;
for (int k = 0; k < N; k++) {
acc += A[k * N + r] * B[c * N + k];
}
// Store the result
C[c * N + r] = acc;
}