#include #include #include #include #include #include #include #include typedef struct { unsigned * x; unsigned * y; unsigned * z; unsigned numColums; unsigned numRows; } mat_add_args_t; unsigned x[] = {5, 5, 5, 5, 6, 6, 6, 6, 7, 7, 7, 7, 8, 8, 8, 8}; unsigned y[] = {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1}; unsigned z[] = {0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}; void mat_add_kernel(void * void_arguments) { mat_add_args_t * arguments = (mat_add_args_t *) void_arguments; unsigned wid = vx_warp_id(); unsigned tid = vx_thread_id(); bool valid = (wid < arguments->numRows) && (tid < arguments->numColums); __if (valid) { unsigned index = (wid * arguments->numColums) + tid; arguments->z[index] = arguments->x[index] + arguments->y[index]; } __endif } void vx_print_mat(unsigned * matPtr, int numRows, int numCols) { vx_printf("---------------------\n"); for (int i = 0; i < numRows; i++) { for (int j = 0; j < numCols; j++) { unsigned index = (i * numCols) + j; vx_printf("0x%x ", matPtr[index]); } vx_printf("\n"); } } int main() { // Main is called with all threads active of warp 0 vx_tmc(1); // void * hellp = malloc(4); vx_printf("Confirm Dev Main\n"); vx_printf("vx_spawn_warps\n"); mat_add_args_t arguments; arguments.x = x; arguments.y = y; arguments.z = z; arguments.numColums = 4; arguments.numRows = 4; int numWarps = 4; int numThreads = 4; // First kernel call vx_spawn_warps(numWarps, numThreads, mat_add_kernel, &arguments); vx_print_mat(z, arguments.numRows, arguments.numColums); arguments.x = z; arguments.y = y; arguments.z = z; arguments.numColums = 4; arguments.numRows = 4; // Second Kernel Call vx_spawn_warps(numWarps, numThreads, mat_add_kernel, &arguments); vx_print_mat(z, arguments.numRows, arguments.numColums); vx_prints("Passed!\n"); return 0; }