minor update

This commit is contained in:
Blaise Tine 2024-02-14 14:24:29 -08:00
parent f13a885815
commit a78ac7a246
4 changed files with 14 additions and 14 deletions

View file

@ -14,7 +14,7 @@ all:
$(MAKE) -C oclprintf
$(MAKE) -C blackscholes
$(MAKE) -C transpose
$(MAKE) -C convolution
$(MAKE) -C conv3
run-simx:
$(MAKE) -C vecadd run-simx
@ -32,7 +32,7 @@ run-simx:
$(MAKE) -C oclprintf run-simx
$(MAKE) -C blackscholes run-simx
$(MAKE) -C transpose run-simx
$(MAKE) -C convolution run-simx
$(MAKE) -C conv3 run-simx
run-rtlsim:
$(MAKE) -C vecadd run-rtlsim
@ -50,7 +50,7 @@ run-rtlsim:
$(MAKE) -C lbm run-rtlsim
$(MAKE) -C oclprintf run-rtlsim
$(MAKE) -C blackscholes run-rtlsim
$(MAKE) -C convolution run-rtlsim
$(MAKE) -C conv3 run-rtlsim
run-opae:
$(MAKE) -C vecadd run-opae
@ -68,7 +68,7 @@ run-opae:
$(MAKE) -C lbm run-opae
$(MAKE) -C oclprintf run-opae
$(MAKE) -C blackscholes run-opae
$(MAKE) -C convolution run-opae
$(MAKE) -C conv3 run-opae
clean:
$(MAKE) -C vecadd clean
@ -86,7 +86,7 @@ clean:
$(MAKE) -C lbm clean
$(MAKE) -C oclprintf clean
$(MAKE) -C blackscholes clean
$(MAKE) -C convolution clean
$(MAKE) -C conv3 clean
clean-all:
$(MAKE) -C vecadd clean-all
@ -104,4 +104,4 @@ clean-all:
$(MAKE) -C lbm clean-all
$(MAKE) -C oclprintf clean-all
$(MAKE) -C blackscholes clean-all
$(MAKE) -C convolution clean-all
$(MAKE) -C conv3 clean-all

View file

@ -1,4 +1,4 @@
PROJECT = convolution
PROJECT = conv3
SRCS = main.cc

View file

@ -1,8 +1,8 @@
__kernel void conv3x3(__global float* output,
__global float* input,
__global float* weights,
const int width,
const int height)
__kernel void conv3(__global float* output,
__global float* input,
__global float* weights,
const int width,
const int height)
{
int x = get_global_id(0);
int y = get_global_id(1);
@ -12,7 +12,7 @@ __kernel void conv3x3(__global float* output,
int paddedX = x + 1;
int paddedY = y + 1;
// Compute the convolution sum
// Compute 3x3 convolution sum
float sum = 0.0f;
sum += input[(paddedY - 1) * paddedWidth + (paddedX - 1)] * weights[0]; // Top-left

View file

@ -10,7 +10,7 @@
#define FLOAT_ULP 6
#define KERNEL_NAME "conv3x3"
#define KERNEL_NAME "conv3"
#define CL_CHECK(_expr) \
do { \