mirror of
https://github.com/vortexgpgpu/vortex.git
synced 2025-04-23 21:39:10 -04:00
minor update
This commit is contained in:
parent
f13a885815
commit
a78ac7a246
4 changed files with 14 additions and 14 deletions
|
@ -14,7 +14,7 @@ all:
|
|||
$(MAKE) -C oclprintf
|
||||
$(MAKE) -C blackscholes
|
||||
$(MAKE) -C transpose
|
||||
$(MAKE) -C convolution
|
||||
$(MAKE) -C conv3
|
||||
|
||||
run-simx:
|
||||
$(MAKE) -C vecadd run-simx
|
||||
|
@ -32,7 +32,7 @@ run-simx:
|
|||
$(MAKE) -C oclprintf run-simx
|
||||
$(MAKE) -C blackscholes run-simx
|
||||
$(MAKE) -C transpose run-simx
|
||||
$(MAKE) -C convolution run-simx
|
||||
$(MAKE) -C conv3 run-simx
|
||||
|
||||
run-rtlsim:
|
||||
$(MAKE) -C vecadd run-rtlsim
|
||||
|
@ -50,7 +50,7 @@ run-rtlsim:
|
|||
$(MAKE) -C lbm run-rtlsim
|
||||
$(MAKE) -C oclprintf run-rtlsim
|
||||
$(MAKE) -C blackscholes run-rtlsim
|
||||
$(MAKE) -C convolution run-rtlsim
|
||||
$(MAKE) -C conv3 run-rtlsim
|
||||
|
||||
run-opae:
|
||||
$(MAKE) -C vecadd run-opae
|
||||
|
@ -68,7 +68,7 @@ run-opae:
|
|||
$(MAKE) -C lbm run-opae
|
||||
$(MAKE) -C oclprintf run-opae
|
||||
$(MAKE) -C blackscholes run-opae
|
||||
$(MAKE) -C convolution run-opae
|
||||
$(MAKE) -C conv3 run-opae
|
||||
|
||||
clean:
|
||||
$(MAKE) -C vecadd clean
|
||||
|
@ -86,7 +86,7 @@ clean:
|
|||
$(MAKE) -C lbm clean
|
||||
$(MAKE) -C oclprintf clean
|
||||
$(MAKE) -C blackscholes clean
|
||||
$(MAKE) -C convolution clean
|
||||
$(MAKE) -C conv3 clean
|
||||
|
||||
clean-all:
|
||||
$(MAKE) -C vecadd clean-all
|
||||
|
@ -104,4 +104,4 @@ clean-all:
|
|||
$(MAKE) -C lbm clean-all
|
||||
$(MAKE) -C oclprintf clean-all
|
||||
$(MAKE) -C blackscholes clean-all
|
||||
$(MAKE) -C convolution clean-all
|
||||
$(MAKE) -C conv3 clean-all
|
|
@ -1,4 +1,4 @@
|
|||
PROJECT = convolution
|
||||
PROJECT = conv3
|
||||
|
||||
SRCS = main.cc
|
||||
|
||||
|
|
|
@ -1,8 +1,8 @@
|
|||
__kernel void conv3x3(__global float* output,
|
||||
__global float* input,
|
||||
__global float* weights,
|
||||
const int width,
|
||||
const int height)
|
||||
__kernel void conv3(__global float* output,
|
||||
__global float* input,
|
||||
__global float* weights,
|
||||
const int width,
|
||||
const int height)
|
||||
{
|
||||
int x = get_global_id(0);
|
||||
int y = get_global_id(1);
|
||||
|
@ -12,7 +12,7 @@ __kernel void conv3x3(__global float* output,
|
|||
int paddedX = x + 1;
|
||||
int paddedY = y + 1;
|
||||
|
||||
// Compute the convolution sum
|
||||
// Compute 3x3 convolution sum
|
||||
float sum = 0.0f;
|
||||
|
||||
sum += input[(paddedY - 1) * paddedWidth + (paddedX - 1)] * weights[0]; // Top-left
|
||||
|
|
|
@ -10,7 +10,7 @@
|
|||
|
||||
#define FLOAT_ULP 6
|
||||
|
||||
#define KERNEL_NAME "conv3x3"
|
||||
#define KERNEL_NAME "conv3"
|
||||
|
||||
#define CL_CHECK(_expr) \
|
||||
do { \
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue