forked from hughperkins/EasyCL
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathCLKernel_structs.h
53 lines (50 loc) · 1.67 KB
/
CLKernel_structs.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
// only include this if you're passing structs
// otherwise no need
// downside of including this is, increase your compile time very slightly
#pragma once
#include "CLKernel.h"
namespace easycl {
template<typename T> CLKernel *CLKernel::input(int N, const T *data) {
cl_mem buffer = clCreateBuffer(*(cl->context), CL_MEM_READ_ONLY | CL_MEM_COPY_HOST_PTR, sizeof(T) * N, (void *)data, &error);
cl->checkError(error);
error = clSetKernelArg(kernel, nextArg, sizeof(cl_mem), &buffer);
cl->checkError(error);
buffers.push_back(buffer);
nextArg++;
return this;
}
template<typename T>
CLKernel *CLKernel::in(int N, const T *data) {
return input(N, data);
}
template<typename T>
CLKernel *CLKernel::output(int N, T *data) {
cl_mem buffer = clCreateBuffer(*(cl->context), CL_MEM_WRITE_ONLY, sizeof(T) * N, 0, &error);
cl->checkError(error);
error = clSetKernelArg(kernel, nextArg, sizeof(cl_mem), &buffer);
buffers.push_back(buffer);
//outputArgNums.push_back(nextArg);
outputArgBuffers.push_back(buffer);
outputArgPointers.push_back((void *)data);
outputArgSizes.push_back(sizeof(T) * N);
nextArg++;
return this;
}
template<typename T>
CLKernel *CLKernel::out(int N, T *data) {
return output(N, data);
}
template<typename T>
CLKernel *CLKernel::inout(int N, T *data) {
cl_mem buffer = clCreateBuffer(*(cl->context), CL_MEM_READ_WRITE | CL_MEM_COPY_HOST_PTR, sizeof(T) * N, (void *)data, &error);
cl->checkError(error);
error = clSetKernelArg(kernel, nextArg, sizeof(cl_mem), &buffer);
cl->checkError(error);
buffers.push_back(buffer);
outputArgBuffers.push_back(buffer);
outputArgPointers.push_back((void *)(data) );
outputArgSizes.push_back(sizeof(T) * N);
nextArg++;
return this;
}
}