aboutsummaryrefslogtreecommitdiffstats
path: root/src
diff options
context:
space:
mode:
authorMichael Bien <[email protected]>2010-02-28 01:19:25 +0100
committerMichael Bien <[email protected]>2010-02-28 01:19:25 +0100
commitf838035d40285b9651868dbd711eb14a5ff92ad2 (patch)
tree165b0cea721194cfe696027894f4607d2b264e65 /src
parentbb92a1504c47073f5d17498607e5be9e79e20532 (diff)
added three missing workgroup info methods in CLKernel.
Diffstat (limited to 'src')
-rw-r--r--src/com/mbien/opencl/CLKernel.java40
-rw-r--r--src/com/mbien/opencl/CLProgram.java2
2 files changed, 41 insertions, 1 deletions
diff --git a/src/com/mbien/opencl/CLKernel.java b/src/com/mbien/opencl/CLKernel.java
index 865c7bf5..b661d31c 100644
--- a/src/com/mbien/opencl/CLKernel.java
+++ b/src/com/mbien/opencl/CLKernel.java
@@ -188,6 +188,46 @@ public class CLKernel extends CLObject implements CLResource, Cloneable {
}
/**
+ * Returns the amount of local memory in bytes being used by a kernel.
+ * This includes local memory that may be needed by an implementation to execute the kernel,
+ * variables declared inside the kernel with the <code>__local</code> address qualifier and local memory
+ * to be allocated for arguments to the kernel declared as pointers with the <code>__local</code> address
+ * qualifier and whose size is specified with clSetKernelArg.
+ * If the local memory size, for any pointer argument to the kernel declared with
+ * the <code>__local</code> address qualifier, is not specified, its size is assumed to be 0.
+ */
+ public long getLocalMemorySize(CLDevice device) {
+ return getWorkGroupInfo(device, CL_KERNEL_LOCAL_MEM_SIZE);
+ }
+
+ /**
+ * Returns the work group size for this kernel on the given device.
+ * This provides a mechanism for the application to query the work-group size
+ * that can be used to execute a kernel on a specific device given by device.
+ * The OpenCL implementation uses the resource requirements of the kernel
+ * (register usage etc.) to determine what this work-group size should be.
+ */
+ public long getWorkGroupSize(CLDevice device) {
+ return getWorkGroupInfo(device, CL_KERNEL_WORK_GROUP_SIZE);
+ }
+
+ /**
+ * Returns the work-group size specified by the <code>__attribute__((reqd_work_gr oup_size(X, Y, Z)))</code> qualifier in kernel sources.
+ * If the work-group size is not specified using the above attribute qualifier <code>new long[]{(0, 0, 0)}</code> is returned.
+ */
+ public long[] getCompileWorkGroupSize(CLDevice device) {
+ int ret = cl.clGetKernelWorkGroupInfo(ID, device.ID, CL_KERNEL_COMPILE_WORK_GROUP_SIZE, 8*3, buffer, null);
+ checkForError(ret, "error while asking for clGetKernelWorkGroupInfo");
+ return new long[] { buffer.getLong(0), buffer.getLong(1), buffer.getLong(2) };
+ }
+
+ private long getWorkGroupInfo(CLDevice device, int flag) {
+ int ret = cl.clGetKernelWorkGroupInfo(ID, device.ID, flag, 8, buffer, null);
+ checkForError(ret, "error while asking for clGetKernelWorkGroupInfo");
+ return buffer.getLong(0);
+ }
+
+ /**
* Releases all resources of this kernel from its context.
*/
public void release() {
diff --git a/src/com/mbien/opencl/CLProgram.java b/src/com/mbien/opencl/CLProgram.java
index a5d1311c..806383f6 100644
--- a/src/com/mbien/opencl/CLProgram.java
+++ b/src/com/mbien/opencl/CLProgram.java
@@ -506,7 +506,7 @@ public class CLProgram extends CLObject implements CLResource {
/**
* Utility method for defining macros as build options (Returns "-D name=value").
*/
- public static String define(String name, String value) {
+ public static String define(String name, Object value) {
return "-D "+name+"="+value;
}