You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
277 lines
9.1 KiB
277 lines
9.1 KiB
/*
|
|
* Copyright (c) 2009-2016 jMonkeyEngine
|
|
* All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions are
|
|
* met:
|
|
*
|
|
* * Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
*
|
|
* * Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
*
|
|
* * Neither the name of 'jMonkeyEngine' nor the names of its contributors
|
|
* may be used to endorse or promote products derived from this software
|
|
* without specific prior written permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
|
|
* TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
|
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
|
|
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
|
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
|
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
|
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
|
* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
|
* NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
|
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
package com.jme3.opencl.lwjgl;
|
|
|
|
import com.jme3.math.Matrix4f;
|
|
import com.jme3.math.Quaternion;
|
|
import com.jme3.math.Vector2f;
|
|
import com.jme3.math.Vector4f;
|
|
import com.jme3.opencl.*;
|
|
import com.jme3.opencl.Buffer;
|
|
import java.nio.*;
|
|
import org.lwjgl.PointerBuffer;
|
|
import org.lwjgl.opencl.CL10;
|
|
import org.lwjgl.opencl.CLCommandQueue;
|
|
import org.lwjgl.opencl.CLDevice;
|
|
import org.lwjgl.opencl.CLKernel;
|
|
|
|
/**
|
|
*
|
|
* @author shaman
|
|
*/
|
|
public class LwjglKernel extends Kernel {
|
|
|
|
private final CLKernel kernel;
|
|
|
|
public LwjglKernel(CLKernel kernel) {
|
|
super(new ReleaserImpl(kernel));
|
|
this.kernel = kernel;
|
|
}
|
|
|
|
public CLKernel getKernel() {
|
|
return kernel;
|
|
}
|
|
|
|
@Override
|
|
public String getName() {
|
|
return kernel.getInfoString(CL10.CL_KERNEL_FUNCTION_NAME);
|
|
}
|
|
|
|
@Override
|
|
public int getArgCount() {
|
|
return kernel.getInfoInt(CL10.CL_KERNEL_NUM_ARGS);
|
|
}
|
|
|
|
@Override
|
|
public long getMaxWorkGroupSize(Device device) {
|
|
CLDevice d = ((LwjglDevice) device).getDevice();
|
|
return kernel.getWorkGroupInfoSize(d, CL10.CL_KERNEL_WORK_GROUP_SIZE);
|
|
}
|
|
|
|
@Override
|
|
public void setArg(int index, LocalMemPerElement t) {
|
|
int ret = CL10.clSetKernelArg (kernel, index, t.getSize() * workGroupSize.getSizes()[0] * workGroupSize.getSizes()[1] * workGroupSize.getSizes()[2]);
|
|
Utils.checkError(ret, "clSetKernelArg");
|
|
}
|
|
|
|
@Override
|
|
public void setArg(int index, LocalMem t) {
|
|
int ret = CL10.clSetKernelArg (kernel, index, t.getSize());
|
|
Utils.checkError(ret, "clSetKernelArg");
|
|
}
|
|
|
|
@Override
|
|
public void setArg(int index, Buffer t) {
|
|
int ret = CL10.clSetKernelArg(kernel, index, ((LwjglBuffer) t).getBuffer());
|
|
Utils.checkError(ret, "clSetKernelArg");
|
|
}
|
|
|
|
@Override
|
|
public void setArg(int index, Image i) {
|
|
int ret = CL10.clSetKernelArg(kernel, index, ((LwjglImage) i).getImage());
|
|
Utils.checkError(ret, "clSetKernelArg");
|
|
}
|
|
|
|
@Override
|
|
public void setArg(int index, byte b) {
|
|
ByteBuffer buf = Utils.tempBuffers[0].b16;
|
|
buf.position(0);
|
|
buf.limit(1);
|
|
buf.put(0, b);
|
|
int ret = CL10.clSetKernelArg(kernel, index, buf);
|
|
Utils.checkError(ret, "clSetKernelArg");
|
|
}
|
|
|
|
@Override
|
|
public void setArg(int index, short s) {
|
|
ShortBuffer buf = Utils.tempBuffers[0].b16s;
|
|
buf.position(0);
|
|
buf.limit(1);
|
|
buf.put(0, s);
|
|
int ret = CL10.clSetKernelArg(kernel, index, buf);
|
|
Utils.checkError(ret, "clSetKernelArg");
|
|
}
|
|
|
|
@Override
|
|
public void setArg(int index, int i) {
|
|
IntBuffer buf = Utils.tempBuffers[0].b16i;
|
|
buf.position(0);
|
|
buf.limit(1);
|
|
buf.put(0, i);
|
|
int ret = CL10.clSetKernelArg(kernel, index, buf);
|
|
Utils.checkError(ret, "clSetKernelArg");
|
|
}
|
|
|
|
@Override
|
|
public void setArg(int index, long l) {
|
|
LongBuffer buf = Utils.tempBuffers[0].b16l;
|
|
buf.position(0);
|
|
buf.limit(1);
|
|
buf.put(0, l);
|
|
int ret = CL10.clSetKernelArg(kernel, index, buf);
|
|
Utils.checkError(ret, "clSetKernelArg");
|
|
}
|
|
|
|
@Override
|
|
public void setArg(int index, float f) {
|
|
FloatBuffer buf = Utils.tempBuffers[0].b16f;
|
|
buf.position(0);
|
|
buf.limit(1);
|
|
buf.put(0, f);
|
|
int ret = CL10.clSetKernelArg(kernel, index, buf);
|
|
Utils.checkError(ret, "clSetKernelArg");
|
|
}
|
|
|
|
@Override
|
|
public void setArg(int index, double d) {
|
|
DoubleBuffer buf = Utils.tempBuffers[0].b16d;
|
|
buf.position(0);
|
|
buf.limit(1);
|
|
buf.put(0, d);
|
|
int ret = CL10.clSetKernelArg(kernel, index, buf);
|
|
Utils.checkError(ret, "clSetKernelArg");
|
|
}
|
|
|
|
@Override
|
|
public void setArg(int index, Vector2f v) {
|
|
FloatBuffer buf = Utils.tempBuffers[0].b16f;
|
|
buf.position(0);
|
|
buf.limit(2);
|
|
buf.put(0, v.x);
|
|
buf.put(1, v.y);
|
|
int ret = CL10.clSetKernelArg(kernel, index, buf);
|
|
Utils.checkError(ret, "clSetKernelArg");
|
|
}
|
|
|
|
@Override
|
|
public void setArg(int index, Vector4f v) {
|
|
FloatBuffer buf = Utils.tempBuffers[0].b16f;
|
|
buf.position(0);
|
|
buf.limit(4);
|
|
buf.put(0, v.x);
|
|
buf.put(1, v.y);
|
|
buf.put(2, v.z);
|
|
buf.put(3, v.w);
|
|
int ret = CL10.clSetKernelArg(kernel, index, buf);
|
|
Utils.checkError(ret, "clSetKernelArg");
|
|
}
|
|
|
|
@Override
|
|
public void setArg(int index, Quaternion q) {
|
|
FloatBuffer buf = Utils.tempBuffers[0].b16f;
|
|
buf.position(0);
|
|
buf.limit(4);
|
|
buf.put(0, q.getX());
|
|
buf.put(1, q.getY());
|
|
buf.put(2, q.getZ());
|
|
buf.put(3, q.getW());
|
|
int ret = CL10.clSetKernelArg(kernel, index, buf);
|
|
Utils.checkError(ret, "clSetKernelArg");
|
|
}
|
|
|
|
@Override
|
|
public void setArg(int index, Matrix4f m) {
|
|
FloatBuffer buf = Utils.b80f;
|
|
buf.position(0);
|
|
buf.limit(16);
|
|
buf.put(m.m00).put(m.m01).put(m.m02).put(m.m03);
|
|
buf.put(m.m10).put(m.m11).put(m.m12).put(m.m13);
|
|
buf.put(m.m20).put(m.m21).put(m.m22).put(m.m23);
|
|
buf.put(m.m30).put(m.m31).put(m.m32).put(m.m33);
|
|
buf.position(0);
|
|
int ret = CL10.clSetKernelArg(kernel, index, buf);
|
|
Utils.checkError(ret, "clSetKernelArg");
|
|
}
|
|
|
|
@Override
|
|
public void setArg(int index, ByteBuffer buffer, long size) {
|
|
buffer.limit((int) (buffer.position() + size));
|
|
int ret = CL10.clSetKernelArg(kernel, index, buffer);
|
|
Utils.checkError(ret, "clSetKernelArg");
|
|
}
|
|
|
|
@Override
|
|
public Event Run(CommandQueue queue) {
|
|
Utils.pointerBuffers[0].rewind();
|
|
Utils.pointerBuffers[1].rewind();
|
|
Utils.pointerBuffers[1].put(globalWorkSize.getSizes());
|
|
Utils.pointerBuffers[1].position(0);
|
|
PointerBuffer p2 = null;
|
|
if (workGroupSize.getSizes()[0] > 0) {
|
|
p2 = Utils.pointerBuffers[2].rewind();
|
|
p2.put(workGroupSize.getSizes());
|
|
p2.position(0);
|
|
}
|
|
CLCommandQueue q = ((LwjglCommandQueue) queue).getQueue();
|
|
int ret = CL10.clEnqueueNDRangeKernel(q, kernel,
|
|
globalWorkSize.getDimension(), null, Utils.pointerBuffers[1],
|
|
p2, null, Utils.pointerBuffers[0]);
|
|
Utils.checkError(ret, "clEnqueueNDRangeKernel");
|
|
return new LwjglEvent(q.getCLEvent(Utils.pointerBuffers[0].get(0)));
|
|
}
|
|
@Override
|
|
public void RunNoEvent(CommandQueue queue) {
|
|
Utils.pointerBuffers[1].rewind();
|
|
Utils.pointerBuffers[1].put(globalWorkSize.getSizes());
|
|
Utils.pointerBuffers[1].position(0);
|
|
PointerBuffer p2 = null;
|
|
if (workGroupSize.getSizes()[0] > 0) {
|
|
p2 = Utils.pointerBuffers[2].rewind();
|
|
p2.put(workGroupSize.getSizes());
|
|
p2.position(0);
|
|
}
|
|
CLCommandQueue q = ((LwjglCommandQueue) queue).getQueue();
|
|
int ret = CL10.clEnqueueNDRangeKernel(q, kernel,
|
|
globalWorkSize.getDimension(), null, Utils.pointerBuffers[1],
|
|
p2, null, null);
|
|
Utils.checkError(ret, "clEnqueueNDRangeKernel");
|
|
}
|
|
|
|
@Override
|
|
public ObjectReleaser getReleaser() {
|
|
return new ReleaserImpl(kernel);
|
|
}
|
|
private static class ReleaserImpl implements ObjectReleaser {
|
|
private CLKernel kernel;
|
|
private ReleaserImpl(CLKernel kernel) {
|
|
this.kernel = kernel;
|
|
}
|
|
@Override
|
|
public void release() {
|
|
if (kernel != null) {
|
|
int ret = CL10.clReleaseKernel(kernel);
|
|
kernel = null;
|
|
Utils.reportError(ret, "clReleaseKernel");
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|