/* * Copyright (C) 2014 Zijia Guo, Andreas Maier * CONRAD is developed as an Open Source project under the GNU General Public License (GPL). */ package edu.stanford.rsl.conrad.opencl.shapes; import java.nio.FloatBuffer; import java.util.ArrayList; import com.jogamp.opencl.CLBuffer; import com.jogamp.opencl.CLCommandQueue; import com.jogamp.opencl.CLContext; import com.jogamp.opencl.CLDevice; import com.jogamp.opencl.CLKernel; import com.jogamp.opencl.CLMemory.Mem; import edu.stanford.rsl.apps.gui.opengl.PointCloudViewer; import edu.stanford.rsl.conrad.geometry.shapes.simple.PointND; import edu.stanford.rsl.conrad.geometry.shapes.simple.Pyramid; import edu.stanford.rsl.conrad.numerics.SimpleMatrix; import edu.stanford.rsl.conrad.opencl.OpenCLEvaluatable; import edu.stanford.rsl.conrad.opencl.OpenCLUtil; public class OpenCLPyramid extends Pyramid implements OpenCLEvaluatable { /** * */ private static final long serialVersionUID = 8658765689476697398L; protected CLDevice device; protected CLContext context; protected CLBuffer<FloatBuffer> parameter; public OpenCLPyramid(CLDevice device){ super(); } public OpenCLPyramid(double dx, double dy, double dz, CLDevice device){ super(dx, dy, dz); this.device = device; this.context = device.getContext(); OpenCLUtil.initSimpleObjectEvaluator(context); handleParameter(dx, dy, dz); } public OpenCLPyramid(Pyramid p, CLDevice device){ this(-p.getMin().get(0), -p.getMin().get(1), -p.getMin().get(2), device); this.transform = p.getTransform(); } public void handleParameter(double dx, double dy, double dz){ //double a = 0.5*(max.get(0) - min.get(0))/(max.get(2) - min.get(2)); //double b = 0.5*(max.get(1) - min.get(1))/(max.get(2) - min.get(2)); float a = (float)(0.5*(max.get(0) - min.get(0))/(max.get(2) - min.get(2))); float b = (float)(0.5*(max.get(1) - min.get(1))/(max.get(2) - min.get(2))); this.parameter = context.createFloatBuffer(5, Mem.READ_ONLY); this.parameter.getBuffer().put((float)dx); // parameter[0] this.parameter.getBuffer().put((float)dy); // parameter[1] this.parameter.getBuffer().put((float)dz); // parameter[2] this.parameter.getBuffer().put(a); // parameter[3] this.parameter.getBuffer().put(b); // parameter[4] this.parameter.getBuffer().rewind(); //device.createCommandQueue().putWriteBuffer(this.parameter, true); CLCommandQueue clc = device.createCommandQueue(); clc.putWriteBuffer(this.parameter, true).finish(); clc.release(); } @Override public boolean isClockwise() { // TODO Auto-generated method stub return true; } @Override public boolean isTimeVariant() { // TODO Auto-generated method stub return false; } @Override public void evaluate(CLBuffer<FloatBuffer> samplingPoints, CLBuffer<FloatBuffer> outputBuffer) { // TODO Auto-generated method stub int elementCount = samplingPoints.getBuffer().capacity()/2; // capacity? 2 or 3? evaluate(samplingPoints, outputBuffer, (int)Math.sqrt(elementCount), (int)Math.sqrt(elementCount)); // how to calculate U and V? } @Override public void evaluate(CLBuffer<FloatBuffer> samplingPoints, CLBuffer<FloatBuffer> outputBuffer, int elementCountU, int elementCountV) { // TODO Auto-generated method stub int elementCount = samplingPoints.getBuffer().capacity()/2; int localWorkSize = Math.min(device.getMaxWorkGroupSize(), 256); int globalWorkSize = OpenCLUtil.roundUp(localWorkSize, elementCount); // to guaranty that global size is interger multiple of group size (local size) CLKernel kernel = OpenCLUtil.simpleObjects.createCLKernel("evaluatePyramid"); kernel.putArgs(parameter, samplingPoints, outputBuffer).putArg(elementCountU).putArg(elementCountV); CLCommandQueue clc = device.createCommandQueue(); clc.put1DRangeKernel(kernel, 0, globalWorkSize, localWorkSize).finish(); kernel.release(); clc.release(); // SimpleMatrix transform SimpleMatrix transform = SimpleMatrix.I_4.clone(); transform.setSubMatrixValue(0, 0, this.transform.getRotation(3)); transform.setSubColValue(0, 3, this.transform.getTranslation(3)); OpenCLUtil.transformPoints(outputBuffer, transform, context, device); } public static void main(String [] args){ CLContext context = OpenCLUtil.getStaticContext(); CLDevice device = context.getMaxFlopsDevice(); int u = 2; int v = 8; Pyramid pyramid = new Pyramid(12,12,12); ArrayList<PointND> cpu = pyramid.getPointCloud(u,v); int numPoints = u*v; OpenCLPyramid clpyramid = new OpenCLPyramid(pyramid, device); CLBuffer<FloatBuffer> samplingPoints = OpenCLUtil.generateSamplingPoints(u, v, context, device); CLBuffer<FloatBuffer> outputBuffer = context.createFloatBuffer(3*numPoints, Mem.READ_WRITE); clpyramid.evaluate(samplingPoints, outputBuffer,u,v); CLCommandQueue queue = device.createCommandQueue(); queue.putReadBuffer(outputBuffer, true); queue.release(); ArrayList<PointND> gpu = new ArrayList<PointND>(); double error =0; for (int i=0; i< numPoints; i++){ PointND point = new PointND(outputBuffer.getBuffer().get(), outputBuffer.getBuffer().get(), outputBuffer.getBuffer().get()); gpu.add(point); error += point.euclideanDistance(cpu.get(i)); } samplingPoints.release(); outputBuffer.release(); PointCloudViewer pcv = new PointCloudViewer("gpu points with error " + error/ numPoints, gpu); pcv.setVisible(true); } }