[PR]
×
[PR]上記の広告は3ヶ月以上新規記事投稿のないブログに表示されています。新しい記事を書く事で広告が消えます。
プログラミング、3DCGとその他いろいろについて
[PR]上記の広告は3ヶ月以上新規記事投稿のないブログに表示されています。新しい記事を書く事で広告が消えます。
このプログラムは実はあまりGPUの並列処理っぽくはない、シングルスレッドなプログラムです。__kernel void myKernelFunction(__global float* numbers){numbers[0] = 3;numbers[1] = 4;numbers[2] = 5;}
cl_program clCreateProgramWithSource( cl_context context, cl_uint count, const char **strings, const size_t *lengths, cl_int *errcode_ret )
cl_int clReleaseProgram(cl_program program)
cl_int clBuildProgram( cl_program program, cl_uint num_devices, const cl_device_id *device_list, const char *options, void (CL_CALLBACK *pfn_notify)(cl_program program, void *user_data), void *user_data )
using System;class MyProgram{static void Main(){IntPtr device = getDevices(getPlatforms()[0], DeviceType.Default)[0];Context context = new Context(device);CommandQueue commandQueue = new CommandQueue(context, device);Program program = new Program(context, System.IO.File.ReadAllText("myKernelProgram.cl"));program.Build(device);Buffer buffer = Buffer.FromCopiedHostMemory(context, new float[] { 1, 2, 3 });float[] readBack = new float[3];commandQueue.ReadBuffer(buffer, readBack);foreach (var number in readBack){Console.WriteLine(number);}}private static IntPtr[] getDevices(IntPtr platform, DeviceType deviceType){int deviceCount;OpenCLFunctions.clGetDeviceIDs(platform, deviceType, 0, null, out deviceCount);IntPtr[] result = new IntPtr[deviceCount];OpenCLFunctions.clGetDeviceIDs(platform, deviceType, deviceCount, result, out deviceCount);return result;}private static IntPtr[] getPlatforms(){int platformCount;OpenCLFunctions.clGetPlatformIDs(0, null, out platformCount);IntPtr[] result = new IntPtr[platformCount];OpenCLFunctions.clGetPlatformIDs(platformCount, result, out platformCount);return result;}}
using System;using System.Runtime.InteropServices;class Context{public IntPtr InternalPointer { get; private set; }public Context(params IntPtr[] devices){int error;InternalPointer = OpenCLFunctions.clCreateContext(null,devices.Length,devices,null,IntPtr.Zero,out error);}~Context(){OpenCLFunctions.clReleaseContext(InternalPointer);}}class CommandQueue{public IntPtr InternalPointer { get; private set; }public CommandQueue(Context context, IntPtr device){int error;InternalPointer = OpenCLFunctions.clCreateCommandQueue(context.InternalPointer,device,0,out error);}~CommandQueue(){OpenCLFunctions.clReleaseCommandQueue(InternalPointer);}public void ReadBuffer<T>(Buffer buffer, T[] systemBuffer) where T : struct{GCHandle handle = GCHandle.Alloc(systemBuffer, GCHandleType.Pinned);OpenCLFunctions.clEnqueueReadBuffer(InternalPointer,buffer.InternalPointer,true,0,Math.Min(buffer.SizeInBytes, Marshal.SizeOf(typeof(T)) * systemBuffer.Length),handle.AddrOfPinnedObject(),0,IntPtr.Zero,IntPtr.Zero);handle.Free();}}class Buffer{public IntPtr InternalPointer { get; private set; }public int SizeInBytes { get; private set; }private Buffer() { }~Buffer(){OpenCLFunctions.clReleaseMemObject(InternalPointer);}public static Buffer FromCopiedHostMemory<T>(Context context, T[] initialData) where T : struct{Buffer result = new Buffer();result.SizeInBytes = Marshal.SizeOf(typeof(T)) * initialData.Length;int errorCode;GCHandle handle = GCHandle.Alloc(initialData, GCHandleType.Pinned);result.InternalPointer = OpenCLFunctions.clCreateBuffer(context.InternalPointer,MemoryFlags.CopyHostMemory,result.SizeInBytes,handle.AddrOfPinnedObject(),out errorCode);handle.Free();return result;}}class Program{public IntPtr InternalPointer { get; private set; }public Program(Context context, params string[] sources){int errorCode;InternalPointer = OpenCLFunctions.clCreateProgramWithSource(context.InternalPointer,sources.Length,sources,null,out errorCode);}~Program(){OpenCLFunctions.clReleaseProgram(InternalPointer);}public void Build(params IntPtr[] devices){OpenCLFunctions.clBuildProgram(InternalPointer,devices.Length,devices,null,null,IntPtr.Zero);}}
using System;using System.Runtime.InteropServices;static class OpenCLFunctions{[DllImport("OpenCL.dll")]public static extern int clGetPlatformIDs(int entryCount, IntPtr[] platforms, out int platformCount);[DllImport("OpenCL.dll")]public static extern int clGetDeviceIDs(IntPtr platform,DeviceType deviceType,int entryCount,IntPtr[] devices,out int deviceCount);[DllImport("OpenCL.dll")]public static extern IntPtr clCreateContext(IntPtr[] properties,int deviceCount,IntPtr[] devices,NotifyContextCreated pfnNotify,IntPtr userData,out int errorCode);[DllImport("OpenCL.dll")]public static extern int clReleaseContext(IntPtr context);[DllImport("OpenCL.dll")]public static extern IntPtr clCreateCommandQueue(IntPtr context,IntPtr device,long properties,out int errorCodeReturn);[DllImport("OpenCL.dll")]public static extern int clReleaseCommandQueue(IntPtr commandQueue);[DllImport("OpenCL.dll")]public static extern IntPtr clCreateBuffer(IntPtr context,MemoryFlags allocationAndUsage,int sizeInBytes,IntPtr hostPtr,//out int errorCodeReturn);[DllImport("OpenCL.dll")]public static extern int clReleaseMemObject(IntPtr memoryObject);[DllImport("OpenCL.dll")]public static extern int clEnqueueReadBuffer(IntPtr commandQueue,IntPtr buffer,bool isBlocking,int offset,int sizeInBytes,IntPtr result,int numberOfEventsInWaitList,IntPtr eventWaitList,IntPtr eventObjectOut);[DllImport("OpenCL.dll")]public static extern IntPtr clCreateProgramWithSource(IntPtr context,int count,string[] programSources,int[] sourceLengths,out int errorCode);[DllImport("OpenCL.dll")]public static extern int clBuildProgram(IntPtr program,int deviceCount,IntPtr[] deviceList,string buildOptions,NotifyProgramBuilt notify,IntPtr userData);[DllImport("OpenCL.dll")]public static extern int clReleaseProgram(IntPtr program);}delegate void NotifyContextCreated(string errorInfo, IntPtr privateInfoSize, int cb, IntPtr userData);delegate void NotifyProgramBuilt(IntPtr program, IntPtr userData);enum DeviceType : long{Default = (1 << 0),Cpu = (1 << 1),Gpu = (1 << 2),Accelerator = (1 << 3),All = 0xFFFFFFFF}enum MemoryFlags : long{ReadWrite = (1 << 0),WriteOnly = (1 << 1),ReadOnly = (1 << 2),UseHostMemory = (1 << 3),HostAccessible = (1 << 4),CopyHostMemory = (1 << 5)}
__kernel void myKernelFunction(__global float* numbers){numbers[0] = 3;numbers[1] = 4;numbers[2] = 5;}