Sha256: 6d2b57ffc2c0f2dee9ed9e758f91fb85c3217b30199ce89f0f136d6966ef8f4a
Contents?: true
Size: 1.08 KB
Versions: 2
Compression:
Stored size: 1.08 KB
Contents
/* STARTDEF void bones_prekernel_<algorithm_name>_0(cudaStream_t kernel_stream, <devicedefinitions>, <argument_definition>); ENDDEF */ // Start of the <algorithm_name> kernel __global__ void bones_kernel_<algorithm_name>_0(<devicedefinitions>, <argument_definition>) { const int bones_global_id = blockIdx.x*blockDim.x + threadIdx.x; if (bones_global_id < (<parallelism>)) { // Calculate the global ID(s) based on the thread id <ids> // Start the computation <algorithm_code1> } } // Function to start the kernel extern "C" void bones_prekernel_<algorithm_name>_0(cudaStream_t kernel_stream, <devicedefinitions>, <argument_definition>) { int bones_block_size; if (<parallelism> >= 64*512 ) { bones_block_size = 512; } else if (<parallelism> >= 64*256 ) { bones_block_size = 256; } else { bones_block_size = 128; } dim3 bones_threads(bones_block_size); dim3 bones_grid(DIV_CEIL(<parallelism>,bones_block_size)); bones_kernel_<algorithm_name>_0<<< bones_grid, bones_threads, 0, kernel_stream >>>(<names>, <argument_name>); }
Version data entries
2 entries across 2 versions & 1 rubygems
Version | Path |
---|---|
bones-compiler-1.6.0 | skeletons/GPU-CUDA/kernel/default.kernel.cu |
bones-compiler-1.3.1 | skeletons/GPU-CUDA/kernel/default.kernel.cu |