#include "../intrinsics/vx_intrinsics.h" #include "vx_api.h" #include #ifdef __cplusplus extern "C" { #endif func_t global_function_pointer; void * global_argument_struct; unsigned global_num_threads; void setup_call() { vx_tmc(global_num_threads); global_function_pointer(global_argument_struct); unsigned wid = vx_warpID(); if (wid != 0) { vx_tmc(0); // Halt Warp Execution } else { vx_tmc(1); // Only activate one thread } } void vx_spawnWarps(unsigned numWarps, unsigned numThreads, func_t func_ptr, void * args) { global_function_pointer = func_ptr; global_argument_struct = args; global_num_threads = numThreads; vx_wspawn(numWarps, (unsigned) setup_call); setup_call(); } unsigned pocl_threads; struct context_t * pocl_ctx; vx_pocl_workgroup_func pocl_pfn; const void * pocl_args; void pocl_spawn_runonce() { vx_tmc(pocl_threads); int x = vx_threadID(); int y = vx_warpID(); (pocl_pfn)(pocl_args, pocl_ctx, x, y, 0); if (y != 0) { vx_tmc(0); } vx_tmc(1); } void pocl_spawn(struct context_t * ctx, vx_pocl_workgroup_func pfn, const void * args) { if (ctx->num_groups[2] > 1) { printf("ERROR: pocl_spawn doesn't support Z dimension yet!\n"); return; } pocl_threads = ctx->num_groups[0]; pocl_ctx = ctx; pocl_pfn = pfn; pocl_args = args; if (ctx->num_groups[1] > 1) { vx_wspawn(ctx->num_groups[1], (unsigned)&pocl_spawn_runonce); } pocl_spawn_runonce(); } #ifdef __cplusplus } #endif