#include #include #include #include "common.h" void kernel_body(int task_id, void* arg) { struct kernel_arg_t* _arg = (struct kernel_arg_t*)(arg); uint32_t stride = _arg->stride; uint32_t* addr_ptr = (uint32_t*)_arg->addr_ptr; float* src_ptr = (float*)_arg->src_ptr; float* dst_ptr = (float*)_arg->dst_ptr; uint32_t offset = task_id * stride; for (uint32_t i = 0; i < stride; ++i) { float value = 0.0f; for (uint32_t j = 0; j < NUM_LOADS; ++j) { uint32_t addr = offset + i + j; uint32_t index = addr_ptr[addr]; value *= src_ptr[index]; } dst_ptr[offset+i] = value; } } void main() { struct kernel_arg_t* arg = (struct kernel_arg_t*)KERNEL_ARG_DEV_MEM_ADDR; vx_spawn_tasks(arg->num_tasks, kernel_body, arg); }