#include #include #include #include "common.h" struct tile_arg_t { struct kernel_arg_t karg; uint32_t tile_width; uint32_t tile_height; float deltaX; float deltaY; }; void kernel_body(int task_id, void* arg) { struct tile_arg_t* _arg = (struct tile_arg_t*)(arg); uint32_t xoffset = task_id * _arg->tile_width; uint32_t yoffset = task_id * _arg->tile_height; uint32_t* dst_ptr = (uint32_t*)_arg->karg.dst_ptr + xoffset + yoffset * _arg->karg.dst_pitch; float fu = xoffset * _arg->deltaX; float fv = yoffset * _arg->deltaY; for (uint32_t y = 0; y < _arg->tile_height; ++y) { for (uint32_t x = 0; x < _arg->tile_width; ++x) { int32_t u = (int32_t)(fu * (1<<28)); int32_t v = (int32_t)(fv * (1<<28)); dst_ptr[x] = vx_tex(0, u, v, 0); fu += _arg->deltaX; } dst_ptr += _arg->karg.dst_pitch; fv += _arg->deltaY; } } int main() { struct kernel_arg_t* arg = (struct kernel_arg_t*)0x0; // configure texture unit vx_csr_write(CSR_TEX0_ADDR, arg->src_ptr); vx_csr_write(CSR_TEX0_FORMAT, 0); vx_csr_write(CSR_TEX0_WIDTH, arg->src_width); vx_csr_write(CSR_TEX0_HEIGHT, arg->src_height); vx_csr_write(CSR_TEX0_PITCH, arg->src_pitch); vx_csr_write(CSR_TEX0_WRAP_U, 0); vx_csr_write(CSR_TEX0_WRAP_V, 0); vx_csr_write(CSR_TEX0_MIN_FILTER, 0); vx_csr_write(CSR_TEX0_MAX_FILTER, 0); struct tile_arg_t targ; targ.karg = *arg; targ.tile_width = arg->dst_width; targ.tile_height = (arg->dst_height + arg->num_tasks - 1) / arg->num_tasks; targ.deltaX = 1.0f / arg->dst_width; targ.deltaY = 1.0f / arg->dst_height; vx_spawn_tasks(arg->num_tasks, kernel_body, targ); }