% if float_type == 'double': #if defined(cl_khr_fp64) #pragma OPENCL EXTENSION cl_khr_fp64 : enable #elif defined(cl_amd_fp64) #pragma OPENCL EXTENSION cl_amd_fp64 : enable #endif % endif __kernel void equilibrilize(__global ${float_type}* f_next, __global ${float_type}* f_prev) { const unsigned int gid = ${layout.gid()}; __global ${float_type}* preshifted_f_next = f_next + gid; __global ${float_type}* preshifted_f_prev = f_prev + gid; % for i, w_i in enumerate(descriptor.w): preshifted_f_next[${layout.pop_offset(i)}] = ${w_i}.f; preshifted_f_prev[${layout.pop_offset(i)}] = ${w_i}.f; % endfor } __kernel void collide_and_stream(__global ${float_type}* f_next, __global ${float_type}* f_prev, __global int* material, unsigned int time) { const unsigned int gid = ${layout.gid()}; const int m = material[gid]; if ( m == 0 ) { return; } __global ${float_type}* preshifted_f_next = f_next + gid; __global ${float_type}* preshifted_f_prev = f_prev + gid; % for i, c_i in enumerate(descriptor.c): const ${float_type} f_curr_${i} = preshifted_f_prev[${layout.pop_offset(i) + layout.neighbor_offset(-c_i)}]; % endfor % for i, expr in enumerate(moments_subexpr): const ${float_type} ${expr[0]} = ${ccode(expr[1])}; % endfor % for i, expr in enumerate(moments_assignment): ${float_type} ${ccode(expr)} % endfor ${boundary_src} % for i, expr in enumerate(collision_subexpr): const ${float_type} ${expr[0]} = ${ccode(expr[1])}; % endfor % for i, expr in enumerate(collision_assignment): const ${float_type} ${ccode(expr)} % endfor % for i in range(0,descriptor.q): preshifted_f_next[${layout.pop_offset(i)}] = f_next_${i}; % endfor } __kernel void collect_moments(__global ${float_type}* f, __global ${float_type}* moments) { const unsigned int gid = ${layout.gid()}; __global ${float_type}* preshifted_f = f + gid; % for i in range(0,descriptor.q): const ${float_type} f_curr_${i} = preshifted_f[${layout.pop_offset(i)}]; % endfor % for i, expr in enumerate(moments_subexpr): const ${float_type} ${expr[0]} = ${ccode(expr[1])}; % endfor % for i, expr in enumerate(moments_assignment): moments[${layout.pop_offset(i)} + gid] = ${ccode(expr.rhs)}; % endfor }