1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
|
import pyopencl as cl
mf = cl.mem_flags
import numpy
import sympy
from mako.template import Template
class Lattice:
def __init__(self, descriptor, nX, nY, moments, collide, geometry, pop_eq_src = '', boundary_src = ''):
self.descriptor = descriptor
self.nX = nX
self.nY = nY
self.nCells = nX * nY
self.moments = moments
self.collide = collide
self.pop_eq_src = pop_eq_src
self.boundary_src = boundary_src
self.platform = cl.get_platforms()[0]
self.context = cl.Context(properties=[(cl.context_properties.PLATFORM, self.platform)])
self.queue = cl.CommandQueue(self.context)
self.np_material = numpy.ndarray(shape=(self.nCells, 1), dtype=numpy.int32)
self.setup_geometry(geometry)
self.tick = True
self.pop_size = descriptor.q * self.nCells * numpy.float32(0).nbytes
self.moments_size = (descriptor.d+1) * self.nCells * numpy.float32(0).nbytes
self.cl_pop_a = cl.Buffer(self.context, mf.READ_WRITE, size=self.pop_size)
self.cl_pop_b = cl.Buffer(self.context, mf.READ_WRITE, size=self.pop_size)
self.cl_moments = cl.Buffer(self.context, mf.WRITE_ONLY, size=self.moments_size)
self.cl_material = cl.Buffer(self.context, mf.READ_ONLY | mf.USE_HOST_PTR, hostbuf=self.np_material)
self.build_kernel()
self.program.equilibrilize(self.queue, (self.nX,self.nY), (32,1), self.cl_pop_a, self.cl_pop_b).wait()
def idx(self, x, y):
return y * self.nX + x;
def setup_geometry(self, geometry):
for y in range(1,self.nY-1):
for x in range(1,self.nX-1):
self.np_material[self.idx(x,y)] = geometry(self.nX,self.nY,x,y)
def build_kernel(self):
program_src = Template(filename = './template/kernel.mako').render(
descriptor = self.descriptor,
nX = self.nX,
nY = self.nY,
nCells = self.nCells,
moments_helper = self.moments[0],
moments_assignment = self.moments[1],
collide_helper = self.collide[0],
collide_assignment = self.collide[1],
pop_eq_src = Template(self.pop_eq_src).render(
descriptor = self.descriptor,
nX = self.nX,
nY = self.nY,
nCells = self.nCells
),
boundary_src = Template(self.boundary_src).render(
descriptor = self.descriptor
),
ccode = sympy.ccode
)
self.program = cl.Program(self.context, program_src).build('-cl-single-precision-constant -cl-fast-relaxed-math')
def evolve(self):
if self.tick:
self.tick = False
self.program.collide_and_stream(self.queue, (self.nX,self.nY), (32,1), self.cl_pop_a, self.cl_pop_b, self.cl_material)
else:
self.tick = True
self.program.collide_and_stream(self.queue, (self.nX,self.nY), (32,1), self.cl_pop_b, self.cl_pop_a, self.cl_material)
def sync(self):
self.queue.finish()
def get_moments(self):
moments = numpy.ndarray(shape=(self.descriptor.d+1, self.nCells), dtype=numpy.float32)
if self.tick:
self.program.collect_moments(self.queue, (self.nX,self.nY), (32,1), self.cl_pop_b, self.cl_moments)
else:
self.program.collect_moments(self.queue, (self.nX,self.nY), (32,1), self.cl_pop_a, self.cl_moments)
cl.enqueue_copy(self.queue, moments, self.cl_moments).wait();
return moments
|