UniformGridGPU.py 6.27 KB
Newer Older
Martin Bauer's avatar
Martin Bauer committed
1
import sympy as sp
2
import numpy as np
3
import pystencils as ps
4
from lbmpy.creationfunctions import create_lb_method, create_lb_update_rule, create_lb_collision_rule
Martin Bauer's avatar
Martin Bauer committed
5
from lbmpy.boundaries import NoSlip, UBB
6
from lbmpy.fieldaccess import StreamPullTwoFieldsAccessor, StreamPushTwoFieldsAccessor
Martin Bauer's avatar
Martin Bauer committed
7
8
9
from pystencils_walberla import generate_pack_info_from_kernel
from lbmpy_walberla import generate_lattice_model, generate_boundary
from pystencils_walberla import CodeGeneration, generate_sweep
10
11
from pystencils.data_types import TypedSymbol
from pystencils.fast_approximation import insert_fast_sqrts, insert_fast_divisions
12
from lbmpy.macroscopic_value_kernels import macroscopic_values_getter, macroscopic_values_setter
Martin Bauer's avatar
Martin Bauer committed
13

14
omega = sp.symbols("omega")
15
omega_fill = sp.symbols("omega_:10")
16
17
18
19
20
21
22
23
compile_time_block_size = False

if compile_time_block_size:
    sweep_block_size = (128, 1, 1)
else:
    sweep_block_size = (TypedSymbol("cudaBlockSize0", np.int32),
                        TypedSymbol("cudaBlockSize1", np.int32),
                        1)
Martin Bauer's avatar
Martin Bauer committed
24

Martin Bauer's avatar
Martin Bauer committed
25
26
sweep_params = {'block_size': sweep_block_size}

27
options_dict = {
28
    'srt': {
Martin Bauer's avatar
Martin Bauer committed
29
30
        'method': 'srt',
        'stencil': 'D3Q19',
31
        'relaxation_rate': omega,
Martin Bauer's avatar
Martin Bauer committed
32
        'compressible': False,
33
34
35
36
37
38
39
40
41
    },
    'trt': {
        'method': 'trt',
        'stencil': 'D3Q19',
        'relaxation_rate': omega,
    },
    'mrt': {
        'method': 'mrt',
        'stencil': 'D3Q19',
42
        'relaxation_rates': [omega, 1.3, 1.4, 1.2, 1.1, 1.15, 1.234, 1.4235],
43
    },
44
45
46
47
48
    'mrt_full': {
        'method': 'mrt',
        'stencil': 'D3Q19',
        'relaxation_rates': [omega_fill[0], omega, omega_fill[1], omega_fill[2], omega_fill[3], omega_fill[4], omega_fill[5]],
    },
Martin Bauer's avatar
Martin Bauer committed
49
50
51
52
53
    'mrt3': {
        'method': 'mrt3',
        'stencil': 'D3Q19',
        'relaxation_rates': [omega, 1.1, 1.2],
    },
54
55
56
57
58
59
60
    'entropic': {
        'method': 'mrt3',
        'stencil': 'D3Q19',
        'compressible': True,
        'relaxation_rates': [omega, omega, sp.Symbol("omega_free")],
        'entropic': True,
    },
61
62
63
64
65
66
67
    'entropic_kbc_n4': {
        'method': 'trt-kbc-n4',
        'stencil': 'D3Q27',
        'compressible': True,
        'relaxation_rates': [omega, sp.Symbol("omega_free")],
        'entropic': True,
    },
68
69
70
71
72
    'smagorinsky': {
        'method': 'srt',
        'stencil': 'D3Q19',
        'smagorinsky': True,
        'relaxation_rate': omega,
Martin Bauer's avatar
Martin Bauer committed
73
74
75
76
77
78
79
80
    },
    'cumulant': {
        'stencil': 'D3Q19',
        'compressible': True,
        'method': 'mrt',
        'cumulant': True,
        'relaxation_rates': [0, omega, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1],
    },
81
82
}

83
84
85
86
87
88
89
90
91
info_header = """
#include "stencil/D3Q{q}.h"\nusing Stencil_T = walberla::stencil::D3Q{q}; 
const char * infoStencil = "{stencil}";
const char * infoConfigName = "{configName}";
const bool infoCseGlobal = {cse_global};
const bool infoCsePdfs = {cse_pdfs};
"""


92
with CodeGeneration() as ctx:
93
94
95
    accessor = StreamPullTwoFieldsAccessor()
    #accessor = StreamPushTwoFieldsAccessor()
    assert not accessor.is_inplace, "This app does not work for inplace accessors"
96
97
98

    common_options = {
        'field_name': 'pdfs',
Martin Bauer's avatar
Martin Bauer committed
99
        'temporary_field_name': 'pdfs_tmp',
100
        'kernel_type': accessor,
Martin Bauer's avatar
Martin Bauer committed
101
        'optimization': {'cse_global': True,
102
                         'cse_pdfs': False}
Martin Bauer's avatar
Martin Bauer committed
103
    }
104
105
    config_name = ctx.config
    noopt = False
106
    d3q27 = False
107
108
109
    if config_name.endswith("_noopt"):
        noopt = True
        config_name = config_name[:-len("_noopt")]
110
111
112
    if config_name.endswith("_d3q27"):
        d3q27 = True
        config_name = config_name[:-len("_d3q27")]
113
114

    options = options_dict[config_name]
115
    options.update(common_options)
116
117
118
119
120
    options = options.copy()

    if noopt:
        options['optimization']['cse_global'] = False
        options['optimization']['cse_pdfs'] = False
121
122
    if d3q27:
        options['stencil'] = 'D3Q27'
123

124
125
126
127
128
    stencil_str = options['stencil']
    q = int(stencil_str[stencil_str.find('Q')+1:])
    pdfs, velocity_field = ps.fields("pdfs({q}), velocity(3) : double[3D]".format(q=q), layout='fzyx')
    options['optimization']['symbolic_field'] = pdfs

129
    vp = [
130
131
132
133
134
135
136
        ('double', 'omega_0'),
        ('double', 'omega_1'),
        ('double', 'omega_2'),
        ('double', 'omega_3'),
        ('double', 'omega_4'),
        ('double', 'omega_5'),
        ('double', 'omega_6'),
137
        ('int32_t', 'cudaBlockSize0'),
138
        ('int32_t', 'cudaBlockSize1'),
139
    ]
Martin Bauer's avatar
Martin Bauer committed
140
141
142
    lb_method = create_lb_method(**options)
    update_rule = create_lb_update_rule(lb_method=lb_method, **options)

143
144
145
    if not noopt:
        update_rule = insert_fast_divisions(update_rule)
        update_rule = insert_fast_sqrts(update_rule)
146

Martin Bauer's avatar
Martin Bauer committed
147
    # CPU lattice model - required for macroscopic value computation, VTK output etc.
148
149
    options_without_opt = options.copy()
    del options_without_opt['optimization']
150
    generate_lattice_model(ctx, 'UniformGridGPU_LatticeModel', create_lb_collision_rule(lb_method=lb_method, **options_without_opt))
Martin Bauer's avatar
Martin Bauer committed
151
152

    # gpu LB sweep & boundaries
153
154
155
156
157
    generate_sweep(ctx, 'UniformGridGPU_LbKernel', update_rule,
                   field_swaps=[('pdfs', 'pdfs_tmp')],
                   inner_outer_split=True, target='gpu', gpu_indexing_params=sweep_params,
                   varying_parameters=vp)

Martin Bauer's avatar
Martin Bauer committed
158
159
160
    generate_boundary(ctx, 'UniformGridGPU_NoSlip', NoSlip(), lb_method, target='gpu')
    generate_boundary(ctx, 'UniformGridGPU_UBB', UBB([0.05, 0, 0]), lb_method, target='gpu')

161
162
163
164
165
166
167
168
    # getter & setter
    setter_assignments = macroscopic_values_setter(lb_method, velocity=velocity_field.center_vector,
                                                   pdfs=pdfs.center_vector, density=1)
    getter_assignments = macroscopic_values_getter(lb_method, velocity=velocity_field.center_vector,
                                                   pdfs=pdfs.center_vector,  density=None)
    generate_sweep(ctx, 'UniformGridGPU_MacroSetter', setter_assignments)
    generate_sweep(ctx, 'UniformGridGPU_MacroGetter', getter_assignments)

Martin Bauer's avatar
Martin Bauer committed
169
170
    # communication
    generate_pack_info_from_kernel(ctx, 'UniformGridGPU_PackInfo', update_rule, target='gpu')
171
172
173
174
175
176
177
178
179

    infoHeaderParams = {
        'stencil': stencil_str,
        'q': q,
        'configName': ctx.config,
        'cse_global': int(options['optimization']['cse_global']),
        'cse_pdfs': int(options['optimization']['cse_pdfs']),
    }
    ctx.write_file("UniformGridGPU_Defines.h", info_header.format(**infoHeaderParams))