cbackend.py 24.4 KB
Newer Older
Martin Bauer's avatar
Martin Bauer committed
1
from collections import namedtuple
2
from typing import Set
3
4
5

import sympy as sp
from sympy.core import S
6
from sympy.printing.ccode import C89CodePrinter
7

8
from pystencils.astnodes import KernelFunction, Node
9
from pystencils.cpu.vectorization import vec_all, vec_any
Martin Bauer's avatar
Martin Bauer committed
10
from pystencils.data_types import (
11
12
    PointerType, VectorType, address_of, cast_func, create_type, get_type_of_expression,
    reinterpret_cast_func, vector_memory_access)
Martin Bauer's avatar
Martin Bauer committed
13
14
from pystencils.fast_approximation import fast_division, fast_inv_sqrt, fast_sqrt
from pystencils.integer_functions import (
15
16
    bit_shift_left, bit_shift_right, bitwise_and, bitwise_or, bitwise_xor,
    int_div, int_power_of_2, modulo_ceil)
17
from pystencils.kernelparameters import FieldPointerSymbol
18

Martin Bauer's avatar
Martin Bauer committed
19
20
try:
    from sympy.printing.ccode import C99CodePrinter as CCodePrinter
Martin Bauer's avatar
Martin Bauer committed
21
22
except ImportError:
    from sympy.printing.ccode import CCodePrinter  # for sympy versions < 1.1
Martin Bauer's avatar
Martin Bauer committed
23

24
__all__ = ['generate_c', 'CustomCodeNode', 'PrintNode', 'get_headers', 'CustomSympyPrinter']
25

26
27
KERNCRAFT_NO_TERNARY_MODE = False

Martin Bauer's avatar
Fixes    
Martin Bauer committed
28

29
def generate_c(ast_node: Node, signature_only: bool = False, dialect='c', custom_backend=None) -> str:
Martin Bauer's avatar
Martin Bauer committed
30
31
32
33
34
35
36
37
38
    """Prints an abstract syntax tree node as C or CUDA code.

    This function does not need to distinguish between C, C++ or CUDA code, it just prints 'C-like' code as encoded
    in the abstract syntax tree (AST). The AST is built differently for C or CUDA by calling different create_kernel
    functions.

    Args:
        ast_node:
        signature_only:
39
        dialect: 'c' or 'cuda'
Martin Bauer's avatar
Martin Bauer committed
40
41
    Returns:
        C-like code for the ast node and its descendants
Martin Bauer's avatar
Martin Bauer committed
42
    """
43
44
45
46
47
48
    global_declarations = get_global_declarations(ast_node)
    for d in global_declarations:
        if hasattr(ast_node, "global_variables"):
            ast_node.global_variables.update(d.symbols_defined)
        else:
            ast_node.global_variables = d.symbols_defined
49
50
51
    if custom_backend:
        printer = custom_backend
    elif dialect == 'c':
52
53
54
55
        try:
            instruction_set = ast_node.instruction_set
        except Exception:
            instruction_set = None
56
        printer = CBackend(signature_only=signature_only,
57
                           vector_instruction_set=instruction_set)
58
59
60
    elif dialect == 'cuda':
        from pystencils.backends.cuda_backend import CudaBackend
        printer = CudaBackend(signature_only=signature_only)
Stephan Seitz's avatar
Stephan Seitz committed
61
    elif dialect == 'opencl':
62
63
        from pystencils.backends.opencl_backend import OpenClBackend
        printer = OpenClBackend(signature_only=signature_only)
64
    else:
Martin Bauer's avatar
Martin Bauer committed
65
        raise ValueError("Unknown dialect: " + str(dialect))
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
    code = printer(ast_node)
    if not signature_only and isinstance(ast_node, KernelFunction):
        code = "\n" + code
        for declaration in global_declarations:
            code = printer(declaration) + "\n" + code

    return code


def get_global_declarations(ast):
    global_declarations = []

    def visit_node(sub_ast):
        if hasattr(sub_ast, "required_global_declarations"):
            nonlocal global_declarations
            global_declarations += sub_ast.required_global_declarations

        if hasattr(sub_ast, "args"):
            for node in sub_ast.args:
                visit_node(node)

    visit_node(ast)

    return set(global_declarations)
90
91


Martin Bauer's avatar
Martin Bauer committed
92
93
def get_headers(ast_node: Node) -> Set[str]:
    """Return a set of header files, necessary to compile the printed C-like code."""
94
95
    headers = set()

Martin Bauer's avatar
Martin Bauer committed
96
97
98
    if isinstance(ast_node, KernelFunction) and ast_node.instruction_set:
        headers.update(ast_node.instruction_set['headers'])

Martin Bauer's avatar
Martin Bauer committed
99
100
101
    if hasattr(ast_node, 'headers'):
        headers.update(ast_node.headers)
    for a in ast_node.args:
102
        if isinstance(a, Node):
Martin Bauer's avatar
Martin Bauer committed
103
            headers.update(get_headers(a))
104
105

    return headers
106
107


108
109
110
# --------------------------------------- Backend Specific Nodes -------------------------------------------------------


111
class CustomCodeNode(Node):
Martin Bauer's avatar
Martin Bauer committed
112
    def __init__(self, code, symbols_read, symbols_defined, parent=None):
113
        super(CustomCodeNode, self).__init__(parent=parent)
114
        self._code = "\n" + code
115
116
        self._symbols_read = set(symbols_read)
        self._symbols_defined = set(symbols_defined)
117
        self.headers = []
118

119
    def get_code(self, dialect, vector_instruction_set):
120
121
122
123
124
125
126
        return self._code

    @property
    def args(self):
        return []

    @property
Martin Bauer's avatar
Martin Bauer committed
127
    def symbols_defined(self):
128
        return self._symbols_defined
129
130

    @property
Martin Bauer's avatar
Martin Bauer committed
131
    def undefined_symbols(self):
132
        return self._symbols_read - self._symbols_defined
133
134


135
class PrintNode(CustomCodeNode):
Martin Bauer's avatar
Martin Bauer committed
136
137
138
139
    # noinspection SpellCheckingInspection
    def __init__(self, symbol_to_print):
        code = '\nstd::cout << "%s  =  " << %s << std::endl; \n' % (symbol_to_print.name, symbol_to_print.name)
        super(PrintNode, self).__init__(code, symbols_read=[symbol_to_print], symbols_defined=set())
140
        self.headers.append("<iostream>")
141
142
143
144


# ------------------------------------------- Printer ------------------------------------------------------------------

145

Martin Bauer's avatar
Martin Bauer committed
146
147
# noinspection PyPep8Naming
class CBackend:
148

Martin Bauer's avatar
Martin Bauer committed
149
    def __init__(self, sympy_printer=None, signature_only=False, vector_instruction_set=None, dialect='c'):
Martin Bauer's avatar
Martin Bauer committed
150
151
        if sympy_printer is None:
            if vector_instruction_set is not None:
152
                self.sympy_printer = VectorizedCustomSympyPrinter(vector_instruction_set)
153
            else:
154
                self.sympy_printer = CustomSympyPrinter()
155
        else:
Martin Bauer's avatar
Martin Bauer committed
156
            self.sympy_printer = sympy_printer
157

158
        self._vector_instruction_set = vector_instruction_set
159
        self._indent = "   "
160
        self._dialect = dialect
Martin Bauer's avatar
Martin Bauer committed
161
        self._signatureOnly = signature_only
162
163

    def __call__(self, node):
Martin Bauer's avatar
Martin Bauer committed
164
        prev_is = VectorType.instruction_set
165
        VectorType.instruction_set = self._vector_instruction_set
166
        result = str(self._print(node))
Martin Bauer's avatar
Martin Bauer committed
167
        VectorType.instruction_set = prev_is
168
        return result
169
170
171

    def _print(self, node):
        for cls in type(node).__mro__:
Martin Bauer's avatar
Martin Bauer committed
172
173
174
            method_name = "_print_" + cls.__name__
            if hasattr(self, method_name):
                return getattr(self, method_name)(node)
175
        raise NotImplementedError(self.__class__.__name__ + " does not support node of type " + node.__class__.__name__)
176

177
178
179
    def _print_Type(self, node):
        return str(node)

180
    def _print_KernelFunction(self, node):
181
        function_arguments = ["%s %s" % (self._print(s.symbol.dtype), s.symbol.name) for s in node.get_parameters()]
182
        launch_bounds = ""
183
        if self._dialect == 'cuda':
184
185
186
187
188
            max_threads = node.indexing.max_threads_per_block()
            if max_threads:
                launch_bounds = "__launch_bounds__({}) ".format(max_threads)
        func_declaration = "FUNC_PREFIX %svoid %s(%s)" % (launch_bounds, node.function_name,
                                                          ", ".join(function_arguments))
189
        if self._signatureOnly:
Martin Bauer's avatar
Martin Bauer committed
190
            return func_declaration
191

192
        body = self._print(node.body)
Martin Bauer's avatar
Martin Bauer committed
193
        return func_declaration + "\n" + body
194
195

    def _print_Block(self, node):
Martin Bauer's avatar
Martin Bauer committed
196
197
        block_contents = "\n".join([self._print(child) for child in node.args])
        return "{\n%s\n}" % (self._indent + self._indent.join(block_contents.splitlines(True)))
198
199

    def _print_PragmaBlock(self, node):
Martin Bauer's avatar
Martin Bauer committed
200
        return "%s\n%s" % (node.pragma_line, self._print_Block(node))
201
202

    def _print_LoopOverCoordinate(self, node):
Martin Bauer's avatar
Martin Bauer committed
203
        counter_symbol = node.loop_counter_name
Martin Bauer's avatar
Martin Bauer committed
204
205
206
207
        start = "int %s = %s" % (counter_symbol, self.sympy_printer.doprint(node.start))
        condition = "%s < %s" % (counter_symbol, self.sympy_printer.doprint(node.stop))
        update = "%s += %s" % (counter_symbol, self.sympy_printer.doprint(node.step),)
        loop_str = "for (%s; %s; %s)" % (start, condition, update)
208

Martin Bauer's avatar
Martin Bauer committed
209
        prefix = "\n".join(node.prefix_lines)
210
211
        if prefix:
            prefix += "\n"
Martin Bauer's avatar
Martin Bauer committed
212
        return "%s%s\n%s" % (prefix, loop_str, self._print(node.body))
213
214

    def _print_SympyAssignment(self, node):
Martin Bauer's avatar
Martin Bauer committed
215
        if node.is_declaration:
Stephan Seitz's avatar
Lint    
Stephan Seitz committed
216
217
218
219
220
            if node.is_const:
                prefix = 'const '
            else:
                prefix = ''
            data_type = prefix + self._print(node.lhs.dtype) + " "
221
222
            return "%s%s = %s;" % (data_type, self.sympy_printer.doprint(node.lhs),
                                   self.sympy_printer.doprint(node.rhs))
223
        else:
Martin Bauer's avatar
Martin Bauer committed
224
            lhs_type = get_type_of_expression(node.lhs)
Martin Bauer's avatar
Martin Bauer committed
225
226
227
228
229
230
            if type(lhs_type) is VectorType and isinstance(node.lhs, cast_func):
                arg, data_type, aligned, nontemporal = node.lhs.args
                instr = 'storeU'
                if aligned:
                    instr = 'stream' if nontemporal else 'storeA'

231
232
233
234
235
236
                rhs_type = get_type_of_expression(node.rhs)
                if type(rhs_type) is not VectorType:
                    rhs = cast_func(node.rhs, VectorType(rhs_type))
                else:
                    rhs = node.rhs

237
238
                return self._vector_instruction_set[instr].format("&" + self.sympy_printer.doprint(node.lhs.args[0]),
                                                                  self.sympy_printer.doprint(rhs)) + ';'
239
            else:
Martin Bauer's avatar
Martin Bauer committed
240
                return "%s = %s;" % (self.sympy_printer.doprint(node.lhs), self.sympy_printer.doprint(node.rhs))
241
242

    def _print_TemporaryMemoryAllocation(self, node):
243
        align = 64
Martin Bauer's avatar
Martin Bauer committed
244
245
246
247
248
249
        np_dtype = node.symbol.dtype.base_type.numpy_dtype
        required_size = np_dtype.itemsize * node.size + align
        size = modulo_ceil(required_size, align)
        code = "{dtype} {name}=({dtype})aligned_alloc({align}, {size}) + {offset};"
        return code.format(dtype=node.symbol.dtype,
                           name=self.sympy_printer.doprint(node.symbol.name),
250
                           size=self.sympy_printer.doprint(size),
Martin Bauer's avatar
Martin Bauer committed
251
252
                           offset=int(node.offset(align)),
                           align=align)
253
254

    def _print_TemporaryMemoryFree(self, node):
255
        align = 64
Martin Bauer's avatar
Martin Bauer committed
256
        return "free(%s - %d);" % (self.sympy_printer.doprint(node.symbol.name), node.offset(align))
257

Martin Bauer's avatar
Martin Bauer committed
258
    def _print_SkipIteration(self, _):
259
        return "continue;"
Martin Bauer's avatar
Martin Bauer committed
260

261
262
    def _print_CustomCodeNode(self, node):
        return node.get_code(self._dialect, self._vector_instruction_set)
263

264
    def _print_Conditional(self, node):
265
266
267
        cond_type = get_type_of_expression(node.condition_expr)
        if isinstance(cond_type, VectorType):
            raise ValueError("Problem with Conditional inside vectorized loop - use vec_any or vec_all")
Martin Bauer's avatar
Martin Bauer committed
268
269
        condition_expr = self.sympy_printer.doprint(node.condition_expr)
        true_block = self._print_Block(node.true_block)
Martin Bauer's avatar
Martin Bauer committed
270
        result = "if (%s)\n%s " % (condition_expr, true_block)
Martin Bauer's avatar
Martin Bauer committed
271
272
        if node.false_block:
            false_block = self._print_Block(node.false_block)
Martin Bauer's avatar
Martin Bauer committed
273
            result += "else " + false_block
274
275
        return result

276
    def _print_DestructuringBindingsForFieldClass(self, node):
277
278
        # Define all undefined symbols
        undefined_field_symbols = node.symbols_defined
279
280
281
        destructuring_bindings = ["%s %s = %s.%s;" %
                                  (u.dtype,
                                   u.name,
282
                                   u.field_name if hasattr(u, 'field_name') else u.field_names[0],
283
284
                                   node.CLASS_TO_MEMBER_DICT[u.__class__] %
                                   (() if type(u) == FieldPointerSymbol else (u.coordinate,)))
285
286
                                  for u in undefined_field_symbols
                                  ]
287
        destructuring_bindings.sort()  # only for code aesthetics
288
        return "{\n" + self._indent + \
Stephan Seitz's avatar
Stephan Seitz committed
289
290
291
292
               ("\n" + self._indent).join(destructuring_bindings) + \
               "\n" + self._indent + \
               ("\n" + self._indent).join(self._print(node.body).splitlines()) + \
               "\n}"
293

294
295
296
297

# ------------------------------------------ Helper function & classes -------------------------------------------------


Martin Bauer's avatar
Martin Bauer committed
298
# noinspection PyPep8Naming
299
class CustomSympyPrinter(CCodePrinter):
Martin Bauer's avatar
Martin Bauer committed
300

301
    def __init__(self):
Martin Bauer's avatar
Martin Bauer committed
302
        super(CustomSympyPrinter, self).__init__()
303
        self._float_type = create_type("float32")
304
305
306
307
        if 'Min' in self.known_functions:
            del self.known_functions['Min']
        if 'Max' in self.known_functions:
            del self.known_functions['Max']
Martin Bauer's avatar
Martin Bauer committed
308

309
310
311
    def _print_Pow(self, expr):
        """Don't use std::pow function, for small integer exponents, write as multiplication"""
        if expr.exp.is_integer and expr.exp.is_number and 0 < expr.exp < 8:
312
            return "(" + self._print(sp.Mul(*[expr.base] * expr.exp, evaluate=False)) + ")"
313
314
        elif expr.exp.is_integer and expr.exp.is_number and - 8 < expr.exp < 0:
            return "1 / ({})".format(self._print(sp.Mul(*[expr.base] * (-expr.exp), evaluate=False)))
315
316
317
318
319
        else:
            return super(CustomSympyPrinter, self)._print_Pow(expr)

    def _print_Rational(self, expr):
        """Evaluate all rationals i.e. print 0.25 instead of 1.0/4.0"""
Martin Bauer's avatar
Martin Bauer committed
320
321
        res = str(expr.evalf().num)
        return res
322
323
324
325
326
327
328
329

    def _print_Equality(self, expr):
        """Equality operator is not printable in default printer"""
        return '((' + self._print(expr.lhs) + ") == (" + self._print(expr.rhs) + '))'

    def _print_Piecewise(self, expr):
        """Print piecewise in one line (remove newlines)"""
        result = super(CustomSympyPrinter, self)._print_Piecewise(expr)
Martin Bauer's avatar
Martin Bauer committed
330
331
        return result.replace("\n", "")

332
    def _print_Function(self, expr):
333
        infix_functions = {
Martin Bauer's avatar
Martin Bauer committed
334
335
336
337
338
            bitwise_xor: '^',
            bit_shift_right: '>>',
            bit_shift_left: '<<',
            bitwise_or: '|',
            bitwise_and: '&',
Martin Bauer's avatar
Martin Bauer committed
339
        }
Martin Bauer's avatar
Martin Bauer committed
340
341
        if hasattr(expr, 'to_c'):
            return expr.to_c(self._print)
342
343
344
        if isinstance(expr, reinterpret_cast_func):
            arg, data_type = expr.args
            return "*((%s)(& %s))" % (PointerType(data_type, restrict=False), self._print(arg))
345
346
347
        elif isinstance(expr, address_of):
            assert len(expr.args) == 1, "address_of must only have one argument"
            return "&(%s)" % self._print(expr.args[0])
348
        elif isinstance(expr, cast_func):
Martin Bauer's avatar
Martin Bauer committed
349
            arg, data_type = expr.args
350
351
352
            if isinstance(arg, sp.Number):
                return self._typed_number(arg, data_type)
            else:
353
354
                return "((%s)(%s))" % (data_type, self._print(arg))
        elif isinstance(expr, fast_division):
355
            return "({})".format(self._print(expr.args[0] / expr.args[1]))
356
        elif isinstance(expr, fast_sqrt):
357
            return "({})".format(self._print(sp.sqrt(expr.args[0])))
358
359
        elif isinstance(expr, vec_any) or isinstance(expr, vec_all):
            return self._print(expr.args[0])
360
        elif isinstance(expr, fast_inv_sqrt):
361
            return "({})".format(self._print(1 / sp.sqrt(expr.args[0])))
362
363
        elif expr.func in infix_functions:
            return "(%s %s %s)" % (self._print(expr.args[0]), infix_functions[expr.func], self._print(expr.args[1]))
364
365
366
367
        elif expr.func == int_power_of_2:
            return "(1 << (%s))" % (self._print(expr.args[0]))
        elif expr.func == int_div:
            return "((%s) / (%s))" % (self._print(expr.args[0]), self._print(expr.args[1]))
368
        else:
369
            return super(CustomSympyPrinter, self)._print_Function(expr)
Martin Bauer's avatar
Martin Bauer committed
370

371
372
    def _typed_number(self, number, dtype):
        res = self._print(number)
373
        if dtype.is_float():
374
375
376
377
378
379
380
381
            if dtype == self._float_type:
                if '.' not in res:
                    res += ".0f"
                else:
                    res += "f"
            return res
        else:
            return res
382

383
384
385
    _print_Max = C89CodePrinter._print_Max
    _print_Min = C89CodePrinter._print_Min

386

Martin Bauer's avatar
Martin Bauer committed
387
# noinspection PyPep8Naming
388
389
390
class VectorizedCustomSympyPrinter(CustomSympyPrinter):
    SummandInfo = namedtuple("SummandInfo", ['sign', 'term'])

391
392
    def __init__(self, instruction_set):
        super(VectorizedCustomSympyPrinter, self).__init__()
Martin Bauer's avatar
Martin Bauer committed
393
        self.instruction_set = instruction_set
394

Martin Bauer's avatar
Martin Bauer committed
395
396
397
398
    def _scalarFallback(self, func_name, expr, *args, **kwargs):
        expr_type = get_type_of_expression(expr)
        if type(expr_type) is not VectorType:
            return getattr(super(VectorizedCustomSympyPrinter, self), func_name)(expr, *args, **kwargs)
399
        else:
Martin Bauer's avatar
Martin Bauer committed
400
            assert self.instruction_set['width'] == expr_type.width
401
402
            return None

403
    def _print_Function(self, expr):
404
        if isinstance(expr, vector_memory_access):
Martin Bauer's avatar
Martin Bauer committed
405
406
407
            arg, data_type, aligned, _ = expr.args
            instruction = self.instruction_set['loadA'] if aligned else self.instruction_set['loadU']
            return instruction.format("& " + self._print(arg))
408
        elif isinstance(expr, cast_func):
Martin Bauer's avatar
Martin Bauer committed
409
410
            arg, data_type = expr.args
            if type(data_type) is VectorType:
Martin Bauer's avatar
Martin Bauer committed
411
                return self.instruction_set['makeVec'].format(self._print(arg))
412
        elif expr.func == fast_division:
413
414
            result = self._scalarFallback('_print_Function', expr)
            if not result:
415
416
                result = self.instruction_set['/'].format(self._print(expr.args[0]), self._print(expr.args[1]))
            return result
417
418
419
        elif expr.func == fast_sqrt:
            return "({})".format(self._print(sp.sqrt(expr.args[0])))
        elif expr.func == fast_inv_sqrt:
420
421
422
423
424
425
            result = self._scalarFallback('_print_Function', expr)
            if not result:
                if self.instruction_set['rsqrt']:
                    return self.instruction_set['rsqrt'].format(self._print(expr.args[0]))
                else:
                    return "({})".format(self._print(1 / sp.sqrt(expr.args[0])))
426
427
428
429
430
431
432
433
434
435
436
437
438
        elif isinstance(expr, vec_any):
            expr_type = get_type_of_expression(expr.args[0])
            if type(expr_type) is not VectorType:
                return self._print(expr.args[0])
            else:
                return self.instruction_set['any'].format(self._print(expr.args[0]))
        elif isinstance(expr, vec_all):
            expr_type = get_type_of_expression(expr.args[0])
            if type(expr_type) is not VectorType:
                return self._print(expr.args[0])
            else:
                return self.instruction_set['all'].format(self._print(expr.args[0]))

439
440
        return super(VectorizedCustomSympyPrinter, self)._print_Function(expr)

441
442
443
444
445
    def _print_And(self, expr):
        result = self._scalarFallback('_print_And', expr)
        if result:
            return result

Martin Bauer's avatar
Martin Bauer committed
446
447
448
449
        arg_strings = [self._print(a) for a in expr.args]
        assert len(arg_strings) > 0
        result = arg_strings[0]
        for item in arg_strings[1:]:
Martin Bauer's avatar
Martin Bauer committed
450
            result = self.instruction_set['&'].format(result, item)
451
452
453
454
455
456
457
        return result

    def _print_Or(self, expr):
        result = self._scalarFallback('_print_Or', expr)
        if result:
            return result

Martin Bauer's avatar
Martin Bauer committed
458
459
460
461
        arg_strings = [self._print(a) for a in expr.args]
        assert len(arg_strings) > 0
        result = arg_strings[0]
        for item in arg_strings[1:]:
Martin Bauer's avatar
Martin Bauer committed
462
            result = self.instruction_set['|'].format(result, item)
463
464
        return result

465
    def _print_Add(self, expr, order=None):
466
467
468
        result = self._scalarFallback('_print_Add', expr)
        if result:
            return result
469
470
471
472

        summands = []
        for term in expr.args:
            if term.func == sp.Mul:
Martin Bauer's avatar
Martin Bauer committed
473
                sign, t = self._print_Mul(term, inside_add=True)
474
475
476
477
478
479
480
481
482
483
484
485
486
            else:
                t = self._print(term)
                sign = 1
            summands.append(self.SummandInfo(sign, t))
        # Use positive terms first
        summands.sort(key=lambda e: e.sign, reverse=True)
        # if no positive term exists, prepend a zero
        if summands[0].sign == -1:
            summands.insert(0, self.SummandInfo(1, "0"))

        assert len(summands) >= 2
        processed = summands[0].term
        for summand in summands[1:]:
Martin Bauer's avatar
Martin Bauer committed
487
            func = self.instruction_set['-'] if summand.sign == -1 else self.instruction_set['+']
488
489
490
            processed = func.format(processed, summand.term)
        return processed

491
    def _print_Pow(self, expr):
492
493
494
        result = self._scalarFallback('_print_Pow', expr)
        if result:
            return result
495

496
497
        one = self.instruction_set['makeVec'].format(1.0)

498
499
        if expr.exp.is_integer and expr.exp.is_number and 0 < expr.exp < 8:
            return "(" + self._print(sp.Mul(*[expr.base] * expr.exp, evaluate=False)) + ")"
500
501
502
503
504
        elif expr.exp == -1:
            one = self.instruction_set['makeVec'].format(1.0)
            return self.instruction_set['/'].format(one, self._print(expr.base))
        elif expr.exp == 0.5:
            return self.instruction_set['sqrt'].format(self._print(expr.base))
505
506
507
        elif expr.exp == -0.5:
            root = self.instruction_set['sqrt'].format(self._print(expr.base))
            return self.instruction_set['/'].format(one, root)
508
509
510
        elif expr.exp.is_integer and expr.exp.is_number and - 8 < expr.exp < 0:
            return self.instruction_set['/'].format(one,
                                                    self._print(sp.Mul(*[expr.base] * (-expr.exp), evaluate=False)))
511
        else:
512
            raise ValueError("Generic exponential not supported: " + str(expr))
513

Martin Bauer's avatar
Martin Bauer committed
514
515
516
517
    def _print_Mul(self, expr, inside_add=False):
        # noinspection PyProtectedMember
        from sympy.core.mul import _keep_coeff

518
519
520
        result = self._scalarFallback('_print_Mul', expr)
        if result:
            return result
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548

        c, e = expr.as_coeff_Mul()
        if c < 0:
            expr = _keep_coeff(-c, e)
            sign = -1
        else:
            sign = 1

        a = []  # items in the numerator
        b = []  # items that are in the denominator (if any)

        # Gather args for numerator/denominator
        for item in expr.as_ordered_factors():
            if item.is_commutative and item.is_Pow and item.exp.is_Rational and item.exp.is_negative:
                if item.exp != -1:
                    b.append(sp.Pow(item.base, -item.exp, evaluate=False))
                else:
                    b.append(sp.Pow(item.base, -item.exp))
            else:
                a.append(item)

        a = a or [S.One]

        a_str = [self._print(x) for x in a]
        b_str = [self._print(x) for x in b]

        result = a_str[0]
        for item in a_str[1:]:
Martin Bauer's avatar
Martin Bauer committed
549
            result = self.instruction_set['*'].format(result, item)
550
551
552
553

        if len(b) > 0:
            denominator_str = b_str[0]
            for item in b_str[1:]:
Martin Bauer's avatar
Martin Bauer committed
554
555
                denominator_str = self.instruction_set['*'].format(denominator_str, item)
            result = self.instruction_set['/'].format(result, denominator_str)
556

Martin Bauer's avatar
Martin Bauer committed
557
        if inside_add:
558
559
560
            return sign, result
        else:
            if sign < 0:
Martin Bauer's avatar
Martin Bauer committed
561
                return self.instruction_set['*'].format(self._print(S.NegativeOne), result)
562
563
564
            else:
                return result

565
    def _print_Relational(self, expr):
566
567
568
        result = self._scalarFallback('_print_Relational', expr)
        if result:
            return result
Martin Bauer's avatar
Martin Bauer committed
569
        return self.instruction_set[expr.rel_op].format(self._print(expr.lhs), self._print(expr.rhs))
570
571

    def _print_Equality(self, expr):
572
573
574
        result = self._scalarFallback('_print_Equality', expr)
        if result:
            return result
Martin Bauer's avatar
Martin Bauer committed
575
        return self.instruction_set['=='].format(self._print(expr.lhs), self._print(expr.rhs))
576
577

    def _print_Piecewise(self, expr):
578
579
580
        result = self._scalarFallback('_print_Piecewise', expr)
        if result:
            return result
581

Martin Bauer's avatar
Martin Bauer committed
582
        if expr.args[-1].cond.args[0] is not sp.sympify(True):
583
584
585
586
587
588
589
590
591
            # We need the last conditional to be a True, otherwise the resulting
            # function may not return a result.
            raise ValueError("All Piecewise expressions must contain an "
                             "(expr, True) statement to be used as a default "
                             "condition. Without one, the generated "
                             "expression may not evaluate to anything under "
                             "some condition.")

        result = self._print(expr.args[-1][0])
Martin Bauer's avatar
Martin Bauer committed
592
        for true_expr, condition in reversed(expr.args[:-1]):
593
            if isinstance(condition, cast_func) and get_type_of_expression(condition.args[0]) == create_type("bool"):
594
595
596
597
598
                if not KERNCRAFT_NO_TERNARY_MODE:
                    result = "(({}) ? ({}) : ({}))".format(self._print(condition.args[0]), self._print(true_expr),
                                                           result)
                else:
                    print("Warning - skipping ternary op")
599
600
601
            else:
                # noinspection SpellCheckingInspection
                result = self.instruction_set['blendv'].format(result, self._print(true_expr), self._print(condition))
602
        return result