cbackend.py 24.2 KB
Newer Older
Martin Bauer's avatar
Martin Bauer committed
1
from collections import namedtuple
2
from typing import Set
3
4
5
6

import jinja2
import sympy as sp
from sympy.core import S
7
from sympy.printing.ccode import C89CodePrinter
8

Martin Bauer's avatar
Martin Bauer committed
9
from pystencils.astnodes import DestructuringBindingsForFieldClass, KernelFunction, Node
10
from pystencils.cpu.vectorization import vec_all, vec_any
Martin Bauer's avatar
Martin Bauer committed
11
12
13
14
15
16
17
from pystencils.data_types import (
    PointerType, VectorType, address_of, cast_func, create_type, get_type_of_expression,
    reinterpret_cast_func, vector_memory_access)
from pystencils.fast_approximation import fast_division, fast_inv_sqrt, fast_sqrt
from pystencils.integer_functions import (
    bit_shift_left, bit_shift_right, bitwise_and, bitwise_or, bitwise_xor,
    int_div, int_power_of_2, modulo_ceil)
18
from pystencils.kernelparameters import FieldPointerSymbol
19

Martin Bauer's avatar
Martin Bauer committed
20
21
try:
    from sympy.printing.ccode import C99CodePrinter as CCodePrinter
Martin Bauer's avatar
Martin Bauer committed
22
23
except ImportError:
    from sympy.printing.ccode import CCodePrinter  # for sympy versions < 1.1
Martin Bauer's avatar
Martin Bauer committed
24

25

26
__all__ = ['generate_c', 'CustomCodeNode', 'PrintNode', 'get_headers', 'CustomSympyPrinter']
27

Martin Bauer's avatar
Martin Bauer committed
28

29
30
KERNCRAFT_NO_TERNARY_MODE = False

Martin Bauer's avatar
Fixes    
Martin Bauer committed
31

32
33
34
35
36
class UnsupportedCDialect(Exception):
    def __init__(self):
        super(UnsupportedCDialect, self).__init__()


37
def generate_c(ast_node: Node, signature_only: bool = False, dialect='c', custom_backend=None) -> str:
Martin Bauer's avatar
Martin Bauer committed
38
39
40
41
42
43
44
45
46
    """Prints an abstract syntax tree node as C or CUDA code.

    This function does not need to distinguish between C, C++ or CUDA code, it just prints 'C-like' code as encoded
    in the abstract syntax tree (AST). The AST is built differently for C or CUDA by calling different create_kernel
    functions.

    Args:
        ast_node:
        signature_only:
47
        dialect: 'c' or 'cuda'
Martin Bauer's avatar
Martin Bauer committed
48
49
    Returns:
        C-like code for the ast node and its descendants
Martin Bauer's avatar
Martin Bauer committed
50
    """
51
52
53
54
55
56
    global_declarations = get_global_declarations(ast_node)
    for d in global_declarations:
        if hasattr(ast_node, "global_variables"):
            ast_node.global_variables.update(d.symbols_defined)
        else:
            ast_node.global_variables = d.symbols_defined
57
58
59
    if custom_backend:
        printer = custom_backend
    elif dialect == 'c':
60
61
62
63
64
65
66
        printer = CBackend(signature_only=signature_only,
                           vector_instruction_set=ast_node.instruction_set)
    elif dialect == 'cuda':
        from pystencils.backends.cuda_backend import CudaBackend
        printer = CudaBackend(signature_only=signature_only)
    else:
        raise UnsupportedCDialect
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
    code = printer(ast_node)
    if not signature_only and isinstance(ast_node, KernelFunction):
        code = "\n" + code
        for declaration in global_declarations:
            code = printer(declaration) + "\n" + code

    return code


def get_global_declarations(ast):
    global_declarations = []

    def visit_node(sub_ast):
        if hasattr(sub_ast, "required_global_declarations"):
            nonlocal global_declarations
            global_declarations += sub_ast.required_global_declarations

        if hasattr(sub_ast, "args"):
            for node in sub_ast.args:
                visit_node(node)

    visit_node(ast)

    return set(global_declarations)
91
92


Martin Bauer's avatar
Martin Bauer committed
93
94
def get_headers(ast_node: Node) -> Set[str]:
    """Return a set of header files, necessary to compile the printed C-like code."""
95
96
    headers = set()

Martin Bauer's avatar
Martin Bauer committed
97
98
99
    if isinstance(ast_node, KernelFunction) and ast_node.instruction_set:
        headers.update(ast_node.instruction_set['headers'])

Martin Bauer's avatar
Martin Bauer committed
100
101
102
    if hasattr(ast_node, 'headers'):
        headers.update(ast_node.headers)
    for a in ast_node.args:
103
        if isinstance(a, Node):
Martin Bauer's avatar
Martin Bauer committed
104
            headers.update(get_headers(a))
105
106

    return headers
107
108


109
110
111
# --------------------------------------- Backend Specific Nodes -------------------------------------------------------


112
class CustomCodeNode(Node):
Martin Bauer's avatar
Martin Bauer committed
113
    def __init__(self, code, symbols_read, symbols_defined, parent=None):
114
        super(CustomCodeNode, self).__init__(parent=parent)
115
        self._code = "\n" + code
116
117
        self._symbols_read = set(symbols_read)
        self._symbols_defined = set(symbols_defined)
118
        self.headers = []
119

120
    def get_code(self, dialect, vector_instruction_set):
121
122
123
124
125
126
127
        return self._code

    @property
    def args(self):
        return []

    @property
Martin Bauer's avatar
Martin Bauer committed
128
    def symbols_defined(self):
129
        return self._symbols_defined
130
131

    @property
Martin Bauer's avatar
Martin Bauer committed
132
    def undefined_symbols(self):
133
        return self._symbols_read - self._symbols_defined
134
135


136
class PrintNode(CustomCodeNode):
Martin Bauer's avatar
Martin Bauer committed
137
138
139
140
    # noinspection SpellCheckingInspection
    def __init__(self, symbol_to_print):
        code = '\nstd::cout << "%s  =  " << %s << std::endl; \n' % (symbol_to_print.name, symbol_to_print.name)
        super(PrintNode, self).__init__(code, symbols_read=[symbol_to_print], symbols_defined=set())
141
        self.headers.append("<iostream>")
142
143
144
145


# ------------------------------------------- Printer ------------------------------------------------------------------

146

Martin Bauer's avatar
Martin Bauer committed
147
148
# noinspection PyPep8Naming
class CBackend:
149

Martin Bauer's avatar
Martin Bauer committed
150
    def __init__(self, sympy_printer=None, signature_only=False, vector_instruction_set=None, dialect='c'):
Martin Bauer's avatar
Martin Bauer committed
151
152
        if sympy_printer is None:
            if vector_instruction_set is not None:
153
                self.sympy_printer = VectorizedCustomSympyPrinter(vector_instruction_set)
154
            else:
155
                self.sympy_printer = CustomSympyPrinter()
156
        else:
Martin Bauer's avatar
Martin Bauer committed
157
            self.sympy_printer = sympy_printer
158

159
        self._vector_instruction_set = vector_instruction_set
160
        self._indent = "   "
161
        self._dialect = dialect
Martin Bauer's avatar
Martin Bauer committed
162
        self._signatureOnly = signature_only
163
164

    def __call__(self, node):
Martin Bauer's avatar
Martin Bauer committed
165
        prev_is = VectorType.instruction_set
166
        VectorType.instruction_set = self._vector_instruction_set
167
        result = str(self._print(node))
Martin Bauer's avatar
Martin Bauer committed
168
        VectorType.instruction_set = prev_is
169
        return result
170
171
172

    def _print(self, node):
        for cls in type(node).__mro__:
Martin Bauer's avatar
Martin Bauer committed
173
174
175
            method_name = "_print_" + cls.__name__
            if hasattr(self, method_name):
                return getattr(self, method_name)(node)
176
        raise NotImplementedError(self.__class__ + " does not support node of type " + str(type(node)))
177
178

    def _print_KernelFunction(self, node):
179
        function_arguments = ["%s %s" % (str(s.symbol.dtype), s.symbol.name) for s in node.get_parameters()]
180
        launch_bounds = ""
181
        if self.__class__ == 'cuda':
182
183
184
185
186
            max_threads = node.indexing.max_threads_per_block()
            if max_threads:
                launch_bounds = "__launch_bounds__({}) ".format(max_threads)
        func_declaration = "FUNC_PREFIX %svoid %s(%s)" % (launch_bounds, node.function_name,
                                                          ", ".join(function_arguments))
187
        if self._signatureOnly:
Martin Bauer's avatar
Martin Bauer committed
188
            return func_declaration
189

190
        body = self._print(node.body)
Martin Bauer's avatar
Martin Bauer committed
191
        return func_declaration + "\n" + body
192
193

    def _print_Block(self, node):
Martin Bauer's avatar
Martin Bauer committed
194
195
        block_contents = "\n".join([self._print(child) for child in node.args])
        return "{\n%s\n}" % (self._indent + self._indent.join(block_contents.splitlines(True)))
196
197

    def _print_PragmaBlock(self, node):
Martin Bauer's avatar
Martin Bauer committed
198
        return "%s\n%s" % (node.pragma_line, self._print_Block(node))
199
200

    def _print_LoopOverCoordinate(self, node):
Martin Bauer's avatar
Martin Bauer committed
201
        counter_symbol = node.loop_counter_name
Martin Bauer's avatar
Martin Bauer committed
202
203
204
205
        start = "int %s = %s" % (counter_symbol, self.sympy_printer.doprint(node.start))
        condition = "%s < %s" % (counter_symbol, self.sympy_printer.doprint(node.stop))
        update = "%s += %s" % (counter_symbol, self.sympy_printer.doprint(node.step),)
        loop_str = "for (%s; %s; %s)" % (start, condition, update)
206

Martin Bauer's avatar
Martin Bauer committed
207
        prefix = "\n".join(node.prefix_lines)
208
209
        if prefix:
            prefix += "\n"
Martin Bauer's avatar
Martin Bauer committed
210
        return "%s%s\n%s" % (prefix, loop_str, self._print(node.body))
211
212

    def _print_SympyAssignment(self, node):
Martin Bauer's avatar
Martin Bauer committed
213
214
        if node.is_declaration:
            data_type = "const " + str(node.lhs.dtype) + " " if node.is_const else str(node.lhs.dtype) + " "
215
216
            return "%s%s = %s;" % (data_type, self.sympy_printer.doprint(node.lhs),
                                   self.sympy_printer.doprint(node.rhs))
217
        else:
Martin Bauer's avatar
Martin Bauer committed
218
            lhs_type = get_type_of_expression(node.lhs)
Martin Bauer's avatar
Martin Bauer committed
219
220
221
222
223
224
            if type(lhs_type) is VectorType and isinstance(node.lhs, cast_func):
                arg, data_type, aligned, nontemporal = node.lhs.args
                instr = 'storeU'
                if aligned:
                    instr = 'stream' if nontemporal else 'storeA'

225
226
227
228
229
230
                rhs_type = get_type_of_expression(node.rhs)
                if type(rhs_type) is not VectorType:
                    rhs = cast_func(node.rhs, VectorType(rhs_type))
                else:
                    rhs = node.rhs

231
232
                return self._vector_instruction_set[instr].format("&" + self.sympy_printer.doprint(node.lhs.args[0]),
                                                                  self.sympy_printer.doprint(rhs)) + ';'
233
            else:
Martin Bauer's avatar
Martin Bauer committed
234
                return "%s = %s;" % (self.sympy_printer.doprint(node.lhs), self.sympy_printer.doprint(node.rhs))
235
236

    def _print_TemporaryMemoryAllocation(self, node):
237
        align = 64
Martin Bauer's avatar
Martin Bauer committed
238
239
240
241
242
243
        np_dtype = node.symbol.dtype.base_type.numpy_dtype
        required_size = np_dtype.itemsize * node.size + align
        size = modulo_ceil(required_size, align)
        code = "{dtype} {name}=({dtype})aligned_alloc({align}, {size}) + {offset};"
        return code.format(dtype=node.symbol.dtype,
                           name=self.sympy_printer.doprint(node.symbol.name),
244
                           size=self.sympy_printer.doprint(size),
Martin Bauer's avatar
Martin Bauer committed
245
246
                           offset=int(node.offset(align)),
                           align=align)
247
248

    def _print_TemporaryMemoryFree(self, node):
249
        align = 64
Martin Bauer's avatar
Martin Bauer committed
250
        return "free(%s - %d);" % (self.sympy_printer.doprint(node.symbol.name), node.offset(align))
251

Martin Bauer's avatar
Martin Bauer committed
252
    def _print_SkipIteration(self, _):
253
        return "continue;"
Martin Bauer's avatar
Martin Bauer committed
254

255
256
    def _print_CustomCodeNode(self, node):
        return node.get_code(self._dialect, self._vector_instruction_set)
257

258
    def _print_Conditional(self, node):
259
260
261
        cond_type = get_type_of_expression(node.condition_expr)
        if isinstance(cond_type, VectorType):
            raise ValueError("Problem with Conditional inside vectorized loop - use vec_any or vec_all")
Martin Bauer's avatar
Martin Bauer committed
262
263
        condition_expr = self.sympy_printer.doprint(node.condition_expr)
        true_block = self._print_Block(node.true_block)
Martin Bauer's avatar
Martin Bauer committed
264
        result = "if (%s)\n%s " % (condition_expr, true_block)
Martin Bauer's avatar
Martin Bauer committed
265
266
        if node.false_block:
            false_block = self._print_Block(node.false_block)
Martin Bauer's avatar
Martin Bauer committed
267
            result += "else " + false_block
268
269
        return result

270
271
272
273
274
275
276
277
278
279
    def _print_DestructuringBindingsForFieldClass(self, node: Node):
        # Define all undefined symbols
        undefined_field_symbols = node.symbols_defined
        destructuring_bindings = ["%s = %s.%s%s;" %
                                  (u.name,
                                   u.field_name if hasattr(u, 'field_name') else u.field_names[0],
                                   DestructuringBindingsForFieldClass.CLASS_TO_MEMBER_DICT[u.__class__],
                                   "" if type(u) == FieldPointerSymbol else ("[%i]" % u.coordinate))
                                  for u in undefined_field_symbols
                                  ]
280
        destructuring_bindings.sort()  # only for code aesthetics
281
282
283
284
285
286
287
288
289
290
291
292
293
        template = jinja2.Template(
            """{
   {% for binding in bindings -%}
   {{ binding | indent(3) }}
   {% endfor -%}
   {{ block | indent(3) }}
}

""")
        code = template.render(bindings=destructuring_bindings,
                               block=self._print(node.body))
        return code

294
295
296
297

# ------------------------------------------ Helper function & classes -------------------------------------------------


Martin Bauer's avatar
Martin Bauer committed
298
# noinspection PyPep8Naming
299
class CustomSympyPrinter(CCodePrinter):
Martin Bauer's avatar
Martin Bauer committed
300

301
    def __init__(self):
Martin Bauer's avatar
Martin Bauer committed
302
        super(CustomSympyPrinter, self).__init__()
303
        self._float_type = create_type("float32")
304
305
306
307
        if 'Min' in self.known_functions:
            del self.known_functions['Min']
        if 'Max' in self.known_functions:
            del self.known_functions['Max']
Martin Bauer's avatar
Martin Bauer committed
308

309
310
311
    def _print_Pow(self, expr):
        """Don't use std::pow function, for small integer exponents, write as multiplication"""
        if expr.exp.is_integer and expr.exp.is_number and 0 < expr.exp < 8:
312
            return "(" + self._print(sp.Mul(*[expr.base] * expr.exp, evaluate=False)) + ")"
313
314
        elif expr.exp.is_integer and expr.exp.is_number and - 8 < expr.exp < 0:
            return "1 / ({})".format(self._print(sp.Mul(*[expr.base] * (-expr.exp), evaluate=False)))
315
316
317
318
319
        else:
            return super(CustomSympyPrinter, self)._print_Pow(expr)

    def _print_Rational(self, expr):
        """Evaluate all rationals i.e. print 0.25 instead of 1.0/4.0"""
Martin Bauer's avatar
Martin Bauer committed
320
321
        res = str(expr.evalf().num)
        return res
322
323
324
325
326
327
328
329

    def _print_Equality(self, expr):
        """Equality operator is not printable in default printer"""
        return '((' + self._print(expr.lhs) + ") == (" + self._print(expr.rhs) + '))'

    def _print_Piecewise(self, expr):
        """Print piecewise in one line (remove newlines)"""
        result = super(CustomSympyPrinter, self)._print_Piecewise(expr)
Martin Bauer's avatar
Martin Bauer committed
330
331
        return result.replace("\n", "")

332
    def _print_Function(self, expr):
333
        infix_functions = {
Martin Bauer's avatar
Martin Bauer committed
334
335
336
337
338
            bitwise_xor: '^',
            bit_shift_right: '>>',
            bit_shift_left: '<<',
            bitwise_or: '|',
            bitwise_and: '&',
Martin Bauer's avatar
Martin Bauer committed
339
        }
Martin Bauer's avatar
Martin Bauer committed
340
341
        if hasattr(expr, 'to_c'):
            return expr.to_c(self._print)
342
343
344
        if isinstance(expr, reinterpret_cast_func):
            arg, data_type = expr.args
            return "*((%s)(& %s))" % (PointerType(data_type, restrict=False), self._print(arg))
345
346
347
        elif isinstance(expr, address_of):
            assert len(expr.args) == 1, "address_of must only have one argument"
            return "&(%s)" % self._print(expr.args[0])
348
        elif isinstance(expr, cast_func):
Martin Bauer's avatar
Martin Bauer committed
349
            arg, data_type = expr.args
350
351
352
            if isinstance(arg, sp.Number):
                return self._typed_number(arg, data_type)
            else:
353
354
                return "((%s)(%s))" % (data_type, self._print(arg))
        elif isinstance(expr, fast_division):
355
            return "({})".format(self._print(expr.args[0] / expr.args[1]))
356
        elif isinstance(expr, fast_sqrt):
357
            return "({})".format(self._print(sp.sqrt(expr.args[0])))
358
359
        elif isinstance(expr, vec_any) or isinstance(expr, vec_all):
            return self._print(expr.args[0])
360
        elif isinstance(expr, fast_inv_sqrt):
361
            return "({})".format(self._print(1 / sp.sqrt(expr.args[0])))
362
363
        elif expr.func in infix_functions:
            return "(%s %s %s)" % (self._print(expr.args[0]), infix_functions[expr.func], self._print(expr.args[1]))
364
365
366
367
        elif expr.func == int_power_of_2:
            return "(1 << (%s))" % (self._print(expr.args[0]))
        elif expr.func == int_div:
            return "((%s) / (%s))" % (self._print(expr.args[0]), self._print(expr.args[1]))
368
        else:
369
            return super(CustomSympyPrinter, self)._print_Function(expr)
Martin Bauer's avatar
Martin Bauer committed
370

371
372
    def _typed_number(self, number, dtype):
        res = self._print(number)
373
        if dtype.is_float():
374
375
376
377
378
379
380
381
            if dtype == self._float_type:
                if '.' not in res:
                    res += ".0f"
                else:
                    res += "f"
            return res
        else:
            return res
382

383
384
385
    _print_Max = C89CodePrinter._print_Max
    _print_Min = C89CodePrinter._print_Min

386

Martin Bauer's avatar
Martin Bauer committed
387
# noinspection PyPep8Naming
388
389
390
class VectorizedCustomSympyPrinter(CustomSympyPrinter):
    SummandInfo = namedtuple("SummandInfo", ['sign', 'term'])

391
392
    def __init__(self, instruction_set):
        super(VectorizedCustomSympyPrinter, self).__init__()
Martin Bauer's avatar
Martin Bauer committed
393
        self.instruction_set = instruction_set
394

Martin Bauer's avatar
Martin Bauer committed
395
396
397
398
    def _scalarFallback(self, func_name, expr, *args, **kwargs):
        expr_type = get_type_of_expression(expr)
        if type(expr_type) is not VectorType:
            return getattr(super(VectorizedCustomSympyPrinter, self), func_name)(expr, *args, **kwargs)
399
        else:
Martin Bauer's avatar
Martin Bauer committed
400
            assert self.instruction_set['width'] == expr_type.width
401
402
            return None

403
    def _print_Function(self, expr):
404
        if isinstance(expr, vector_memory_access):
Martin Bauer's avatar
Martin Bauer committed
405
406
407
            arg, data_type, aligned, _ = expr.args
            instruction = self.instruction_set['loadA'] if aligned else self.instruction_set['loadU']
            return instruction.format("& " + self._print(arg))
408
        elif isinstance(expr, cast_func):
Martin Bauer's avatar
Martin Bauer committed
409
410
            arg, data_type = expr.args
            if type(data_type) is VectorType:
Martin Bauer's avatar
Martin Bauer committed
411
                return self.instruction_set['makeVec'].format(self._print(arg))
412
        elif expr.func == fast_division:
413
414
            result = self._scalarFallback('_print_Function', expr)
            if not result:
415
416
                result = self.instruction_set['/'].format(self._print(expr.args[0]), self._print(expr.args[1]))
            return result
417
418
419
        elif expr.func == fast_sqrt:
            return "({})".format(self._print(sp.sqrt(expr.args[0])))
        elif expr.func == fast_inv_sqrt:
420
421
422
423
424
425
            result = self._scalarFallback('_print_Function', expr)
            if not result:
                if self.instruction_set['rsqrt']:
                    return self.instruction_set['rsqrt'].format(self._print(expr.args[0]))
                else:
                    return "({})".format(self._print(1 / sp.sqrt(expr.args[0])))
426
427
428
429
430
431
432
433
434
435
436
437
438
        elif isinstance(expr, vec_any):
            expr_type = get_type_of_expression(expr.args[0])
            if type(expr_type) is not VectorType:
                return self._print(expr.args[0])
            else:
                return self.instruction_set['any'].format(self._print(expr.args[0]))
        elif isinstance(expr, vec_all):
            expr_type = get_type_of_expression(expr.args[0])
            if type(expr_type) is not VectorType:
                return self._print(expr.args[0])
            else:
                return self.instruction_set['all'].format(self._print(expr.args[0]))

439
440
        return super(VectorizedCustomSympyPrinter, self)._print_Function(expr)

441
442
443
444
445
    def _print_And(self, expr):
        result = self._scalarFallback('_print_And', expr)
        if result:
            return result

Martin Bauer's avatar
Martin Bauer committed
446
447
448
449
        arg_strings = [self._print(a) for a in expr.args]
        assert len(arg_strings) > 0
        result = arg_strings[0]
        for item in arg_strings[1:]:
Martin Bauer's avatar
Martin Bauer committed
450
            result = self.instruction_set['&'].format(result, item)
451
452
453
454
455
456
457
        return result

    def _print_Or(self, expr):
        result = self._scalarFallback('_print_Or', expr)
        if result:
            return result

Martin Bauer's avatar
Martin Bauer committed
458
459
460
461
        arg_strings = [self._print(a) for a in expr.args]
        assert len(arg_strings) > 0
        result = arg_strings[0]
        for item in arg_strings[1:]:
Martin Bauer's avatar
Martin Bauer committed
462
            result = self.instruction_set['|'].format(result, item)
463
464
        return result

465
    def _print_Add(self, expr, order=None):
466
467
468
        result = self._scalarFallback('_print_Add', expr)
        if result:
            return result
469
470
471
472

        summands = []
        for term in expr.args:
            if term.func == sp.Mul:
Martin Bauer's avatar
Martin Bauer committed
473
                sign, t = self._print_Mul(term, inside_add=True)
474
475
476
477
478
479
480
481
482
483
484
485
486
            else:
                t = self._print(term)
                sign = 1
            summands.append(self.SummandInfo(sign, t))
        # Use positive terms first
        summands.sort(key=lambda e: e.sign, reverse=True)
        # if no positive term exists, prepend a zero
        if summands[0].sign == -1:
            summands.insert(0, self.SummandInfo(1, "0"))

        assert len(summands) >= 2
        processed = summands[0].term
        for summand in summands[1:]:
Martin Bauer's avatar
Martin Bauer committed
487
            func = self.instruction_set['-'] if summand.sign == -1 else self.instruction_set['+']
488
489
490
            processed = func.format(processed, summand.term)
        return processed

491
    def _print_Pow(self, expr):
492
493
494
        result = self._scalarFallback('_print_Pow', expr)
        if result:
            return result
495

496
497
        one = self.instruction_set['makeVec'].format(1.0)

498
499
        if expr.exp.is_integer and expr.exp.is_number and 0 < expr.exp < 8:
            return "(" + self._print(sp.Mul(*[expr.base] * expr.exp, evaluate=False)) + ")"
500
501
502
503
504
        elif expr.exp == -1:
            one = self.instruction_set['makeVec'].format(1.0)
            return self.instruction_set['/'].format(one, self._print(expr.base))
        elif expr.exp == 0.5:
            return self.instruction_set['sqrt'].format(self._print(expr.base))
505
506
507
        elif expr.exp == -0.5:
            root = self.instruction_set['sqrt'].format(self._print(expr.base))
            return self.instruction_set['/'].format(one, root)
508
509
510
        elif expr.exp.is_integer and expr.exp.is_number and - 8 < expr.exp < 0:
            return self.instruction_set['/'].format(one,
                                                    self._print(sp.Mul(*[expr.base] * (-expr.exp), evaluate=False)))
511
        else:
512
            raise ValueError("Generic exponential not supported: " + str(expr))
513

Martin Bauer's avatar
Martin Bauer committed
514
515
516
517
    def _print_Mul(self, expr, inside_add=False):
        # noinspection PyProtectedMember
        from sympy.core.mul import _keep_coeff

518
519
520
        result = self._scalarFallback('_print_Mul', expr)
        if result:
            return result
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548

        c, e = expr.as_coeff_Mul()
        if c < 0:
            expr = _keep_coeff(-c, e)
            sign = -1
        else:
            sign = 1

        a = []  # items in the numerator
        b = []  # items that are in the denominator (if any)

        # Gather args for numerator/denominator
        for item in expr.as_ordered_factors():
            if item.is_commutative and item.is_Pow and item.exp.is_Rational and item.exp.is_negative:
                if item.exp != -1:
                    b.append(sp.Pow(item.base, -item.exp, evaluate=False))
                else:
                    b.append(sp.Pow(item.base, -item.exp))
            else:
                a.append(item)

        a = a or [S.One]

        a_str = [self._print(x) for x in a]
        b_str = [self._print(x) for x in b]

        result = a_str[0]
        for item in a_str[1:]:
Martin Bauer's avatar
Martin Bauer committed
549
            result = self.instruction_set['*'].format(result, item)
550
551
552
553

        if len(b) > 0:
            denominator_str = b_str[0]
            for item in b_str[1:]:
Martin Bauer's avatar
Martin Bauer committed
554
555
                denominator_str = self.instruction_set['*'].format(denominator_str, item)
            result = self.instruction_set['/'].format(result, denominator_str)
556

Martin Bauer's avatar
Martin Bauer committed
557
        if inside_add:
558
559
560
            return sign, result
        else:
            if sign < 0:
Martin Bauer's avatar
Martin Bauer committed
561
                return self.instruction_set['*'].format(self._print(S.NegativeOne), result)
562
563
564
            else:
                return result

565
    def _print_Relational(self, expr):
566
567
568
        result = self._scalarFallback('_print_Relational', expr)
        if result:
            return result
Martin Bauer's avatar
Martin Bauer committed
569
        return self.instruction_set[expr.rel_op].format(self._print(expr.lhs), self._print(expr.rhs))
570
571

    def _print_Equality(self, expr):
572
573
574
        result = self._scalarFallback('_print_Equality', expr)
        if result:
            return result
Martin Bauer's avatar
Martin Bauer committed
575
        return self.instruction_set['=='].format(self._print(expr.lhs), self._print(expr.rhs))
576
577

    def _print_Piecewise(self, expr):
578
579
580
        result = self._scalarFallback('_print_Piecewise', expr)
        if result:
            return result
581

Martin Bauer's avatar
Martin Bauer committed
582
        if expr.args[-1].cond.args[0] is not sp.sympify(True):
583
584
585
586
587
588
589
590
591
            # We need the last conditional to be a True, otherwise the resulting
            # function may not return a result.
            raise ValueError("All Piecewise expressions must contain an "
                             "(expr, True) statement to be used as a default "
                             "condition. Without one, the generated "
                             "expression may not evaluate to anything under "
                             "some condition.")

        result = self._print(expr.args[-1][0])
Martin Bauer's avatar
Martin Bauer committed
592
        for true_expr, condition in reversed(expr.args[:-1]):
593
            if isinstance(condition, cast_func) and get_type_of_expression(condition.args[0]) == create_type("bool"):
594
595
596
597
598
                if not KERNCRAFT_NO_TERNARY_MODE:
                    result = "(({}) ? ({}) : ({}))".format(self._print(condition.args[0]), self._print(true_expr),
                                                           result)
                else:
                    print("Warning - skipping ternary op")
599
600
601
            else:
                # noinspection SpellCheckingInspection
                result = self.instruction_set['blendv'].format(result, self._print(true_expr), self._print(condition))
602
        return result