Top

miasm2.jitter.codegen module

Module to generate C code for a given native @block

"""
Module to generate C code for a given native @block
"""

from miasm2.expression.expression import Expr, ExprId, ExprLoc, ExprInt, \
    ExprMem, ExprCond, LocKey
from miasm2.ir.ir import IRBlock, AssignBlock

from miasm2.ir.translators.C import TranslatorC, int_size_to_bn
from miasm2.core.asmblock import AsmBlockBad
from miasm2.expression.simplifications import expr_simp_high_to_explicit

TRANSLATOR_NO_SYMBOL = TranslatorC(loc_db=None)

SIZE_TO_MASK = {size: TRANSLATOR_NO_SYMBOL.from_expr(ExprInt(0, size).mask)
                for size in (1, 2, 3, 7, 8, 16, 32, 64)}






class Attributes(object):

    """
    Store an irblock attributes
    """

    def __init__(self, log_mn=False, log_regs=False):
        self.mem_read = False
        self.mem_write = False
        self.set_exception = False
        self.log_mn = log_mn
        self.log_regs = log_regs
        self.instr = None


class CGen(object):
    """
    Helper to generate C code for a given AsmBlock
    """

    """
    Translate native assembly block to C
    """

    CODE_EXCEPTION_MEM_AT_INSTR = r"""
    // except fetch mem at instr noauto
    if ((VM_exception_flag & ~EXCEPT_CODE_AUTOMOD) & EXCEPT_DO_NOT_UPDATE_PC) {
        %s = %s;
        BlockDst->address = %s;
        return JIT_RET_EXCEPTION;
    }
    """

    CODE_EXCEPTION_AT_INSTR = r"""
    if (CPU_exception_flag_at_instr) {
        %s = %s;
        BlockDst->address = %s;
        return JIT_RET_EXCEPTION;
    }
    """

    CODE_RETURN_EXCEPTION = r"""
    return JIT_RET_EXCEPTION;
    """

    CODE_RETURN_NO_EXCEPTION = r"""
    %s:
    %s = %s;
    BlockDst->address = %s;
    return JIT_RET_NO_EXCEPTION;
    """

    CODE_CPU_EXCEPTION_POST_INSTR = r"""
    if (CPU_exception_flag) {
        %s = DST_value;
        BlockDst->address = DST_value;
        return JIT_RET_EXCEPTION;
    }
    """

    CODE_VM_EXCEPTION_POST_INSTR = r"""
    check_memory_breakpoint(&(jitcpu->pyvm->vm_mngr));
    check_invalid_code_blocs(&(jitcpu->pyvm->vm_mngr));
    if (VM_exception_flag) {
        %s = DST_value;
        BlockDst->address = DST_value;
        return JIT_RET_EXCEPTION;
    }
    """

    CODE_INIT = r"""
    int DST_case;
    uint64_t DST_value;
    vm_cpu_t* mycpu = (vm_cpu_t*)jitcpu->cpu;

    goto %s;
    """

    CODE_BAD_BLOCK = r"""
    // Unknown mnemonic
    CPU_exception_flag = EXCEPT_UNK_MNEMO;
    """ + CODE_RETURN_EXCEPTION

    def __init__(self, ir_arch):
        self.ir_arch = ir_arch
        self.PC = self.ir_arch.pc
        self.translator = TranslatorC(self.ir_arch.loc_db)
        self.init_arch_C()

    def init_arch_C(self):
        """Iinitialize jitter internals"""
        self.id_to_c_id = {}
        for reg in self.ir_arch.arch.regs.all_regs_ids:
            self.id_to_c_id[reg] = ExprId('mycpu->%s' % reg, reg.size)

        self.C_PC = self.id_to_c(self.PC)

    def dst_to_c(self, src):
        """Translate Expr @src into C code"""
        if not isinstance(src, Expr):
            src = ExprInt(src, self.PC.size)
        return self.id_to_c(src)

    def patch_c_id(self, expr):
        """Replace ExprId in @expr with corresponding C variables"""
        return expr.replace_expr(self.id_to_c_id)

    def id_to_c(self, expr):
        """Translate Expr @expr into corresponding C code"""
        return self.translator.from_expr(self.patch_c_id(expr))

    def add_label_index(self, dst2index, loc_key):
        """Insert @lbl to the dictionnary @dst2index with a uniq value
        @dst2index: LocKey -> uniq value
        @loc_key: LocKey istance"""

        if loc_key not in dst2index:
            dst2index[loc_key] = len(dst2index)

    def assignblk_to_irbloc(self, instr, assignblk):
        """
        Ensure IRDst is always set in the head @assignblk of the @instr
        @instr: an instruction instance
        @assignblk: Assignblk instance
        """
        new_assignblk = dict(assignblk)
        if self.ir_arch.IRDst not in assignblk:
            offset = instr.offset + instr.l
            loc_key = self.ir_arch.loc_db.get_or_create_offset_location(offset)
            dst = ExprLoc(loc_key, self.ir_arch.IRDst.size)
            new_assignblk[self.ir_arch.IRDst] = dst
        irs = [AssignBlock(new_assignblk, instr)]
        return IRBlock(self.ir_arch.get_loc_key_for_instr(instr), irs)

    def block2assignblks(self, block):
        """
        Return the list of irblocks for a native @block
        @block: AsmBlock
        """
        irblocks_list = []
        for instr in block.lines:
            assignblk_head, assignblks_extra = self.ir_arch.instr2ir(instr)
            # Keep result in ordered list as first element is the assignblk head
            # The remainings order is not really important
            irblock_head = self.assignblk_to_irbloc(instr, assignblk_head)
            irblocks = [irblock_head] + assignblks_extra

            # Simplify high level operators
            out = []
            for irblock in irblocks:
                new_irblock = irblock.simplify(expr_simp_high_to_explicit)[1]
                out.append(new_irblock)
            irblocks = out

            for irblock in irblocks:
                assert irblock.dst is not None
            irblocks_list.append(irblocks)

        return irblocks_list

    def add_local_var(self, dst_var, dst_index, expr):
        """
        Add local varaible used to store temporay result
        @dst_var: dictionnary of Expr -> local_var_expr
        @dst_index : dictionnary of size -> local var count
        @expr: Expression source
        """
        size = expr.size
        if size < 8:
            size = 8
        if size not in dst_index:
            raise RuntimeError("Unsupported operand size %s", size)
        var_num = dst_index[size]
        dst = ExprId("var_%.2d_%.2d" % (size, var_num), size)
        dst_index[size] += 1
        dst_var[expr] = dst
        return dst

    def get_mem_prefetch(self, assignblk):
        """
        Generate temporary variables used to fetch memory used in the @assignblk
        Return a dictionnary: ExprMem -> temporary variable
        @assignblk: AssignBlock instance
        """
        mem_index = {8: 0, 16: 0, 32: 0, 64: 0, 128:0}
        mem_var = {}

        # Prefetch memory read
        for expr in assignblk.get_r(mem_read=True):
            if not isinstance(expr, ExprMem):
                continue
            var_num = mem_index[expr.size]
            mem_index[expr.size] += 1
            var = ExprId(
                "prefetch_%.2d_%.2d" % (expr.size, var_num), expr.size
            )
            mem_var[expr] = var

        # Generate memory prefetch
        return mem_var

    def gen_c_assignments(self, assignblk):
        """
        Return C informations used to generate the C code of the @assignblk
        @assignblk: an AssignBlock instance
        """
        c_var = []
        c_main = []
        c_mem = []
        c_updt = []
        c_prefetch = []

        dst_index = {8: 0, 16: 0, 32: 0, 64: 0, 128:0}
        dst_var = {}

        prefetchers = self.get_mem_prefetch(assignblk)

        for expr, prefetcher in sorted(prefetchers.iteritems()):
            str_src = self.id_to_c(expr)
            str_dst = self.id_to_c(prefetcher)
            c_prefetch.append('%s = %s;' % (str_dst, str_src))

        for var in prefetchers.itervalues():
            if var.size <= self.translator.NATIVE_INT_MAX_SIZE:
                c_var.append("uint%d_t %s;" % (var.size, var))
            else:
                c_var.append("bn_t %s; // %d" % (var, var.size))

        for dst, src in sorted(assignblk.iteritems()):
            src = src.replace_expr(prefetchers)
            if dst == self.ir_arch.IRDst:
                pass
            elif isinstance(dst, ExprId):
                new_dst = self.add_local_var(dst_var, dst_index, dst)
                if dst in self.ir_arch.arch.regs.regs_flt_expr:
                    # Dont mask float affectation
                    c_main.append(
                        '%s = (%s);' % (self.id_to_c(new_dst), self.id_to_c(src)))
                elif new_dst.size <= self.translator.NATIVE_INT_MAX_SIZE:
                    c_main.append(
                        '%s = (%s)&%s;' % (self.id_to_c(new_dst),
                                           self.id_to_c(src),
                                           SIZE_TO_MASK[src.size]))
                else:
                    c_main.append(
                        '%s = bignum_mask(%s, %d);' % (
                            self.id_to_c(new_dst),
                            self.id_to_c(src),
                            src.size
                        )
                    )
            elif isinstance(dst, ExprMem):
                ptr = dst.arg.replace_expr(prefetchers)
                if ptr.size <= self.translator.NATIVE_INT_MAX_SIZE:
                    new_dst = ExprMem(ptr, dst.size)
                    str_dst = self.id_to_c(new_dst).replace('MEM_LOOKUP', 'MEM_WRITE')
                    c_mem.append('%s, %s);' % (str_dst[:-1], self.id_to_c(src)))
                else:
                    ptr_str = self.id_to_c(ptr)
                    if ptr.size <= self.translator.NATIVE_INT_MAX_SIZE:
                        c_mem.append('%s, %s);' % (str_dst[:-1], self.id_to_c(src)))
                    else:
                        if src.size <= self.translator.NATIVE_INT_MAX_SIZE:
                            c_mem.append('MEM_WRITE_BN_INT(jitcpu, %d, %s, %s);' % (
                                src.size, ptr_str, self.id_to_c(src))
                            )
                        else:
                            c_mem.append('MEM_WRITE_BN_BN(jitcpu, %d, %s, %s);' % (
                                src.size, ptr_str, self.id_to_c(src))
                            )
            else:
                raise ValueError("Unknown dst")

        for dst, new_dst in dst_var.iteritems():
            if dst == self.ir_arch.IRDst:
                continue

            c_updt.append('%s = %s;' % (self.id_to_c(dst), self.id_to_c(new_dst)))
            if dst.size <= self.translator.NATIVE_INT_MAX_SIZE:
                c_var.append("uint%d_t %s;" % (new_dst.size, new_dst))
            else:
                c_var.append("bn_t %s; // %d" % (new_dst, new_dst.size))

        return c_prefetch, c_var, c_main, c_mem, c_updt

    def gen_check_memory_exception(self, address):
        """Generate C code to check memory exceptions
        @address: address of the faulty instruction"""
        dst = self.dst_to_c(address)
        return (self.CODE_EXCEPTION_MEM_AT_INSTR % (self.C_PC, dst, dst)).split('\n')

    def gen_check_cpu_exception(self, address):
        """Generate C code to check cpu exceptions
        @address: address of the faulty instruction"""
        dst = self.dst_to_c(address)
        return (self.CODE_EXCEPTION_AT_INSTR % (self.C_PC, dst, dst)).split('\n')

    def traverse_expr_dst(self, expr, dst2index):
        """
        Generate the index of the destination label for the @expr
        @dst2index: dictionnary to link label to its index
        """

        if isinstance(expr, ExprCond):
            src1, src1b = self.traverse_expr_dst(expr.src1, dst2index)
            src2, src2b = self.traverse_expr_dst(expr.src2, dst2index)
            cond = self.id_to_c(expr.cond)
            if not expr.cond.size <= self.translator.NATIVE_INT_MAX_SIZE:
                cond = "(!bignum_is_zero(%s))" % cond

            return ("((%s)?(%s):(%s))" % (cond, src1, src2),
                    "((%s)?(%s):(%s))" % (cond, src1b, src2b))
        if isinstance(expr, ExprInt):
            offset = int(expr)
            loc_key = self.ir_arch.loc_db.get_or_create_offset_location(offset)
            self.add_label_index(dst2index, loc_key)

            value, int_size = int_size_to_bn(offset, 64)
            out = hex(offset)

            return ("%s" % dst2index[loc_key], out)
        if expr.is_loc():
            loc_key = expr.loc_key
            offset = self.ir_arch.loc_db.get_location_offset(expr.loc_key)
            if offset is not None:
                self.add_label_index(dst2index, loc_key)

                value, int_size = int_size_to_bn(offset, 64)
                out = hex(offset)

                return ("%s" % dst2index[loc_key], out)
            self.add_label_index(dst2index, loc_key)

            value, int_size = int_size_to_bn(0, 64)
            out = hex(0)

            return ("%s" % dst2index[loc_key], out)
        dst2index[expr] = -1
        return ("-1", self.id_to_c(expr))

    def gen_assignblk_dst(self, dst):
        """Generate C code to handle instruction destination
        @dst: instruction destination Expr"""
        dst2index = {}
        (ret, retb) = self.traverse_expr_dst(dst, dst2index)
        ret = "DST_case = %s;" % ret
        retb = 'DST_value = %s;' % retb
        return ['// %s' % dst2index,
                '%s' % ret,
                '%s' % retb], dst2index

    def gen_post_instr_checks(self, attrib):
        """Generate C code for handling potential exceptions
        @attrib: Attributes instance"""
        out = []
        if attrib.mem_read | attrib.mem_write:
            out += (self.CODE_VM_EXCEPTION_POST_INSTR % (self.C_PC)).split('\n')
        if attrib.set_exception:
            out += (self.CODE_CPU_EXCEPTION_POST_INSTR % (self.C_PC)).split('\n')

        if attrib.mem_read | attrib.mem_write:
            out.append("reset_memory_access(&(jitcpu->pyvm->vm_mngr));")

        return out

    def gen_pre_code(self, instr_attrib):
        """Callback to generate code BEFORE the instruction execution
        @instr_attrib: Attributes instance"""

        out = []

        if instr_attrib.log_mn:
            out.append(
                'printf("%.8X %s\\n");' % (
                    instr_attrib.instr.offset,
                    instr_attrib.instr.to_string(self.ir_arch.loc_db)
                )
            )
        return out

    def gen_post_code(self, attrib):
        """Callback to generate code AFTER the instruction execution
        @attrib: Attributes instance"""
        out = []
        if attrib.log_regs:
            out.append('dump_gpregs(jitcpu->cpu);')
        return out

    def gen_goto_code(self, attrib, instr_offsets, dst):
        """Generate C code for a potential destination @dst
        @attrib: instruction Attributes
        @instr_offsets: instructions offsets list
        @dst: potential instruction destination"""

        out = []
        if isinstance(dst, Expr):
            out += self.gen_post_code(attrib)
            out.append('BlockDst->address = DST_value;')
            out += self.gen_post_instr_checks(attrib)
            out.append('\t\treturn JIT_RET_NO_EXCEPTION;')
            return out

        assert isinstance(dst, LocKey)
        offset = self.ir_arch.loc_db.get_location_offset(dst)
        if offset is None:
            # Generate goto for local labels
            return ['goto %s;' % dst]
        if (offset > attrib.instr.offset and
            offset in instr_offsets):
            # Only generate goto for next instructions.
            # (consecutive instructions)
            out += self.gen_post_code(attrib)
            out += self.gen_post_instr_checks(attrib)
            out.append('goto %s;' % dst)
        else:
            out += self.gen_post_code(attrib)
            out.append('BlockDst->address = DST_value;')
            out += self.gen_post_instr_checks(attrib)
            out.append('\t\treturn JIT_RET_NO_EXCEPTION;')
        return out

    def gen_dst_goto(self, attrib, instr_offsets, dst2index):
        """
        Generate code for possible @dst2index.

        @attrib: an Attributes instance
        @instr_offsets: list of instructions offsets
        @dst2index: link from destination to index
        """

        if not dst2index:
            return []
        out = []
        out.append('switch(DST_case) {')

        stopcase = False
        for dst, index in sorted(dst2index.iteritems(), key=lambda lblindex: lblindex[1]):
            if index == -1:
                # Handle '-1' case only once
                if not stopcase:
                    stopcase = True
                else:
                    continue

            out.append('\tcase %d:' % index)

            out += self.gen_goto_code(attrib, instr_offsets, dst)
            out.append('\t\tbreak;')
        out.append('};')
        return out

    def gen_c_code(self, attrib, c_dst, c_assignmnts):
        """
        Generate the C code for assignblk.
        @attrib: Attributes instance
        @c_dst: irdst C code
        """

        c_prefetch, c_var, c_main, c_mem, c_updt = c_assignmnts
        out = []
        out.append("{")
        out.append("// var")
        out += c_var
        out.append("// Prefetch")
        out += c_prefetch
        out.append("// Dst")
        out += c_dst
        out.append("// Main")
        out += c_main

        out.append("// Check op/mem exceptions")

        # Check memory access if assignblk has memory read
        if c_prefetch:
            out += self.gen_check_memory_exception(attrib.instr.offset)

        out.append("// Mem updt")
        out += c_mem

        out.append("// Check exception Mem write")
        # Check memory write exceptions
        if attrib.mem_write:
            out += self.gen_check_memory_exception(attrib.instr.offset)

        out.append("// Updt")
        out += c_updt

        out.append("// Checks exception")

        # Check post assignblk exception flags
        if attrib.set_exception:
            out += self.gen_check_cpu_exception(attrib.instr.offset)

        out.append("}")

        return out

    def get_caracteristics(self, assignblk, attrib):
        """
        Set the carateristics in @attrib according to the @assignblk
        @assignblk: an AssignBlock instance
        @attrib: an Attributes instance
        """

        # Check explicit exception raising
        attrib.set_exception = self.ir_arch.arch.regs.exception_flags in assignblk

        element_read = assignblk.get_r(mem_read=True)
        # Check mem read
        attrib.mem_read = any(isinstance(expr, ExprMem)
                              for expr in element_read)
        # Check mem write
        attrib.mem_write = any(isinstance(dst, ExprMem)
                               for dst in assignblk)

    def get_attributes(self, instr, irblocks, log_mn=False, log_regs=False):
        """
        Get the carateristics of each @irblocks. Returns the corresponding
        attributes object.
        @irblock: a list of irbloc instance
        @log_mn: generate code to log instructions
        @log_regs: generate code to log registers states
        """

        instr_attrib = Attributes(log_mn, log_regs)
        instr_attrib.instr = instr
        irblocks_attributes = []

        for irblock in irblocks:
            attributes = []
            irblocks_attributes.append(attributes)
            for assignblk in irblock:
                attrib = Attributes(log_mn, log_regs)
                attributes.append(attrib)
                self.get_caracteristics(assignblk, attrib)
                attrib.instr = instr
                instr_attrib.mem_read |= attrib.mem_read
                instr_attrib.mem_write |= attrib.mem_write
                instr_attrib.set_exception |= attrib.set_exception

        return instr_attrib, irblocks_attributes

    def gen_bad_block(self):
        """
        Generate the C code for a bad_block instance
        """
        return self.CODE_BAD_BLOCK.split("\n")

    def get_block_post_label(self, block):
        """Get label next to the @block
        @block: AsmBlock instance"""

        last_instr = block.lines[-1]
        offset = last_instr.offset + last_instr.l
        return self.ir_arch.loc_db.get_or_create_offset_location(offset)

    def gen_init(self, block):
        """
        Generate the init C code for a @block
        @block: an asm_bloc instance
        """

        instr_offsets = [line.offset for line in block.lines]
        post_label = self.get_block_post_label(block)
        post_offset = self.ir_arch.loc_db.get_location_offset(post_label)
        instr_offsets.append(post_offset)
        lbl_start = block.loc_key
        return (self.CODE_INIT % lbl_start).split("\n"), instr_offsets

    def gen_irblock(self, instr_attrib, attributes, instr_offsets, irblock):
        """
        Generate the C code for an @irblock
        @irblock: an irbloc instance
        @attributes: an Attributes instance list
        """

        out = []
        dst2index = None
        for index, assignblk in enumerate(irblock):
            if index == irblock.dst_linenb:
                c_dst, dst2index = self.gen_assignblk_dst(irblock.dst)
            else:
                c_dst = []

            c_assignmnts = self.gen_c_assignments(assignblk)
            out += self.gen_c_code(attributes[index], c_dst, c_assignmnts)

        if dst2index:
            out.append("// Set irdst")
            # Gen goto on irdst set
            out += self.gen_dst_goto(instr_attrib, instr_offsets, dst2index)

        return out

    def gen_finalize(self, block):
        """
        Generate the C code for the final block instruction
        """

        loc_key = self.get_block_post_label(block)
        offset = self.ir_arch.loc_db.get_location_offset(loc_key)
        dst = self.dst_to_c(offset)
        code = self.CODE_RETURN_NO_EXCEPTION % (loc_key, self.C_PC, dst, dst)
        return code.split('\n')

    def gen_c(self, block, log_mn=False, log_regs=False):
        """
        Generate the C code for the @block and return it as a list of lines
        @log_mn: log mnemonics
        @log_regs: log registers
        """

        if isinstance(block, AsmBlockBad):
            return self.gen_bad_block()
        irblocks_list = self.block2assignblks(block)
        out, instr_offsets = self.gen_init(block)
        assert len(block.lines) == len(irblocks_list)
        for instr, irblocks in zip(block.lines, irblocks_list):
            instr_attrib, irblocks_attributes = self.get_attributes(instr, irblocks, log_mn, log_regs)
            for index, irblock in enumerate(irblocks):
                new_irblock = self.ir_arch.irbloc_fix_regs_for_mode(irblock, self.ir_arch.attrib)
                label = str(new_irblock.loc_key)
                out.append("%-40s // %.16X %s" %
                           (label + ":", instr.offset, instr))
                if index == 0:
                    out += self.gen_pre_code(instr_attrib)
                out += self.gen_irblock(instr_attrib, irblocks_attributes[index], instr_offsets, new_irblock)

        out += self.gen_finalize(block)

        return ['\t' + line for line in out]

Module variables

var SIZE_TO_MASK

var TRANSLATOR_NO_SYMBOL

Classes

class Attributes

Store an irblock attributes

class Attributes(object):

    """
    Store an irblock attributes
    """

    def __init__(self, log_mn=False, log_regs=False):
        self.mem_read = False
        self.mem_write = False
        self.set_exception = False
        self.log_mn = log_mn
        self.log_regs = log_regs
        self.instr = None

Ancestors (in MRO)

Instance variables

var instr

var log_mn

var log_regs

var mem_read

var mem_write

var set_exception

Methods

def __init__(

self, log_mn=False, log_regs=False)

def __init__(self, log_mn=False, log_regs=False):
    self.mem_read = False
    self.mem_write = False
    self.set_exception = False
    self.log_mn = log_mn
    self.log_regs = log_regs
    self.instr = None

class CGen

Helper to generate C code for a given AsmBlock

class CGen(object):
    """
    Helper to generate C code for a given AsmBlock
    """

    """
    Translate native assembly block to C
    """

    CODE_EXCEPTION_MEM_AT_INSTR = r"""
    // except fetch mem at instr noauto
    if ((VM_exception_flag & ~EXCEPT_CODE_AUTOMOD) & EXCEPT_DO_NOT_UPDATE_PC) {
        %s = %s;
        BlockDst->address = %s;
        return JIT_RET_EXCEPTION;
    }
    """

    CODE_EXCEPTION_AT_INSTR = r"""
    if (CPU_exception_flag_at_instr) {
        %s = %s;
        BlockDst->address = %s;
        return JIT_RET_EXCEPTION;
    }
    """

    CODE_RETURN_EXCEPTION = r"""
    return JIT_RET_EXCEPTION;
    """

    CODE_RETURN_NO_EXCEPTION = r"""
    %s:
    %s = %s;
    BlockDst->address = %s;
    return JIT_RET_NO_EXCEPTION;
    """

    CODE_CPU_EXCEPTION_POST_INSTR = r"""
    if (CPU_exception_flag) {
        %s = DST_value;
        BlockDst->address = DST_value;
        return JIT_RET_EXCEPTION;
    }
    """

    CODE_VM_EXCEPTION_POST_INSTR = r"""
    check_memory_breakpoint(&(jitcpu->pyvm->vm_mngr));
    check_invalid_code_blocs(&(jitcpu->pyvm->vm_mngr));
    if (VM_exception_flag) {
        %s = DST_value;
        BlockDst->address = DST_value;
        return JIT_RET_EXCEPTION;
    }
    """

    CODE_INIT = r"""
    int DST_case;
    uint64_t DST_value;
    vm_cpu_t* mycpu = (vm_cpu_t*)jitcpu->cpu;

    goto %s;
    """

    CODE_BAD_BLOCK = r"""
    // Unknown mnemonic
    CPU_exception_flag = EXCEPT_UNK_MNEMO;
    """ + CODE_RETURN_EXCEPTION

    def __init__(self, ir_arch):
        self.ir_arch = ir_arch
        self.PC = self.ir_arch.pc
        self.translator = TranslatorC(self.ir_arch.loc_db)
        self.init_arch_C()

    def init_arch_C(self):
        """Iinitialize jitter internals"""
        self.id_to_c_id = {}
        for reg in self.ir_arch.arch.regs.all_regs_ids:
            self.id_to_c_id[reg] = ExprId('mycpu->%s' % reg, reg.size)

        self.C_PC = self.id_to_c(self.PC)

    def dst_to_c(self, src):
        """Translate Expr @src into C code"""
        if not isinstance(src, Expr):
            src = ExprInt(src, self.PC.size)
        return self.id_to_c(src)

    def patch_c_id(self, expr):
        """Replace ExprId in @expr with corresponding C variables"""
        return expr.replace_expr(self.id_to_c_id)

    def id_to_c(self, expr):
        """Translate Expr @expr into corresponding C code"""
        return self.translator.from_expr(self.patch_c_id(expr))

    def add_label_index(self, dst2index, loc_key):
        """Insert @lbl to the dictionnary @dst2index with a uniq value
        @dst2index: LocKey -> uniq value
        @loc_key: LocKey istance"""

        if loc_key not in dst2index:
            dst2index[loc_key] = len(dst2index)

    def assignblk_to_irbloc(self, instr, assignblk):
        """
        Ensure IRDst is always set in the head @assignblk of the @instr
        @instr: an instruction instance
        @assignblk: Assignblk instance
        """
        new_assignblk = dict(assignblk)
        if self.ir_arch.IRDst not in assignblk:
            offset = instr.offset + instr.l
            loc_key = self.ir_arch.loc_db.get_or_create_offset_location(offset)
            dst = ExprLoc(loc_key, self.ir_arch.IRDst.size)
            new_assignblk[self.ir_arch.IRDst] = dst
        irs = [AssignBlock(new_assignblk, instr)]
        return IRBlock(self.ir_arch.get_loc_key_for_instr(instr), irs)

    def block2assignblks(self, block):
        """
        Return the list of irblocks for a native @block
        @block: AsmBlock
        """
        irblocks_list = []
        for instr in block.lines:
            assignblk_head, assignblks_extra = self.ir_arch.instr2ir(instr)
            # Keep result in ordered list as first element is the assignblk head
            # The remainings order is not really important
            irblock_head = self.assignblk_to_irbloc(instr, assignblk_head)
            irblocks = [irblock_head] + assignblks_extra

            # Simplify high level operators
            out = []
            for irblock in irblocks:
                new_irblock = irblock.simplify(expr_simp_high_to_explicit)[1]
                out.append(new_irblock)
            irblocks = out

            for irblock in irblocks:
                assert irblock.dst is not None
            irblocks_list.append(irblocks)

        return irblocks_list

    def add_local_var(self, dst_var, dst_index, expr):
        """
        Add local varaible used to store temporay result
        @dst_var: dictionnary of Expr -> local_var_expr
        @dst_index : dictionnary of size -> local var count
        @expr: Expression source
        """
        size = expr.size
        if size < 8:
            size = 8
        if size not in dst_index:
            raise RuntimeError("Unsupported operand size %s", size)
        var_num = dst_index[size]
        dst = ExprId("var_%.2d_%.2d" % (size, var_num), size)
        dst_index[size] += 1
        dst_var[expr] = dst
        return dst

    def get_mem_prefetch(self, assignblk):
        """
        Generate temporary variables used to fetch memory used in the @assignblk
        Return a dictionnary: ExprMem -> temporary variable
        @assignblk: AssignBlock instance
        """
        mem_index = {8: 0, 16: 0, 32: 0, 64: 0, 128:0}
        mem_var = {}

        # Prefetch memory read
        for expr in assignblk.get_r(mem_read=True):
            if not isinstance(expr, ExprMem):
                continue
            var_num = mem_index[expr.size]
            mem_index[expr.size] += 1
            var = ExprId(
                "prefetch_%.2d_%.2d" % (expr.size, var_num), expr.size
            )
            mem_var[expr] = var

        # Generate memory prefetch
        return mem_var

    def gen_c_assignments(self, assignblk):
        """
        Return C informations used to generate the C code of the @assignblk
        @assignblk: an AssignBlock instance
        """
        c_var = []
        c_main = []
        c_mem = []
        c_updt = []
        c_prefetch = []

        dst_index = {8: 0, 16: 0, 32: 0, 64: 0, 128:0}
        dst_var = {}

        prefetchers = self.get_mem_prefetch(assignblk)

        for expr, prefetcher in sorted(prefetchers.iteritems()):
            str_src = self.id_to_c(expr)
            str_dst = self.id_to_c(prefetcher)
            c_prefetch.append('%s = %s;' % (str_dst, str_src))

        for var in prefetchers.itervalues():
            if var.size <= self.translator.NATIVE_INT_MAX_SIZE:
                c_var.append("uint%d_t %s;" % (var.size, var))
            else:
                c_var.append("bn_t %s; // %d" % (var, var.size))

        for dst, src in sorted(assignblk.iteritems()):
            src = src.replace_expr(prefetchers)
            if dst == self.ir_arch.IRDst:
                pass
            elif isinstance(dst, ExprId):
                new_dst = self.add_local_var(dst_var, dst_index, dst)
                if dst in self.ir_arch.arch.regs.regs_flt_expr:
                    # Dont mask float affectation
                    c_main.append(
                        '%s = (%s);' % (self.id_to_c(new_dst), self.id_to_c(src)))
                elif new_dst.size <= self.translator.NATIVE_INT_MAX_SIZE:
                    c_main.append(
                        '%s = (%s)&%s;' % (self.id_to_c(new_dst),
                                           self.id_to_c(src),
                                           SIZE_TO_MASK[src.size]))
                else:
                    c_main.append(
                        '%s = bignum_mask(%s, %d);' % (
                            self.id_to_c(new_dst),
                            self.id_to_c(src),
                            src.size
                        )
                    )
            elif isinstance(dst, ExprMem):
                ptr = dst.arg.replace_expr(prefetchers)
                if ptr.size <= self.translator.NATIVE_INT_MAX_SIZE:
                    new_dst = ExprMem(ptr, dst.size)
                    str_dst = self.id_to_c(new_dst).replace('MEM_LOOKUP', 'MEM_WRITE')
                    c_mem.append('%s, %s);' % (str_dst[:-1], self.id_to_c(src)))
                else:
                    ptr_str = self.id_to_c(ptr)
                    if ptr.size <= self.translator.NATIVE_INT_MAX_SIZE:
                        c_mem.append('%s, %s);' % (str_dst[:-1], self.id_to_c(src)))
                    else:
                        if src.size <= self.translator.NATIVE_INT_MAX_SIZE:
                            c_mem.append('MEM_WRITE_BN_INT(jitcpu, %d, %s, %s);' % (
                                src.size, ptr_str, self.id_to_c(src))
                            )
                        else:
                            c_mem.append('MEM_WRITE_BN_BN(jitcpu, %d, %s, %s);' % (
                                src.size, ptr_str, self.id_to_c(src))
                            )
            else:
                raise ValueError("Unknown dst")

        for dst, new_dst in dst_var.iteritems():
            if dst == self.ir_arch.IRDst:
                continue

            c_updt.append('%s = %s;' % (self.id_to_c(dst), self.id_to_c(new_dst)))
            if dst.size <= self.translator.NATIVE_INT_MAX_SIZE:
                c_var.append("uint%d_t %s;" % (new_dst.size, new_dst))
            else:
                c_var.append("bn_t %s; // %d" % (new_dst, new_dst.size))

        return c_prefetch, c_var, c_main, c_mem, c_updt

    def gen_check_memory_exception(self, address):
        """Generate C code to check memory exceptions
        @address: address of the faulty instruction"""
        dst = self.dst_to_c(address)
        return (self.CODE_EXCEPTION_MEM_AT_INSTR % (self.C_PC, dst, dst)).split('\n')

    def gen_check_cpu_exception(self, address):
        """Generate C code to check cpu exceptions
        @address: address of the faulty instruction"""
        dst = self.dst_to_c(address)
        return (self.CODE_EXCEPTION_AT_INSTR % (self.C_PC, dst, dst)).split('\n')

    def traverse_expr_dst(self, expr, dst2index):
        """
        Generate the index of the destination label for the @expr
        @dst2index: dictionnary to link label to its index
        """

        if isinstance(expr, ExprCond):
            src1, src1b = self.traverse_expr_dst(expr.src1, dst2index)
            src2, src2b = self.traverse_expr_dst(expr.src2, dst2index)
            cond = self.id_to_c(expr.cond)
            if not expr.cond.size <= self.translator.NATIVE_INT_MAX_SIZE:
                cond = "(!bignum_is_zero(%s))" % cond

            return ("((%s)?(%s):(%s))" % (cond, src1, src2),
                    "((%s)?(%s):(%s))" % (cond, src1b, src2b))
        if isinstance(expr, ExprInt):
            offset = int(expr)
            loc_key = self.ir_arch.loc_db.get_or_create_offset_location(offset)
            self.add_label_index(dst2index, loc_key)

            value, int_size = int_size_to_bn(offset, 64)
            out = hex(offset)

            return ("%s" % dst2index[loc_key], out)
        if expr.is_loc():
            loc_key = expr.loc_key
            offset = self.ir_arch.loc_db.get_location_offset(expr.loc_key)
            if offset is not None:
                self.add_label_index(dst2index, loc_key)

                value, int_size = int_size_to_bn(offset, 64)
                out = hex(offset)

                return ("%s" % dst2index[loc_key], out)
            self.add_label_index(dst2index, loc_key)

            value, int_size = int_size_to_bn(0, 64)
            out = hex(0)

            return ("%s" % dst2index[loc_key], out)
        dst2index[expr] = -1
        return ("-1", self.id_to_c(expr))

    def gen_assignblk_dst(self, dst):
        """Generate C code to handle instruction destination
        @dst: instruction destination Expr"""
        dst2index = {}
        (ret, retb) = self.traverse_expr_dst(dst, dst2index)
        ret = "DST_case = %s;" % ret
        retb = 'DST_value = %s;' % retb
        return ['// %s' % dst2index,
                '%s' % ret,
                '%s' % retb], dst2index

    def gen_post_instr_checks(self, attrib):
        """Generate C code for handling potential exceptions
        @attrib: Attributes instance"""
        out = []
        if attrib.mem_read | attrib.mem_write:
            out += (self.CODE_VM_EXCEPTION_POST_INSTR % (self.C_PC)).split('\n')
        if attrib.set_exception:
            out += (self.CODE_CPU_EXCEPTION_POST_INSTR % (self.C_PC)).split('\n')

        if attrib.mem_read | attrib.mem_write:
            out.append("reset_memory_access(&(jitcpu->pyvm->vm_mngr));")

        return out

    def gen_pre_code(self, instr_attrib):
        """Callback to generate code BEFORE the instruction execution
        @instr_attrib: Attributes instance"""

        out = []

        if instr_attrib.log_mn:
            out.append(
                'printf("%.8X %s\\n");' % (
                    instr_attrib.instr.offset,
                    instr_attrib.instr.to_string(self.ir_arch.loc_db)
                )
            )
        return out

    def gen_post_code(self, attrib):
        """Callback to generate code AFTER the instruction execution
        @attrib: Attributes instance"""
        out = []
        if attrib.log_regs:
            out.append('dump_gpregs(jitcpu->cpu);')
        return out

    def gen_goto_code(self, attrib, instr_offsets, dst):
        """Generate C code for a potential destination @dst
        @attrib: instruction Attributes
        @instr_offsets: instructions offsets list
        @dst: potential instruction destination"""

        out = []
        if isinstance(dst, Expr):
            out += self.gen_post_code(attrib)
            out.append('BlockDst->address = DST_value;')
            out += self.gen_post_instr_checks(attrib)
            out.append('\t\treturn JIT_RET_NO_EXCEPTION;')
            return out

        assert isinstance(dst, LocKey)
        offset = self.ir_arch.loc_db.get_location_offset(dst)
        if offset is None:
            # Generate goto for local labels
            return ['goto %s;' % dst]
        if (offset > attrib.instr.offset and
            offset in instr_offsets):
            # Only generate goto for next instructions.
            # (consecutive instructions)
            out += self.gen_post_code(attrib)
            out += self.gen_post_instr_checks(attrib)
            out.append('goto %s;' % dst)
        else:
            out += self.gen_post_code(attrib)
            out.append('BlockDst->address = DST_value;')
            out += self.gen_post_instr_checks(attrib)
            out.append('\t\treturn JIT_RET_NO_EXCEPTION;')
        return out

    def gen_dst_goto(self, attrib, instr_offsets, dst2index):
        """
        Generate code for possible @dst2index.

        @attrib: an Attributes instance
        @instr_offsets: list of instructions offsets
        @dst2index: link from destination to index
        """

        if not dst2index:
            return []
        out = []
        out.append('switch(DST_case) {')

        stopcase = False
        for dst, index in sorted(dst2index.iteritems(), key=lambda lblindex: lblindex[1]):
            if index == -1:
                # Handle '-1' case only once
                if not stopcase:
                    stopcase = True
                else:
                    continue

            out.append('\tcase %d:' % index)

            out += self.gen_goto_code(attrib, instr_offsets, dst)
            out.append('\t\tbreak;')
        out.append('};')
        return out

    def gen_c_code(self, attrib, c_dst, c_assignmnts):
        """
        Generate the C code for assignblk.
        @attrib: Attributes instance
        @c_dst: irdst C code
        """

        c_prefetch, c_var, c_main, c_mem, c_updt = c_assignmnts
        out = []
        out.append("{")
        out.append("// var")
        out += c_var
        out.append("// Prefetch")
        out += c_prefetch
        out.append("// Dst")
        out += c_dst
        out.append("// Main")
        out += c_main

        out.append("// Check op/mem exceptions")

        # Check memory access if assignblk has memory read
        if c_prefetch:
            out += self.gen_check_memory_exception(attrib.instr.offset)

        out.append("// Mem updt")
        out += c_mem

        out.append("// Check exception Mem write")
        # Check memory write exceptions
        if attrib.mem_write:
            out += self.gen_check_memory_exception(attrib.instr.offset)

        out.append("// Updt")
        out += c_updt

        out.append("// Checks exception")

        # Check post assignblk exception flags
        if attrib.set_exception:
            out += self.gen_check_cpu_exception(attrib.instr.offset)

        out.append("}")

        return out

    def get_caracteristics(self, assignblk, attrib):
        """
        Set the carateristics in @attrib according to the @assignblk
        @assignblk: an AssignBlock instance
        @attrib: an Attributes instance
        """

        # Check explicit exception raising
        attrib.set_exception = self.ir_arch.arch.regs.exception_flags in assignblk

        element_read = assignblk.get_r(mem_read=True)
        # Check mem read
        attrib.mem_read = any(isinstance(expr, ExprMem)
                              for expr in element_read)
        # Check mem write
        attrib.mem_write = any(isinstance(dst, ExprMem)
                               for dst in assignblk)

    def get_attributes(self, instr, irblocks, log_mn=False, log_regs=False):
        """
        Get the carateristics of each @irblocks. Returns the corresponding
        attributes object.
        @irblock: a list of irbloc instance
        @log_mn: generate code to log instructions
        @log_regs: generate code to log registers states
        """

        instr_attrib = Attributes(log_mn, log_regs)
        instr_attrib.instr = instr
        irblocks_attributes = []

        for irblock in irblocks:
            attributes = []
            irblocks_attributes.append(attributes)
            for assignblk in irblock:
                attrib = Attributes(log_mn, log_regs)
                attributes.append(attrib)
                self.get_caracteristics(assignblk, attrib)
                attrib.instr = instr
                instr_attrib.mem_read |= attrib.mem_read
                instr_attrib.mem_write |= attrib.mem_write
                instr_attrib.set_exception |= attrib.set_exception

        return instr_attrib, irblocks_attributes

    def gen_bad_block(self):
        """
        Generate the C code for a bad_block instance
        """
        return self.CODE_BAD_BLOCK.split("\n")

    def get_block_post_label(self, block):
        """Get label next to the @block
        @block: AsmBlock instance"""

        last_instr = block.lines[-1]
        offset = last_instr.offset + last_instr.l
        return self.ir_arch.loc_db.get_or_create_offset_location(offset)

    def gen_init(self, block):
        """
        Generate the init C code for a @block
        @block: an asm_bloc instance
        """

        instr_offsets = [line.offset for line in block.lines]
        post_label = self.get_block_post_label(block)
        post_offset = self.ir_arch.loc_db.get_location_offset(post_label)
        instr_offsets.append(post_offset)
        lbl_start = block.loc_key
        return (self.CODE_INIT % lbl_start).split("\n"), instr_offsets

    def gen_irblock(self, instr_attrib, attributes, instr_offsets, irblock):
        """
        Generate the C code for an @irblock
        @irblock: an irbloc instance
        @attributes: an Attributes instance list
        """

        out = []
        dst2index = None
        for index, assignblk in enumerate(irblock):
            if index == irblock.dst_linenb:
                c_dst, dst2index = self.gen_assignblk_dst(irblock.dst)
            else:
                c_dst = []

            c_assignmnts = self.gen_c_assignments(assignblk)
            out += self.gen_c_code(attributes[index], c_dst, c_assignmnts)

        if dst2index:
            out.append("// Set irdst")
            # Gen goto on irdst set
            out += self.gen_dst_goto(instr_attrib, instr_offsets, dst2index)

        return out

    def gen_finalize(self, block):
        """
        Generate the C code for the final block instruction
        """

        loc_key = self.get_block_post_label(block)
        offset = self.ir_arch.loc_db.get_location_offset(loc_key)
        dst = self.dst_to_c(offset)
        code = self.CODE_RETURN_NO_EXCEPTION % (loc_key, self.C_PC, dst, dst)
        return code.split('\n')

    def gen_c(self, block, log_mn=False, log_regs=False):
        """
        Generate the C code for the @block and return it as a list of lines
        @log_mn: log mnemonics
        @log_regs: log registers
        """

        if isinstance(block, AsmBlockBad):
            return self.gen_bad_block()
        irblocks_list = self.block2assignblks(block)
        out, instr_offsets = self.gen_init(block)
        assert len(block.lines) == len(irblocks_list)
        for instr, irblocks in zip(block.lines, irblocks_list):
            instr_attrib, irblocks_attributes = self.get_attributes(instr, irblocks, log_mn, log_regs)
            for index, irblock in enumerate(irblocks):
                new_irblock = self.ir_arch.irbloc_fix_regs_for_mode(irblock, self.ir_arch.attrib)
                label = str(new_irblock.loc_key)
                out.append("%-40s // %.16X %s" %
                           (label + ":", instr.offset, instr))
                if index == 0:
                    out += self.gen_pre_code(instr_attrib)
                out += self.gen_irblock(instr_attrib, irblocks_attributes[index], instr_offsets, new_irblock)

        out += self.gen_finalize(block)

        return ['\t' + line for line in out]

Ancestors (in MRO)

  • CGen
  • __builtin__.object

Class variables

var CODE_BAD_BLOCK

var CODE_CPU_EXCEPTION_POST_INSTR

var CODE_EXCEPTION_AT_INSTR

var CODE_EXCEPTION_MEM_AT_INSTR

var CODE_INIT

var CODE_RETURN_EXCEPTION

var CODE_RETURN_NO_EXCEPTION

var CODE_VM_EXCEPTION_POST_INSTR

Instance variables

var PC

var ir_arch

var translator

Methods

def __init__(

self, ir_arch)

def __init__(self, ir_arch):
    self.ir_arch = ir_arch
    self.PC = self.ir_arch.pc
    self.translator = TranslatorC(self.ir_arch.loc_db)
    self.init_arch_C()

def add_label_index(

self, dst2index, loc_key)

Insert @lbl to the dictionnary @dst2index with a uniq value @dst2index: LocKey -> uniq value @loc_key: LocKey istance

def add_label_index(self, dst2index, loc_key):
    """Insert @lbl to the dictionnary @dst2index with a uniq value
    @dst2index: LocKey -> uniq value
    @loc_key: LocKey istance"""
    if loc_key not in dst2index:
        dst2index[loc_key] = len(dst2index)

def add_local_var(

self, dst_var, dst_index, expr)

Add local varaible used to store temporay result @dst_var: dictionnary of Expr -> local_var_expr @dst_index : dictionnary of size -> local var count @expr: Expression source

def add_local_var(self, dst_var, dst_index, expr):
    """
    Add local varaible used to store temporay result
    @dst_var: dictionnary of Expr -> local_var_expr
    @dst_index : dictionnary of size -> local var count
    @expr: Expression source
    """
    size = expr.size
    if size < 8:
        size = 8
    if size not in dst_index:
        raise RuntimeError("Unsupported operand size %s", size)
    var_num = dst_index[size]
    dst = ExprId("var_%.2d_%.2d" % (size, var_num), size)
    dst_index[size] += 1
    dst_var[expr] = dst
    return dst

def assignblk_to_irbloc(

self, instr, assignblk)

Ensure IRDst is always set in the head @assignblk of the @instr @instr: an instruction instance @assignblk: Assignblk instance

def assignblk_to_irbloc(self, instr, assignblk):
    """
    Ensure IRDst is always set in the head @assignblk of the @instr
    @instr: an instruction instance
    @assignblk: Assignblk instance
    """
    new_assignblk = dict(assignblk)
    if self.ir_arch.IRDst not in assignblk:
        offset = instr.offset + instr.l
        loc_key = self.ir_arch.loc_db.get_or_create_offset_location(offset)
        dst = ExprLoc(loc_key, self.ir_arch.IRDst.size)
        new_assignblk[self.ir_arch.IRDst] = dst
    irs = [AssignBlock(new_assignblk, instr)]
    return IRBlock(self.ir_arch.get_loc_key_for_instr(instr), irs)

def block2assignblks(

self, block)

Return the list of irblocks for a native @block @block: AsmBlock

def block2assignblks(self, block):
    """
    Return the list of irblocks for a native @block
    @block: AsmBlock
    """
    irblocks_list = []
    for instr in block.lines:
        assignblk_head, assignblks_extra = self.ir_arch.instr2ir(instr)
        # Keep result in ordered list as first element is the assignblk head
        # The remainings order is not really important
        irblock_head = self.assignblk_to_irbloc(instr, assignblk_head)
        irblocks = [irblock_head] + assignblks_extra
        # Simplify high level operators
        out = []
        for irblock in irblocks:
            new_irblock = irblock.simplify(expr_simp_high_to_explicit)[1]
            out.append(new_irblock)
        irblocks = out
        for irblock in irblocks:
            assert irblock.dst is not None
        irblocks_list.append(irblocks)
    return irblocks_list

def dst_to_c(

self, src)

Translate Expr @src into C code

def dst_to_c(self, src):
    """Translate Expr @src into C code"""
    if not isinstance(src, Expr):
        src = ExprInt(src, self.PC.size)
    return self.id_to_c(src)

def gen_assignblk_dst(

self, dst)

Generate C code to handle instruction destination @dst: instruction destination Expr

def gen_assignblk_dst(self, dst):
    """Generate C code to handle instruction destination
    @dst: instruction destination Expr"""
    dst2index = {}
    (ret, retb) = self.traverse_expr_dst(dst, dst2index)
    ret = "DST_case = %s;" % ret
    retb = 'DST_value = %s;' % retb
    return ['// %s' % dst2index,
            '%s' % ret,
            '%s' % retb], dst2index

def gen_bad_block(

self)

Generate the C code for a bad_block instance

def gen_bad_block(self):
    """
    Generate the C code for a bad_block instance
    """
    return self.CODE_BAD_BLOCK.split("\n")

def gen_c(

self, block, log_mn=False, log_regs=False)

Generate the C code for the @block and return it as a list of lines @log_mn: log mnemonics @log_regs: log registers

def gen_c(self, block, log_mn=False, log_regs=False):
    """
    Generate the C code for the @block and return it as a list of lines
    @log_mn: log mnemonics
    @log_regs: log registers
    """
    if isinstance(block, AsmBlockBad):
        return self.gen_bad_block()
    irblocks_list = self.block2assignblks(block)
    out, instr_offsets = self.gen_init(block)
    assert len(block.lines) == len(irblocks_list)
    for instr, irblocks in zip(block.lines, irblocks_list):
        instr_attrib, irblocks_attributes = self.get_attributes(instr, irblocks, log_mn, log_regs)
        for index, irblock in enumerate(irblocks):
            new_irblock = self.ir_arch.irbloc_fix_regs_for_mode(irblock, self.ir_arch.attrib)
            label = str(new_irblock.loc_key)
            out.append("%-40s // %.16X %s" %
                       (label + ":", instr.offset, instr))
            if index == 0:
                out += self.gen_pre_code(instr_attrib)
            out += self.gen_irblock(instr_attrib, irblocks_attributes[index], instr_offsets, new_irblock)
    out += self.gen_finalize(block)
    return ['\t' + line for line in out]

def gen_c_assignments(

self, assignblk)

Return C informations used to generate the C code of the @assignblk @assignblk: an AssignBlock instance

def gen_c_assignments(self, assignblk):
    """
    Return C informations used to generate the C code of the @assignblk
    @assignblk: an AssignBlock instance
    """
    c_var = []
    c_main = []
    c_mem = []
    c_updt = []
    c_prefetch = []
    dst_index = {8: 0, 16: 0, 32: 0, 64: 0, 128:0}
    dst_var = {}
    prefetchers = self.get_mem_prefetch(assignblk)
    for expr, prefetcher in sorted(prefetchers.iteritems()):
        str_src = self.id_to_c(expr)
        str_dst = self.id_to_c(prefetcher)
        c_prefetch.append('%s = %s;' % (str_dst, str_src))
    for var in prefetchers.itervalues():
        if var.size <= self.translator.NATIVE_INT_MAX_SIZE:
            c_var.append("uint%d_t %s;" % (var.size, var))
        else:
            c_var.append("bn_t %s; // %d" % (var, var.size))
    for dst, src in sorted(assignblk.iteritems()):
        src = src.replace_expr(prefetchers)
        if dst == self.ir_arch.IRDst:
            pass
        elif isinstance(dst, ExprId):
            new_dst = self.add_local_var(dst_var, dst_index, dst)
            if dst in self.ir_arch.arch.regs.regs_flt_expr:
                # Dont mask float affectation
                c_main.append(
                    '%s = (%s);' % (self.id_to_c(new_dst), self.id_to_c(src)))
            elif new_dst.size <= self.translator.NATIVE_INT_MAX_SIZE:
                c_main.append(
                    '%s = (%s)&%s;' % (self.id_to_c(new_dst),
                                       self.id_to_c(src),
                                       SIZE_TO_MASK[src.size]))
            else:
                c_main.append(
                    '%s = bignum_mask(%s, %d);' % (
                        self.id_to_c(new_dst),
                        self.id_to_c(src),
                        src.size
                    )
                )
        elif isinstance(dst, ExprMem):
            ptr = dst.arg.replace_expr(prefetchers)
            if ptr.size <= self.translator.NATIVE_INT_MAX_SIZE:
                new_dst = ExprMem(ptr, dst.size)
                str_dst = self.id_to_c(new_dst).replace('MEM_LOOKUP', 'MEM_WRITE')
                c_mem.append('%s, %s);' % (str_dst[:-1], self.id_to_c(src)))
            else:
                ptr_str = self.id_to_c(ptr)
                if ptr.size <= self.translator.NATIVE_INT_MAX_SIZE:
                    c_mem.append('%s, %s);' % (str_dst[:-1], self.id_to_c(src)))
                else:
                    if src.size <= self.translator.NATIVE_INT_MAX_SIZE:
                        c_mem.append('MEM_WRITE_BN_INT(jitcpu, %d, %s, %s);' % (
                            src.size, ptr_str, self.id_to_c(src))
                        )
                    else:
                        c_mem.append('MEM_WRITE_BN_BN(jitcpu, %d, %s, %s);' % (
                            src.size, ptr_str, self.id_to_c(src))
                        )
        else:
            raise ValueError("Unknown dst")
    for dst, new_dst in dst_var.iteritems():
        if dst == self.ir_arch.IRDst:
            continue
        c_updt.append('%s = %s;' % (self.id_to_c(dst), self.id_to_c(new_dst)))
        if dst.size <= self.translator.NATIVE_INT_MAX_SIZE:
            c_var.append("uint%d_t %s;" % (new_dst.size, new_dst))
        else:
            c_var.append("bn_t %s; // %d" % (new_dst, new_dst.size))
    return c_prefetch, c_var, c_main, c_mem, c_updt

def gen_c_code(

self, attrib, c_dst, c_assignmnts)

Generate the C code for assignblk. @attrib: Attributes instance @c_dst: irdst C code

def gen_c_code(self, attrib, c_dst, c_assignmnts):
    """
    Generate the C code for assignblk.
    @attrib: Attributes instance
    @c_dst: irdst C code
    """
    c_prefetch, c_var, c_main, c_mem, c_updt = c_assignmnts
    out = []
    out.append("{")
    out.append("// var")
    out += c_var
    out.append("// Prefetch")
    out += c_prefetch
    out.append("// Dst")
    out += c_dst
    out.append("// Main")
    out += c_main
    out.append("// Check op/mem exceptions")
    # Check memory access if assignblk has memory read
    if c_prefetch:
        out += self.gen_check_memory_exception(attrib.instr.offset)
    out.append("// Mem updt")
    out += c_mem
    out.append("// Check exception Mem write")
    # Check memory write exceptions
    if attrib.mem_write:
        out += self.gen_check_memory_exception(attrib.instr.offset)
    out.append("// Updt")
    out += c_updt
    out.append("// Checks exception")
    # Check post assignblk exception flags
    if attrib.set_exception:
        out += self.gen_check_cpu_exception(attrib.instr.offset)
    out.append("}")
    return out

def gen_check_cpu_exception(

self, address)

Generate C code to check cpu exceptions @address: address of the faulty instruction

def gen_check_cpu_exception(self, address):
    """Generate C code to check cpu exceptions
    @address: address of the faulty instruction"""
    dst = self.dst_to_c(address)
    return (self.CODE_EXCEPTION_AT_INSTR % (self.C_PC, dst, dst)).split('\n')

def gen_check_memory_exception(

self, address)

Generate C code to check memory exceptions @address: address of the faulty instruction

def gen_check_memory_exception(self, address):
    """Generate C code to check memory exceptions
    @address: address of the faulty instruction"""
    dst = self.dst_to_c(address)
    return (self.CODE_EXCEPTION_MEM_AT_INSTR % (self.C_PC, dst, dst)).split('\n')

def gen_dst_goto(

self, attrib, instr_offsets, dst2index)

Generate code for possible @dst2index.

@attrib: an Attributes instance @instr_offsets: list of instructions offsets @dst2index: link from destination to index

def gen_dst_goto(self, attrib, instr_offsets, dst2index):
    """
    Generate code for possible @dst2index.
    @attrib: an Attributes instance
    @instr_offsets: list of instructions offsets
    @dst2index: link from destination to index
    """
    if not dst2index:
        return []
    out = []
    out.append('switch(DST_case) {')
    stopcase = False
    for dst, index in sorted(dst2index.iteritems(), key=lambda lblindex: lblindex[1]):
        if index == -1:
            # Handle '-1' case only once
            if not stopcase:
                stopcase = True
            else:
                continue
        out.append('\tcase %d:' % index)
        out += self.gen_goto_code(attrib, instr_offsets, dst)
        out.append('\t\tbreak;')
    out.append('};')
    return out

def gen_finalize(

self, block)

Generate the C code for the final block instruction

def gen_finalize(self, block):
    """
    Generate the C code for the final block instruction
    """
    loc_key = self.get_block_post_label(block)
    offset = self.ir_arch.loc_db.get_location_offset(loc_key)
    dst = self.dst_to_c(offset)
    code = self.CODE_RETURN_NO_EXCEPTION % (loc_key, self.C_PC, dst, dst)
    return code.split('\n')

def gen_goto_code(

self, attrib, instr_offsets, dst)

Generate C code for a potential destination @dst @attrib: instruction Attributes @instr_offsets: instructions offsets list @dst: potential instruction destination

def gen_goto_code(self, attrib, instr_offsets, dst):
    """Generate C code for a potential destination @dst
    @attrib: instruction Attributes
    @instr_offsets: instructions offsets list
    @dst: potential instruction destination"""
    out = []
    if isinstance(dst, Expr):
        out += self.gen_post_code(attrib)
        out.append('BlockDst->address = DST_value;')
        out += self.gen_post_instr_checks(attrib)
        out.append('\t\treturn JIT_RET_NO_EXCEPTION;')
        return out
    assert isinstance(dst, LocKey)
    offset = self.ir_arch.loc_db.get_location_offset(dst)
    if offset is None:
        # Generate goto for local labels
        return ['goto %s;' % dst]
    if (offset > attrib.instr.offset and
        offset in instr_offsets):
        # Only generate goto for next instructions.
        # (consecutive instructions)
        out += self.gen_post_code(attrib)
        out += self.gen_post_instr_checks(attrib)
        out.append('goto %s;' % dst)
    else:
        out += self.gen_post_code(attrib)
        out.append('BlockDst->address = DST_value;')
        out += self.gen_post_instr_checks(attrib)
        out.append('\t\treturn JIT_RET_NO_EXCEPTION;')
    return out

def gen_init(

self, block)

Generate the init C code for a @block @block: an asm_bloc instance

def gen_init(self, block):
    """
    Generate the init C code for a @block
    @block: an asm_bloc instance
    """
    instr_offsets = [line.offset for line in block.lines]
    post_label = self.get_block_post_label(block)
    post_offset = self.ir_arch.loc_db.get_location_offset(post_label)
    instr_offsets.append(post_offset)
    lbl_start = block.loc_key
    return (self.CODE_INIT % lbl_start).split("\n"), instr_offsets

def gen_irblock(

self, instr_attrib, attributes, instr_offsets, irblock)

Generate the C code for an @irblock @irblock: an irbloc instance @attributes: an Attributes instance list

def gen_irblock(self, instr_attrib, attributes, instr_offsets, irblock):
    """
    Generate the C code for an @irblock
    @irblock: an irbloc instance
    @attributes: an Attributes instance list
    """
    out = []
    dst2index = None
    for index, assignblk in enumerate(irblock):
        if index == irblock.dst_linenb:
            c_dst, dst2index = self.gen_assignblk_dst(irblock.dst)
        else:
            c_dst = []
        c_assignmnts = self.gen_c_assignments(assignblk)
        out += self.gen_c_code(attributes[index], c_dst, c_assignmnts)
    if dst2index:
        out.append("// Set irdst")
        # Gen goto on irdst set
        out += self.gen_dst_goto(instr_attrib, instr_offsets, dst2index)
    return out

def gen_post_code(

self, attrib)

Callback to generate code AFTER the instruction execution @attrib: Attributes instance

def gen_post_code(self, attrib):
    """Callback to generate code AFTER the instruction execution
    @attrib: Attributes instance"""
    out = []
    if attrib.log_regs:
        out.append('dump_gpregs(jitcpu->cpu);')
    return out

def gen_post_instr_checks(

self, attrib)

Generate C code for handling potential exceptions @attrib: Attributes instance

def gen_post_instr_checks(self, attrib):
    """Generate C code for handling potential exceptions
    @attrib: Attributes instance"""
    out = []
    if attrib.mem_read | attrib.mem_write:
        out += (self.CODE_VM_EXCEPTION_POST_INSTR % (self.C_PC)).split('\n')
    if attrib.set_exception:
        out += (self.CODE_CPU_EXCEPTION_POST_INSTR % (self.C_PC)).split('\n')
    if attrib.mem_read | attrib.mem_write:
        out.append("reset_memory_access(&(jitcpu->pyvm->vm_mngr));")
    return out

def gen_pre_code(

self, instr_attrib)

Callback to generate code BEFORE the instruction execution @instr_attrib: Attributes instance

def gen_pre_code(self, instr_attrib):
    """Callback to generate code BEFORE the instruction execution
    @instr_attrib: Attributes instance"""
    out = []
    if instr_attrib.log_mn:
        out.append(
            'printf("%.8X %s\\n");' % (
                instr_attrib.instr.offset,
                instr_attrib.instr.to_string(self.ir_arch.loc_db)
            )
        )
    return out

def get_attributes(

self, instr, irblocks, log_mn=False, log_regs=False)

Get the carateristics of each @irblocks. Returns the corresponding attributes object. @irblock: a list of irbloc instance @log_mn: generate code to log instructions @log_regs: generate code to log registers states

def get_attributes(self, instr, irblocks, log_mn=False, log_regs=False):
    """
    Get the carateristics of each @irblocks. Returns the corresponding
    attributes object.
    @irblock: a list of irbloc instance
    @log_mn: generate code to log instructions
    @log_regs: generate code to log registers states
    """
    instr_attrib = Attributes(log_mn, log_regs)
    instr_attrib.instr = instr
    irblocks_attributes = []
    for irblock in irblocks:
        attributes = []
        irblocks_attributes.append(attributes)
        for assignblk in irblock:
            attrib = Attributes(log_mn, log_regs)
            attributes.append(attrib)
            self.get_caracteristics(assignblk, attrib)
            attrib.instr = instr
            instr_attrib.mem_read |= attrib.mem_read
            instr_attrib.mem_write |= attrib.mem_write
            instr_attrib.set_exception |= attrib.set_exception
    return instr_attrib, irblocks_attributes

def get_block_post_label(

self, block)

Get label next to the @block @block: AsmBlock instance

def get_block_post_label(self, block):
    """Get label next to the @block
    @block: AsmBlock instance"""
    last_instr = block.lines[-1]
    offset = last_instr.offset + last_instr.l
    return self.ir_arch.loc_db.get_or_create_offset_location(offset)

def get_caracteristics(

self, assignblk, attrib)

Set the carateristics in @attrib according to the @assignblk @assignblk: an AssignBlock instance @attrib: an Attributes instance

def get_caracteristics(self, assignblk, attrib):
    """
    Set the carateristics in @attrib according to the @assignblk
    @assignblk: an AssignBlock instance
    @attrib: an Attributes instance
    """
    # Check explicit exception raising
    attrib.set_exception = self.ir_arch.arch.regs.exception_flags in assignblk
    element_read = assignblk.get_r(mem_read=True)
    # Check mem read
    attrib.mem_read = any(isinstance(expr, ExprMem)
                          for expr in element_read)
    # Check mem write
    attrib.mem_write = any(isinstance(dst, ExprMem)
                           for dst in assignblk)

def get_mem_prefetch(

self, assignblk)

Generate temporary variables used to fetch memory used in the @assignblk Return a dictionnary: ExprMem -> temporary variable @assignblk: AssignBlock instance

def get_mem_prefetch(self, assignblk):
    """
    Generate temporary variables used to fetch memory used in the @assignblk
    Return a dictionnary: ExprMem -> temporary variable
    @assignblk: AssignBlock instance
    """
    mem_index = {8: 0, 16: 0, 32: 0, 64: 0, 128:0}
    mem_var = {}
    # Prefetch memory read
    for expr in assignblk.get_r(mem_read=True):
        if not isinstance(expr, ExprMem):
            continue
        var_num = mem_index[expr.size]
        mem_index[expr.size] += 1
        var = ExprId(
            "prefetch_%.2d_%.2d" % (expr.size, var_num), expr.size
        )
        mem_var[expr] = var
    # Generate memory prefetch
    return mem_var

def id_to_c(

self, expr)

Translate Expr @expr into corresponding C code

def id_to_c(self, expr):
    """Translate Expr @expr into corresponding C code"""
    return self.translator.from_expr(self.patch_c_id(expr))

def init_arch_C(

self)

Iinitialize jitter internals

def init_arch_C(self):
    """Iinitialize jitter internals"""
    self.id_to_c_id = {}
    for reg in self.ir_arch.arch.regs.all_regs_ids:
        self.id_to_c_id[reg] = ExprId('mycpu->%s' % reg, reg.size)
    self.C_PC = self.id_to_c(self.PC)

def patch_c_id(

self, expr)

Replace ExprId in @expr with corresponding C variables

def patch_c_id(self, expr):
    """Replace ExprId in @expr with corresponding C variables"""
    return expr.replace_expr(self.id_to_c_id)

def traverse_expr_dst(

self, expr, dst2index)

Generate the index of the destination label for the @expr @dst2index: dictionnary to link label to its index

def traverse_expr_dst(self, expr, dst2index):
    """
    Generate the index of the destination label for the @expr
    @dst2index: dictionnary to link label to its index
    """
    if isinstance(expr, ExprCond):
        src1, src1b = self.traverse_expr_dst(expr.src1, dst2index)
        src2, src2b = self.traverse_expr_dst(expr.src2, dst2index)
        cond = self.id_to_c(expr.cond)
        if not expr.cond.size <= self.translator.NATIVE_INT_MAX_SIZE:
            cond = "(!bignum_is_zero(%s))" % cond
        return ("((%s)?(%s):(%s))" % (cond, src1, src2),
                "((%s)?(%s):(%s))" % (cond, src1b, src2b))
    if isinstance(expr, ExprInt):
        offset = int(expr)
        loc_key = self.ir_arch.loc_db.get_or_create_offset_location(offset)
        self.add_label_index(dst2index, loc_key)
        value, int_size = int_size_to_bn(offset, 64)
        out = hex(offset)
        return ("%s" % dst2index[loc_key], out)
    if expr.is_loc():
        loc_key = expr.loc_key
        offset = self.ir_arch.loc_db.get_location_offset(expr.loc_key)
        if offset is not None:
            self.add_label_index(dst2index, loc_key)
            value, int_size = int_size_to_bn(offset, 64)
            out = hex(offset)
            return ("%s" % dst2index[loc_key], out)
        self.add_label_index(dst2index, loc_key)
        value, int_size = int_size_to_bn(0, 64)
        out = hex(0)
        return ("%s" % dst2index[loc_key], out)
    dst2index[expr] = -1
    return ("-1", self.id_to_c(expr))