archived-xed/pysrc/ild_cdict.py

#BEGIN_LEGAL
#
#Copyright (c) 2017 Intel Corporation
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
#
#END_LEGAL
import genutil
import ildutil
import ild_info
import collections
import opnds
import math
import ild_phash
import ild_codegen
import ild_phash
import ild_eosz
import ild_easz
import ild_nt
import genutil
import actions_codegen
import actions
import copy
import verbosity
import tup2int

# _token_2_module is for fields that might be modified in the pattern.
# if fields are modified in the pattern by some NT, then we must be
# consistent across buckets (legacy/vex/evex, opcode,map). This is
# only relevant for fields that would be used in the "dynamic decode
# part 1".

# EASZ is only rarely modified in experimental extensions.
_token_2_module = {'EOSZ':ild_eosz, 'EASZ':ild_easz}

_find_fn_pfx = 'xed3_phash_find'

def _log(f,s):
    if verbosity.vild():
        f.write(s)

def _set_state_space_from_ii(agi, ii, state_space):
    """
    state_space is a 2D dictionary, ii is generator.instruction_info_t
    this functions sets:
    state_space[OPNAME][OPVAL] = True for every operand decider or prebinding
    with name OPNAME and value OPVAL legal for the given ii.
    """
    for bt in ii.ipattern.bits:
        if bt.is_operand_decider():
            if bt.test == 'eq':
                state_space[bt.token][bt.requirement] = True
    #look at prebindings too
    #for things like ZEROING that don't have all possible
    #values mentioned in patterns
    for (name, binding) in list(ii.prebindings.items()):

        bitnum = len(binding.bit_info_list)
        #dirty hack: we don't want big prebidnings to explode
        #our dictionaries
        #FIXME: this assumes that all constraints used for
        #pattern dispatching (all constraints explicitly mentioned
        #in patterns) have bit widths up to 3 bits.
        #This is true now, but might change later. Should put an
        #assertion somewhere.
        #Also better to use a genutil.max_constraint_bitwidth than
        #3.
        if bitnum < 4:
            if not name in state_space:
                state_space[name] = {}
            for val in range(0, 2**bitnum):
                state_space[name][val] = True
        elif binding.is_constant():
            val = int(binding.get_value(), 2)
            state_space[name][val] = True

def _set_space_from_operands(agi, operands, state_space):
    state_dict = agi.common.state_bits
    for op in operands:
        ops = []
        #if binding operand is a macro
        if op.name.lower() in state_dict:
            op_spec = state_dict[op.name.lower()].list_of_str
            found_op = False
            for w in op_spec:
                exapnded_op = opnds.parse_one_operand(w)
                ops.append(exapnded_op)
        else:
            ops.append(op)

        for op in ops:
            if (op.bits and op.name in state_space and
                op.type == 'imm_const'):
                op_val = int(op.bits, 16)
                state_space[op.name][op_val] = True

def get_all_constraints_state_space(agi):
    """
    Returns a 2D dictionary state_space:
    state_space[OPNAME][OPVAL] == True if there is an operand with
    name OPNAME and value OPVAL.
    In other words dictionary contains all legal values for
    operands in grammar.
    Only operands that appear as operand deciders, prebindings, or
    instruction operands are added to the returned dictionary.
    """
    state_space = collections.defaultdict(dict)
    for g in agi.generator_list:
        for ii in g.parser_output.instructions:
            _set_state_space_from_ii(agi, ii, state_space)
    #set state_space from operands
    #These are NTs partition tables right parts
    for g in agi.generator_list:
        ii = g.parser_output.instructions[0]
        if genutil.field_check(ii,'iclass'):
            continue #only real NTs, not instructions
        for ii in g.parser_output.instructions:
            _set_space_from_operands(agi, ii.operands, state_space)

    # in some configurations xed can be build without any AVX
    # instructions, in this case the operand VEXVALID will no be added.
    # the ild relies on this operand so we add it manually
    if 'VEXVALID' not in state_space:
        state_space['VEXVALID'][0] = True
    else: # KNC/AVX/EVEX builds...
        # 2014-10-10: when I got rid of the NTs for decoding the
        # VEX/EVEX/XOP prefixes, I ended up losing the only NTs that
        # mention ZEROING=1 and VLBAD (VL=3). So we add them here.
        # They are required for proper splattering of don't care
        # cases.  in the hash function generation.  For example when,
        # EVEX.RC is rounding control and co-opting the EVEX.LL field,
        # we need to have the value of VL=3 because it is not
        # "corrected" when we are still picking an instruction (aka
        # 'static decode').
        state_space['ZEROING'][1] = True
        state_space['VL'][3] = True

    return state_space

def get_state_op_widths(agi, state_space):
    """
    Returns a dictionary from operand name to operands bit width
    """
    widths_dict = {}
    for opname,val_dict in list(state_space.items()):
        if opname in agi.operand_storage.get_operands():
            opnd = agi.operand_storage.get_operand(opname)
            widths_dict[opname] = int(opnd.bitwidth)
            continue
        maxval = max(val_dict.keys())
        if maxval == 0:
            #log doesn't work on 0 so well
            width = 1
        else:
            width = int(math.floor(math.log(maxval, 2))) + 1
        widths_dict[opname] = width
    #Special, "compressed" operands
    #FIXME: we can add these special operands widths in grammar
    widths_dict[_bin_MOD3] = 1
    widths_dict[_vd_token_7] = 1
    widths_dict[_rm_token_4] = 1
    widths_dict[_mask_token_n0] = 1
    widths_dict[_mask_token_zero] = 1
    #constraints on uimm0 operands are 8 bits width max
    widths_dict['UIMM0'] = 8
    return widths_dict

#Following functions are for operands compressing

_bin_MOD3 = 'MOD3'
#FIXME: could have made a generic function is_binary_op_X
#but it seems to be an overkill - most common binary ops are MOD
#and RM
def _is_binary_MOD3(ptrn_list):
    mod3_eq = 'MOD=3'
    mod3_neq = 'MOD!=3'
    for ptrn in ptrn_list:
        if not (mod3_eq in ptrn.ptrn or mod3_neq in ptrn.ptrn):
            return False
    return True

def _replace_MOD_with_MOD3(cnames, ptrn_list):
    cnames.remove('MOD')
    cnames.add(_bin_MOD3)
    for ptrn in ptrn_list:
        if 'MOD=3' in ptrn.ptrn:
            ptrn.constraints[_bin_MOD3] = {1: True}
        else:
            ptrn.constraints[_bin_MOD3] = {0: True}

_vd_token = 'VEXDEST210'
_vd_token_7 = 'VEXDEST210_7'
#FIXME: too hardcoded
#this one is different: there are two possibilities: VD=7 and VD in [0..7]
#hence VD7=1 will mean VD=7 and {VD7=0, VD7=0} will mean VD is any value
#
def _is_binary_VEXDEST210_7(cnames, ptrn_list):
    found = False
    if _vd_token not in cnames:
        return False
    for ptrn in ptrn_list:
        cvals = ptrn.constraints[_vd_token]
        if (len(cvals) == 1 and 7 in cvals):
            found = True
        elif (len(cvals) != 0):
            return False
    return found

def _replace_VEXDEST210_with_VD2107(cnames, ptrn_list):
    cnames.remove(_vd_token)
    cnames.add(_vd_token_7)
    for ptrn in ptrn_list:
        found = False
        for bt in ptrn.ii.ipattern.bits:
            if bt.token == _vd_token:
                if bt.test == 'eq':
                    found = True
                    ptrn.constraints[_vd_token_7] = {1:True}
                    break
        if not found:
            #vd7==0 says any VD
            ptrn.constraints[_vd_token_7] = {0:True, 1:True}

_rm_token = 'RM'
_rm_token_4 = 'RM4'
#FIXME: make one function for RM4 and VD7
def _is_binary_RM_4(cnames, ptrn_list):
    found = False
    if _rm_token not in cnames:
        return False
    for ptrn in ptrn_list:
        cvals = ptrn.constraints[_rm_token]
        if (len(cvals)==1) and 4 in cvals :
            found = True
        elif len(cvals) != 0:
            return False
        else: #len(cvals)==0
            ptrn.constraints.pop(_rm_token)
    return found

def _replace_RM_with_RM4(cnames, ptrn_list):
    # This looks for RM=4 in the pattern. It will not find "RM[0b100]"
    # so the patterns should NOT use that for specifying RM=4
    # requirements.
    #
    # FIXME:2016-01-29: MJC I have a concern that other instructions
    # with RM[...] constraints might be being mishandled. Need to test.
    cnames.remove(_rm_token)
    cnames.add(_rm_token_4)
    for ptrn in ptrn_list:
        found = False
        #print "PATTERN BITS", "\t\n".join( [str(x) for x in ptrn.ii.ipattern.bits])
        for bt in ptrn.ii.ipattern.bits:
            if bt.token == _rm_token:
                if bt.test == 'eq':
                    found = True
                    ptrn.constraints[_rm_token_4] = {1:True}
                    break
        if not found:
            #print "X", str(cnames)
            #print "\t\n".join( [ str(x) for x in ptrn_list] )
            ptrn.constraints[_rm_token_4] = {0:True, 1:True}

#FIXME: probably should move this one to layers
_mask_token = 'MASK'
_mask_token_n0 = 'MASK_NOT0'
_mask_token_zero = 'MASK_ZERO'
#FIXME: make one function for is binary and replace_binary
def _is_binary_MASK_NOT0(cnames, ptrn_list):
    found = False
    if _mask_token not in cnames:
        return False
    for ptrn in ptrn_list:
        cvals = ptrn.constraints[_mask_token]
        # 7 of the 8 possible mask values without 0
        if (len(cvals)==7) and 0 not in cvals :
            found = True
        elif len(cvals)==0:  #no constraint values -> any mask is ok
            ptrn.constraints.pop(_mask_token)
        else:
            return False
    return found

def _is_binary_MASK_ZERO(cnames, ptrn_list):
    found = False
    if _mask_token not in cnames:
        return False
    for ptrn in ptrn_list:
        cvals = ptrn.constraints[_mask_token]
        if (len(cvals)==1) and 0 in cvals :
            found = True
        elif len(cvals)==0:  #any mask, ok
            ptrn.constraints.pop(_mask_token)
        else:
            return False
    return found


def _replace_MASK_with_MASK_NOT0(cnames, ptrn_list):
    cnames.remove(_mask_token)
    cnames.add(_mask_token_n0)
    for ptrn in ptrn_list:
        found = False
        for bt in ptrn.ii.ipattern.bits:
            if bt.token == _mask_token:
                if bt.test == 'ne':
                    found = True
                    ptrn.constraints[_mask_token_n0] = {1:True}
                    break
        if not found:
            #mask is not in the pattern, all values of MASK_NOT0 are valid
            ptrn.constraints[_mask_token_n0] = {0:True, 1:True}


def _replace_MASK_with_MASK_ZERO(cnames, ptrn_list):
    cnames.remove(_mask_token)
    cnames.add(_mask_token_zero)
    for ptrn in ptrn_list:
        found = False
        for bt in ptrn.ii.ipattern.bits:
            if bt.token == _mask_token:
                if bt.test == 'eq':
                    found = True
                    ptrn.constraints[_mask_token_zero] = {1:True}
                    break
        if not found:
            #mask is not in the pattern, all values of MASK_ZERO are valid
            ptrn.constraints[_mask_token_zero] = {0:True, 1:True}

_compressed_ops = [_mask_token_n0,
                   _mask_token_zero,
                   _rm_token_4,
                   _vd_token_7,
                   _bin_MOD3      ]

def is_compressed_op(opname):
    """
    Compressed operands are special - we do not capture them
    in ILD and do not derive them in NTs. (though we could..
    FIXME: is it worthy?), hence in order to get their value we can not
    use regular xed3_operand_get_* function - we use special getters
    for them.
    is_compressed_op(opname) helps us to determine whether we need to use a
    special getter.
    """
    return opname in _compressed_ops

def get_compressed_op_getter_fn(opname):
    """
    Compressed operands are special - we do not capture them
    in ILD and do not derive them in NTs. (though we could..
    FIXME: is it worthy?), hence in order to get their value we can not
    use regular xed3_operand_get_* function - we use special getters
    for them.
    get_compressed_op_getter_fn(opname) returns a name of the special getter
    for a given compressed operand name.
    FIXME: right now we just use the same operand naming scheme as for
    regular operands. Do we need this function?
    """
    return operand_storage.get_op_getter_fn(opname)

def _get_united_cdict(ptrn_list, state_space, vexvalid, all_ops_widths):
    """
    @param ptrn_list: list of ild.pattern_t
    @param state_space: all legal values for xed operands:
                        state_space['REXW'][1] = True,
                        state_space['REXW'][0]=True
    @param vexvalid: VEXVALID value we want to filter by. vevxavlid==0
                    will include only patterns with vexvalid==0 constraint
                    value.
    @param all_ops_widths: dict of operands to their bit widths.
    @return ild_cdict.constrant_dict_t which unites patterns constraint dicts
    """
    cnames = []

    #take only requested space patterns
    ptrns = []
    for ptrn in ptrn_list:
        if vexvalid in list(ptrn.constraints['VEXVALID'].keys()):
            ptrns.append(ptrn)

    if len(ptrns) == 0:
        return None

    for ptrn in ptrns:
        cnames.extend(list(ptrn.constraints.keys()))
    cnames = set(cnames)

    cdicts = []
    if _is_binary_MOD3(ptrns):
        _replace_MOD_with_MOD3(cnames, ptrns)

    if _is_binary_VEXDEST210_7(cnames, ptrn_list):
        _replace_VEXDEST210_with_VD2107(cnames, ptrn_list)

    if _is_binary_RM_4(cnames, ptrn_list):
       _replace_RM_with_RM4(cnames, ptrn_list)

    if _is_binary_MASK_NOT0(cnames, ptrn_list):
       _replace_MASK_with_MASK_NOT0(cnames, ptrn_list)

    if _is_binary_MASK_ZERO(cnames, ptrn_list):
       _replace_MASK_with_MASK_ZERO(cnames, ptrn_list)

    # For each pattern we have a list of constraints. ptrn.constraints
    # is the legal values for those constraints. In each map opcode
    # bin, we have several patterns with different constraints. We
    # want to make one hash table for these different patterns. Thats
    # why we want to take the union of all the constraints and make
    # one dictionary (and ultimately a hash table). Need to add all
    # legal variations of all constraints, cross product. (dangerous)
    #For example if we have two patterns:
    #PATTERN1: MOD=1
    #PATTERN2: REG=2
    #then for PATTERN1 we will create a constraint dictionary with all
    #combinations (MOD=1 REG=0), (MOD=1, REG=1) ,..., (MOD=1, REG=7)
    #and for PATTERN2 we will have (MOD=0 REG=2), (MOD=1 REG=2), ...
    for ptrn in ptrns:
        cdict = constraint_dict_t(cnames, ptrn.constraints, state_space, ptrn)
        cdicts.append(cdict)
    insn_map = ptrns[0].insn_map
    opcode = ptrns[0].opcode
    msg = []
    msg.append("cdict conflict in pattern")
    msg.append('MAP:%s OPCODE:%s\n' % (insn_map, opcode))
    msg = "\n".join(msg)
    # now we unite (cross-product) after exploding/back-filling all the
    # constraints. All patterns now have same constraints.
    united_dict = constraint_dict_t.unite_dicts(cdicts, msg, cnames)

    #generate the int value for each tuple
    united_dict.create_tuple2int(all_ops_widths)
    united_dict.strings_dict = ild_codegen._dec_strings

    #creating the default action that will be taken when we did not hit
    #a valid hash entry
    default_action = [actions.gen_return_action('0')]
    united_dict.action_codegen = actions_codegen.actions_codegen_t(
                                                       united_dict.tuple2rule,
                                                       default_action,
                                                       united_dict.strings_dict)
    return united_dict


#FIXME: maybe it should contain tuple2int function?
#Now tuple2int is a part of phash object.
class constraint_dict_t(object):
    def __init__(self, cnames=[], state_space={}, all_state_space={},
                 rule=None):
         #cnames is sorted list of strings - constraints' names that we want
         #this cdict to have
         self.cnames = sorted(list(cnames))

         #state_space is a dict with constraints' values we want
         #this cdict to represent.
         #For example if we want cdict to allow only MODE=0 we will
         #have state_space['MODE'][0] = True
         self.state_space = state_space

         #all_state_space is a dict with all legal values that constraints
         #have in grammar.
         #For example:
         #all_state_space['REXW'][0]=True, all_state_space['REXW'][1]=True
         #It is used when state_space doesn't have a constraint from cnames.
         #We need this when we build united constraint dict for a set of
         #patterns:
         #first we build a separate constraint dict for each pattern, but
         #it includes all the cnames that set has, and then we unite those
         #cdicts. See _get_united_cdict() function
         self.all_state_space = all_state_space

         self.rule = rule

         #dict mapping tuples to rules.
         #tuples are the constraint values (without the constraint names).
         self.tuple2rule = {}

         #tuple2int maps the same tuples as tuple2int to hash key values.
         self.tuple2int = {}

         #reverse mapping from hash key to list of constraint value tuples.
         self.int2tuple = {}

         #dict of all operands -> bit width.
         self.op_widths = {}

         if len(state_space) > 0:
             self.tuple2rule = self.make_cdict(self.cnames, {})

    @staticmethod
    def unite_dicts(dict_list, err_msg, cnstr_names):
        """ dict_list is a list of constraint dictionaries.  The keys
        in the dictionary are the values of the constraints as tuples.
        If we see the same values in more than one pattern, we have a
        decoding conflict in the grammar. The dictionaries have been
        expanded so that they all have the same constraint names upon
        entry.
        """

        if len(dict_list) == 0:
            return None
        if len(dict_list) == 1:
            return dict_list[0]
        res = constraint_dict_t(cnames=cnstr_names)
        for cdict in dict_list:
            for key in list(cdict.tuple2rule.keys()):
                if key in res.tuple2rule:
                    msg = []
                    msg.append("key: %s" % (key,))
                    msg.append("cdict:%s" % cdict)
                    msg.append("res:%s" % res)
                    msg = "\n".join(msg)
                    ildutil.ild_err(err_msg + msg)
                    return None
                else:
                    res.tuple2rule[key] = cdict.tuple2rule[key]

        return res


    def make_cdict(self, cnames, tuple2rule):
        if len(cnames) == 0:
            return tuple2rule
        name = cnames[0]
        if name in self.state_space:
            vals = sorted(self.state_space[name].keys())
        else:
            vals = sorted(self.all_state_space[name].keys())
        if len(tuple2rule) == 0:
            #initialize tuple2rule with singleton tuples
            for val in vals:
                tuple2rule[(val,)] = self.rule
            return self.make_cdict(cnames[1:], tuple2rule)
        else:
            new_tuple2rule = {}
            for key_tuple in list(tuple2rule.keys()):
                for val in vals:
                    new_key = key_tuple + (val,)
                    new_tuple2rule[new_key] = self.rule
            return self.make_cdict(cnames[1:], new_tuple2rule)

    def get_all_keys_by_val(self, val):
        return [k for k,v in self.tuple2rule.items() if v == val]

    def create_tuple2int(self, all_ops_widths):
        ''' create the mapping of tuple to its int value '''
        tuple2int = {}
        int2tuple = {}
        for t in self.tuple2rule.keys():
            res = tup2int.tuple2int(t, self.cnames, all_ops_widths)
            if res in int2tuple:
                err = "the tuple % and the tuple %s generate the same value:%d"
                die(err % (t,str(int2tuple[res]),res))
            else:
                tuple2int[t] = res
                int2tuple[res] = t

        #later using the op_widths for the code generation
        self.op_widths = all_ops_widths
        self.tuple2int = tuple2int
        self.int2tuple = int2tuple

    def get_ptrn(self, tuple):
        ''' return the pattern that represents the given tuple '''
        return self.tuple2rule[tuple].ptrn

    def filter_tuples(self,tuples):
        ''' from all the dictionaries in self, remove the tuples that are not
        in the input tuples list.
        return new instance of cdict '''

        new_cdict = copy.copy(self)
        new_cdict.tuple2int = {}
        new_cdict.tuple2rule = {}
        for t in tuples:
            new_cdict.tuple2int[t] = self.tuple2int[t]
            new_cdict.tuple2rule[t] = self.tuple2rule[t]


        new_cdict.int2tuple = dict((i,t) for t,i in
                                   new_cdict.tuple2int.items())

        return new_cdict

    def get_operand_accessor(self, cname):
        ''' return a tuple of the operand accessor function and the constraint
        names that it represents '''

        ptrn_list = list(self.tuple2rule.values())
        if cname in list(_token_2_module.keys()):
            nt_module = _token_2_module[cname]
            getter_fn = nt_module.get_getter_fn(ptrn_list)
            if not getter_fn:
                    msg = 'Failed to resolve %s getter fn for '
                    msg += 'MAP:%s OPCODE:%s'
                    insn_map = ptrn_list[0].insn_map
                    opcode = ptrn_list[0].opcode
                    ildutil.ild_err(msg % (cname, insn_map, opcode))
            access_str = '%s(%s)' % (getter_fn, self.strings_dict['obj_str'])
            nt = ild_nt.get_nt_from_lufname(getter_fn)
            return access_str, nt
        else:
            access_str = ild_codegen.emit_ild_access_call(cname,
                                                      self.strings_dict['obj_str'])
            return access_str, cname

    def __str__(self):
        rows = []
        size = len(self.tuple2rule)
        rows.append("cdict_size=%d" % size)
        if size >= 100:
            rows.append('HUGE!')
        elif size >= 50:
            rows.append('BIG!')
        legend = " ".join(self.cnames)
        legend += ' \t-> VALUE'
        rows.append(legend)
        if len(self.tuple2rule) == 0:
            rows.append("_ \t-> %s" % self.rule)
        for key in sorted(self.tuple2rule.keys()):
            val = self.tuple2rule[key]
            rows.append("%s \t-> %s" % (key, str(val)))
        return "\n".join(rows)


def get_constraints_lu_table(ptrns_by_map_opcode, is_amd, state_space,
                              vexvalid, all_ops_widths):
    """
    returns a tuple (cdict_by_map_opcode,cnames)
    cnames is a set of all constraint names used in patterns.
    cdict_by_map_opcode is  a traditional 2D lookup dict from map,opcode to
    constraint_dict_t objects that represent the mapping from constraints
    values to different patterns of the corresponding (map,opcode,vexvalid)
    bin. These cdict objects can later be used for generating hash functions
    from constraint values to patterns (inums).
    """
    maps = ild_info.get_maps(is_amd)
    cdict_by_map_opcode = collections.defaultdict(dict)
    cnames = set()
    for insn_map in maps:
        for opcode in range(0, 256):
            opcode = hex(opcode)
            ptrns = ptrns_by_map_opcode[insn_map][opcode]
            cdict = _get_united_cdict(ptrns, state_space, vexvalid,
                                      all_ops_widths)
            cdict_by_map_opcode[insn_map][opcode] = cdict
            if cdict:
                cnames = cnames.union(set(cdict.cnames))
    return cdict_by_map_opcode,cnames

def gen_ph_fos(agi, cdict_by_map_opcode, is_amd, log_fn,
               ptrn_dict, vv):
    """
    Returns a tuple (phash_lu_table,phash_fo_list,op_lu_list)
    phash_lu_table is a traditional 2D dict by map, opcode to a
    hash function name.
    phash_fo_list is a list of all phash function objects created
    (we might have fos that are not in lookup table - when we have
    2-level hash functions).
    op_lu_list is a list for all the operands lookup functions
    Also writes log file for debugging.
    """
    maps = ild_info.get_maps(is_amd)
    log_f = open(log_fn, 'w')
    cnames = set()
    stats = {
             '0. #map-opcodes': 0,
             '1. #entries': 0,
             '2. #hentries': 0,
             '3. #hashes': 0,
             '4. #min_hashes': 0,
             '5. #cdict_size_1_to_10': 0,
             '6. #cdict_size_10_to_20': 0,
             '7. #cdict_size_20_to_100': 0,
             '8. #cdict_size_at_least_100': 0
             }##
    lu_fo_list = []
    op_lu_map = {}
    phash_lu = {}
    for insn_map in maps:
        phash_lu [insn_map] = {}
        for opcode in range(0, 256):
            opcode = hex(opcode)
            cdict = cdict_by_map_opcode[insn_map][opcode]
            if cdict:
                stats['0. #map-opcodes'] += 1
                stats['1. #entries'] += len(cdict.tuple2rule)
                cnames = cnames.union(set(cdict.cnames))
                _log(log_f,'MAP:%s OPCODE:%s:\n%s\n' % (insn_map, opcode,
                                                        cdict))

                phash = ild_phash.gen_hash(cdict)
                if phash:
                    _log(log_f,"%s" % phash)
                    phash_id = 'map%s_opcode%s_vv%d' % (insn_map, opcode,
                                                        vv)
                    fname = "%s_%s" % (_find_fn_pfx,phash_id)
                    (fo_list,op_lu_fo) = phash.gen_find_fos(fname)
                    lu_fo_list.extend(fo_list)

                    #hold only one instance of each function
                    if op_lu_fo.function_name not in op_lu_map:
                        op_lu_map[op_lu_fo.function_name] = op_lu_fo
                    for fo in fo_list:
                        _log(log_f,'//find function:\n')
                        _log(log_f,fo.emit())
                        _log(log_f,'-----------------------------\n')
                    #FIXME: assumption: L2 function is last in the list
                    #maybe return dict or tuple to make a distinction between
                    #L2 and L1 functions?
                    phlu_fn = lu_fo_list[-1]
                    phash_lu[insn_map][opcode] = phlu_fn.function_name
                    phash.update_stats(stats)
                else:
                    _log(log_f,'---NOPHASH-----\n')
                    msg = "Failed to gen phash for map %s opcode %s"
                    ildutil.ild_err(msg % (insn_map, opcode))
            else:
                phash_lu[insn_map][opcode] = '(xed3_find_func_t)0'
    _log(log_f,"cnames: %s\n" %cnames)
    for key in sorted(stats.keys()):
        _log(log_f,"%s %s\n" % (key,stats[key]))
    log_f.close()
    return phash_lu,lu_fo_list,list(op_lu_map.values())