microasm.isa revision 4344:174e31456abe
12023SN/A// -*- mode:c++ -*-
22023SN/A
32023SN/A// Copyright (c) 2007 The Hewlett-Packard Development Company
42023SN/A// All rights reserved.
52023SN/A//
62023SN/A// Redistribution and use of this software in source and binary forms,
72023SN/A// with or without modification, are permitted provided that the
82023SN/A// following conditions are met:
92023SN/A//
102023SN/A// The software must be used only for Non-Commercial Use which means any
112023SN/A// use which is NOT directed to receiving any direct monetary
122023SN/A// compensation for, or commercial advantage from such use.  Illustrative
132023SN/A// examples of non-commercial use are academic research, personal study,
142023SN/A// teaching, education and corporate research & development.
152023SN/A// Illustrative examples of commercial use are distributing products for
162023SN/A// commercial advantage and providing services using the software for
172023SN/A// commercial advantage.
182023SN/A//
192023SN/A// If you wish to use this software or functionality therein that may be
202023SN/A// covered by patents for commercial use, please contact:
212023SN/A//     Director of Intellectual Property Licensing
222023SN/A//     Office of Strategy and Technology
232023SN/A//     Hewlett-Packard Company
242023SN/A//     1501 Page Mill Road
252023SN/A//     Palo Alto, California  94304
262023SN/A//
272665Ssaidi@eecs.umich.edu// Redistributions of source code must retain the above copyright notice,
282665Ssaidi@eecs.umich.edu// this list of conditions and the following disclaimer.  Redistributions
292665Ssaidi@eecs.umich.edu// in binary form must reproduce the above copyright notice, this list of
302023SN/A// conditions and the following disclaimer in the documentation and/or
312023SN/A// other materials provided with the distribution.  Neither the name of
322028SN/A// the COPYRIGHT HOLDER(s), HEWLETT-PACKARD COMPANY, nor the names of its
332028SN/A// contributors may be used to endorse or promote products derived from
342023SN/A// this software without specific prior written permission.  No right of
352597SN/A// sublicense is granted herewith.  Derivatives of the software and
362023SN/A// output created using the software may be prepared, but only for
372023SN/A// Non-Commercial Uses.  Derivatives of the software may be shared with
382239SN/A// others provided: (i) the others agree to abide by the list of
392239SN/A// conditions herein which includes the Non-Commercial Use restrictions;
402028SN/A// and (ii) such Derivatives of the software include the above copyright
412023SN/A// notice to acknowledge the contribution from this software where
422131SN/A// applicable, this list of conditions and the disclaimer below.
432023SN/A//
442131SN/A// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
452023SN/A// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
462525SN/A// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
472525SN/A// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
482447SN/A// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
492023SN/A// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
502972Sgblack@eecs.umich.edu// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
512972Sgblack@eecs.umich.edu// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
522972Sgblack@eecs.umich.edu// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
532972Sgblack@eecs.umich.edu// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
542239SN/A// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
552972Sgblack@eecs.umich.edu//
562972Sgblack@eecs.umich.edu// Authors: Gabe Black
572131SN/A
582972Sgblack@eecs.umich.edu////////////////////////////////////////////////////////////////////
592972Sgblack@eecs.umich.edu//
602972Sgblack@eecs.umich.edu//  Code to "specialize" a microcode sequence to use a particular
612972Sgblack@eecs.umich.edu//  variety of operands
622972Sgblack@eecs.umich.edu//
632972Sgblack@eecs.umich.edu
642972Sgblack@eecs.umich.edulet {{
652131SN/A    # This code builds up a decode block which decodes based on switchval.
662972Sgblack@eecs.umich.edu    # vals is a dict which matches case values with what should be decoded to.
672972Sgblack@eecs.umich.edu    # builder is called on the exploded contents of "vals" values to generate
682972Sgblack@eecs.umich.edu    # whatever code should be used.
692131SN/A    def doSplitDecode(name, Name, builder, switchVal, vals, default = None):
702972Sgblack@eecs.umich.edu        header_output = ''
712972Sgblack@eecs.umich.edu        decoder_output = ''
722597SN/A        decode_block = 'switch(%s) {\n' % switchVal
732972Sgblack@eecs.umich.edu        exec_output = ''
742597SN/A        for (val, todo) in vals.items():
752972Sgblack@eecs.umich.edu            (new_header_output,
762972Sgblack@eecs.umich.edu             new_decoder_output,
772972Sgblack@eecs.umich.edu             new_decode_block,
782597SN/A             new_exec_output) = builder(name, Name, *todo)
792972Sgblack@eecs.umich.edu            header_output += new_header_output
802972Sgblack@eecs.umich.edu            decoder_output += new_decoder_output
812972Sgblack@eecs.umich.edu            decode_block += '\tcase %s: %s\n' % (val, new_decode_block)
822972Sgblack@eecs.umich.edu            exec_output += new_exec_output
832972Sgblack@eecs.umich.edu        if default:
842972Sgblack@eecs.umich.edu            (new_header_output,
852972Sgblack@eecs.umich.edu             new_decoder_output,
862972Sgblack@eecs.umich.edu             new_decode_block,
872972Sgblack@eecs.umich.edu             new_exec_output) = builder(name, Name, *default)
882972Sgblack@eecs.umich.edu            header_output += new_header_output
892972Sgblack@eecs.umich.edu            decoder_output += new_decoder_output
902972Sgblack@eecs.umich.edu            decode_block += '\tdefault: %s\n' % new_decode_block
912972Sgblack@eecs.umich.edu            exec_output += new_exec_output
922972Sgblack@eecs.umich.edu        decode_block += '}\n'
932972Sgblack@eecs.umich.edu        return (header_output, decoder_output, decode_block, exec_output)
942972Sgblack@eecs.umich.edu}};
952597SN/A
962972Sgblack@eecs.umich.edulet {{
972972Sgblack@eecs.umich.edu    class OpType(object):
982972Sgblack@eecs.umich.edu        parser = re.compile(r"(?P<tag>[A-Z][A-Z]*)(?P<size>[a-z][a-z]*)|(r(?P<reg>[A-Za-z0-9][A-Za-z0-9]*))")
992131SN/A        def __init__(self, opTypeString):
1002972Sgblack@eecs.umich.edu            match = OpType.parser.search(opTypeString)
1012972Sgblack@eecs.umich.edu            if match == None:
1022131SN/A                raise Exception, "Problem parsing operand type %s" % opTypeString
1032972Sgblack@eecs.umich.edu            self.reg = match.group("reg")
1042131SN/A            self.tag = match.group("tag")
1052972Sgblack@eecs.umich.edu            self.size = match.group("size")
1062972Sgblack@eecs.umich.edu}};
1072972Sgblack@eecs.umich.edu
1082972Sgblack@eecs.umich.edulet {{
1092131SN/A
1102972Sgblack@eecs.umich.edu    # This function specializes the given piece of code to use a particular
1112972Sgblack@eecs.umich.edu    # set of argument types described by "opTypes". These are "implemented"
1122972Sgblack@eecs.umich.edu    # in reverse order.
1132131SN/A    def specializeInst(name, Name, code, opTypes):
1142972Sgblack@eecs.umich.edu        opNum = len(opTypes) - 1
1152972Sgblack@eecs.umich.edu        while len(opTypes):
1162131SN/A            # print "Building a composite op with tags", opTypes
1172023SN/A            # print "And code", code
1182023SN/A            opNum = len(opTypes) - 1
1192447SN/A            # A regular expression to find the operand placeholders we're
1202447SN/A            # interested in.
1212028SN/A            opRe = re.compile("\\^(?P<operandNum>%d)(?=[^0-9]|$)" % opNum)
122
123            # Parse the operand type strign we're working with
124            opType = OpType(opTypes[opNum])
125
126            if opType.reg:
127                #Figure out what to do with fixed register operands
128                if opType.reg in ("Ax", "Bx", "Cx", "Dx"):
129                    code = opRe.sub("%%{INTREG_R%s}" % opType.reg.upper(), code)
130                elif opType.reg == "Al":
131                    # We need a way to specify register width
132                    code = opRe.sub("%{INTREG_RAX}", code)
133                else:
134                    print "Didn't know how to encode fixed register %s!" % opType.reg
135            elif opType.tag == None or opType.size == None:
136                raise Exception, "Problem parsing operand tag: %s" % opType.tag
137            elif opType.tag in ("C", "D", "G", "P", "S", "T", "V"):
138                # Use the "reg" field of the ModRM byte to select the register
139                code = opRe.sub("%{(uint8_t)MODRM_REG}", code)
140            elif opType.tag in ("E", "Q", "W"):
141                # This might refer to memory or to a register. We need to
142                # divide it up farther.
143                regCode = opRe.sub("%{(uint8_t)MODRM_RM}", code)
144                regTypes = copy.copy(opTypes)
145                regTypes.pop(-1)
146                # This needs to refer to memory, but we'll fill in the details
147                # later. It needs to take into account unaligned memory
148                # addresses.
149                memCode = opRe.sub("%0", code)
150                memTypes = copy.copy(opTypes)
151                memTypes.pop(-1)
152                return doSplitDecode(name, Name, specializeInst, "MODRM_MOD",
153                    {"3" : (regCode, regTypes)}, (memCode, memTypes))
154            elif opType.tag in ("I", "J"):
155                # Immediates are already in the instruction, so don't leave in
156                # those parameters
157                code = opRe.sub("${IMMEDIATE}", code)
158            elif opType.tag == "M":
159                # This needs to refer to memory, but we'll fill in the details
160                # later. It needs to take into account unaligned memory
161                # addresses.
162                code = opRe.sub("%0", code)
163            elif opType.tag in ("PR", "R", "VR"):
164                # There should probably be a check here to verify that mod
165                # is equal to 11b
166                code = opRe.sub("%{(uint8_t)MODRM_RM}", code)
167            else:
168                raise Exception, "Unrecognized tag %s." % opType.tag
169            opTypes.pop(-1)
170
171        # At this point, we've built up "code" to have all the necessary extra
172        # instructions needed to implement whatever types of operands were
173        # specified. Now we'll assemble it it into a StaticInst.
174        return assembleMicro(name, Name, code)
175}};
176
177////////////////////////////////////////////////////////////////////
178//
179//  The microcode assembler
180//
181
182let {{
183    # These are used when setting up microops so that they can specialize their
184    # base class template properly.
185    RegOpType = "RegisterOperand"
186    ImmOpType = "ImmediateOperand"
187}};
188
189let {{
190    class MicroOpStatement(object):
191        def __init__(self):
192            self.className = ''
193            self.label = ''
194            self.args = []
195
196        # This converts a list of python bools into
197        # a comma seperated list of C++ bools.
198        def microFlagsText(self, vals):
199            text = ""
200            for val in vals:
201                if val:
202                    text += ", true"
203                else:
204                    text += ", false"
205            return text
206
207        def getAllocator(self, *microFlags):
208            args = ''
209            signature = "<"
210            emptySig = True
211            for arg in self.args:
212                if not emptySig:
213                    signature += ", "
214                emptySig = False
215                if arg.has_key("operandImm"):
216                    args += ", %s" % arg["operandImm"]
217                    signature += ImmOpType
218                elif arg.has_key("operandReg"):
219                    args += ", %s" % arg["operandReg"]
220                    signature += RegOpType
221                elif arg.has_key("operandLabel"):
222                    raise Exception, "Found a label while creating allocator string."
223                else:
224                    raise Exception, "Unrecognized operand type."
225            signature += ">"
226            return 'new %s%s(machInst%s%s)' % (self.className, signature, self.microFlagsText(microFlags), args)
227}};
228
229let{{
230    def assembleMicro(name, Name, code):
231
232        # This function takes in a block of microcode assembly and returns
233        # a python list of objects which describe it.
234
235        # Keep this around in case we need it later
236        orig_code = code
237        # A list of the statements we've found thus far
238        statements = []
239
240        # Regular expressions to pull each piece of the statement out at a
241        # time. Each expression expects the thing it's looking for to be at
242        # the beginning of the line, so the previous component is stripped
243        # before continuing.
244        labelRe = re.compile(r'^[ \t]*(?P<label>\w\w*)[ \t]:')
245        lineRe = re.compile(r'^(?P<line>[^\n][^\n]*)$')
246        classRe = re.compile(r'^[ \t]*(?P<className>[a-zA-Z_]\w*)')
247        # This recognizes three different flavors of operands:
248        # 1. Raw decimal numbers composed of digits between 0 and 9
249        # 2. Code beginning with "{" and continuing until the first "}"
250        #         ^ This one might need revising
251        # 3. A label, which starts with a capital or small letter, or
252        #    underscore, which is optionally followed by a sequence of
253        #    capital or small letters, underscores, or digts between 0 and 9
254        opRe = re.compile( \
255            r'^[ \t]*((\@(?P<operandLabel0>\w\w*))|' +
256                    r'(\@\{(?P<operandLabel1>[^}]*)\})|' +
257                    r'(\%(?P<operandReg0>\w\w*))|' +
258                    r'(\%\{(?P<operandReg1>[^}]*)\})|' +
259                    r'(\$(?P<operandImm0>\w\w*))|' +
260                    r'(\$\{(?P<operandImm1>[^}]*)\}))')
261        lineMatch = lineRe.search(code)
262        while lineMatch != None:
263            statement = MicroOpStatement()
264            # Get a line and seperate it from the rest of the code
265            line = lineMatch.group("line")
266            orig_line = line
267            # print "Parsing line %s" % line
268            code = lineRe.sub('', code, 1)
269
270            # Find the label, if any
271            labelMatch = labelRe.search(line)
272            if labelMatch != None:
273                statement.label = labelMatch.group("label")
274                # print "Found label %s." % statement.label
275            # Clear the label from the statement
276            line = labelRe.sub('', line, 1)
277
278            # Find the class name which is roughly equivalent to the op name
279            classMatch = classRe.search(line)
280            if classMatch == None:
281                raise Exception, "Couldn't find class name in statement: %s" \
282                        % orig_line
283            else:
284                statement.className = classMatch.group("className")
285                # print "Found class name %s." % statement.className
286
287            # Clear the class name from the statement
288            line = classRe.sub('', line, 1)
289
290            #Find as many arguments as you can
291            statement.args = []
292            opMatch = opRe.search(line)
293            while opMatch is not None:
294                statement.args.append({})
295                # args is a list of dicts which collect different
296                # representations of operand values. Different forms might be
297                # needed in different places, for instance to replace a label
298                # with an offset.
299                for opType in ("operandLabel0", "operandReg0", "operandImm0",
300                               "operandLabel1", "operandReg1", "operandImm1"):
301                    if opMatch.group(opType):
302                        statement.args[-1][opType[:-1]] = opMatch.group(opType)
303                if len(statement.args[-1]) == 0:
304                    print "Problem parsing operand in statement: %s" \
305                            % orig_line
306                line = opRe.sub('', line, 1)
307                # print "Found operand %s." % statement.args[-1]
308                opMatch = opRe.search(line)
309            # print "Found operands", statement.args
310
311            # Add this statement to our collection
312            statements.append(statement)
313
314            # Get the next line
315            lineMatch = lineRe.search(code)
316
317        # Decode the labels into displacements
318
319        labels = {}
320        micropc = 0
321        for statement in statements:
322            if statement.label:
323                labels[statement.label] = count
324            micropc += 1
325        micropc = 0
326        for statement in statements:
327            for arg in statement.args:
328                if arg.has_key("operandLabel"):
329                    if not labels.has_key(arg["operandLabel"]):
330                        raise Exception, "Unrecognized label: %s." % arg["operandLabel"]
331                    # This is assuming that intra microcode branches go to
332                    # the next micropc + displacement, or
333                    # micropc + 1 + displacement.
334                    arg["operandImm"] = labels[arg["operandLabel"]] - micropc - 1
335            micropc += 1
336
337        # If we can implement this instruction with exactly one microop, just
338        # use that directly.
339        if len(statements) == 1:
340            decode_block = "return %s;" % \
341                            statements[0].getAllocator()
342            return ('', '', decode_block, '')
343        else:
344            # Build a macroop to contain the sequence of microops we've
345            # been given.
346            return genMacroOp(name, Name, statements)
347}};
348