microasm.isa revision 4344:174e31456abe
12023SN/A// -*- mode:c++ -*- 22023SN/A 32023SN/A// Copyright (c) 2007 The Hewlett-Packard Development Company 42023SN/A// All rights reserved. 52023SN/A// 62023SN/A// Redistribution and use of this software in source and binary forms, 72023SN/A// with or without modification, are permitted provided that the 82023SN/A// following conditions are met: 92023SN/A// 102023SN/A// The software must be used only for Non-Commercial Use which means any 112023SN/A// use which is NOT directed to receiving any direct monetary 122023SN/A// compensation for, or commercial advantage from such use. Illustrative 132023SN/A// examples of non-commercial use are academic research, personal study, 142023SN/A// teaching, education and corporate research & development. 152023SN/A// Illustrative examples of commercial use are distributing products for 162023SN/A// commercial advantage and providing services using the software for 172023SN/A// commercial advantage. 182023SN/A// 192023SN/A// If you wish to use this software or functionality therein that may be 202023SN/A// covered by patents for commercial use, please contact: 212023SN/A// Director of Intellectual Property Licensing 222023SN/A// Office of Strategy and Technology 232023SN/A// Hewlett-Packard Company 242023SN/A// 1501 Page Mill Road 252023SN/A// Palo Alto, California 94304 262023SN/A// 272665Ssaidi@eecs.umich.edu// Redistributions of source code must retain the above copyright notice, 282665Ssaidi@eecs.umich.edu// this list of conditions and the following disclaimer. Redistributions 292665Ssaidi@eecs.umich.edu// in binary form must reproduce the above copyright notice, this list of 302023SN/A// conditions and the following disclaimer in the documentation and/or 312023SN/A// other materials provided with the distribution. Neither the name of 322028SN/A// the COPYRIGHT HOLDER(s), HEWLETT-PACKARD COMPANY, nor the names of its 332028SN/A// contributors may be used to endorse or promote products derived from 342023SN/A// this software without specific prior written permission. No right of 352597SN/A// sublicense is granted herewith. Derivatives of the software and 362023SN/A// output created using the software may be prepared, but only for 372023SN/A// Non-Commercial Uses. Derivatives of the software may be shared with 382239SN/A// others provided: (i) the others agree to abide by the list of 392239SN/A// conditions herein which includes the Non-Commercial Use restrictions; 402028SN/A// and (ii) such Derivatives of the software include the above copyright 412023SN/A// notice to acknowledge the contribution from this software where 422131SN/A// applicable, this list of conditions and the disclaimer below. 432023SN/A// 442131SN/A// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 452023SN/A// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 462525SN/A// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 472525SN/A// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 482447SN/A// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 492023SN/A// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 502972Sgblack@eecs.umich.edu// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 512972Sgblack@eecs.umich.edu// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 522972Sgblack@eecs.umich.edu// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 532972Sgblack@eecs.umich.edu// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 542239SN/A// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 552972Sgblack@eecs.umich.edu// 562972Sgblack@eecs.umich.edu// Authors: Gabe Black 572131SN/A 582972Sgblack@eecs.umich.edu//////////////////////////////////////////////////////////////////// 592972Sgblack@eecs.umich.edu// 602972Sgblack@eecs.umich.edu// Code to "specialize" a microcode sequence to use a particular 612972Sgblack@eecs.umich.edu// variety of operands 622972Sgblack@eecs.umich.edu// 632972Sgblack@eecs.umich.edu 642972Sgblack@eecs.umich.edulet {{ 652131SN/A # This code builds up a decode block which decodes based on switchval. 662972Sgblack@eecs.umich.edu # vals is a dict which matches case values with what should be decoded to. 672972Sgblack@eecs.umich.edu # builder is called on the exploded contents of "vals" values to generate 682972Sgblack@eecs.umich.edu # whatever code should be used. 692131SN/A def doSplitDecode(name, Name, builder, switchVal, vals, default = None): 702972Sgblack@eecs.umich.edu header_output = '' 712972Sgblack@eecs.umich.edu decoder_output = '' 722597SN/A decode_block = 'switch(%s) {\n' % switchVal 732972Sgblack@eecs.umich.edu exec_output = '' 742597SN/A for (val, todo) in vals.items(): 752972Sgblack@eecs.umich.edu (new_header_output, 762972Sgblack@eecs.umich.edu new_decoder_output, 772972Sgblack@eecs.umich.edu new_decode_block, 782597SN/A new_exec_output) = builder(name, Name, *todo) 792972Sgblack@eecs.umich.edu header_output += new_header_output 802972Sgblack@eecs.umich.edu decoder_output += new_decoder_output 812972Sgblack@eecs.umich.edu decode_block += '\tcase %s: %s\n' % (val, new_decode_block) 822972Sgblack@eecs.umich.edu exec_output += new_exec_output 832972Sgblack@eecs.umich.edu if default: 842972Sgblack@eecs.umich.edu (new_header_output, 852972Sgblack@eecs.umich.edu new_decoder_output, 862972Sgblack@eecs.umich.edu new_decode_block, 872972Sgblack@eecs.umich.edu new_exec_output) = builder(name, Name, *default) 882972Sgblack@eecs.umich.edu header_output += new_header_output 892972Sgblack@eecs.umich.edu decoder_output += new_decoder_output 902972Sgblack@eecs.umich.edu decode_block += '\tdefault: %s\n' % new_decode_block 912972Sgblack@eecs.umich.edu exec_output += new_exec_output 922972Sgblack@eecs.umich.edu decode_block += '}\n' 932972Sgblack@eecs.umich.edu return (header_output, decoder_output, decode_block, exec_output) 942972Sgblack@eecs.umich.edu}}; 952597SN/A 962972Sgblack@eecs.umich.edulet {{ 972972Sgblack@eecs.umich.edu class OpType(object): 982972Sgblack@eecs.umich.edu parser = re.compile(r"(?P<tag>[A-Z][A-Z]*)(?P<size>[a-z][a-z]*)|(r(?P<reg>[A-Za-z0-9][A-Za-z0-9]*))") 992131SN/A def __init__(self, opTypeString): 1002972Sgblack@eecs.umich.edu match = OpType.parser.search(opTypeString) 1012972Sgblack@eecs.umich.edu if match == None: 1022131SN/A raise Exception, "Problem parsing operand type %s" % opTypeString 1032972Sgblack@eecs.umich.edu self.reg = match.group("reg") 1042131SN/A self.tag = match.group("tag") 1052972Sgblack@eecs.umich.edu self.size = match.group("size") 1062972Sgblack@eecs.umich.edu}}; 1072972Sgblack@eecs.umich.edu 1082972Sgblack@eecs.umich.edulet {{ 1092131SN/A 1102972Sgblack@eecs.umich.edu # This function specializes the given piece of code to use a particular 1112972Sgblack@eecs.umich.edu # set of argument types described by "opTypes". These are "implemented" 1122972Sgblack@eecs.umich.edu # in reverse order. 1132131SN/A def specializeInst(name, Name, code, opTypes): 1142972Sgblack@eecs.umich.edu opNum = len(opTypes) - 1 1152972Sgblack@eecs.umich.edu while len(opTypes): 1162131SN/A # print "Building a composite op with tags", opTypes 1172023SN/A # print "And code", code 1182023SN/A opNum = len(opTypes) - 1 1192447SN/A # A regular expression to find the operand placeholders we're 1202447SN/A # interested in. 1212028SN/A opRe = re.compile("\\^(?P<operandNum>%d)(?=[^0-9]|$)" % opNum) 122 123 # Parse the operand type strign we're working with 124 opType = OpType(opTypes[opNum]) 125 126 if opType.reg: 127 #Figure out what to do with fixed register operands 128 if opType.reg in ("Ax", "Bx", "Cx", "Dx"): 129 code = opRe.sub("%%{INTREG_R%s}" % opType.reg.upper(), code) 130 elif opType.reg == "Al": 131 # We need a way to specify register width 132 code = opRe.sub("%{INTREG_RAX}", code) 133 else: 134 print "Didn't know how to encode fixed register %s!" % opType.reg 135 elif opType.tag == None or opType.size == None: 136 raise Exception, "Problem parsing operand tag: %s" % opType.tag 137 elif opType.tag in ("C", "D", "G", "P", "S", "T", "V"): 138 # Use the "reg" field of the ModRM byte to select the register 139 code = opRe.sub("%{(uint8_t)MODRM_REG}", code) 140 elif opType.tag in ("E", "Q", "W"): 141 # This might refer to memory or to a register. We need to 142 # divide it up farther. 143 regCode = opRe.sub("%{(uint8_t)MODRM_RM}", code) 144 regTypes = copy.copy(opTypes) 145 regTypes.pop(-1) 146 # This needs to refer to memory, but we'll fill in the details 147 # later. It needs to take into account unaligned memory 148 # addresses. 149 memCode = opRe.sub("%0", code) 150 memTypes = copy.copy(opTypes) 151 memTypes.pop(-1) 152 return doSplitDecode(name, Name, specializeInst, "MODRM_MOD", 153 {"3" : (regCode, regTypes)}, (memCode, memTypes)) 154 elif opType.tag in ("I", "J"): 155 # Immediates are already in the instruction, so don't leave in 156 # those parameters 157 code = opRe.sub("${IMMEDIATE}", code) 158 elif opType.tag == "M": 159 # This needs to refer to memory, but we'll fill in the details 160 # later. It needs to take into account unaligned memory 161 # addresses. 162 code = opRe.sub("%0", code) 163 elif opType.tag in ("PR", "R", "VR"): 164 # There should probably be a check here to verify that mod 165 # is equal to 11b 166 code = opRe.sub("%{(uint8_t)MODRM_RM}", code) 167 else: 168 raise Exception, "Unrecognized tag %s." % opType.tag 169 opTypes.pop(-1) 170 171 # At this point, we've built up "code" to have all the necessary extra 172 # instructions needed to implement whatever types of operands were 173 # specified. Now we'll assemble it it into a StaticInst. 174 return assembleMicro(name, Name, code) 175}}; 176 177//////////////////////////////////////////////////////////////////// 178// 179// The microcode assembler 180// 181 182let {{ 183 # These are used when setting up microops so that they can specialize their 184 # base class template properly. 185 RegOpType = "RegisterOperand" 186 ImmOpType = "ImmediateOperand" 187}}; 188 189let {{ 190 class MicroOpStatement(object): 191 def __init__(self): 192 self.className = '' 193 self.label = '' 194 self.args = [] 195 196 # This converts a list of python bools into 197 # a comma seperated list of C++ bools. 198 def microFlagsText(self, vals): 199 text = "" 200 for val in vals: 201 if val: 202 text += ", true" 203 else: 204 text += ", false" 205 return text 206 207 def getAllocator(self, *microFlags): 208 args = '' 209 signature = "<" 210 emptySig = True 211 for arg in self.args: 212 if not emptySig: 213 signature += ", " 214 emptySig = False 215 if arg.has_key("operandImm"): 216 args += ", %s" % arg["operandImm"] 217 signature += ImmOpType 218 elif arg.has_key("operandReg"): 219 args += ", %s" % arg["operandReg"] 220 signature += RegOpType 221 elif arg.has_key("operandLabel"): 222 raise Exception, "Found a label while creating allocator string." 223 else: 224 raise Exception, "Unrecognized operand type." 225 signature += ">" 226 return 'new %s%s(machInst%s%s)' % (self.className, signature, self.microFlagsText(microFlags), args) 227}}; 228 229let{{ 230 def assembleMicro(name, Name, code): 231 232 # This function takes in a block of microcode assembly and returns 233 # a python list of objects which describe it. 234 235 # Keep this around in case we need it later 236 orig_code = code 237 # A list of the statements we've found thus far 238 statements = [] 239 240 # Regular expressions to pull each piece of the statement out at a 241 # time. Each expression expects the thing it's looking for to be at 242 # the beginning of the line, so the previous component is stripped 243 # before continuing. 244 labelRe = re.compile(r'^[ \t]*(?P<label>\w\w*)[ \t]:') 245 lineRe = re.compile(r'^(?P<line>[^\n][^\n]*)$') 246 classRe = re.compile(r'^[ \t]*(?P<className>[a-zA-Z_]\w*)') 247 # This recognizes three different flavors of operands: 248 # 1. Raw decimal numbers composed of digits between 0 and 9 249 # 2. Code beginning with "{" and continuing until the first "}" 250 # ^ This one might need revising 251 # 3. A label, which starts with a capital or small letter, or 252 # underscore, which is optionally followed by a sequence of 253 # capital or small letters, underscores, or digts between 0 and 9 254 opRe = re.compile( \ 255 r'^[ \t]*((\@(?P<operandLabel0>\w\w*))|' + 256 r'(\@\{(?P<operandLabel1>[^}]*)\})|' + 257 r'(\%(?P<operandReg0>\w\w*))|' + 258 r'(\%\{(?P<operandReg1>[^}]*)\})|' + 259 r'(\$(?P<operandImm0>\w\w*))|' + 260 r'(\$\{(?P<operandImm1>[^}]*)\}))') 261 lineMatch = lineRe.search(code) 262 while lineMatch != None: 263 statement = MicroOpStatement() 264 # Get a line and seperate it from the rest of the code 265 line = lineMatch.group("line") 266 orig_line = line 267 # print "Parsing line %s" % line 268 code = lineRe.sub('', code, 1) 269 270 # Find the label, if any 271 labelMatch = labelRe.search(line) 272 if labelMatch != None: 273 statement.label = labelMatch.group("label") 274 # print "Found label %s." % statement.label 275 # Clear the label from the statement 276 line = labelRe.sub('', line, 1) 277 278 # Find the class name which is roughly equivalent to the op name 279 classMatch = classRe.search(line) 280 if classMatch == None: 281 raise Exception, "Couldn't find class name in statement: %s" \ 282 % orig_line 283 else: 284 statement.className = classMatch.group("className") 285 # print "Found class name %s." % statement.className 286 287 # Clear the class name from the statement 288 line = classRe.sub('', line, 1) 289 290 #Find as many arguments as you can 291 statement.args = [] 292 opMatch = opRe.search(line) 293 while opMatch is not None: 294 statement.args.append({}) 295 # args is a list of dicts which collect different 296 # representations of operand values. Different forms might be 297 # needed in different places, for instance to replace a label 298 # with an offset. 299 for opType in ("operandLabel0", "operandReg0", "operandImm0", 300 "operandLabel1", "operandReg1", "operandImm1"): 301 if opMatch.group(opType): 302 statement.args[-1][opType[:-1]] = opMatch.group(opType) 303 if len(statement.args[-1]) == 0: 304 print "Problem parsing operand in statement: %s" \ 305 % orig_line 306 line = opRe.sub('', line, 1) 307 # print "Found operand %s." % statement.args[-1] 308 opMatch = opRe.search(line) 309 # print "Found operands", statement.args 310 311 # Add this statement to our collection 312 statements.append(statement) 313 314 # Get the next line 315 lineMatch = lineRe.search(code) 316 317 # Decode the labels into displacements 318 319 labels = {} 320 micropc = 0 321 for statement in statements: 322 if statement.label: 323 labels[statement.label] = count 324 micropc += 1 325 micropc = 0 326 for statement in statements: 327 for arg in statement.args: 328 if arg.has_key("operandLabel"): 329 if not labels.has_key(arg["operandLabel"]): 330 raise Exception, "Unrecognized label: %s." % arg["operandLabel"] 331 # This is assuming that intra microcode branches go to 332 # the next micropc + displacement, or 333 # micropc + 1 + displacement. 334 arg["operandImm"] = labels[arg["operandLabel"]] - micropc - 1 335 micropc += 1 336 337 # If we can implement this instruction with exactly one microop, just 338 # use that directly. 339 if len(statements) == 1: 340 decode_block = "return %s;" % \ 341 statements[0].getAllocator() 342 return ('', '', decode_block, '') 343 else: 344 # Build a macroop to contain the sequence of microops we've 345 # been given. 346 return genMacroOp(name, Name, statements) 347}}; 348