specialize.isa revision 7087
14348Sgblack@eecs.umich.edu// -*- mode:c++ -*- 24348Sgblack@eecs.umich.edu 34348Sgblack@eecs.umich.edu// Copyright (c) 2007 The Hewlett-Packard Development Company 44348Sgblack@eecs.umich.edu// All rights reserved. 54348Sgblack@eecs.umich.edu// 67087Snate@binkert.org// The license below extends only to copyright in the software and shall 77087Snate@binkert.org// not be construed as granting a license to any other intellectual 87087Snate@binkert.org// property including but not limited to intellectual property relating 97087Snate@binkert.org// to a hardware implementation of the functionality of the software 107087Snate@binkert.org// licensed hereunder. You may use the software subject to the license 117087Snate@binkert.org// terms below provided that you ensure that this notice is replicated 127087Snate@binkert.org// unmodified and in its entirety in all distributions of the software, 137087Snate@binkert.org// modified or unmodified, in source code or in binary form. 144348Sgblack@eecs.umich.edu// 157087Snate@binkert.org// Redistribution and use in source and binary forms, with or without 167087Snate@binkert.org// modification, are permitted provided that the following conditions are 177087Snate@binkert.org// met: redistributions of source code must retain the above copyright 187087Snate@binkert.org// notice, this list of conditions and the following disclaimer; 197087Snate@binkert.org// redistributions in binary form must reproduce the above copyright 207087Snate@binkert.org// notice, this list of conditions and the following disclaimer in the 217087Snate@binkert.org// documentation and/or other materials provided with the distribution; 227087Snate@binkert.org// neither the name of the copyright holders nor the names of its 234348Sgblack@eecs.umich.edu// contributors may be used to endorse or promote products derived from 247087Snate@binkert.org// this software without specific prior written permission. 254348Sgblack@eecs.umich.edu// 264348Sgblack@eecs.umich.edu// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 274348Sgblack@eecs.umich.edu// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 284348Sgblack@eecs.umich.edu// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 294348Sgblack@eecs.umich.edu// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 304348Sgblack@eecs.umich.edu// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 314348Sgblack@eecs.umich.edu// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 324348Sgblack@eecs.umich.edu// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 334348Sgblack@eecs.umich.edu// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 344348Sgblack@eecs.umich.edu// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 354348Sgblack@eecs.umich.edu// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 364348Sgblack@eecs.umich.edu// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 374348Sgblack@eecs.umich.edu// 384348Sgblack@eecs.umich.edu// Authors: Gabe Black 394348Sgblack@eecs.umich.edu 404348Sgblack@eecs.umich.edu//////////////////////////////////////////////////////////////////// 414348Sgblack@eecs.umich.edu// 424348Sgblack@eecs.umich.edu// Code to "specialize" a microcode sequence to use a particular 434348Sgblack@eecs.umich.edu// variety of operands 444348Sgblack@eecs.umich.edu// 454348Sgblack@eecs.umich.edu 464348Sgblack@eecs.umich.edulet {{ 474348Sgblack@eecs.umich.edu # This code builds up a decode block which decodes based on switchval. 484348Sgblack@eecs.umich.edu # vals is a dict which matches case values with what should be decoded to. 494609Sgblack@eecs.umich.edu # Each element of the dict is a list containing a function and then the 504609Sgblack@eecs.umich.edu # arguments to pass to it. 514609Sgblack@eecs.umich.edu def doSplitDecode(switchVal, vals, default = None): 524542Sgblack@eecs.umich.edu blocks = OutputBlocks() 534542Sgblack@eecs.umich.edu blocks.decode_block = 'switch(%s) {\n' % switchVal 544348Sgblack@eecs.umich.edu for (val, todo) in vals.items(): 554609Sgblack@eecs.umich.edu new_blocks = todo[0](*todo[1:]) 564542Sgblack@eecs.umich.edu new_blocks.decode_block = \ 574542Sgblack@eecs.umich.edu '\tcase %s: %s\n' % (val, new_blocks.decode_block) 584542Sgblack@eecs.umich.edu blocks.append(new_blocks) 594348Sgblack@eecs.umich.edu if default: 604609Sgblack@eecs.umich.edu new_blocks = default[0](*default[1:]) 614542Sgblack@eecs.umich.edu new_blocks.decode_block = \ 624542Sgblack@eecs.umich.edu '\tdefault: %s\n' % new_blocks.decode_block 634542Sgblack@eecs.umich.edu blocks.append(new_blocks) 644542Sgblack@eecs.umich.edu blocks.decode_block += '}\n' 654542Sgblack@eecs.umich.edu return blocks 664348Sgblack@eecs.umich.edu}}; 674348Sgblack@eecs.umich.edu 684348Sgblack@eecs.umich.edulet {{ 694609Sgblack@eecs.umich.edu def doRipRelativeDecode(Name, opTypes, env): 704609Sgblack@eecs.umich.edu # print "RIPing %s with opTypes %s" % (Name, opTypes) 715788Sgblack@eecs.umich.edu env.memoryInst = True 725788Sgblack@eecs.umich.edu normEnv = copy.copy(env) 735788Sgblack@eecs.umich.edu normEnv.addToDisassembly( 745788Sgblack@eecs.umich.edu '''printMem(out, env.seg, env.scale, env.index, env.base, 755788Sgblack@eecs.umich.edu machInst.displacement, env.addressSize, false);''') 765788Sgblack@eecs.umich.edu normBlocks = specializeInst(Name + "_M", copy.copy(opTypes), normEnv) 775788Sgblack@eecs.umich.edu ripEnv = copy.copy(env) 785788Sgblack@eecs.umich.edu ripEnv.addToDisassembly( 795788Sgblack@eecs.umich.edu '''printMem(out, env.seg, 1, 0, 0, 805788Sgblack@eecs.umich.edu machInst.displacement, env.addressSize, true);''') 815788Sgblack@eecs.umich.edu ripBlocks = specializeInst(Name + "_P", copy.copy(opTypes), ripEnv) 824609Sgblack@eecs.umich.edu 834609Sgblack@eecs.umich.edu blocks = OutputBlocks() 844609Sgblack@eecs.umich.edu blocks.append(normBlocks) 854609Sgblack@eecs.umich.edu blocks.append(ripBlocks) 864609Sgblack@eecs.umich.edu 874609Sgblack@eecs.umich.edu blocks.decode_block = ''' 884609Sgblack@eecs.umich.edu if(machInst.modRM.mod == 0 && 894609Sgblack@eecs.umich.edu machInst.modRM.rm == 5 && 904609Sgblack@eecs.umich.edu machInst.mode.submode == SixtyFourBitMode) 914609Sgblack@eecs.umich.edu { %s } 924609Sgblack@eecs.umich.edu else 934609Sgblack@eecs.umich.edu { %s }''' % \ 944609Sgblack@eecs.umich.edu (ripBlocks.decode_block, normBlocks.decode_block) 954609Sgblack@eecs.umich.edu return blocks 964609Sgblack@eecs.umich.edu}}; 974609Sgblack@eecs.umich.edu 984609Sgblack@eecs.umich.edulet {{ 994348Sgblack@eecs.umich.edu class OpType(object): 1004601Sgblack@eecs.umich.edu parser = re.compile(r"(?P<tag>[A-Z]+)(?P<size>[a-z]*)|(r(?P<reg>[A-Z0-9]+)(?P<rsize>[a-z]*))") 1014348Sgblack@eecs.umich.edu def __init__(self, opTypeString): 1024348Sgblack@eecs.umich.edu match = OpType.parser.search(opTypeString) 1034348Sgblack@eecs.umich.edu if match == None: 1044348Sgblack@eecs.umich.edu raise Exception, "Problem parsing operand type %s" % opTypeString 1054348Sgblack@eecs.umich.edu self.reg = match.group("reg") 1064348Sgblack@eecs.umich.edu self.tag = match.group("tag") 1074348Sgblack@eecs.umich.edu self.size = match.group("size") 1084746Sgblack@eecs.umich.edu if not self.size: 1094746Sgblack@eecs.umich.edu self.size = match.group("rsize") 1104348Sgblack@eecs.umich.edu 1114548Sgblack@eecs.umich.edu ModRMRegIndex = "(MODRM_REG | (REX_R << 3))" 1124548Sgblack@eecs.umich.edu ModRMRMIndex = "(MODRM_RM | (REX_B << 3))" 1134716Sgblack@eecs.umich.edu InstRegIndex = "(OPCODE_OP_BOTTOM3 | (REX_B << 3))" 1144548Sgblack@eecs.umich.edu 1154348Sgblack@eecs.umich.edu # This function specializes the given piece of code to use a particular 1164528Sgblack@eecs.umich.edu # set of argument types described by "opTypes". 1174528Sgblack@eecs.umich.edu def specializeInst(Name, opTypes, env): 1184568Sgblack@eecs.umich.edu # print "Specializing %s with opTypes %s" % (Name, opTypes) 1194348Sgblack@eecs.umich.edu while len(opTypes): 1204528Sgblack@eecs.umich.edu # Parse the operand type string we're working with 1214542Sgblack@eecs.umich.edu opType = OpType(opTypes[0]) 1224601Sgblack@eecs.umich.edu opTypes.pop(0) 1234348Sgblack@eecs.umich.edu 1246519Sgblack@eecs.umich.edu if opType.tag not in ("I", "J", "P", "PR", "Q", "V", "VR", "W"): 1254746Sgblack@eecs.umich.edu if opType.size: 1264746Sgblack@eecs.umich.edu env.setSize(opType.size) 1274746Sgblack@eecs.umich.edu 1284348Sgblack@eecs.umich.edu if opType.reg: 1294348Sgblack@eecs.umich.edu #Figure out what to do with fixed register operands 1304528Sgblack@eecs.umich.edu #This is the index to use, so we should stick it some place. 1314542Sgblack@eecs.umich.edu if opType.reg in ("A", "B", "C", "D"): 1325788Sgblack@eecs.umich.edu regString = "INTREG_R%sX" % opType.reg 1334542Sgblack@eecs.umich.edu else: 1345788Sgblack@eecs.umich.edu regString = "INTREG_R%s" % opType.reg 1355788Sgblack@eecs.umich.edu env.addReg(regString) 1365788Sgblack@eecs.umich.edu env.addToDisassembly( 1375788Sgblack@eecs.umich.edu "printReg(out, %s, regSize);\n" % regString) 1384575Sgblack@eecs.umich.edu Name += "_R" 1394716Sgblack@eecs.umich.edu elif opType.tag == "B": 1404716Sgblack@eecs.umich.edu # This refers to registers whose index is encoded as part of the opcode 1415788Sgblack@eecs.umich.edu env.addToDisassembly( 1425788Sgblack@eecs.umich.edu "printReg(out, %s, regSize);\n" % InstRegIndex) 1434716Sgblack@eecs.umich.edu Name += "_R" 1444716Sgblack@eecs.umich.edu env.addReg(InstRegIndex) 1454601Sgblack@eecs.umich.edu elif opType.tag == "M": 1464601Sgblack@eecs.umich.edu # This refers to memory. The macroop constructor sets up modrm 1474601Sgblack@eecs.umich.edu # addressing. Non memory modrm settings should cause an error. 1484601Sgblack@eecs.umich.edu env.doModRM = True 1494817Sgblack@eecs.umich.edu return doRipRelativeDecode(Name, opTypes, env) 1504348Sgblack@eecs.umich.edu elif opType.tag == None or opType.size == None: 1514348Sgblack@eecs.umich.edu raise Exception, "Problem parsing operand tag: %s" % opType.tag 1525241Sgblack@eecs.umich.edu elif opType.tag == "C": 1535294Sgblack@eecs.umich.edu # A control register indexed by the "reg" field 1545241Sgblack@eecs.umich.edu env.addReg(ModRMRegIndex) 1555788Sgblack@eecs.umich.edu env.addToDisassembly( 1565788Sgblack@eecs.umich.edu "ccprintf(out, \"CR%%d\", %s);\n" % ModRMRegIndex) 1575241Sgblack@eecs.umich.edu Name += "_C" 1585241Sgblack@eecs.umich.edu elif opType.tag == "D": 1595294Sgblack@eecs.umich.edu # A debug register indexed by the "reg" field 1605241Sgblack@eecs.umich.edu env.addReg(ModRMRegIndex) 1615788Sgblack@eecs.umich.edu env.addToDisassembly( 1625788Sgblack@eecs.umich.edu "ccprintf(out, \"DR%%d\", %s);\n" % ModRMRegIndex) 1635241Sgblack@eecs.umich.edu Name += "_D" 1645294Sgblack@eecs.umich.edu elif opType.tag == "S": 1655294Sgblack@eecs.umich.edu # A segment selector register indexed by the "reg" field 1665294Sgblack@eecs.umich.edu env.addReg(ModRMRegIndex) 1675788Sgblack@eecs.umich.edu env.addToDisassembly( 1685788Sgblack@eecs.umich.edu "printSegment(out, %s);\n" % ModRMRegIndex) 1695294Sgblack@eecs.umich.edu Name += "_S" 1705294Sgblack@eecs.umich.edu elif opType.tag in ("G", "P", "T", "V"): 1714348Sgblack@eecs.umich.edu # Use the "reg" field of the ModRM byte to select the register 1724548Sgblack@eecs.umich.edu env.addReg(ModRMRegIndex) 1735788Sgblack@eecs.umich.edu env.addToDisassembly( 1745788Sgblack@eecs.umich.edu "printReg(out, %s, regSize);\n" % ModRMRegIndex) 1756518Sgblack@eecs.umich.edu if opType.tag == "P": 1766518Sgblack@eecs.umich.edu Name += "_MMX" 1776518Sgblack@eecs.umich.edu elif opType.tag == "V": 1786518Sgblack@eecs.umich.edu Name += "_XMM" 1796518Sgblack@eecs.umich.edu else: 1806518Sgblack@eecs.umich.edu Name += "_R" 1814348Sgblack@eecs.umich.edu elif opType.tag in ("E", "Q", "W"): 1824348Sgblack@eecs.umich.edu # This might refer to memory or to a register. We need to 1834348Sgblack@eecs.umich.edu # divide it up farther. 1844528Sgblack@eecs.umich.edu regEnv = copy.copy(env) 1854548Sgblack@eecs.umich.edu regEnv.addReg(ModRMRMIndex) 1865788Sgblack@eecs.umich.edu regEnv.addToDisassembly( 1875788Sgblack@eecs.umich.edu "printReg(out, %s, regSize);\n" % ModRMRMIndex) 1884601Sgblack@eecs.umich.edu # This refers to memory. The macroop constructor should set up 1894601Sgblack@eecs.umich.edu # modrm addressing. 1904528Sgblack@eecs.umich.edu memEnv = copy.copy(env) 1914601Sgblack@eecs.umich.edu memEnv.doModRM = True 1926518Sgblack@eecs.umich.edu regSuffix = "_R" 1936518Sgblack@eecs.umich.edu if opType.tag == "Q": 1946518Sgblack@eecs.umich.edu regSuffix = "_MMX" 1956518Sgblack@eecs.umich.edu elif opType.tag == "W": 1966518Sgblack@eecs.umich.edu regSuffix = "_XMM" 1974609Sgblack@eecs.umich.edu return doSplitDecode("MODRM_MOD", 1986518Sgblack@eecs.umich.edu {"3" : (specializeInst, Name + regSuffix, 1996518Sgblack@eecs.umich.edu copy.copy(opTypes), regEnv)}, 2006518Sgblack@eecs.umich.edu (doRipRelativeDecode, Name, 2016518Sgblack@eecs.umich.edu copy.copy(opTypes), memEnv)) 2024348Sgblack@eecs.umich.edu elif opType.tag in ("I", "J"): 2034532Sgblack@eecs.umich.edu # Immediates 2045788Sgblack@eecs.umich.edu env.addToDisassembly( 2055788Sgblack@eecs.umich.edu "ccprintf(out, \"%#x\", machInst.immediate);\n") 2064575Sgblack@eecs.umich.edu Name += "_I" 2075151Sgblack@eecs.umich.edu elif opType.tag == "O": 2085151Sgblack@eecs.umich.edu # Immediate containing a memory offset 2095151Sgblack@eecs.umich.edu Name += "_MI" 2104348Sgblack@eecs.umich.edu elif opType.tag in ("PR", "R", "VR"): 2114601Sgblack@eecs.umich.edu # Non register modrm settings should cause an error 2124548Sgblack@eecs.umich.edu env.addReg(ModRMRMIndex) 2135788Sgblack@eecs.umich.edu env.addToDisassembly( 2145788Sgblack@eecs.umich.edu "printReg(out, %s, regSize);\n" % ModRMRMIndex) 2156518Sgblack@eecs.umich.edu if opType.tag == "PR": 2166518Sgblack@eecs.umich.edu Name += "_MMX" 2176518Sgblack@eecs.umich.edu elif opType.tag == "VR": 2186518Sgblack@eecs.umich.edu Name += "_XMM" 2196518Sgblack@eecs.umich.edu else: 2206518Sgblack@eecs.umich.edu Name += "_R" 2214868Sgblack@eecs.umich.edu elif opType.tag in ("X", "Y"): 2224868Sgblack@eecs.umich.edu # This type of memory addressing is for string instructions. 2234868Sgblack@eecs.umich.edu # They'll use the right index and segment internally. 2245788Sgblack@eecs.umich.edu if opType.tag == "X": 2255788Sgblack@eecs.umich.edu env.addToDisassembly( 2265788Sgblack@eecs.umich.edu '''printMem(out, env.seg, 2275788Sgblack@eecs.umich.edu 1, X86ISA::ZeroReg, X86ISA::INTREG_RSI, 0, 2285788Sgblack@eecs.umich.edu env.addressSize, false);''') 2295788Sgblack@eecs.umich.edu else: 2305788Sgblack@eecs.umich.edu env.addToDisassembly( 2315788Sgblack@eecs.umich.edu '''printMem(out, SEGMENT_REG_ES, 2325788Sgblack@eecs.umich.edu 1, X86ISA::ZeroReg, X86ISA::INTREG_RDI, 0, 2335788Sgblack@eecs.umich.edu env.addressSize, false);''') 2344868Sgblack@eecs.umich.edu Name += "_M" 2354348Sgblack@eecs.umich.edu else: 2364348Sgblack@eecs.umich.edu raise Exception, "Unrecognized tag %s." % opType.tag 2374348Sgblack@eecs.umich.edu 2384532Sgblack@eecs.umich.edu # Generate code to return a macroop of the given name which will 2394559Sgblack@eecs.umich.edu # operate in the "emulation environment" env 2404528Sgblack@eecs.umich.edu return genMacroop(Name, env) 2414348Sgblack@eecs.umich.edu}}; 242