mediaop.isa revision 7620
16516Sgblack@eecs.umich.edu/// Copyright (c) 2009 The Regents of The University of Michigan
26516Sgblack@eecs.umich.edu// All rights reserved.
36516Sgblack@eecs.umich.edu//
46516Sgblack@eecs.umich.edu// Redistribution and use in source and binary forms, with or without
56516Sgblack@eecs.umich.edu// modification, are permitted provided that the following conditions are
66516Sgblack@eecs.umich.edu// met: redistributions of source code must retain the above copyright
76516Sgblack@eecs.umich.edu// notice, this list of conditions and the following disclaimer;
86516Sgblack@eecs.umich.edu// redistributions in binary form must reproduce the above copyright
96516Sgblack@eecs.umich.edu// notice, this list of conditions and the following disclaimer in the
106516Sgblack@eecs.umich.edu// documentation and/or other materials provided with the distribution;
116516Sgblack@eecs.umich.edu// neither the name of the copyright holders nor the names of its
126516Sgblack@eecs.umich.edu// contributors may be used to endorse or promote products derived from
136516Sgblack@eecs.umich.edu// this software without specific prior written permission.
146516Sgblack@eecs.umich.edu//
156516Sgblack@eecs.umich.edu// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
166516Sgblack@eecs.umich.edu// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
176516Sgblack@eecs.umich.edu// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
186516Sgblack@eecs.umich.edu// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
196516Sgblack@eecs.umich.edu// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
206516Sgblack@eecs.umich.edu// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
216516Sgblack@eecs.umich.edu// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
226516Sgblack@eecs.umich.edu// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
236516Sgblack@eecs.umich.edu// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
246516Sgblack@eecs.umich.edu// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
256516Sgblack@eecs.umich.edu// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
266516Sgblack@eecs.umich.edu//
276516Sgblack@eecs.umich.edu// Authors: Gabe Black
286516Sgblack@eecs.umich.edu
296516Sgblack@eecs.umich.edudef template MediaOpExecute {{
306516Sgblack@eecs.umich.edu        Fault %(class_name)s::execute(%(CPU_exec_context)s *xc,
316516Sgblack@eecs.umich.edu                Trace::InstRecord *traceData) const
326516Sgblack@eecs.umich.edu        {
336516Sgblack@eecs.umich.edu            Fault fault = NoFault;
346516Sgblack@eecs.umich.edu
356516Sgblack@eecs.umich.edu            %(op_decl)s;
366516Sgblack@eecs.umich.edu            %(op_rd)s;
376516Sgblack@eecs.umich.edu
386516Sgblack@eecs.umich.edu            %(code)s;
396516Sgblack@eecs.umich.edu
406516Sgblack@eecs.umich.edu            //Write the resulting state to the execution context
416516Sgblack@eecs.umich.edu            if(fault == NoFault)
426516Sgblack@eecs.umich.edu            {
436516Sgblack@eecs.umich.edu                %(op_wb)s;
446516Sgblack@eecs.umich.edu            }
456516Sgblack@eecs.umich.edu            return fault;
466516Sgblack@eecs.umich.edu        }
476516Sgblack@eecs.umich.edu}};
486516Sgblack@eecs.umich.edu
496516Sgblack@eecs.umich.edudef template MediaOpRegDeclare {{
506516Sgblack@eecs.umich.edu    class %(class_name)s : public %(base_class)s
516516Sgblack@eecs.umich.edu    {
526516Sgblack@eecs.umich.edu      protected:
536516Sgblack@eecs.umich.edu        void buildMe();
546516Sgblack@eecs.umich.edu
556516Sgblack@eecs.umich.edu      public:
566516Sgblack@eecs.umich.edu        %(class_name)s(ExtMachInst _machInst,
577620Sgblack@eecs.umich.edu                const char * instMnem, uint64_t setFlags,
586516Sgblack@eecs.umich.edu                InstRegIndex _src1, InstRegIndex _src2, InstRegIndex _dest,
596545Sgblack@eecs.umich.edu                uint8_t _srcSize, uint8_t _destSize, uint16_t _ext);
606516Sgblack@eecs.umich.edu
616516Sgblack@eecs.umich.edu        %(class_name)s(ExtMachInst _machInst,
626516Sgblack@eecs.umich.edu                const char * instMnem,
636516Sgblack@eecs.umich.edu                InstRegIndex _src1, InstRegIndex _src2, InstRegIndex _dest,
646545Sgblack@eecs.umich.edu                uint8_t _srcSize, uint8_t _destSize, uint16_t _ext);
656516Sgblack@eecs.umich.edu
666516Sgblack@eecs.umich.edu        %(BasicExecDeclare)s
676516Sgblack@eecs.umich.edu    };
686516Sgblack@eecs.umich.edu}};
696516Sgblack@eecs.umich.edu
706516Sgblack@eecs.umich.edudef template MediaOpImmDeclare {{
716516Sgblack@eecs.umich.edu
726516Sgblack@eecs.umich.edu    class %(class_name)s : public %(base_class)s
736516Sgblack@eecs.umich.edu    {
746516Sgblack@eecs.umich.edu      protected:
756516Sgblack@eecs.umich.edu        void buildMe();
766516Sgblack@eecs.umich.edu
776516Sgblack@eecs.umich.edu      public:
786516Sgblack@eecs.umich.edu        %(class_name)s(ExtMachInst _machInst,
797620Sgblack@eecs.umich.edu                const char * instMnem, uint64_t setFlags,
806516Sgblack@eecs.umich.edu                InstRegIndex _src1, uint16_t _imm8, InstRegIndex _dest,
816545Sgblack@eecs.umich.edu                uint8_t _srcSize, uint8_t _destSize, uint16_t _ext);
826516Sgblack@eecs.umich.edu
836516Sgblack@eecs.umich.edu        %(class_name)s(ExtMachInst _machInst,
846516Sgblack@eecs.umich.edu                const char * instMnem,
856516Sgblack@eecs.umich.edu                InstRegIndex _src1, uint16_t _imm8, InstRegIndex _dest,
866545Sgblack@eecs.umich.edu                uint8_t _srcSize, uint8_t _destSize, uint16_t _ext);
876516Sgblack@eecs.umich.edu
886516Sgblack@eecs.umich.edu        %(BasicExecDeclare)s
896516Sgblack@eecs.umich.edu    };
906516Sgblack@eecs.umich.edu}};
916516Sgblack@eecs.umich.edu
926516Sgblack@eecs.umich.edudef template MediaOpRegConstructor {{
936516Sgblack@eecs.umich.edu
946516Sgblack@eecs.umich.edu    inline void %(class_name)s::buildMe()
956516Sgblack@eecs.umich.edu    {
966516Sgblack@eecs.umich.edu        %(constructor)s;
976516Sgblack@eecs.umich.edu    }
986516Sgblack@eecs.umich.edu
996516Sgblack@eecs.umich.edu    inline %(class_name)s::%(class_name)s(
1006516Sgblack@eecs.umich.edu            ExtMachInst machInst, const char * instMnem,
1016516Sgblack@eecs.umich.edu            InstRegIndex _src1, InstRegIndex _src2, InstRegIndex _dest,
1026545Sgblack@eecs.umich.edu            uint8_t _srcSize, uint8_t _destSize, uint16_t _ext) :
1037620Sgblack@eecs.umich.edu        %(base_class)s(machInst, "%(mnemonic)s", instMnem, 0,
1046545Sgblack@eecs.umich.edu                _src1, _src2, _dest, _srcSize, _destSize, _ext,
1056516Sgblack@eecs.umich.edu                %(op_class)s)
1066516Sgblack@eecs.umich.edu    {
1076516Sgblack@eecs.umich.edu        buildMe();
1086516Sgblack@eecs.umich.edu    }
1096516Sgblack@eecs.umich.edu
1106516Sgblack@eecs.umich.edu    inline %(class_name)s::%(class_name)s(
1117620Sgblack@eecs.umich.edu            ExtMachInst machInst, const char * instMnem, uint64_t setFlags,
1126516Sgblack@eecs.umich.edu            InstRegIndex _src1, InstRegIndex _src2, InstRegIndex _dest,
1136545Sgblack@eecs.umich.edu            uint8_t _srcSize, uint8_t _destSize, uint16_t _ext) :
1147620Sgblack@eecs.umich.edu        %(base_class)s(machInst, "%(mnemonic)s", instMnem, setFlags,
1156545Sgblack@eecs.umich.edu                _src1, _src2, _dest, _srcSize, _destSize, _ext,
1166516Sgblack@eecs.umich.edu                %(op_class)s)
1176516Sgblack@eecs.umich.edu    {
1186516Sgblack@eecs.umich.edu        buildMe();
1196516Sgblack@eecs.umich.edu    }
1206516Sgblack@eecs.umich.edu}};
1216516Sgblack@eecs.umich.edu
1226516Sgblack@eecs.umich.edudef template MediaOpImmConstructor {{
1236516Sgblack@eecs.umich.edu
1246516Sgblack@eecs.umich.edu    inline void %(class_name)s::buildMe()
1256516Sgblack@eecs.umich.edu    {
1266516Sgblack@eecs.umich.edu        %(constructor)s;
1276516Sgblack@eecs.umich.edu    }
1286516Sgblack@eecs.umich.edu
1296516Sgblack@eecs.umich.edu    inline %(class_name)s::%(class_name)s(
1306516Sgblack@eecs.umich.edu            ExtMachInst machInst, const char * instMnem,
1316516Sgblack@eecs.umich.edu            InstRegIndex _src1, uint16_t _imm8, InstRegIndex _dest,
1326545Sgblack@eecs.umich.edu            uint8_t _srcSize, uint8_t _destSize, uint16_t _ext) :
1337620Sgblack@eecs.umich.edu        %(base_class)s(machInst, "%(mnemonic)s", instMnem, 0,
1346545Sgblack@eecs.umich.edu                _src1, _imm8, _dest, _srcSize, _destSize, _ext,
1356516Sgblack@eecs.umich.edu                %(op_class)s)
1366516Sgblack@eecs.umich.edu    {
1376516Sgblack@eecs.umich.edu        buildMe();
1386516Sgblack@eecs.umich.edu    }
1396516Sgblack@eecs.umich.edu
1406516Sgblack@eecs.umich.edu    inline %(class_name)s::%(class_name)s(
1417620Sgblack@eecs.umich.edu            ExtMachInst machInst, const char * instMnem, uint64_t setFlags,
1426516Sgblack@eecs.umich.edu            InstRegIndex _src1, uint16_t _imm8, InstRegIndex _dest,
1436545Sgblack@eecs.umich.edu            uint8_t _srcSize, uint8_t _destSize, uint16_t _ext) :
1447620Sgblack@eecs.umich.edu        %(base_class)s(machInst, "%(mnemonic)s", instMnem, setFlags,
1456545Sgblack@eecs.umich.edu                _src1, _imm8, _dest, _srcSize, _destSize, _ext,
1466516Sgblack@eecs.umich.edu                %(op_class)s)
1476516Sgblack@eecs.umich.edu    {
1486516Sgblack@eecs.umich.edu        buildMe();
1496516Sgblack@eecs.umich.edu    }
1506516Sgblack@eecs.umich.edu}};
1516516Sgblack@eecs.umich.edu
1526516Sgblack@eecs.umich.edulet {{
1536516Sgblack@eecs.umich.edu    # Make these empty strings so that concatenating onto
1546516Sgblack@eecs.umich.edu    # them will always work.
1556516Sgblack@eecs.umich.edu    header_output = ""
1566516Sgblack@eecs.umich.edu    decoder_output = ""
1576516Sgblack@eecs.umich.edu    exec_output = ""
1586516Sgblack@eecs.umich.edu
1596516Sgblack@eecs.umich.edu    immTemplates = (
1606516Sgblack@eecs.umich.edu            MediaOpImmDeclare,
1616516Sgblack@eecs.umich.edu            MediaOpImmConstructor,
1626516Sgblack@eecs.umich.edu            MediaOpExecute)
1636516Sgblack@eecs.umich.edu
1646516Sgblack@eecs.umich.edu    regTemplates = (
1656516Sgblack@eecs.umich.edu            MediaOpRegDeclare,
1666516Sgblack@eecs.umich.edu            MediaOpRegConstructor,
1676516Sgblack@eecs.umich.edu            MediaOpExecute)
1686516Sgblack@eecs.umich.edu
1696516Sgblack@eecs.umich.edu    class MediaOpMeta(type):
1706516Sgblack@eecs.umich.edu        def buildCppClasses(self, name, Name, suffix, code):
1716516Sgblack@eecs.umich.edu
1726516Sgblack@eecs.umich.edu            # Globals to stick the output in
1736516Sgblack@eecs.umich.edu            global header_output
1746516Sgblack@eecs.umich.edu            global decoder_output
1756516Sgblack@eecs.umich.edu            global exec_output
1766516Sgblack@eecs.umich.edu
1776516Sgblack@eecs.umich.edu            # If op2 is used anywhere, make register and immediate versions
1786516Sgblack@eecs.umich.edu            # of this code.
1796516Sgblack@eecs.umich.edu            matcher = re.compile("(?<!\\w)(?P<prefix>s?)op2(?P<typeQual>\\.\\w+)?")
1806516Sgblack@eecs.umich.edu            match = matcher.search(code)
1816516Sgblack@eecs.umich.edu            if match:
1826516Sgblack@eecs.umich.edu                typeQual = ""
1836516Sgblack@eecs.umich.edu                if match.group("typeQual"):
1846516Sgblack@eecs.umich.edu                    typeQual = match.group("typeQual")
1856583Sgblack@eecs.umich.edu                src2_name = "%sFpSrcReg2%s" % (match.group("prefix"), typeQual)
1866516Sgblack@eecs.umich.edu                self.buildCppClasses(name, Name, suffix,
1876516Sgblack@eecs.umich.edu                        matcher.sub(src2_name, code))
1886516Sgblack@eecs.umich.edu                self.buildCppClasses(name + "i", Name, suffix + "Imm",
1896516Sgblack@eecs.umich.edu                        matcher.sub("imm8", code))
1906516Sgblack@eecs.umich.edu                return
1916516Sgblack@eecs.umich.edu
1926516Sgblack@eecs.umich.edu            base = "X86ISA::MediaOp"
1936516Sgblack@eecs.umich.edu
1946516Sgblack@eecs.umich.edu            # If imm8 shows up in the code, use the immediate templates, if
1956516Sgblack@eecs.umich.edu            # not, hopefully the register ones will be correct.
1966516Sgblack@eecs.umich.edu            matcher = re.compile("(?<!\w)imm8(?!\w)")
1976516Sgblack@eecs.umich.edu            if matcher.search(code):
1986516Sgblack@eecs.umich.edu                base += "Imm"
1996516Sgblack@eecs.umich.edu                templates = immTemplates
2006516Sgblack@eecs.umich.edu            else:
2016516Sgblack@eecs.umich.edu                base += "Reg"
2026516Sgblack@eecs.umich.edu                templates = regTemplates
2036516Sgblack@eecs.umich.edu
2046516Sgblack@eecs.umich.edu            # Get everything ready for the substitution
2056516Sgblack@eecs.umich.edu            iop = InstObjParams(name, Name + suffix, base, {"code" : code})
2066516Sgblack@eecs.umich.edu
2076516Sgblack@eecs.umich.edu            # Generate the actual code (finally!)
2086516Sgblack@eecs.umich.edu            header_output += templates[0].subst(iop)
2096516Sgblack@eecs.umich.edu            decoder_output += templates[1].subst(iop)
2106516Sgblack@eecs.umich.edu            exec_output += templates[2].subst(iop)
2116516Sgblack@eecs.umich.edu
2126516Sgblack@eecs.umich.edu
2136516Sgblack@eecs.umich.edu        def __new__(mcls, Name, bases, dict):
2146516Sgblack@eecs.umich.edu            abstract = False
2156516Sgblack@eecs.umich.edu            name = Name.lower()
2166516Sgblack@eecs.umich.edu            if "abstract" in dict:
2176516Sgblack@eecs.umich.edu                abstract = dict['abstract']
2186516Sgblack@eecs.umich.edu                del dict['abstract']
2196516Sgblack@eecs.umich.edu
2206516Sgblack@eecs.umich.edu            cls = super(MediaOpMeta, mcls).__new__(mcls, Name, bases, dict)
2216516Sgblack@eecs.umich.edu            if not abstract:
2226516Sgblack@eecs.umich.edu                cls.className = Name
2236516Sgblack@eecs.umich.edu                cls.base_mnemonic = name
2246516Sgblack@eecs.umich.edu                code = cls.code
2256516Sgblack@eecs.umich.edu
2266516Sgblack@eecs.umich.edu                # Set up the C++ classes
2276516Sgblack@eecs.umich.edu                mcls.buildCppClasses(cls, name, Name, "", code)
2286516Sgblack@eecs.umich.edu
2296516Sgblack@eecs.umich.edu                # Hook into the microassembler dict
2306516Sgblack@eecs.umich.edu                global microopClasses
2316516Sgblack@eecs.umich.edu                microopClasses[name] = cls
2326516Sgblack@eecs.umich.edu
2336516Sgblack@eecs.umich.edu                # If op2 is used anywhere, make register and immediate versions
2346516Sgblack@eecs.umich.edu                # of this code.
2356516Sgblack@eecs.umich.edu                matcher = re.compile("op2(?P<typeQual>\\.\\w+)?")
2366516Sgblack@eecs.umich.edu                if matcher.search(code):
2376516Sgblack@eecs.umich.edu                    microopClasses[name + 'i'] = cls
2386516Sgblack@eecs.umich.edu            return cls
2396516Sgblack@eecs.umich.edu
2406516Sgblack@eecs.umich.edu
2416516Sgblack@eecs.umich.edu    class MediaOp(X86Microop):
2426516Sgblack@eecs.umich.edu        __metaclass__ = MediaOpMeta
2436516Sgblack@eecs.umich.edu        # This class itself doesn't act as a microop
2446516Sgblack@eecs.umich.edu        abstract = True
2456516Sgblack@eecs.umich.edu
2466516Sgblack@eecs.umich.edu        def __init__(self, dest, src1, op2,
2476545Sgblack@eecs.umich.edu                size = None, destSize = None, srcSize = None, ext = None):
2486516Sgblack@eecs.umich.edu            self.dest = dest
2496516Sgblack@eecs.umich.edu            self.src1 = src1
2506516Sgblack@eecs.umich.edu            self.op2 = op2
2516516Sgblack@eecs.umich.edu            if size is not None:
2526516Sgblack@eecs.umich.edu                self.srcSize = size
2536516Sgblack@eecs.umich.edu                self.destSize = size
2546516Sgblack@eecs.umich.edu            if srcSize is not None:
2556516Sgblack@eecs.umich.edu                self.srcSize = srcSize
2566516Sgblack@eecs.umich.edu            if destSize is not None:
2576516Sgblack@eecs.umich.edu                self.destSize = destSize
2586516Sgblack@eecs.umich.edu            if self.srcSize is None:
2596516Sgblack@eecs.umich.edu                raise Exception, "Source size not set."
2606516Sgblack@eecs.umich.edu            if self.destSize is None:
2616516Sgblack@eecs.umich.edu                raise Exception, "Dest size not set."
2626545Sgblack@eecs.umich.edu            if ext is None:
2636545Sgblack@eecs.umich.edu                self.ext = 0
2646516Sgblack@eecs.umich.edu            else:
2656545Sgblack@eecs.umich.edu                self.ext = ext 
2666516Sgblack@eecs.umich.edu
2677620Sgblack@eecs.umich.edu        def getAllocator(self, microFlags):
2686516Sgblack@eecs.umich.edu            className = self.className
2696516Sgblack@eecs.umich.edu            if self.mnemonic == self.base_mnemonic + 'i':
2706516Sgblack@eecs.umich.edu                className += "Imm"
2717620Sgblack@eecs.umich.edu            allocator = '''new %(class_name)s(machInst, macrocodeBlock,
2726516Sgblack@eecs.umich.edu                    %(flags)s, %(src1)s, %(op2)s, %(dest)s,
2736545Sgblack@eecs.umich.edu                    %(srcSize)s, %(destSize)s, %(ext)s)''' % {
2746516Sgblack@eecs.umich.edu                "class_name" : className,
2756516Sgblack@eecs.umich.edu                "flags" : self.microFlagsText(microFlags),
2766516Sgblack@eecs.umich.edu                "src1" : self.src1, "op2" : self.op2,
2776516Sgblack@eecs.umich.edu                "dest" : self.dest,
2786516Sgblack@eecs.umich.edu                "srcSize" : self.srcSize,
2796516Sgblack@eecs.umich.edu                "destSize" : self.destSize,
2806545Sgblack@eecs.umich.edu                "ext" : self.ext}
2816516Sgblack@eecs.umich.edu            return allocator
2826516Sgblack@eecs.umich.edu
2836516Sgblack@eecs.umich.edu    class Mov2int(MediaOp):
2846589Sgblack@eecs.umich.edu        def __init__(self, dest, src1, src2 = 0, \
2856545Sgblack@eecs.umich.edu                size = None, destSize = None, srcSize = None, ext = None):
2866589Sgblack@eecs.umich.edu            super(Mov2int, self).__init__(dest, src1,\
2876589Sgblack@eecs.umich.edu                    src2, size, destSize, srcSize, ext)
2886516Sgblack@eecs.umich.edu        code = '''
2896589Sgblack@eecs.umich.edu            int items = sizeof(FloatRegBits) / srcSize;
2906589Sgblack@eecs.umich.edu            int offset = imm8;
2916589Sgblack@eecs.umich.edu            if (bits(src1, 0) && (ext & 0x1))
2926589Sgblack@eecs.umich.edu                offset -= items;
2936589Sgblack@eecs.umich.edu            if (offset >= 0 && offset < items) {
2946589Sgblack@eecs.umich.edu                uint64_t fpSrcReg1 =
2956589Sgblack@eecs.umich.edu                    bits(FpSrcReg1.uqw,
2966589Sgblack@eecs.umich.edu                            (offset + 1) * srcSize * 8 - 1,
2976589Sgblack@eecs.umich.edu                            (offset + 0) * srcSize * 8);
2986589Sgblack@eecs.umich.edu                DestReg = merge(0, fpSrcReg1, destSize);
2996589Sgblack@eecs.umich.edu            } else {
3006589Sgblack@eecs.umich.edu                DestReg = DestReg;
3016589Sgblack@eecs.umich.edu            }
3026516Sgblack@eecs.umich.edu        '''
3036516Sgblack@eecs.umich.edu
3046516Sgblack@eecs.umich.edu    class Mov2fp(MediaOp):
3056589Sgblack@eecs.umich.edu        def __init__(self, dest, src1, src2 = 0, \
3066545Sgblack@eecs.umich.edu                size = None, destSize = None, srcSize = None, ext = None):
3076589Sgblack@eecs.umich.edu            super(Mov2fp, self).__init__(dest, src1,\
3086589Sgblack@eecs.umich.edu                    src2, size, destSize, srcSize, ext)
3096516Sgblack@eecs.umich.edu        code = '''
3106589Sgblack@eecs.umich.edu            int items = sizeof(FloatRegBits) / destSize;
3116589Sgblack@eecs.umich.edu            int offset = imm8;
3126589Sgblack@eecs.umich.edu            if (bits(dest, 0) && (ext & 0x1))
3136589Sgblack@eecs.umich.edu                offset -= items;
3146589Sgblack@eecs.umich.edu            if (offset >= 0 && offset < items) {
3156589Sgblack@eecs.umich.edu                uint64_t srcReg1 = pick(SrcReg1, 0, srcSize);
3166589Sgblack@eecs.umich.edu                FpDestReg.uqw =
3176589Sgblack@eecs.umich.edu                    insertBits(FpDestReg.uqw,
3186589Sgblack@eecs.umich.edu                            (offset + 1) * destSize * 8 - 1,
3196589Sgblack@eecs.umich.edu                            (offset + 0) * destSize * 8, srcReg1);
3206589Sgblack@eecs.umich.edu            } else {
3216589Sgblack@eecs.umich.edu                FpDestReg.uqw = FpDestReg.uqw;
3226589Sgblack@eecs.umich.edu            }
3236516Sgblack@eecs.umich.edu        '''
3246521Sgblack@eecs.umich.edu
3256592Sgblack@eecs.umich.edu    class Movsign(MediaOp):
3266592Sgblack@eecs.umich.edu        def __init__(self, dest, src, \
3276592Sgblack@eecs.umich.edu                size = None, destSize = None, srcSize = None, ext = None):
3286592Sgblack@eecs.umich.edu            super(Movsign, self).__init__(dest, src,\
3296592Sgblack@eecs.umich.edu                    "InstRegIndex(0)", size, destSize, srcSize, ext)
3306592Sgblack@eecs.umich.edu        code = '''
3316592Sgblack@eecs.umich.edu            int items = sizeof(FloatRegBits) / srcSize;
3326592Sgblack@eecs.umich.edu            uint64_t result = 0;
3336592Sgblack@eecs.umich.edu            int offset = (ext & 0x1) ? items : 0;
3346592Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
3356592Sgblack@eecs.umich.edu                uint64_t picked =
3366592Sgblack@eecs.umich.edu                    bits(FpSrcReg1.uqw, (i + 1) * 8 * srcSize - 1);
3376592Sgblack@eecs.umich.edu                result = insertBits(result, i + offset, i + offset, picked);
3386592Sgblack@eecs.umich.edu            }
3396592Sgblack@eecs.umich.edu            DestReg = DestReg | result;
3406592Sgblack@eecs.umich.edu        '''
3416592Sgblack@eecs.umich.edu
3426594Sgblack@eecs.umich.edu    class Maskmov(MediaOp):
3436594Sgblack@eecs.umich.edu        code = '''
3446594Sgblack@eecs.umich.edu            assert(srcSize == destSize);
3456594Sgblack@eecs.umich.edu            int size = srcSize;
3466594Sgblack@eecs.umich.edu            int sizeBits = size * 8;
3476799Sgblack@eecs.umich.edu            int items = numItems(size);
3486594Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
3496594Sgblack@eecs.umich.edu
3506594Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
3516594Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
3526594Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
3536594Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
3546594Sgblack@eecs.umich.edu                if (bits(FpSrcReg2.uqw, hiIndex))
3556594Sgblack@eecs.umich.edu                    result = insertBits(result, hiIndex, loIndex, arg1Bits);
3566594Sgblack@eecs.umich.edu            }
3576594Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
3586594Sgblack@eecs.umich.edu        '''
3596594Sgblack@eecs.umich.edu
3606596Sgblack@eecs.umich.edu    class shuffle(MediaOp):
3616596Sgblack@eecs.umich.edu        code = '''
3626596Sgblack@eecs.umich.edu            assert(srcSize == destSize);
3636596Sgblack@eecs.umich.edu            int size = srcSize;
3646596Sgblack@eecs.umich.edu            int sizeBits = size * 8;
3656596Sgblack@eecs.umich.edu            int items = sizeof(FloatRegBits) / size;
3666596Sgblack@eecs.umich.edu            int options;
3676596Sgblack@eecs.umich.edu            int optionBits;
3686596Sgblack@eecs.umich.edu            if (size == 8) {
3696596Sgblack@eecs.umich.edu                options = 2;
3706596Sgblack@eecs.umich.edu                optionBits = 1;
3716596Sgblack@eecs.umich.edu            } else {
3726596Sgblack@eecs.umich.edu                options = 4;
3736596Sgblack@eecs.umich.edu                optionBits = 2;
3746596Sgblack@eecs.umich.edu            }
3756596Sgblack@eecs.umich.edu
3766596Sgblack@eecs.umich.edu            uint64_t result = 0;
3776596Sgblack@eecs.umich.edu            uint8_t sel = ext;
3786596Sgblack@eecs.umich.edu
3796596Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
3806596Sgblack@eecs.umich.edu                uint64_t resBits;
3816596Sgblack@eecs.umich.edu                uint8_t lsel = sel & mask(optionBits);
3826596Sgblack@eecs.umich.edu                if (lsel * size >= sizeof(FloatRegBits)) {
3836596Sgblack@eecs.umich.edu                    lsel -= options / 2;
3846596Sgblack@eecs.umich.edu                    resBits = bits(FpSrcReg2.uqw,
3856596Sgblack@eecs.umich.edu                            (lsel + 1) * sizeBits - 1,
3866596Sgblack@eecs.umich.edu                            (lsel + 0) * sizeBits);
3876596Sgblack@eecs.umich.edu                }  else {
3886596Sgblack@eecs.umich.edu                    resBits = bits(FpSrcReg1.uqw,
3896596Sgblack@eecs.umich.edu                            (lsel + 1) * sizeBits - 1,
3906596Sgblack@eecs.umich.edu                            (lsel + 0) * sizeBits);
3916596Sgblack@eecs.umich.edu                }
3926596Sgblack@eecs.umich.edu
3936596Sgblack@eecs.umich.edu                sel >>= optionBits;
3946596Sgblack@eecs.umich.edu
3956596Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
3966596Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
3976596Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, resBits);
3986596Sgblack@eecs.umich.edu            }
3996596Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
4006596Sgblack@eecs.umich.edu        '''
4016596Sgblack@eecs.umich.edu
4026521Sgblack@eecs.umich.edu    class Unpack(MediaOp):
4036521Sgblack@eecs.umich.edu        code = '''
4046521Sgblack@eecs.umich.edu            assert(srcSize == destSize);
4056521Sgblack@eecs.umich.edu            int size = destSize;
4066521Sgblack@eecs.umich.edu            int items = (sizeof(FloatRegBits) / size) / 2;
4076545Sgblack@eecs.umich.edu            int offset = ext ? items : 0;
4086521Sgblack@eecs.umich.edu            uint64_t result = 0;
4096521Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
4106521Sgblack@eecs.umich.edu                uint64_t pickedLow =
4116521Sgblack@eecs.umich.edu                    bits(FpSrcReg1.uqw, (i + offset + 1) * 8 * size - 1,
4126521Sgblack@eecs.umich.edu                                        (i + offset) * 8 * size);
4136521Sgblack@eecs.umich.edu                result = insertBits(result,
4146521Sgblack@eecs.umich.edu                                    (2 * i + 1) * 8 * size - 1,
4156521Sgblack@eecs.umich.edu                                    (2 * i + 0) * 8 * size,
4166521Sgblack@eecs.umich.edu                                    pickedLow);
4176521Sgblack@eecs.umich.edu                uint64_t pickedHigh =
4186521Sgblack@eecs.umich.edu                    bits(FpSrcReg2.uqw, (i + offset + 1) * 8 * size - 1,
4196521Sgblack@eecs.umich.edu                                        (i + offset) * 8 * size);
4206521Sgblack@eecs.umich.edu                result = insertBits(result,
4216521Sgblack@eecs.umich.edu                                    (2 * i + 2) * 8 * size - 1,
4226521Sgblack@eecs.umich.edu                                    (2 * i + 1) * 8 * size,
4236521Sgblack@eecs.umich.edu                                    pickedHigh);
4246521Sgblack@eecs.umich.edu            }
4256521Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
4266521Sgblack@eecs.umich.edu        '''
4276534Sgblack@eecs.umich.edu
4286546Sgblack@eecs.umich.edu    class Pack(MediaOp):
4296546Sgblack@eecs.umich.edu        code = '''
4306546Sgblack@eecs.umich.edu            assert(srcSize == destSize * 2);
4316546Sgblack@eecs.umich.edu            int items = (sizeof(FloatRegBits) / destSize);
4326546Sgblack@eecs.umich.edu            int destBits = destSize * 8;
4336546Sgblack@eecs.umich.edu            int srcBits = srcSize * 8;
4346546Sgblack@eecs.umich.edu            uint64_t result = 0;
4356546Sgblack@eecs.umich.edu            int i;
4366546Sgblack@eecs.umich.edu            for (i = 0; i < items / 2; i++) {
4376546Sgblack@eecs.umich.edu                uint64_t picked =
4386546Sgblack@eecs.umich.edu                    bits(FpSrcReg1.uqw, (i + 1) * srcBits - 1,
4396546Sgblack@eecs.umich.edu                                        (i + 0) * srcBits);
4406546Sgblack@eecs.umich.edu                unsigned signBit = bits(picked, srcBits - 1);
4416546Sgblack@eecs.umich.edu                uint64_t overflow = bits(picked, srcBits - 1, destBits - 1);
4426546Sgblack@eecs.umich.edu
4436546Sgblack@eecs.umich.edu                // Handle saturation.
4446546Sgblack@eecs.umich.edu                if (signBit) {
4456546Sgblack@eecs.umich.edu                    if (overflow != mask(destBits - srcBits + 1)) {
4466801Sgblack@eecs.umich.edu                        if (signedOp())
4476742Svince@csl.cornell.edu                            picked = (ULL(1) << (destBits - 1));
4486546Sgblack@eecs.umich.edu                        else
4496546Sgblack@eecs.umich.edu                            picked = 0;
4506546Sgblack@eecs.umich.edu                    }
4516546Sgblack@eecs.umich.edu                } else {
4526546Sgblack@eecs.umich.edu                    if (overflow != 0) {
4536801Sgblack@eecs.umich.edu                        if (signedOp())
4546546Sgblack@eecs.umich.edu                            picked = mask(destBits - 1);
4556546Sgblack@eecs.umich.edu                        else
4566546Sgblack@eecs.umich.edu                            picked = mask(destBits);
4576546Sgblack@eecs.umich.edu                    }
4586546Sgblack@eecs.umich.edu                }
4596546Sgblack@eecs.umich.edu                result = insertBits(result,
4606546Sgblack@eecs.umich.edu                                    (i + 1) * destBits - 1,
4616546Sgblack@eecs.umich.edu                                    (i + 0) * destBits,
4626546Sgblack@eecs.umich.edu                                    picked);
4636546Sgblack@eecs.umich.edu            }
4646546Sgblack@eecs.umich.edu            for (;i < items; i++) {
4656546Sgblack@eecs.umich.edu                uint64_t picked =
4666546Sgblack@eecs.umich.edu                    bits(FpSrcReg2.uqw, (i - items + 1) * srcBits - 1,
4676546Sgblack@eecs.umich.edu                                        (i - items + 0) * srcBits);
4686546Sgblack@eecs.umich.edu                unsigned signBit = bits(picked, srcBits - 1);
4696546Sgblack@eecs.umich.edu                uint64_t overflow = bits(picked, srcBits - 1, destBits - 1);
4706546Sgblack@eecs.umich.edu
4716546Sgblack@eecs.umich.edu                // Handle saturation.
4726546Sgblack@eecs.umich.edu                if (signBit) {
4736546Sgblack@eecs.umich.edu                    if (overflow != mask(destBits - srcBits + 1)) {
4746801Sgblack@eecs.umich.edu                        if (signedOp())
4756742Svince@csl.cornell.edu                            picked = (ULL(1) << (destBits - 1));
4766546Sgblack@eecs.umich.edu                        else
4776546Sgblack@eecs.umich.edu                            picked = 0;
4786546Sgblack@eecs.umich.edu                    }
4796546Sgblack@eecs.umich.edu                } else {
4806546Sgblack@eecs.umich.edu                    if (overflow != 0) {
4816801Sgblack@eecs.umich.edu                        if (signedOp())
4826546Sgblack@eecs.umich.edu                            picked = mask(destBits - 1);
4836546Sgblack@eecs.umich.edu                        else
4846546Sgblack@eecs.umich.edu                            picked = mask(destBits);
4856546Sgblack@eecs.umich.edu                    }
4866546Sgblack@eecs.umich.edu                }
4876546Sgblack@eecs.umich.edu                result = insertBits(result,
4886546Sgblack@eecs.umich.edu                                    (i + 1) * destBits - 1,
4896546Sgblack@eecs.umich.edu                                    (i + 0) * destBits,
4906546Sgblack@eecs.umich.edu                                    picked);
4916546Sgblack@eecs.umich.edu            }
4926546Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
4936546Sgblack@eecs.umich.edu        '''
4946546Sgblack@eecs.umich.edu
4956534Sgblack@eecs.umich.edu    class Mxor(MediaOp):
4966534Sgblack@eecs.umich.edu        def __init__(self, dest, src1, src2):
4976534Sgblack@eecs.umich.edu            super(Mxor, self).__init__(dest, src1, src2, 1)
4986534Sgblack@eecs.umich.edu        code = '''
4996534Sgblack@eecs.umich.edu            FpDestReg.uqw = FpSrcReg1.uqw ^ FpSrcReg2.uqw;
5006534Sgblack@eecs.umich.edu        '''
5016537Sgblack@eecs.umich.edu
5026537Sgblack@eecs.umich.edu    class Mor(MediaOp):
5036537Sgblack@eecs.umich.edu        def __init__(self, dest, src1, src2):
5046537Sgblack@eecs.umich.edu            super(Mor, self).__init__(dest, src1, src2, 1)
5056537Sgblack@eecs.umich.edu        code = '''
5066537Sgblack@eecs.umich.edu            FpDestReg.uqw = FpSrcReg1.uqw | FpSrcReg2.uqw;
5076537Sgblack@eecs.umich.edu        '''
5086539Sgblack@eecs.umich.edu
5096539Sgblack@eecs.umich.edu    class Mand(MediaOp):
5106539Sgblack@eecs.umich.edu        def __init__(self, dest, src1, src2):
5116539Sgblack@eecs.umich.edu            super(Mand, self).__init__(dest, src1, src2, 1)
5126539Sgblack@eecs.umich.edu        code = '''
5136539Sgblack@eecs.umich.edu            FpDestReg.uqw = FpSrcReg1.uqw & FpSrcReg2.uqw;
5146539Sgblack@eecs.umich.edu        '''
5156541Sgblack@eecs.umich.edu
5166541Sgblack@eecs.umich.edu    class Mandn(MediaOp):
5176541Sgblack@eecs.umich.edu        def __init__(self, dest, src1, src2):
5186541Sgblack@eecs.umich.edu            super(Mandn, self).__init__(dest, src1, src2, 1)
5196541Sgblack@eecs.umich.edu        code = '''
5206541Sgblack@eecs.umich.edu            FpDestReg.uqw = ~FpSrcReg1.uqw & FpSrcReg2.uqw;
5216541Sgblack@eecs.umich.edu        '''
5226548Sgblack@eecs.umich.edu
5236548Sgblack@eecs.umich.edu    class Mminf(MediaOp):
5246548Sgblack@eecs.umich.edu        code = '''
5256548Sgblack@eecs.umich.edu            union floatInt
5266548Sgblack@eecs.umich.edu            {
5276548Sgblack@eecs.umich.edu                float f;
5286548Sgblack@eecs.umich.edu                uint32_t i;
5296548Sgblack@eecs.umich.edu            };
5306548Sgblack@eecs.umich.edu            union doubleInt
5316548Sgblack@eecs.umich.edu            {
5326548Sgblack@eecs.umich.edu                double d;
5336548Sgblack@eecs.umich.edu                uint64_t i;
5346548Sgblack@eecs.umich.edu            };
5356548Sgblack@eecs.umich.edu
5366548Sgblack@eecs.umich.edu            assert(srcSize == destSize);
5376548Sgblack@eecs.umich.edu            int size = srcSize;
5386548Sgblack@eecs.umich.edu            int sizeBits = size * 8;
5396548Sgblack@eecs.umich.edu            assert(srcSize == 4 || srcSize == 8);
5406799Sgblack@eecs.umich.edu            int items = numItems(size);
5416548Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
5426548Sgblack@eecs.umich.edu
5436548Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
5446548Sgblack@eecs.umich.edu                double arg1, arg2;
5456548Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
5466548Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
5476548Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
5486548Sgblack@eecs.umich.edu                uint64_t arg2Bits = bits(FpSrcReg2.uqw, hiIndex, loIndex);
5496548Sgblack@eecs.umich.edu
5506548Sgblack@eecs.umich.edu                if (size == 4) {
5516548Sgblack@eecs.umich.edu                    floatInt fi;
5526548Sgblack@eecs.umich.edu                    fi.i = arg1Bits;
5536548Sgblack@eecs.umich.edu                    arg1 = fi.f;
5546548Sgblack@eecs.umich.edu                    fi.i = arg2Bits;
5556548Sgblack@eecs.umich.edu                    arg2 = fi.f;
5566548Sgblack@eecs.umich.edu                } else {
5576548Sgblack@eecs.umich.edu                    doubleInt di;
5586548Sgblack@eecs.umich.edu                    di.i = arg1Bits;
5596548Sgblack@eecs.umich.edu                    arg1 = di.d;
5606548Sgblack@eecs.umich.edu                    di.i = arg2Bits;
5616548Sgblack@eecs.umich.edu                    arg2 = di.d;
5626548Sgblack@eecs.umich.edu                }
5636548Sgblack@eecs.umich.edu
5646548Sgblack@eecs.umich.edu                if (arg1 < arg2) {
5656548Sgblack@eecs.umich.edu                    result = insertBits(result, hiIndex, loIndex, arg1Bits);
5666548Sgblack@eecs.umich.edu                } else {
5676548Sgblack@eecs.umich.edu                    result = insertBits(result, hiIndex, loIndex, arg2Bits);
5686548Sgblack@eecs.umich.edu                }
5696548Sgblack@eecs.umich.edu            }
5706548Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
5716548Sgblack@eecs.umich.edu        '''
5726550Sgblack@eecs.umich.edu
5736550Sgblack@eecs.umich.edu    class Mmaxf(MediaOp):
5746550Sgblack@eecs.umich.edu        code = '''
5756550Sgblack@eecs.umich.edu            union floatInt
5766550Sgblack@eecs.umich.edu            {
5776550Sgblack@eecs.umich.edu                float f;
5786550Sgblack@eecs.umich.edu                uint32_t i;
5796550Sgblack@eecs.umich.edu            };
5806550Sgblack@eecs.umich.edu            union doubleInt
5816550Sgblack@eecs.umich.edu            {
5826550Sgblack@eecs.umich.edu                double d;
5836550Sgblack@eecs.umich.edu                uint64_t i;
5846550Sgblack@eecs.umich.edu            };
5856550Sgblack@eecs.umich.edu
5866550Sgblack@eecs.umich.edu            assert(srcSize == destSize);
5876550Sgblack@eecs.umich.edu            int size = srcSize;
5886550Sgblack@eecs.umich.edu            int sizeBits = size * 8;
5896550Sgblack@eecs.umich.edu            assert(srcSize == 4 || srcSize == 8);
5906799Sgblack@eecs.umich.edu            int items = numItems(size);
5916550Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
5926550Sgblack@eecs.umich.edu
5936550Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
5946550Sgblack@eecs.umich.edu                double arg1, arg2;
5956550Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
5966550Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
5976550Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
5986550Sgblack@eecs.umich.edu                uint64_t arg2Bits = bits(FpSrcReg2.uqw, hiIndex, loIndex);
5996550Sgblack@eecs.umich.edu
6006550Sgblack@eecs.umich.edu                if (size == 4) {
6016550Sgblack@eecs.umich.edu                    floatInt fi;
6026550Sgblack@eecs.umich.edu                    fi.i = arg1Bits;
6036550Sgblack@eecs.umich.edu                    arg1 = fi.f;
6046550Sgblack@eecs.umich.edu                    fi.i = arg2Bits;
6056550Sgblack@eecs.umich.edu                    arg2 = fi.f;
6066550Sgblack@eecs.umich.edu                } else {
6076550Sgblack@eecs.umich.edu                    doubleInt di;
6086550Sgblack@eecs.umich.edu                    di.i = arg1Bits;
6096550Sgblack@eecs.umich.edu                    arg1 = di.d;
6106550Sgblack@eecs.umich.edu                    di.i = arg2Bits;
6116550Sgblack@eecs.umich.edu                    arg2 = di.d;
6126550Sgblack@eecs.umich.edu                }
6136550Sgblack@eecs.umich.edu
6146550Sgblack@eecs.umich.edu                if (arg1 > arg2) {
6156550Sgblack@eecs.umich.edu                    result = insertBits(result, hiIndex, loIndex, arg1Bits);
6166550Sgblack@eecs.umich.edu                } else {
6176550Sgblack@eecs.umich.edu                    result = insertBits(result, hiIndex, loIndex, arg2Bits);
6186550Sgblack@eecs.umich.edu                }
6196550Sgblack@eecs.umich.edu            }
6206550Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
6216550Sgblack@eecs.umich.edu        '''
6226552Sgblack@eecs.umich.edu
6236572Sgblack@eecs.umich.edu    class Mmini(MediaOp):
6246572Sgblack@eecs.umich.edu        code = '''
6256572Sgblack@eecs.umich.edu
6266572Sgblack@eecs.umich.edu            assert(srcSize == destSize);
6276572Sgblack@eecs.umich.edu            int size = srcSize;
6286572Sgblack@eecs.umich.edu            int sizeBits = size * 8;
6296799Sgblack@eecs.umich.edu            int items = numItems(size);
6306572Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
6316572Sgblack@eecs.umich.edu
6326572Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
6336572Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
6346572Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
6356572Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
6366572Sgblack@eecs.umich.edu                int64_t arg1 = arg1Bits |
6376742Svince@csl.cornell.edu                    (0 - (arg1Bits & (ULL(1) << (sizeBits - 1))));
6386572Sgblack@eecs.umich.edu                uint64_t arg2Bits = bits(FpSrcReg2.uqw, hiIndex, loIndex);
6396572Sgblack@eecs.umich.edu                int64_t arg2 = arg2Bits |
6406742Svince@csl.cornell.edu                    (0 - (arg2Bits & (ULL(1) << (sizeBits - 1))));
6416572Sgblack@eecs.umich.edu                uint64_t resBits;
6426572Sgblack@eecs.umich.edu
6436801Sgblack@eecs.umich.edu                if (signedOp()) {
6446572Sgblack@eecs.umich.edu                    if (arg1 < arg2) {
6456572Sgblack@eecs.umich.edu                        resBits = arg1Bits;
6466572Sgblack@eecs.umich.edu                    } else {
6476572Sgblack@eecs.umich.edu                        resBits = arg2Bits;
6486572Sgblack@eecs.umich.edu                    }
6496572Sgblack@eecs.umich.edu                } else {
6506572Sgblack@eecs.umich.edu                    if (arg1Bits < arg2Bits) {
6516572Sgblack@eecs.umich.edu                        resBits = arg1Bits;
6526572Sgblack@eecs.umich.edu                    } else {
6536572Sgblack@eecs.umich.edu                        resBits = arg2Bits;
6546572Sgblack@eecs.umich.edu                    }
6556572Sgblack@eecs.umich.edu                }
6566572Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, resBits);
6576572Sgblack@eecs.umich.edu            }
6586572Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
6596572Sgblack@eecs.umich.edu        '''
6606572Sgblack@eecs.umich.edu
6616574Sgblack@eecs.umich.edu    class Mmaxi(MediaOp):
6626574Sgblack@eecs.umich.edu        code = '''
6636574Sgblack@eecs.umich.edu
6646574Sgblack@eecs.umich.edu            assert(srcSize == destSize);
6656574Sgblack@eecs.umich.edu            int size = srcSize;
6666574Sgblack@eecs.umich.edu            int sizeBits = size * 8;
6676799Sgblack@eecs.umich.edu            int items = numItems(size);
6686574Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
6696574Sgblack@eecs.umich.edu
6706574Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
6716574Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
6726574Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
6736574Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
6746574Sgblack@eecs.umich.edu                int64_t arg1 = arg1Bits |
6756742Svince@csl.cornell.edu                    (0 - (arg1Bits & (ULL(1) << (sizeBits - 1))));
6766574Sgblack@eecs.umich.edu                uint64_t arg2Bits = bits(FpSrcReg2.uqw, hiIndex, loIndex);
6776574Sgblack@eecs.umich.edu                int64_t arg2 = arg2Bits |
6786742Svince@csl.cornell.edu                    (0 - (arg2Bits & (ULL(1) << (sizeBits - 1))));
6796574Sgblack@eecs.umich.edu                uint64_t resBits;
6806574Sgblack@eecs.umich.edu
6816801Sgblack@eecs.umich.edu                if (signedOp()) {
6826574Sgblack@eecs.umich.edu                    if (arg1 > arg2) {
6836574Sgblack@eecs.umich.edu                        resBits = arg1Bits;
6846574Sgblack@eecs.umich.edu                    } else {
6856574Sgblack@eecs.umich.edu                        resBits = arg2Bits;
6866574Sgblack@eecs.umich.edu                    }
6876574Sgblack@eecs.umich.edu                } else {
6886574Sgblack@eecs.umich.edu                    if (arg1Bits > arg2Bits) {
6896574Sgblack@eecs.umich.edu                        resBits = arg1Bits;
6906574Sgblack@eecs.umich.edu                    } else {
6916574Sgblack@eecs.umich.edu                        resBits = arg2Bits;
6926574Sgblack@eecs.umich.edu                    }
6936574Sgblack@eecs.umich.edu                }
6946574Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, resBits);
6956574Sgblack@eecs.umich.edu            }
6966574Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
6976574Sgblack@eecs.umich.edu        '''
6986574Sgblack@eecs.umich.edu
6996552Sgblack@eecs.umich.edu    class Msqrt(MediaOp):
7006552Sgblack@eecs.umich.edu        def __init__(self, dest, src, \
7016552Sgblack@eecs.umich.edu                size = None, destSize = None, srcSize = None, ext = None):
7026552Sgblack@eecs.umich.edu            super(Msqrt, self).__init__(dest, src,\
7036552Sgblack@eecs.umich.edu                    "InstRegIndex(0)", size, destSize, srcSize, ext)
7046552Sgblack@eecs.umich.edu        code = '''
7056552Sgblack@eecs.umich.edu            union floatInt
7066552Sgblack@eecs.umich.edu            {
7076552Sgblack@eecs.umich.edu                float f;
7086552Sgblack@eecs.umich.edu                uint32_t i;
7096552Sgblack@eecs.umich.edu            };
7106552Sgblack@eecs.umich.edu            union doubleInt
7116552Sgblack@eecs.umich.edu            {
7126552Sgblack@eecs.umich.edu                double d;
7136552Sgblack@eecs.umich.edu                uint64_t i;
7146552Sgblack@eecs.umich.edu            };
7156552Sgblack@eecs.umich.edu
7166552Sgblack@eecs.umich.edu            assert(srcSize == destSize);
7176552Sgblack@eecs.umich.edu            int size = srcSize;
7186552Sgblack@eecs.umich.edu            int sizeBits = size * 8;
7196552Sgblack@eecs.umich.edu            assert(srcSize == 4 || srcSize == 8);
7206799Sgblack@eecs.umich.edu            int items = numItems(size);
7216552Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
7226552Sgblack@eecs.umich.edu
7236552Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
7246552Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
7256552Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
7266552Sgblack@eecs.umich.edu                uint64_t argBits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
7276552Sgblack@eecs.umich.edu
7286552Sgblack@eecs.umich.edu                if (size == 4) {
7296552Sgblack@eecs.umich.edu                    floatInt fi;
7306552Sgblack@eecs.umich.edu                    fi.i = argBits;
7316552Sgblack@eecs.umich.edu                    fi.f = sqrt(fi.f);
7326552Sgblack@eecs.umich.edu                    argBits = fi.i;
7336552Sgblack@eecs.umich.edu                } else {
7346552Sgblack@eecs.umich.edu                    doubleInt di;
7356552Sgblack@eecs.umich.edu                    di.i = argBits;
7366552Sgblack@eecs.umich.edu                    di.d = sqrt(di.d);
7376552Sgblack@eecs.umich.edu                    argBits = di.i;
7386552Sgblack@eecs.umich.edu                }
7396552Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, argBits);
7406552Sgblack@eecs.umich.edu            }
7416552Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
7426552Sgblack@eecs.umich.edu        '''
7436554Sgblack@eecs.umich.edu
7446554Sgblack@eecs.umich.edu    class Maddf(MediaOp):
7456554Sgblack@eecs.umich.edu        code = '''
7466554Sgblack@eecs.umich.edu            union floatInt
7476554Sgblack@eecs.umich.edu            {
7486554Sgblack@eecs.umich.edu                float f;
7496554Sgblack@eecs.umich.edu                uint32_t i;
7506554Sgblack@eecs.umich.edu            };
7516554Sgblack@eecs.umich.edu            union doubleInt
7526554Sgblack@eecs.umich.edu            {
7536554Sgblack@eecs.umich.edu                double d;
7546554Sgblack@eecs.umich.edu                uint64_t i;
7556554Sgblack@eecs.umich.edu            };
7566554Sgblack@eecs.umich.edu
7576554Sgblack@eecs.umich.edu            assert(srcSize == destSize);
7586554Sgblack@eecs.umich.edu            int size = srcSize;
7596554Sgblack@eecs.umich.edu            int sizeBits = size * 8;
7606554Sgblack@eecs.umich.edu            assert(srcSize == 4 || srcSize == 8);
7616799Sgblack@eecs.umich.edu            int items = numItems(size);
7626554Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
7636554Sgblack@eecs.umich.edu
7646554Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
7656554Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
7666554Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
7676554Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
7686554Sgblack@eecs.umich.edu                uint64_t arg2Bits = bits(FpSrcReg2.uqw, hiIndex, loIndex);
7696554Sgblack@eecs.umich.edu                uint64_t resBits;
7706554Sgblack@eecs.umich.edu
7716554Sgblack@eecs.umich.edu                if (size == 4) {
7726554Sgblack@eecs.umich.edu                    floatInt arg1, arg2, res;
7736554Sgblack@eecs.umich.edu                    arg1.i = arg1Bits;
7746554Sgblack@eecs.umich.edu                    arg2.i = arg2Bits;
7756554Sgblack@eecs.umich.edu                    res.f = arg1.f + arg2.f;
7766554Sgblack@eecs.umich.edu                    resBits = res.i;
7776554Sgblack@eecs.umich.edu                } else {
7786554Sgblack@eecs.umich.edu                    doubleInt arg1, arg2, res;
7796554Sgblack@eecs.umich.edu                    arg1.i = arg1Bits;
7806554Sgblack@eecs.umich.edu                    arg2.i = arg2Bits;
7816554Sgblack@eecs.umich.edu                    res.d = arg1.d + arg2.d;
7826554Sgblack@eecs.umich.edu                    resBits = res.i;
7836554Sgblack@eecs.umich.edu                }
7846554Sgblack@eecs.umich.edu
7856554Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, resBits);
7866554Sgblack@eecs.umich.edu            }
7876554Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
7886554Sgblack@eecs.umich.edu        '''
7896556Sgblack@eecs.umich.edu
7906556Sgblack@eecs.umich.edu    class Msubf(MediaOp):
7916556Sgblack@eecs.umich.edu        code = '''
7926556Sgblack@eecs.umich.edu            union floatInt
7936556Sgblack@eecs.umich.edu            {
7946556Sgblack@eecs.umich.edu                float f;
7956556Sgblack@eecs.umich.edu                uint32_t i;
7966556Sgblack@eecs.umich.edu            };
7976556Sgblack@eecs.umich.edu            union doubleInt
7986556Sgblack@eecs.umich.edu            {
7996556Sgblack@eecs.umich.edu                double d;
8006556Sgblack@eecs.umich.edu                uint64_t i;
8016556Sgblack@eecs.umich.edu            };
8026556Sgblack@eecs.umich.edu
8036556Sgblack@eecs.umich.edu            assert(srcSize == destSize);
8046556Sgblack@eecs.umich.edu            int size = srcSize;
8056556Sgblack@eecs.umich.edu            int sizeBits = size * 8;
8066556Sgblack@eecs.umich.edu            assert(srcSize == 4 || srcSize == 8);
8076799Sgblack@eecs.umich.edu            int items = numItems(size);
8086556Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
8096556Sgblack@eecs.umich.edu
8106556Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
8116556Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
8126556Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
8136556Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
8146556Sgblack@eecs.umich.edu                uint64_t arg2Bits = bits(FpSrcReg2.uqw, hiIndex, loIndex);
8156556Sgblack@eecs.umich.edu                uint64_t resBits;
8166556Sgblack@eecs.umich.edu
8176556Sgblack@eecs.umich.edu                if (size == 4) {
8186556Sgblack@eecs.umich.edu                    floatInt arg1, arg2, res;
8196556Sgblack@eecs.umich.edu                    arg1.i = arg1Bits;
8206556Sgblack@eecs.umich.edu                    arg2.i = arg2Bits;
8216556Sgblack@eecs.umich.edu                    res.f = arg1.f - arg2.f;
8226556Sgblack@eecs.umich.edu                    resBits = res.i;
8236556Sgblack@eecs.umich.edu                } else {
8246556Sgblack@eecs.umich.edu                    doubleInt arg1, arg2, res;
8256556Sgblack@eecs.umich.edu                    arg1.i = arg1Bits;
8266556Sgblack@eecs.umich.edu                    arg2.i = arg2Bits;
8276556Sgblack@eecs.umich.edu                    res.d = arg1.d - arg2.d;
8286556Sgblack@eecs.umich.edu                    resBits = res.i;
8296556Sgblack@eecs.umich.edu                }
8306556Sgblack@eecs.umich.edu
8316556Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, resBits);
8326556Sgblack@eecs.umich.edu            }
8336556Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
8346556Sgblack@eecs.umich.edu        '''
8356558Sgblack@eecs.umich.edu
8366558Sgblack@eecs.umich.edu    class Mmulf(MediaOp):
8376558Sgblack@eecs.umich.edu        code = '''
8386558Sgblack@eecs.umich.edu            union floatInt
8396558Sgblack@eecs.umich.edu            {
8406558Sgblack@eecs.umich.edu                float f;
8416558Sgblack@eecs.umich.edu                uint32_t i;
8426558Sgblack@eecs.umich.edu            };
8436558Sgblack@eecs.umich.edu            union doubleInt
8446558Sgblack@eecs.umich.edu            {
8456558Sgblack@eecs.umich.edu                double d;
8466558Sgblack@eecs.umich.edu                uint64_t i;
8476558Sgblack@eecs.umich.edu            };
8486558Sgblack@eecs.umich.edu
8496558Sgblack@eecs.umich.edu            assert(srcSize == destSize);
8506558Sgblack@eecs.umich.edu            int size = srcSize;
8516558Sgblack@eecs.umich.edu            int sizeBits = size * 8;
8526558Sgblack@eecs.umich.edu            assert(srcSize == 4 || srcSize == 8);
8536799Sgblack@eecs.umich.edu            int items = numItems(size);
8546558Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
8556558Sgblack@eecs.umich.edu
8566558Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
8576558Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
8586558Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
8596558Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
8606558Sgblack@eecs.umich.edu                uint64_t arg2Bits = bits(FpSrcReg2.uqw, hiIndex, loIndex);
8616558Sgblack@eecs.umich.edu                uint64_t resBits;
8626558Sgblack@eecs.umich.edu
8636558Sgblack@eecs.umich.edu                if (size == 4) {
8646558Sgblack@eecs.umich.edu                    floatInt arg1, arg2, res;
8656558Sgblack@eecs.umich.edu                    arg1.i = arg1Bits;
8666558Sgblack@eecs.umich.edu                    arg2.i = arg2Bits;
8676558Sgblack@eecs.umich.edu                    res.f = arg1.f * arg2.f;
8686558Sgblack@eecs.umich.edu                    resBits = res.i;
8696558Sgblack@eecs.umich.edu                } else {
8706558Sgblack@eecs.umich.edu                    doubleInt arg1, arg2, res;
8716558Sgblack@eecs.umich.edu                    arg1.i = arg1Bits;
8726558Sgblack@eecs.umich.edu                    arg2.i = arg2Bits;
8736558Sgblack@eecs.umich.edu                    res.d = arg1.d * arg2.d;
8746558Sgblack@eecs.umich.edu                    resBits = res.i;
8756558Sgblack@eecs.umich.edu                }
8766558Sgblack@eecs.umich.edu
8776558Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, resBits);
8786558Sgblack@eecs.umich.edu            }
8796558Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
8806558Sgblack@eecs.umich.edu        '''
8816560Sgblack@eecs.umich.edu
8826560Sgblack@eecs.umich.edu    class Mdivf(MediaOp):
8836560Sgblack@eecs.umich.edu        code = '''
8846560Sgblack@eecs.umich.edu            union floatInt
8856560Sgblack@eecs.umich.edu            {
8866560Sgblack@eecs.umich.edu                float f;
8876560Sgblack@eecs.umich.edu                uint32_t i;
8886560Sgblack@eecs.umich.edu            };
8896560Sgblack@eecs.umich.edu            union doubleInt
8906560Sgblack@eecs.umich.edu            {
8916560Sgblack@eecs.umich.edu                double d;
8926560Sgblack@eecs.umich.edu                uint64_t i;
8936560Sgblack@eecs.umich.edu            };
8946560Sgblack@eecs.umich.edu
8956560Sgblack@eecs.umich.edu            assert(srcSize == destSize);
8966560Sgblack@eecs.umich.edu            int size = srcSize;
8976560Sgblack@eecs.umich.edu            int sizeBits = size * 8;
8986560Sgblack@eecs.umich.edu            assert(srcSize == 4 || srcSize == 8);
8996799Sgblack@eecs.umich.edu            int items = numItems(size);
9006560Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
9016560Sgblack@eecs.umich.edu
9026560Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
9036560Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
9046560Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
9056560Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
9066560Sgblack@eecs.umich.edu                uint64_t arg2Bits = bits(FpSrcReg2.uqw, hiIndex, loIndex);
9076560Sgblack@eecs.umich.edu                uint64_t resBits;
9086560Sgblack@eecs.umich.edu
9096560Sgblack@eecs.umich.edu                if (size == 4) {
9106560Sgblack@eecs.umich.edu                    floatInt arg1, arg2, res;
9116560Sgblack@eecs.umich.edu                    arg1.i = arg1Bits;
9126560Sgblack@eecs.umich.edu                    arg2.i = arg2Bits;
9136560Sgblack@eecs.umich.edu                    res.f = arg1.f / arg2.f;
9146560Sgblack@eecs.umich.edu                    resBits = res.i;
9156560Sgblack@eecs.umich.edu                } else {
9166560Sgblack@eecs.umich.edu                    doubleInt arg1, arg2, res;
9176560Sgblack@eecs.umich.edu                    arg1.i = arg1Bits;
9186560Sgblack@eecs.umich.edu                    arg2.i = arg2Bits;
9196560Sgblack@eecs.umich.edu                    res.d = arg1.d / arg2.d;
9206560Sgblack@eecs.umich.edu                    resBits = res.i;
9216560Sgblack@eecs.umich.edu                }
9226560Sgblack@eecs.umich.edu
9236560Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, resBits);
9246560Sgblack@eecs.umich.edu            }
9256560Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
9266560Sgblack@eecs.umich.edu        '''
9276562Sgblack@eecs.umich.edu
9286570Sgblack@eecs.umich.edu    class Maddi(MediaOp):
9296570Sgblack@eecs.umich.edu        code = '''
9306570Sgblack@eecs.umich.edu            assert(srcSize == destSize);
9316570Sgblack@eecs.umich.edu            int size = srcSize;
9326570Sgblack@eecs.umich.edu            int sizeBits = size * 8;
9336799Sgblack@eecs.umich.edu            int items = numItems(size);
9346570Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
9356570Sgblack@eecs.umich.edu
9366570Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
9376570Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
9386570Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
9396570Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
9406570Sgblack@eecs.umich.edu                uint64_t arg2Bits = bits(FpSrcReg2.uqw, hiIndex, loIndex);
9416570Sgblack@eecs.umich.edu                uint64_t resBits = arg1Bits + arg2Bits;
9426570Sgblack@eecs.umich.edu                
9436570Sgblack@eecs.umich.edu                if (ext & 0x2) {
9446801Sgblack@eecs.umich.edu                    if (signedOp()) {
9456801Sgblack@eecs.umich.edu                        int arg1Sign = bits(arg1Bits, sizeBits - 1);
9466801Sgblack@eecs.umich.edu                        int arg2Sign = bits(arg2Bits, sizeBits - 1);
9476801Sgblack@eecs.umich.edu                        int resSign = bits(resBits, sizeBits - 1);
9486801Sgblack@eecs.umich.edu                        if ((arg1Sign == arg2Sign) && (arg1Sign != resSign)) {
9496801Sgblack@eecs.umich.edu                            if (resSign == 0)
9506801Sgblack@eecs.umich.edu                                resBits = (ULL(1) << (sizeBits - 1));
9516801Sgblack@eecs.umich.edu                            else
9526801Sgblack@eecs.umich.edu                                resBits = mask(sizeBits - 1);
9536801Sgblack@eecs.umich.edu                        }
9546801Sgblack@eecs.umich.edu                    } else {
9556801Sgblack@eecs.umich.edu                        if (findCarry(sizeBits, resBits, arg1Bits, arg2Bits))
9566801Sgblack@eecs.umich.edu                            resBits = mask(sizeBits);
9576570Sgblack@eecs.umich.edu                    }
9586570Sgblack@eecs.umich.edu                }
9596570Sgblack@eecs.umich.edu
9606570Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, resBits);
9616570Sgblack@eecs.umich.edu            }
9626570Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
9636570Sgblack@eecs.umich.edu        '''
9646570Sgblack@eecs.umich.edu
9656579Sgblack@eecs.umich.edu    class Msubi(MediaOp):
9666579Sgblack@eecs.umich.edu        code = '''
9676579Sgblack@eecs.umich.edu            assert(srcSize == destSize);
9686579Sgblack@eecs.umich.edu            int size = srcSize;
9696579Sgblack@eecs.umich.edu            int sizeBits = size * 8;
9706799Sgblack@eecs.umich.edu            int items = numItems(size);
9716579Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
9726579Sgblack@eecs.umich.edu
9736579Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
9746579Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
9756579Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
9766579Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
9776579Sgblack@eecs.umich.edu                uint64_t arg2Bits = bits(FpSrcReg2.uqw, hiIndex, loIndex);
9786579Sgblack@eecs.umich.edu                uint64_t resBits = arg1Bits - arg2Bits;
9796579Sgblack@eecs.umich.edu                
9806579Sgblack@eecs.umich.edu                if (ext & 0x2) {
9816801Sgblack@eecs.umich.edu                    if (signedOp()) {
9826801Sgblack@eecs.umich.edu                        int arg1Sign = bits(arg1Bits, sizeBits - 1);
9836801Sgblack@eecs.umich.edu                        int arg2Sign = !bits(arg2Bits, sizeBits - 1);
9846801Sgblack@eecs.umich.edu                        int resSign = bits(resBits, sizeBits - 1);
9856801Sgblack@eecs.umich.edu                        if ((arg1Sign == arg2Sign) && (arg1Sign != resSign)) {
9866801Sgblack@eecs.umich.edu                            if (resSign == 0)
9876801Sgblack@eecs.umich.edu                                resBits = (ULL(1) << (sizeBits - 1));
9886801Sgblack@eecs.umich.edu                            else
9896801Sgblack@eecs.umich.edu                                resBits = mask(sizeBits - 1);
9906801Sgblack@eecs.umich.edu                        }
9916801Sgblack@eecs.umich.edu                    } else {
9926801Sgblack@eecs.umich.edu                        if (arg2Bits > arg1Bits) {
9936801Sgblack@eecs.umich.edu                            resBits = 0;
9946801Sgblack@eecs.umich.edu                        } else if (!findCarry(sizeBits, resBits,
9956801Sgblack@eecs.umich.edu                                             arg1Bits, ~arg2Bits)) {
9966801Sgblack@eecs.umich.edu                            resBits = mask(sizeBits);
9976801Sgblack@eecs.umich.edu                        }
9986579Sgblack@eecs.umich.edu                    }
9996579Sgblack@eecs.umich.edu                }
10006579Sgblack@eecs.umich.edu
10016579Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, resBits);
10026579Sgblack@eecs.umich.edu            }
10036579Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
10046579Sgblack@eecs.umich.edu        '''
10056579Sgblack@eecs.umich.edu
10066577Sgblack@eecs.umich.edu    class Mmuli(MediaOp):
10076577Sgblack@eecs.umich.edu        code = '''
10086577Sgblack@eecs.umich.edu            int srcBits = srcSize * 8;
10096577Sgblack@eecs.umich.edu            int destBits = destSize * 8;
10106577Sgblack@eecs.umich.edu            assert(destBits <= 64);
10116577Sgblack@eecs.umich.edu            assert(destSize >= srcSize);
10126799Sgblack@eecs.umich.edu            int items = numItems(destSize);
10136577Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
10146577Sgblack@eecs.umich.edu
10156577Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
10166585Sgblack@eecs.umich.edu                int offset = 0;
10176585Sgblack@eecs.umich.edu                if (ext & 16) {
10186585Sgblack@eecs.umich.edu                    if (ext & 32)
10196585Sgblack@eecs.umich.edu                        offset = i * (destBits - srcBits);
10206585Sgblack@eecs.umich.edu                    else
10216585Sgblack@eecs.umich.edu                        offset = i * (destBits - srcBits) + srcBits;
10226585Sgblack@eecs.umich.edu                }
10236585Sgblack@eecs.umich.edu                int srcHiIndex = (i + 1) * srcBits - 1 + offset;
10246585Sgblack@eecs.umich.edu                int srcLoIndex = (i + 0) * srcBits + offset;
10256577Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, srcHiIndex, srcLoIndex);
10266577Sgblack@eecs.umich.edu                uint64_t arg2Bits = bits(FpSrcReg2.uqw, srcHiIndex, srcLoIndex);
10276577Sgblack@eecs.umich.edu                uint64_t resBits;
10286577Sgblack@eecs.umich.edu
10296801Sgblack@eecs.umich.edu                if (signedOp()) {
10306577Sgblack@eecs.umich.edu                    int64_t arg1 = arg1Bits |
10316742Svince@csl.cornell.edu                        (0 - (arg1Bits & (ULL(1) << (srcBits - 1))));
10326577Sgblack@eecs.umich.edu                    int64_t arg2 = arg2Bits |
10336742Svince@csl.cornell.edu                        (0 - (arg2Bits & (ULL(1) << (srcBits - 1))));
10346577Sgblack@eecs.umich.edu                    resBits = (uint64_t)(arg1 * arg2);
10356577Sgblack@eecs.umich.edu                } else {
10366577Sgblack@eecs.umich.edu                    resBits = arg1Bits * arg2Bits;
10376577Sgblack@eecs.umich.edu                }
10386577Sgblack@eecs.umich.edu
10396577Sgblack@eecs.umich.edu                if (ext & 0x4)
10406742Svince@csl.cornell.edu                    resBits += (ULL(1) << (destBits - 1));
10416577Sgblack@eecs.umich.edu                
10426800Sgblack@eecs.umich.edu                if (multHi())
10436577Sgblack@eecs.umich.edu                    resBits >>= destBits;
10446577Sgblack@eecs.umich.edu
10456577Sgblack@eecs.umich.edu                int destHiIndex = (i + 1) * destBits - 1;
10466577Sgblack@eecs.umich.edu                int destLoIndex = (i + 0) * destBits;
10476577Sgblack@eecs.umich.edu                result = insertBits(result, destHiIndex, destLoIndex, resBits);
10486577Sgblack@eecs.umich.edu            }
10496577Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
10506577Sgblack@eecs.umich.edu        '''
10516577Sgblack@eecs.umich.edu
10526587Sgblack@eecs.umich.edu    class Mavg(MediaOp):
10536587Sgblack@eecs.umich.edu        code = '''
10546587Sgblack@eecs.umich.edu            assert(srcSize == destSize);
10556587Sgblack@eecs.umich.edu            int size = srcSize;
10566587Sgblack@eecs.umich.edu            int sizeBits = size * 8;
10576799Sgblack@eecs.umich.edu            int items = numItems(size);
10586587Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
10596587Sgblack@eecs.umich.edu
10606587Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
10616587Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
10626587Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
10636587Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
10646587Sgblack@eecs.umich.edu                uint64_t arg2Bits = bits(FpSrcReg2.uqw, hiIndex, loIndex);
10656587Sgblack@eecs.umich.edu                uint64_t resBits = (arg1Bits + arg2Bits + 1) / 2;
10666587Sgblack@eecs.umich.edu                
10676587Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, resBits);
10686587Sgblack@eecs.umich.edu            }
10696587Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
10706587Sgblack@eecs.umich.edu        '''
10716587Sgblack@eecs.umich.edu
10726581Sgblack@eecs.umich.edu    class Msad(MediaOp):
10736581Sgblack@eecs.umich.edu        code = '''
10746581Sgblack@eecs.umich.edu            int srcBits = srcSize * 8;
10756581Sgblack@eecs.umich.edu            int items = sizeof(FloatRegBits) / srcSize;
10766581Sgblack@eecs.umich.edu
10776581Sgblack@eecs.umich.edu            uint64_t sum = 0;
10786581Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
10796581Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * srcBits - 1;
10806581Sgblack@eecs.umich.edu                int loIndex = (i + 0) * srcBits;
10816581Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
10826581Sgblack@eecs.umich.edu                uint64_t arg2Bits = bits(FpSrcReg2.uqw, hiIndex, loIndex);
10836581Sgblack@eecs.umich.edu                int64_t resBits = arg1Bits - arg2Bits;
10846581Sgblack@eecs.umich.edu                if (resBits < 0)
10856581Sgblack@eecs.umich.edu                    resBits = -resBits;
10866581Sgblack@eecs.umich.edu                sum += resBits;
10876581Sgblack@eecs.umich.edu            }
10886581Sgblack@eecs.umich.edu            FpDestReg.uqw = sum & mask(destSize * 8);
10896581Sgblack@eecs.umich.edu        '''
10906581Sgblack@eecs.umich.edu
10916583Sgblack@eecs.umich.edu    class Msrl(MediaOp):
10926583Sgblack@eecs.umich.edu        code = '''
10936583Sgblack@eecs.umich.edu
10946583Sgblack@eecs.umich.edu            assert(srcSize == destSize);
10956583Sgblack@eecs.umich.edu            int size = srcSize;
10966583Sgblack@eecs.umich.edu            int sizeBits = size * 8;
10976799Sgblack@eecs.umich.edu            int items = numItems(size);
10986583Sgblack@eecs.umich.edu            uint64_t shiftAmt = op2.uqw;
10996583Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
11006583Sgblack@eecs.umich.edu
11016583Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
11026583Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
11036583Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
11046583Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
11056583Sgblack@eecs.umich.edu                uint64_t resBits;
11066583Sgblack@eecs.umich.edu                if (shiftAmt >= sizeBits) {
11076583Sgblack@eecs.umich.edu                    resBits = 0;
11086583Sgblack@eecs.umich.edu                } else {
11096583Sgblack@eecs.umich.edu                    resBits = (arg1Bits >> shiftAmt) &
11106583Sgblack@eecs.umich.edu                        mask(sizeBits - shiftAmt);
11116583Sgblack@eecs.umich.edu                }
11126583Sgblack@eecs.umich.edu
11136583Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, resBits);
11146583Sgblack@eecs.umich.edu            }
11156583Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
11166583Sgblack@eecs.umich.edu        '''
11176583Sgblack@eecs.umich.edu
11186583Sgblack@eecs.umich.edu    class Msra(MediaOp):
11196583Sgblack@eecs.umich.edu        code = '''
11206583Sgblack@eecs.umich.edu
11216583Sgblack@eecs.umich.edu            assert(srcSize == destSize);
11226583Sgblack@eecs.umich.edu            int size = srcSize;
11236583Sgblack@eecs.umich.edu            int sizeBits = size * 8;
11246799Sgblack@eecs.umich.edu            int items = numItems(size);
11256583Sgblack@eecs.umich.edu            uint64_t shiftAmt = op2.uqw;
11266583Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
11276583Sgblack@eecs.umich.edu
11286583Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
11296583Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
11306583Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
11316583Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
11326583Sgblack@eecs.umich.edu                uint64_t resBits;
11336583Sgblack@eecs.umich.edu                if (shiftAmt >= sizeBits) {
11346583Sgblack@eecs.umich.edu                    if (bits(arg1Bits, sizeBits - 1))
11356583Sgblack@eecs.umich.edu                        resBits = mask(sizeBits);
11366583Sgblack@eecs.umich.edu                    else
11376583Sgblack@eecs.umich.edu                        resBits = 0;
11386583Sgblack@eecs.umich.edu                } else {
11396583Sgblack@eecs.umich.edu                    resBits = (arg1Bits >> shiftAmt);
11406583Sgblack@eecs.umich.edu                    resBits = resBits |
11416742Svince@csl.cornell.edu                        (0 - (resBits & (ULL(1) << (sizeBits - 1 - shiftAmt))));
11426583Sgblack@eecs.umich.edu                }
11436583Sgblack@eecs.umich.edu
11446583Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, resBits);
11456583Sgblack@eecs.umich.edu            }
11466583Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
11476583Sgblack@eecs.umich.edu        '''
11486583Sgblack@eecs.umich.edu
11496583Sgblack@eecs.umich.edu    class Msll(MediaOp):
11506583Sgblack@eecs.umich.edu        code = '''
11516583Sgblack@eecs.umich.edu
11526583Sgblack@eecs.umich.edu            assert(srcSize == destSize);
11536583Sgblack@eecs.umich.edu            int size = srcSize;
11546583Sgblack@eecs.umich.edu            int sizeBits = size * 8;
11556799Sgblack@eecs.umich.edu            int items = numItems(size);
11566583Sgblack@eecs.umich.edu            uint64_t shiftAmt = op2.uqw;
11576583Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
11586583Sgblack@eecs.umich.edu
11596583Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
11606583Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
11616583Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
11626583Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
11636583Sgblack@eecs.umich.edu                uint64_t resBits;
11646583Sgblack@eecs.umich.edu                if (shiftAmt >= sizeBits) {
11656583Sgblack@eecs.umich.edu                    resBits = 0;
11666583Sgblack@eecs.umich.edu                } else {
11676583Sgblack@eecs.umich.edu                    resBits = (arg1Bits << shiftAmt);
11686583Sgblack@eecs.umich.edu                }
11696583Sgblack@eecs.umich.edu
11706583Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, resBits);
11716583Sgblack@eecs.umich.edu            }
11726583Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
11736583Sgblack@eecs.umich.edu        '''
11746583Sgblack@eecs.umich.edu
11756605Sgblack@eecs.umich.edu    class Cvtf2i(MediaOp):
11766605Sgblack@eecs.umich.edu        def __init__(self, dest, src, \
11776605Sgblack@eecs.umich.edu                size = None, destSize = None, srcSize = None, ext = None):
11786605Sgblack@eecs.umich.edu            super(Cvtf2i, self).__init__(dest, src,\
11796605Sgblack@eecs.umich.edu                    "InstRegIndex(0)", size, destSize, srcSize, ext)
11806605Sgblack@eecs.umich.edu        code = '''
11816605Sgblack@eecs.umich.edu            union floatInt
11826605Sgblack@eecs.umich.edu            {
11836605Sgblack@eecs.umich.edu                float f;
11846605Sgblack@eecs.umich.edu                uint32_t i;
11856605Sgblack@eecs.umich.edu            };
11866605Sgblack@eecs.umich.edu            union doubleInt
11876605Sgblack@eecs.umich.edu            {
11886605Sgblack@eecs.umich.edu                double d;
11896605Sgblack@eecs.umich.edu                uint64_t i;
11906605Sgblack@eecs.umich.edu            };
11916605Sgblack@eecs.umich.edu
11926605Sgblack@eecs.umich.edu            assert(destSize == 4 || destSize == 8);
11936605Sgblack@eecs.umich.edu            assert(srcSize == 4 || srcSize == 8);
11946605Sgblack@eecs.umich.edu            int srcSizeBits = srcSize * 8;
11956605Sgblack@eecs.umich.edu            int destSizeBits = destSize * 8;
11966605Sgblack@eecs.umich.edu            int items;
11976605Sgblack@eecs.umich.edu            int srcStart = 0;
11986605Sgblack@eecs.umich.edu            int destStart = 0;
11996605Sgblack@eecs.umich.edu            if (srcSize == 2 * destSize) {
12006799Sgblack@eecs.umich.edu                items = numItems(srcSize);
12016605Sgblack@eecs.umich.edu                if (ext & 0x2)
12026605Sgblack@eecs.umich.edu                    destStart = destSizeBits * items;
12036605Sgblack@eecs.umich.edu            } else if (destSize == 2 * srcSize) {
12046799Sgblack@eecs.umich.edu                items = numItems(destSize);
12056605Sgblack@eecs.umich.edu                if (ext & 0x2)
12066605Sgblack@eecs.umich.edu                    srcStart = srcSizeBits * items;
12076605Sgblack@eecs.umich.edu            } else {
12086799Sgblack@eecs.umich.edu                items = numItems(destSize);
12096605Sgblack@eecs.umich.edu            }
12106605Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
12116605Sgblack@eecs.umich.edu
12126605Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
12136605Sgblack@eecs.umich.edu                int srcHiIndex = srcStart + (i + 1) * srcSizeBits - 1;
12146605Sgblack@eecs.umich.edu                int srcLoIndex = srcStart + (i + 0) * srcSizeBits;
12156605Sgblack@eecs.umich.edu                uint64_t argBits = bits(FpSrcReg1.uqw, srcHiIndex, srcLoIndex);
12166605Sgblack@eecs.umich.edu                double arg;
12176605Sgblack@eecs.umich.edu
12186605Sgblack@eecs.umich.edu                if (srcSize == 4) {
12196605Sgblack@eecs.umich.edu                    floatInt fi;
12206605Sgblack@eecs.umich.edu                    fi.i = argBits;
12216605Sgblack@eecs.umich.edu                    arg = fi.f;
12226605Sgblack@eecs.umich.edu                } else {
12236605Sgblack@eecs.umich.edu                    doubleInt di;
12246605Sgblack@eecs.umich.edu                    di.i = argBits;
12256605Sgblack@eecs.umich.edu                    arg = di.d;
12266605Sgblack@eecs.umich.edu                }
12276605Sgblack@eecs.umich.edu
12286605Sgblack@eecs.umich.edu                if (ext & 0x4) {
12296605Sgblack@eecs.umich.edu                    if (arg >= 0)
12306605Sgblack@eecs.umich.edu                        arg += 0.5;
12316605Sgblack@eecs.umich.edu                    else
12326605Sgblack@eecs.umich.edu                        arg -= 0.5;
12336605Sgblack@eecs.umich.edu                }
12346605Sgblack@eecs.umich.edu
12356605Sgblack@eecs.umich.edu                if (destSize == 4) {
12366732Svince@csl.cornell.edu                    argBits = (uint32_t)arg;
12376605Sgblack@eecs.umich.edu                } else {
12386605Sgblack@eecs.umich.edu                    argBits = (uint64_t)arg;
12396605Sgblack@eecs.umich.edu                }
12406605Sgblack@eecs.umich.edu                int destHiIndex = destStart + (i + 1) * destSizeBits - 1;
12416605Sgblack@eecs.umich.edu                int destLoIndex = destStart + (i + 0) * destSizeBits;
12426605Sgblack@eecs.umich.edu                result = insertBits(result, destHiIndex, destLoIndex, argBits);
12436605Sgblack@eecs.umich.edu            }
12446605Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
12456605Sgblack@eecs.umich.edu        '''
12466605Sgblack@eecs.umich.edu
12476562Sgblack@eecs.umich.edu    class Cvti2f(MediaOp):
12486562Sgblack@eecs.umich.edu        def __init__(self, dest, src, \
12496562Sgblack@eecs.umich.edu                size = None, destSize = None, srcSize = None, ext = None):
12506562Sgblack@eecs.umich.edu            super(Cvti2f, self).__init__(dest, src,\
12516562Sgblack@eecs.umich.edu                    "InstRegIndex(0)", size, destSize, srcSize, ext)
12526562Sgblack@eecs.umich.edu        code = '''
12536562Sgblack@eecs.umich.edu            union floatInt
12546562Sgblack@eecs.umich.edu            {
12556562Sgblack@eecs.umich.edu                float f;
12566562Sgblack@eecs.umich.edu                uint32_t i;
12576562Sgblack@eecs.umich.edu            };
12586562Sgblack@eecs.umich.edu            union doubleInt
12596562Sgblack@eecs.umich.edu            {
12606562Sgblack@eecs.umich.edu                double d;
12616562Sgblack@eecs.umich.edu                uint64_t i;
12626562Sgblack@eecs.umich.edu            };
12636562Sgblack@eecs.umich.edu
12646562Sgblack@eecs.umich.edu            assert(destSize == 4 || destSize == 8);
12656562Sgblack@eecs.umich.edu            assert(srcSize == 4 || srcSize == 8);
12666562Sgblack@eecs.umich.edu            int srcSizeBits = srcSize * 8;
12676562Sgblack@eecs.umich.edu            int destSizeBits = destSize * 8;
12686562Sgblack@eecs.umich.edu            int items;
12696562Sgblack@eecs.umich.edu            int srcStart = 0;
12706562Sgblack@eecs.umich.edu            int destStart = 0;
12716562Sgblack@eecs.umich.edu            if (srcSize == 2 * destSize) {
12726799Sgblack@eecs.umich.edu                items = numItems(srcSize);
12736562Sgblack@eecs.umich.edu                if (ext & 0x2)
12746562Sgblack@eecs.umich.edu                    destStart = destSizeBits * items;
12756562Sgblack@eecs.umich.edu            } else if (destSize == 2 * srcSize) {
12766799Sgblack@eecs.umich.edu                items = numItems(destSize);
12776562Sgblack@eecs.umich.edu                if (ext & 0x2)
12786562Sgblack@eecs.umich.edu                    srcStart = srcSizeBits * items;
12796562Sgblack@eecs.umich.edu            } else {
12806799Sgblack@eecs.umich.edu                items = numItems(destSize);
12816562Sgblack@eecs.umich.edu            }
12826562Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
12836562Sgblack@eecs.umich.edu
12846562Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
12856562Sgblack@eecs.umich.edu                int srcHiIndex = srcStart + (i + 1) * srcSizeBits - 1;
12866562Sgblack@eecs.umich.edu                int srcLoIndex = srcStart + (i + 0) * srcSizeBits;
12876562Sgblack@eecs.umich.edu                uint64_t argBits = bits(FpSrcReg1.uqw, srcHiIndex, srcLoIndex);
12886742Svince@csl.cornell.edu
12897081Sgblack@eecs.umich.edu                int64_t sArg = argBits |
12907081Sgblack@eecs.umich.edu                    (0 - (argBits & (ULL(1) << (srcSizeBits - 1))));
12916562Sgblack@eecs.umich.edu                double arg = sArg;
12926562Sgblack@eecs.umich.edu
12936562Sgblack@eecs.umich.edu                if (destSize == 4) {
12946562Sgblack@eecs.umich.edu                    floatInt fi;
12956562Sgblack@eecs.umich.edu                    fi.f = arg;
12966562Sgblack@eecs.umich.edu                    argBits = fi.i;
12976562Sgblack@eecs.umich.edu                } else {
12986562Sgblack@eecs.umich.edu                    doubleInt di;
12996562Sgblack@eecs.umich.edu                    di.d = arg;
13006562Sgblack@eecs.umich.edu                    argBits = di.i;
13016562Sgblack@eecs.umich.edu                }
13026562Sgblack@eecs.umich.edu                int destHiIndex = destStart + (i + 1) * destSizeBits - 1;
13036562Sgblack@eecs.umich.edu                int destLoIndex = destStart + (i + 0) * destSizeBits;
13046562Sgblack@eecs.umich.edu                result = insertBits(result, destHiIndex, destLoIndex, argBits);
13056562Sgblack@eecs.umich.edu            }
13066562Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
13076562Sgblack@eecs.umich.edu        '''
13086566Sgblack@eecs.umich.edu
13096568Sgblack@eecs.umich.edu    class Cvtf2f(MediaOp):
13106568Sgblack@eecs.umich.edu        def __init__(self, dest, src, \
13116568Sgblack@eecs.umich.edu                size = None, destSize = None, srcSize = None, ext = None):
13126568Sgblack@eecs.umich.edu            super(Cvtf2f, self).__init__(dest, src,\
13136568Sgblack@eecs.umich.edu                    "InstRegIndex(0)", size, destSize, srcSize, ext)
13146568Sgblack@eecs.umich.edu        code = '''
13156568Sgblack@eecs.umich.edu            union floatInt
13166568Sgblack@eecs.umich.edu            {
13176568Sgblack@eecs.umich.edu                float f;
13186568Sgblack@eecs.umich.edu                uint32_t i;
13196568Sgblack@eecs.umich.edu            };
13206568Sgblack@eecs.umich.edu            union doubleInt
13216568Sgblack@eecs.umich.edu            {
13226568Sgblack@eecs.umich.edu                double d;
13236568Sgblack@eecs.umich.edu                uint64_t i;
13246568Sgblack@eecs.umich.edu            };
13256568Sgblack@eecs.umich.edu
13266568Sgblack@eecs.umich.edu            assert(destSize == 4 || destSize == 8);
13276568Sgblack@eecs.umich.edu            assert(srcSize == 4 || srcSize == 8);
13286568Sgblack@eecs.umich.edu            int srcSizeBits = srcSize * 8;
13296568Sgblack@eecs.umich.edu            int destSizeBits = destSize * 8;
13306568Sgblack@eecs.umich.edu            int items;
13316568Sgblack@eecs.umich.edu            int srcStart = 0;
13326568Sgblack@eecs.umich.edu            int destStart = 0;
13336568Sgblack@eecs.umich.edu            if (srcSize == 2 * destSize) {
13346799Sgblack@eecs.umich.edu                items = numItems(srcSize);
13356568Sgblack@eecs.umich.edu                if (ext & 0x2)
13366568Sgblack@eecs.umich.edu                    destStart = destSizeBits * items;
13376568Sgblack@eecs.umich.edu            } else if (destSize == 2 * srcSize) {
13386799Sgblack@eecs.umich.edu                items = numItems(destSize);
13396568Sgblack@eecs.umich.edu                if (ext & 0x2)
13406568Sgblack@eecs.umich.edu                    srcStart = srcSizeBits * items;
13416568Sgblack@eecs.umich.edu            } else {
13426799Sgblack@eecs.umich.edu                items = numItems(destSize);
13436568Sgblack@eecs.umich.edu            }
13446568Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
13456568Sgblack@eecs.umich.edu
13466568Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
13476568Sgblack@eecs.umich.edu                int srcHiIndex = srcStart + (i + 1) * srcSizeBits - 1;
13486568Sgblack@eecs.umich.edu                int srcLoIndex = srcStart + (i + 0) * srcSizeBits;
13496568Sgblack@eecs.umich.edu                uint64_t argBits = bits(FpSrcReg1.uqw, srcHiIndex, srcLoIndex);
13506568Sgblack@eecs.umich.edu                double arg;
13516568Sgblack@eecs.umich.edu
13526568Sgblack@eecs.umich.edu                if (srcSize == 4) {
13536568Sgblack@eecs.umich.edu                    floatInt fi;
13546568Sgblack@eecs.umich.edu                    fi.i = argBits;
13556568Sgblack@eecs.umich.edu                    arg = fi.f;
13566568Sgblack@eecs.umich.edu                } else {
13576568Sgblack@eecs.umich.edu                    doubleInt di;
13586568Sgblack@eecs.umich.edu                    di.i = argBits;
13596568Sgblack@eecs.umich.edu                    arg = di.d;
13606568Sgblack@eecs.umich.edu                }
13616568Sgblack@eecs.umich.edu                if (destSize == 4) {
13626568Sgblack@eecs.umich.edu                    floatInt fi;
13636568Sgblack@eecs.umich.edu                    fi.f = arg;
13646568Sgblack@eecs.umich.edu                    argBits = fi.i;
13656568Sgblack@eecs.umich.edu                } else {
13666568Sgblack@eecs.umich.edu                    doubleInt di;
13676568Sgblack@eecs.umich.edu                    di.d = arg;
13686568Sgblack@eecs.umich.edu                    argBits = di.i;
13696568Sgblack@eecs.umich.edu                }
13706568Sgblack@eecs.umich.edu                int destHiIndex = destStart + (i + 1) * destSizeBits - 1;
13716568Sgblack@eecs.umich.edu                int destLoIndex = destStart + (i + 0) * destSizeBits;
13726568Sgblack@eecs.umich.edu                result = insertBits(result, destHiIndex, destLoIndex, argBits);
13736568Sgblack@eecs.umich.edu            }
13746568Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
13756568Sgblack@eecs.umich.edu        '''
13766568Sgblack@eecs.umich.edu
13776566Sgblack@eecs.umich.edu    class Mcmpi2r(MediaOp):
13786566Sgblack@eecs.umich.edu        code = '''
13796566Sgblack@eecs.umich.edu            union floatInt
13806566Sgblack@eecs.umich.edu            {
13816566Sgblack@eecs.umich.edu                float f;
13826566Sgblack@eecs.umich.edu                uint32_t i;
13836566Sgblack@eecs.umich.edu            };
13846566Sgblack@eecs.umich.edu            union doubleInt
13856566Sgblack@eecs.umich.edu            {
13866566Sgblack@eecs.umich.edu                double d;
13876566Sgblack@eecs.umich.edu                uint64_t i;
13886566Sgblack@eecs.umich.edu            };
13896566Sgblack@eecs.umich.edu
13906566Sgblack@eecs.umich.edu            assert(srcSize == destSize);
13916566Sgblack@eecs.umich.edu            int size = srcSize;
13926566Sgblack@eecs.umich.edu            int sizeBits = size * 8;
13936799Sgblack@eecs.umich.edu            int items = numItems(size);
13946566Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
13956566Sgblack@eecs.umich.edu
13966566Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
13976566Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
13986566Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
13996566Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
14006566Sgblack@eecs.umich.edu                int64_t arg1 = arg1Bits |
14016742Svince@csl.cornell.edu                    (0 - (arg1Bits & (ULL(1) << (sizeBits - 1))));
14026566Sgblack@eecs.umich.edu                uint64_t arg2Bits = bits(FpSrcReg2.uqw, hiIndex, loIndex);
14036566Sgblack@eecs.umich.edu                int64_t arg2 = arg2Bits |
14046742Svince@csl.cornell.edu                    (0 - (arg2Bits & (ULL(1) << (sizeBits - 1))));
14056566Sgblack@eecs.umich.edu
14066566Sgblack@eecs.umich.edu                uint64_t resBits = 0;
14076622Snate@binkert.org                if (((ext & 0x2) == 0 && arg1 == arg2) ||
14086622Snate@binkert.org                    ((ext & 0x2) == 0x2 && arg1 > arg2))
14096566Sgblack@eecs.umich.edu                    resBits = mask(sizeBits);
14106566Sgblack@eecs.umich.edu
14116566Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, resBits);
14126566Sgblack@eecs.umich.edu            }
14136566Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
14146566Sgblack@eecs.umich.edu        '''
14156601Sgblack@eecs.umich.edu
14166603Sgblack@eecs.umich.edu    class Mcmpf2r(MediaOp):
14176603Sgblack@eecs.umich.edu        code = '''
14186603Sgblack@eecs.umich.edu            union floatInt
14196603Sgblack@eecs.umich.edu            {
14206603Sgblack@eecs.umich.edu                float f;
14216603Sgblack@eecs.umich.edu                uint32_t i;
14226603Sgblack@eecs.umich.edu            };
14236603Sgblack@eecs.umich.edu            union doubleInt
14246603Sgblack@eecs.umich.edu            {
14256603Sgblack@eecs.umich.edu                double d;
14266603Sgblack@eecs.umich.edu                uint64_t i;
14276603Sgblack@eecs.umich.edu            };
14286603Sgblack@eecs.umich.edu
14296603Sgblack@eecs.umich.edu            assert(srcSize == destSize);
14306603Sgblack@eecs.umich.edu            int size = srcSize;
14316603Sgblack@eecs.umich.edu            int sizeBits = size * 8;
14326799Sgblack@eecs.umich.edu            int items = numItems(size);
14336603Sgblack@eecs.umich.edu            uint64_t result = FpDestReg.uqw;
14346603Sgblack@eecs.umich.edu
14356603Sgblack@eecs.umich.edu            for (int i = 0; i < items; i++) {
14366603Sgblack@eecs.umich.edu                int hiIndex = (i + 1) * sizeBits - 1;
14376603Sgblack@eecs.umich.edu                int loIndex = (i + 0) * sizeBits;
14386603Sgblack@eecs.umich.edu                uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
14396603Sgblack@eecs.umich.edu                uint64_t arg2Bits = bits(FpSrcReg2.uqw, hiIndex, loIndex);
14406603Sgblack@eecs.umich.edu                double arg1, arg2;
14416603Sgblack@eecs.umich.edu
14426603Sgblack@eecs.umich.edu                if (size == 4) {
14436603Sgblack@eecs.umich.edu                    floatInt fi;
14446603Sgblack@eecs.umich.edu                    fi.i = arg1Bits;
14456603Sgblack@eecs.umich.edu                    arg1 = fi.f;
14466603Sgblack@eecs.umich.edu                    fi.i = arg2Bits;
14476603Sgblack@eecs.umich.edu                    arg2 = fi.f;
14486603Sgblack@eecs.umich.edu                } else {
14496603Sgblack@eecs.umich.edu                    doubleInt di;
14506603Sgblack@eecs.umich.edu                    di.i = arg1Bits;
14516603Sgblack@eecs.umich.edu                    arg1 = di.d;
14526603Sgblack@eecs.umich.edu                    di.i = arg2Bits;
14536603Sgblack@eecs.umich.edu                    arg2 = di.d;
14546603Sgblack@eecs.umich.edu                }
14556603Sgblack@eecs.umich.edu
14566603Sgblack@eecs.umich.edu                uint64_t resBits = 0;
14576603Sgblack@eecs.umich.edu                bool nanop = isnan(arg1) || isnan(arg2);
14586603Sgblack@eecs.umich.edu                switch (ext & mask(3)) {
14596603Sgblack@eecs.umich.edu                  case 0:
14606603Sgblack@eecs.umich.edu                    if (arg1 == arg2 && !nanop)
14616603Sgblack@eecs.umich.edu                        resBits = mask(sizeBits);
14626603Sgblack@eecs.umich.edu                    break;
14636603Sgblack@eecs.umich.edu                  case 1:
14646603Sgblack@eecs.umich.edu                    if (arg1 < arg2 && !nanop)
14656603Sgblack@eecs.umich.edu                        resBits = mask(sizeBits);
14666603Sgblack@eecs.umich.edu                    break;
14676603Sgblack@eecs.umich.edu                  case 2:
14686603Sgblack@eecs.umich.edu                    if (arg1 <= arg2 && !nanop)
14696603Sgblack@eecs.umich.edu                        resBits = mask(sizeBits);
14706603Sgblack@eecs.umich.edu                    break;
14716603Sgblack@eecs.umich.edu                  case 3:
14726603Sgblack@eecs.umich.edu                    if (nanop)
14736603Sgblack@eecs.umich.edu                        resBits = mask(sizeBits);
14746603Sgblack@eecs.umich.edu                    break;
14756603Sgblack@eecs.umich.edu                  case 4:
14766603Sgblack@eecs.umich.edu                    if (arg1 != arg2 || nanop)
14776603Sgblack@eecs.umich.edu                        resBits = mask(sizeBits);
14786603Sgblack@eecs.umich.edu                    break;
14796603Sgblack@eecs.umich.edu                  case 5:
14806603Sgblack@eecs.umich.edu                    if (!(arg1 < arg2) || nanop)
14816603Sgblack@eecs.umich.edu                        resBits = mask(sizeBits);
14826603Sgblack@eecs.umich.edu                    break;
14836603Sgblack@eecs.umich.edu                  case 6:
14846603Sgblack@eecs.umich.edu                    if (!(arg1 <= arg2) || nanop)
14856603Sgblack@eecs.umich.edu                        resBits = mask(sizeBits);
14866603Sgblack@eecs.umich.edu                    break;
14876603Sgblack@eecs.umich.edu                  case 7:
14886603Sgblack@eecs.umich.edu                    if (!nanop)
14896603Sgblack@eecs.umich.edu                        resBits = mask(sizeBits);
14906603Sgblack@eecs.umich.edu                    break;
14916603Sgblack@eecs.umich.edu                };
14926603Sgblack@eecs.umich.edu
14936603Sgblack@eecs.umich.edu                result = insertBits(result, hiIndex, loIndex, resBits);
14946603Sgblack@eecs.umich.edu            }
14956603Sgblack@eecs.umich.edu            FpDestReg.uqw = result;
14966603Sgblack@eecs.umich.edu        '''
14976603Sgblack@eecs.umich.edu
14986601Sgblack@eecs.umich.edu    class Mcmpf2rf(MediaOp):
14996601Sgblack@eecs.umich.edu        def __init__(self, src1, src2,\
15006601Sgblack@eecs.umich.edu                size = None, destSize = None, srcSize = None, ext = None):
15016601Sgblack@eecs.umich.edu            super(Mcmpf2rf, self).__init__("InstRegIndex(0)", src1,\
15026601Sgblack@eecs.umich.edu                    src2, size, destSize, srcSize, ext)
15036601Sgblack@eecs.umich.edu        code = '''
15046601Sgblack@eecs.umich.edu            union floatInt
15056601Sgblack@eecs.umich.edu            {
15066601Sgblack@eecs.umich.edu                float f;
15076601Sgblack@eecs.umich.edu                uint32_t i;
15086601Sgblack@eecs.umich.edu            };
15096601Sgblack@eecs.umich.edu            union doubleInt
15106601Sgblack@eecs.umich.edu            {
15116601Sgblack@eecs.umich.edu                double d;
15126601Sgblack@eecs.umich.edu                uint64_t i;
15136601Sgblack@eecs.umich.edu            };
15146601Sgblack@eecs.umich.edu
15156601Sgblack@eecs.umich.edu            assert(srcSize == destSize);
15166601Sgblack@eecs.umich.edu            assert(srcSize == 4 || srcSize == 8);
15176601Sgblack@eecs.umich.edu            int size = srcSize;
15186601Sgblack@eecs.umich.edu            int sizeBits = size * 8;
15196601Sgblack@eecs.umich.edu
15206601Sgblack@eecs.umich.edu            double arg1, arg2;
15216601Sgblack@eecs.umich.edu            uint64_t arg1Bits = bits(FpSrcReg1.uqw, sizeBits - 1, 0);
15226601Sgblack@eecs.umich.edu            uint64_t arg2Bits = bits(FpSrcReg2.uqw, sizeBits - 1, 0);
15236601Sgblack@eecs.umich.edu            if (size == 4) {
15246601Sgblack@eecs.umich.edu                floatInt fi;
15256601Sgblack@eecs.umich.edu                fi.i = arg1Bits;
15266601Sgblack@eecs.umich.edu                arg1 = fi.f;
15276601Sgblack@eecs.umich.edu                fi.i = arg2Bits;
15286601Sgblack@eecs.umich.edu                arg2 = fi.f;
15296601Sgblack@eecs.umich.edu            } else {
15306601Sgblack@eecs.umich.edu                doubleInt di;
15316601Sgblack@eecs.umich.edu                di.i = arg1Bits;
15326601Sgblack@eecs.umich.edu                arg1 = di.d;
15336601Sgblack@eecs.umich.edu                di.i = arg2Bits;
15346601Sgblack@eecs.umich.edu                arg2 = di.d;
15356601Sgblack@eecs.umich.edu            }
15366601Sgblack@eecs.umich.edu
15376601Sgblack@eecs.umich.edu            //               ZF PF CF
15386601Sgblack@eecs.umich.edu            // Unordered      1  1  1
15396601Sgblack@eecs.umich.edu            // Greater than   0  0  0
15406601Sgblack@eecs.umich.edu            // Less than      0  0  1
15416601Sgblack@eecs.umich.edu            // Equal          1  0  0
15426601Sgblack@eecs.umich.edu            //           OF = SF = AF = 0
15436601Sgblack@eecs.umich.edu            ccFlagBits = ccFlagBits & ~(OFBit | SFBit | AFBit |
15446601Sgblack@eecs.umich.edu                                        ZFBit | PFBit | CFBit);
15456601Sgblack@eecs.umich.edu            if (isnan(arg1) || isnan(arg2))
15466601Sgblack@eecs.umich.edu                ccFlagBits = ccFlagBits | (ZFBit | PFBit | CFBit);
15476601Sgblack@eecs.umich.edu            else if(arg1 < arg2)
15486601Sgblack@eecs.umich.edu                ccFlagBits = ccFlagBits | CFBit;
15496601Sgblack@eecs.umich.edu            else if(arg1 == arg2)
15506601Sgblack@eecs.umich.edu                ccFlagBits = ccFlagBits | ZFBit;
15516601Sgblack@eecs.umich.edu        '''
15526516Sgblack@eecs.umich.edu}};
1553