mult.isa revision 7422:feddb9077def
1// -*- mode:c++ -*-
2
3// Copyright (c) 2010 ARM Limited
4// All rights reserved
5//
6// The license below extends only to copyright in the software and shall
7// not be construed as granting a license to any other intellectual
8// property including but not limited to intellectual property relating
9// to a hardware implementation of the functionality of the software
10// licensed hereunder.  You may use the software subject to the license
11// terms below provided that you ensure that this notice is replicated
12// unmodified and in its entirety in all distributions of the software,
13// modified or unmodified, in source code or in binary form.
14//
15// Redistribution and use in source and binary forms, with or without
16// modification, are permitted provided that the following conditions are
17// met: redistributions of source code must retain the above copyright
18// notice, this list of conditions and the following disclaimer;
19// redistributions in binary form must reproduce the above copyright
20// notice, this list of conditions and the following disclaimer in the
21// documentation and/or other materials provided with the distribution;
22// neither the name of the copyright holders nor the names of its
23// contributors may be used to endorse or promote products derived from
24// this software without specific prior written permission.
25//
26// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
27// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
28// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
29// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
30// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
31// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
32// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
33// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
34// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
35// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
36// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
37//
38// Authors: Gabe Black
39
40let {{
41
42    header_output = ""
43    decoder_output = ""
44    exec_output = ""
45
46    calcQCode = '''
47        CondCodes = CondCodes | ((resTemp & 1) << 27);
48    '''
49
50    calcCcCode = '''
51        uint16_t _iz, _in;
52        _in = (resTemp >> %(negBit)d) & 1;
53        _iz = ((%(zType)s)resTemp == 0);
54
55        CondCodes =  _in << 31 | _iz << 30 | (CondCodes & 0x3FFFFFFF);
56
57        DPRINTF(Arm, "(in, iz) = (%%d, %%d)\\n", _in, _iz);
58       '''
59
60    def buildMultInst(mnem, doCc, unCc, regs, code, flagType):
61        global header_output, decoder_output, exec_output
62        cCode = carryCode[flagType]
63        vCode = overflowCode[flagType]
64        zType = "uint32_t"
65        negBit = 31
66        if flagType == "llbit":
67            zType = "uint64_t"
68            negBit = 63
69        if flagType == "overflow":
70            ccCode = calcQCode
71        else:
72            ccCode = calcCcCode % {
73                "negBit": negBit,
74                "zType": zType
75            }
76
77        if not regs in (3, 4):
78            raise Exception, "Multiplication instructions with %d " + \
79                             "registers are not implemented"
80
81        if regs == 3:
82            base = 'Mult3'
83        else:
84            base = 'Mult4'
85
86        Name = mnem.capitalize()
87
88        if unCc:
89            iop = InstObjParams(mnem, Name, base,
90                                {"code" : code,
91                                 "predicate_test": predicateTest})
92        if doCc:
93            iopCc = InstObjParams(mnem + "s", Name + "Cc", base,
94                                  {"code" : code + ccCode,
95                                   "predicate_test": condPredicateTest})
96
97        if regs == 3:
98            declare = Mult3Declare
99            constructor = Mult3Constructor
100        else:
101            declare = Mult4Declare
102            constructor = Mult4Constructor
103
104        if unCc:
105            header_output += declare.subst(iop)
106            decoder_output += constructor.subst(iop)
107            exec_output += PredOpExecute.subst(iop)
108        if doCc:
109            header_output += declare.subst(iopCc)
110            decoder_output += constructor.subst(iopCc)
111            exec_output += PredOpExecute.subst(iopCc)
112
113    def buildMult3Inst(mnem, code, flagType = "logic"):
114        buildMultInst(mnem, True, True, 3, code, flagType)
115
116    def buildMult3InstCc(mnem, code, flagType = "logic"):
117        buildMultInst(mnem, True, False, 3, code, flagType)
118
119    def buildMult3InstUnCc(mnem, code, flagType = "logic"):
120        buildMultInst(mnem, False, True, 3, code, flagType)
121
122    def buildMult4Inst(mnem, code, flagType = "logic"):
123        buildMultInst(mnem, True, True, 4, code, flagType)
124
125    def buildMult4InstCc(mnem, code, flagType = "logic"):
126        buildMultInst(mnem, True, False, 4, code, flagType)
127
128    def buildMult4InstUnCc(mnem, code, flagType = "logic"):
129        buildMultInst(mnem, False, True, 4, code, flagType)
130
131    buildMult4Inst    ("mla", "Reg0 = resTemp = Reg1 * Reg2 + Reg3;")
132    buildMult4InstUnCc("mls", "Reg0 = resTemp = Reg3 - Reg1 * Reg2;")
133    buildMult3Inst    ("mul", "Reg0 = resTemp = Reg1 * Reg2;")
134    buildMult4InstCc  ("smlabb", '''Reg0 = resTemp =
135                                        sext<16>(bits(Reg1, 15, 0)) *
136                                        sext<16>(bits(Reg2.sw, 15, 0)) +
137                                        Reg3.sw;
138                                 resTemp = bits(resTemp, 32) !=
139                                           bits(resTemp, 31);
140                                 ''', "overflow")
141    buildMult4InstCc  ("smlabt", '''Reg0 = resTemp =
142                                        sext<16>(bits(Reg1, 15, 0)) *
143                                        sext<16>(bits(Reg2.sw, 31, 16)) +
144                                        Reg3.sw;
145                                 resTemp = bits(resTemp, 32) !=
146                                           bits(resTemp, 31);
147                                 ''', "overflow")
148    buildMult4InstCc  ("smlatb", '''Reg0 = resTemp =
149                                        sext<16>(bits(Reg1, 31, 16)) *
150                                        sext<16>(bits(Reg2.sw, 15, 0)) +
151                                        Reg3.sw;
152                                 resTemp = bits(resTemp, 32) !=
153                                           bits(resTemp, 31);
154                                 ''', "overflow")
155    buildMult4InstCc  ("smlatt", '''Reg0 = resTemp =
156                                        sext<16>(bits(Reg1, 31, 16)) *
157                                        sext<16>(bits(Reg2.sw, 31, 16)) +
158                                        Reg3.sw;
159                                 resTemp = bits(resTemp, 32) !=
160                                           bits(resTemp, 31);
161                                 ''', "overflow")
162    buildMult4InstCc  ("smlad", '''Reg0 = resTemp =
163                                        sext<16>(bits(Reg1, 31, 16)) *
164                                        sext<16>(bits(Reg2, 31, 16)) +
165                                        sext<16>(bits(Reg1, 15, 0)) *
166                                        sext<16>(bits(Reg2, 15, 0)) +
167                                        Reg3.sw;
168                                    resTemp = bits(resTemp, 32) !=
169                                              bits(resTemp, 31);
170                                ''', "overflow")
171    buildMult4InstCc  ("smladx", '''Reg0 = resTemp =
172                                         sext<16>(bits(Reg1, 31, 16)) *
173                                         sext<16>(bits(Reg2, 15, 0)) +
174                                         sext<16>(bits(Reg1, 15, 0)) *
175                                         sext<16>(bits(Reg2, 31, 16)) +
176                                         Reg3.sw;
177                                    resTemp = bits(resTemp, 32) !=
178                                              bits(resTemp, 31);
179                                 ''', "overflow")
180    buildMult4Inst    ("smlal", '''resTemp = sext<32>(Reg2) * sext<32>(Reg3) +
181                                       (int64_t)((Reg1.ud << 32) | Reg0.ud);
182                                   Reg0.ud = (uint32_t)resTemp;
183                                   Reg1.ud = (uint32_t)(resTemp >> 32);
184                                ''', "llbit")
185    buildMult4InstUnCc("smlalbb", '''resTemp = sext<16>(bits(Reg2, 15, 0)) *
186                                               sext<16>(bits(Reg3, 15, 0)) +
187                                               (int64_t)((Reg1.ud << 32) |
188                                                         Reg0.ud);
189                                     Reg0.ud = (uint32_t)resTemp;
190                                     Reg1.ud = (uint32_t)(resTemp >> 32);
191                                  ''')
192    buildMult4InstUnCc("smlalbt", '''resTemp = sext<16>(bits(Reg2, 15, 0)) *
193                                               sext<16>(bits(Reg3, 31, 16)) +
194                                               (int64_t)((Reg1.ud << 32) |
195                                                         Reg0.ud);
196                                     Reg0.ud = (uint32_t)resTemp;
197                                     Reg1.ud = (uint32_t)(resTemp >> 32);
198                                  ''')
199    buildMult4InstUnCc("smlaltb", '''resTemp = sext<16>(bits(Reg2, 31, 16)) *
200                                               sext<16>(bits(Reg3, 15, 0)) +
201                                               (int64_t)((Reg1.ud << 32) |
202                                                         Reg0.ud);
203                                     Reg0.ud = (uint32_t)resTemp;
204                                     Reg1.ud = (uint32_t)(resTemp >> 32);
205                                  ''')
206    buildMult4InstUnCc("smlaltt", '''resTemp = sext<16>(bits(Reg2, 31, 16)) *
207                                               sext<16>(bits(Reg3, 31, 16)) +
208                                               (int64_t)((Reg1.ud << 32) |
209                                                         Reg0.ud);
210                                     Reg0.ud = (uint32_t)resTemp;
211                                     Reg1.ud = (uint32_t)(resTemp >> 32);
212                                  ''')
213    buildMult4InstUnCc("smlald", '''resTemp =
214                                        sext<16>(bits(Reg2, 31, 16)) *
215                                        sext<16>(bits(Reg3, 31, 16)) +
216                                        sext<16>(bits(Reg2, 15, 0)) *
217                                        sext<16>(bits(Reg3, 15, 0)) +
218                                        (int64_t)((Reg1.ud << 32) |
219                                                  Reg0.ud);
220                                    Reg0.ud = (uint32_t)resTemp;
221                                    Reg1.ud = (uint32_t)(resTemp >> 32);
222                                 ''')
223    buildMult4InstUnCc("smlaldx", '''resTemp =
224                                         sext<16>(bits(Reg2, 31, 16)) *
225                                         sext<16>(bits(Reg3, 15, 0)) +
226                                         sext<16>(bits(Reg2, 15, 0)) *
227                                         sext<16>(bits(Reg3, 31, 16)) +
228                                         (int64_t)((Reg1.ud << 32) |
229                                                   Reg0.ud);
230                                     Reg0.ud = (uint32_t)resTemp;
231                                     Reg1.ud = (uint32_t)(resTemp >> 32);
232                                  ''')
233    buildMult4InstCc  ("smlawb", '''Reg0 = resTemp =
234                                        (Reg1.sw *
235                                         sext<16>(bits(Reg2, 15, 0)) +
236                                         ((int64_t)Reg3.sw << 16)) >> 16;
237                                    resTemp = bits(resTemp, 32) !=
238                                              bits(resTemp, 31);
239                                 ''', "overflow")
240    buildMult4InstCc  ("smlawt", '''Reg0 = resTemp =
241                                        (Reg1.sw *
242                                         sext<16>(bits(Reg2, 31, 16)) +
243                                         ((int64_t)Reg3.sw << 16)) >> 16;
244                                    resTemp = bits(resTemp, 32) !=
245                                              bits(resTemp, 31);
246                                 ''', "overflow")
247    buildMult4InstCc  ("smlsd", '''Reg0 = resTemp =
248                                       sext<16>(bits(Reg1, 15, 0)) *
249                                       sext<16>(bits(Reg2, 15, 0)) -
250                                       sext<16>(bits(Reg1, 31, 16)) *
251                                       sext<16>(bits(Reg2, 31, 16)) +
252                                       Reg3.sw;
253                                    resTemp = bits(resTemp, 32) !=
254                                              bits(resTemp, 31);
255                                ''', "overflow")
256    buildMult4InstCc  ("smlsdx", '''Reg0 = resTemp =
257                                        sext<16>(bits(Reg1, 15, 0)) *
258                                        sext<16>(bits(Reg2, 31, 16)) -
259                                        sext<16>(bits(Reg1, 31, 16)) *
260                                        sext<16>(bits(Reg2, 15, 0)) +
261                                        Reg3.sw;
262                                    resTemp = bits(resTemp, 32) !=
263                                              bits(resTemp, 31);
264                                 ''', "overflow")
265    buildMult4InstUnCc("smlsld", '''resTemp =
266                                        sext<16>(bits(Reg2, 15, 0)) *
267                                        sext<16>(bits(Reg3, 15, 0)) -
268                                        sext<16>(bits(Reg2, 31, 16)) *
269                                        sext<16>(bits(Reg3, 31, 16)) +
270                                        (int64_t)((Reg1.ud << 32) |
271                                                  Reg0.ud);
272                                    Reg0.ud = (uint32_t)resTemp;
273                                    Reg1.ud = (uint32_t)(resTemp >> 32);
274                                 ''')
275    buildMult4InstUnCc("smlsldx", '''resTemp =
276                                         sext<16>(bits(Reg2, 15, 0)) *
277                                         sext<16>(bits(Reg3, 31, 16)) -
278                                         sext<16>(bits(Reg2, 31, 16)) *
279                                         sext<16>(bits(Reg3, 15, 0)) +
280                                         (int64_t)((Reg1.ud << 32) |
281                                                   Reg0.ud);
282                                     Reg0.ud = (uint32_t)resTemp;
283                                     Reg1.ud = (uint32_t)(resTemp >> 32);
284                                  ''')
285    buildMult4InstUnCc("smmla", '''Reg0 = resTemp =
286                                       ((int64_t)(Reg3.ud << 32) +
287                                        (int64_t)Reg1.sw *
288                                        (int64_t)Reg2.sw) >> 32;
289                                ''')
290    buildMult4InstUnCc("smmlar", '''Reg0 = resTemp =
291                                        ((int64_t)(Reg3.ud << 32) +
292                                         (int64_t)Reg1.sw *
293                                         (int64_t)Reg2.sw +
294                                         ULL(0x80000000)) >> 32;
295                                 ''')
296    buildMult4InstUnCc("smmls", '''Reg0 = resTemp =
297                                       ((int64_t)(Reg3.ud << 32) -
298                                        (int64_t)Reg1.sw *
299                                        (int64_t)Reg2.sw) >> 32;
300                                ''')
301    buildMult4InstUnCc("smmlsr", '''Reg0 = resTemp =
302                                        ((int64_t)(Reg3.ud << 32) -
303                                         (int64_t)Reg1.sw *
304                                         (int64_t)Reg2.sw +
305                                         ULL(0x80000000)) >> 32;
306                                 ''')
307    buildMult3InstUnCc("smmul", '''Reg0 = resTemp =
308                                       ((int64_t)Reg1.sw *
309                                        (int64_t)Reg2.sw) >> 32;
310                                ''')
311    buildMult3InstUnCc("smmulr", '''Reg0 = resTemp =
312                                        ((int64_t)Reg1.sw *
313                                         (int64_t)Reg2.sw +
314                                         ULL(0x80000000)) >> 32;
315                                 ''')
316    buildMult3InstCc  ("smuad", '''Reg0 = resTemp =
317                                        sext<16>(bits(Reg1, 15, 0)) *
318                                        sext<16>(bits(Reg2, 15, 0)) +
319                                        sext<16>(bits(Reg1, 31, 16)) *
320                                        sext<16>(bits(Reg2, 31, 16));
321                                    resTemp = bits(resTemp, 32) !=
322                                              bits(resTemp, 31);
323                                ''', "overflow")
324    buildMult3InstCc  ("smuadx", '''Reg0 = resTemp =
325                                        sext<16>(bits(Reg1, 15, 0)) *
326                                        sext<16>(bits(Reg2, 31, 16)) +
327                                        sext<16>(bits(Reg1, 31, 16)) *
328                                        sext<16>(bits(Reg2, 15, 0));
329                                    resTemp = bits(resTemp, 32) !=
330                                              bits(resTemp, 31);
331                                 ''', "overflow")
332    buildMult3InstUnCc("smulbb", '''Reg0 = resTemp =
333                                         sext<16>(bits(Reg1, 15, 0)) *
334                                         sext<16>(bits(Reg2, 15, 0));
335                                 ''')
336    buildMult3InstUnCc("smulbt", '''Reg0 = resTemp =
337                                         sext<16>(bits(Reg1, 15, 0)) *
338                                         sext<16>(bits(Reg2, 31, 16));
339                                 ''')
340    buildMult3InstUnCc("smultb", '''Reg0 = resTemp =
341                                         sext<16>(bits(Reg1, 31, 16)) *
342                                         sext<16>(bits(Reg2, 15, 0));
343                                 ''')
344    buildMult3InstUnCc("smultt", '''Reg0 = resTemp =
345                                         sext<16>(bits(Reg1, 31, 16)) *
346                                         sext<16>(bits(Reg2, 31, 16));
347                                 ''')
348    buildMult4Inst    ("smull", '''resTemp = (int64_t)Reg2.sw *
349                                             (int64_t)Reg3.sw;
350                                   Reg0 = (int32_t)resTemp;
351                                   Reg1 = (int32_t)(resTemp >> 32);
352                                ''', "llbit")
353    buildMult3InstUnCc("smulwb", '''Reg0 = resTemp =
354                                        (Reg1.sw *
355                                         sext<16>(bits(Reg2, 15, 0))) >> 16;
356                                 ''')
357    buildMult3InstUnCc("smulwt", '''Reg0 = resTemp =
358                                        (Reg1.sw *
359                                         sext<16>(bits(Reg2, 31, 16))) >> 16;
360                                 ''')
361    buildMult3InstUnCc("smusd", '''Reg0 = resTemp =
362                                        sext<16>(bits(Reg1, 15, 0)) *
363                                        sext<16>(bits(Reg2, 15, 0)) -
364                                        sext<16>(bits(Reg1, 31, 16)) *
365                                        sext<16>(bits(Reg2, 31, 16));
366                                ''')
367    buildMult3InstUnCc("smusdx", '''Reg0 = resTemp =
368                                        sext<16>(bits(Reg1, 15, 0)) *
369                                        sext<16>(bits(Reg2, 31, 16)) -
370                                        sext<16>(bits(Reg1, 31, 16)) *
371                                        sext<16>(bits(Reg2, 15, 0));
372                                 ''')
373    buildMult4InstUnCc("umaal", '''resTemp = Reg2.ud * Reg3.ud +
374                                             Reg0.ud + Reg1.ud;
375                                   Reg0.ud = (uint32_t)resTemp;
376                                   Reg1.ud = (uint32_t)(resTemp >> 32);
377                                ''')
378    buildMult4Inst    ("umlal", '''resTemp = Reg2.ud * Reg3.ud + Reg0.ud +
379                                             (Reg1.ud << 32);
380                                   Reg0.ud = (uint32_t)resTemp;
381                                   Reg1.ud = (uint32_t)(resTemp >> 32);
382                                ''', "llbit")
383    buildMult4Inst    ("umull", '''resTemp = Reg2.ud * Reg3.ud;
384                                   Reg0 = (uint32_t)resTemp;
385                                   Reg1 = (uint32_t)(resTemp >> 32);
386                                ''', "llbit")
387}};
388