fp.isa (2649:2fb859a457a2) fp.isa (2665:a124942bacb8)
1// -*- mode:c++ -*-
2
3// Copyright (c) 2003-2005 The Regents of The University of Michigan
4// All rights reserved.
5//
6// Redistribution and use in source and binary forms, with or without
7// modification, are permitted provided that the following conditions are
8// met: redistributions of source code must retain the above copyright
9// notice, this list of conditions and the following disclaimer;
10// redistributions in binary form must reproduce the above copyright
11// notice, this list of conditions and the following disclaimer in the
12// documentation and/or other materials provided with the distribution;
13// neither the name of the copyright holders nor the names of its
14// contributors may be used to endorse or promote products derived from
15// this software without specific prior written permission.
16//
17// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
18// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
19// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
20// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
21// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
22// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
23// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
24// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
25// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
27// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
1// -*- mode:c++ -*-
2
3// Copyright (c) 2003-2005 The Regents of The University of Michigan
4// All rights reserved.
5//
6// Redistribution and use in source and binary forms, with or without
7// modification, are permitted provided that the following conditions are
8// met: redistributions of source code must retain the above copyright
9// notice, this list of conditions and the following disclaimer;
10// redistributions in binary form must reproduce the above copyright
11// notice, this list of conditions and the following disclaimer in the
12// documentation and/or other materials provided with the distribution;
13// neither the name of the copyright holders nor the names of its
14// contributors may be used to endorse or promote products derived from
15// this software without specific prior written permission.
16//
17// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
18// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
19// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
20// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
21// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
22// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
23// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
24// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
25// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
27// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28//
29// Authors: Steve Reinhardt
28
29////////////////////////////////////////////////////////////////////
30//
31// Floating-point instructions
32//
33// Note that many FP-type instructions which do not support all the
34// various rounding & trapping modes use the simpler format
35// BasicOperateWithNopCheck.
36//
37
38output exec {{
39 /// Check "FP enabled" machine status bit. Called when executing any FP
40 /// instruction in full-system mode.
41 /// @retval Full-system mode: NoFault if FP is enabled, FenFault
42 /// if not. Non-full-system mode: always returns NoFault.
43#if FULL_SYSTEM
44 inline Fault checkFpEnableFault(%(CPU_exec_context)s *xc)
45 {
46 Fault fault = NoFault; // dummy... this ipr access should not fault
47 if (!EV5::ICSR_FPE(xc->readMiscRegWithEffect(AlphaISA::IPR_ICSR, fault))) {
48 fault = new FloatEnableFault;
49 }
50 return fault;
51 }
52#else
53 inline Fault checkFpEnableFault(%(CPU_exec_context)s *xc)
54 {
55 return NoFault;
56 }
57#endif
58}};
59
60output header {{
61 /**
62 * Base class for general floating-point instructions. Includes
63 * support for various Alpha rounding and trapping modes. Only FP
64 * instructions that require this support are derived from this
65 * class; the rest derive directly from AlphaStaticInst.
66 */
67 class AlphaFP : public AlphaStaticInst
68 {
69 public:
70 /// Alpha FP rounding modes.
71 enum RoundingMode {
72 Chopped = 0, ///< round toward zero
73 Minus_Infinity = 1, ///< round toward minus infinity
74 Normal = 2, ///< round to nearest (default)
75 Dynamic = 3, ///< use FPCR setting (in instruction)
76 Plus_Infinity = 3 ///< round to plus inifinity (in FPCR)
77 };
78
79 /// Alpha FP trapping modes.
80 /// For instructions that produce integer results, the
81 /// "Underflow Enable" modes really mean "Overflow Enable", and
82 /// the assembly modifier is V rather than U.
83 enum TrappingMode {
84 /// default: nothing enabled
85 Imprecise = 0, ///< no modifier
86 /// underflow/overflow traps enabled, inexact disabled
87 Underflow_Imprecise = 1, ///< /U or /V
88 Underflow_Precise = 5, ///< /SU or /SV
89 /// underflow/overflow and inexact traps enabled
90 Underflow_Inexact_Precise = 7 ///< /SUI or /SVI
91 };
92
93 protected:
94 /// Map Alpha rounding mode to C99 constants from <fenv.h>.
95 static const int alphaToC99RoundingMode[];
96
97 /// Map enum RoundingMode values to disassembly suffixes.
98 static const char *roundingModeSuffix[];
99 /// Map enum TrappingMode values to FP disassembly suffixes.
100 static const char *fpTrappingModeSuffix[];
101 /// Map enum TrappingMode values to integer disassembly suffixes.
102 static const char *intTrappingModeSuffix[];
103
104 /// This instruction's rounding mode.
105 RoundingMode roundingMode;
106 /// This instruction's trapping mode.
107 TrappingMode trappingMode;
108
109 /// Have we warned about this instruction's unsupported
110 /// rounding mode (if applicable)?
111 mutable bool warnedOnRounding;
112
113 /// Have we warned about this instruction's unsupported
114 /// trapping mode (if applicable)?
115 mutable bool warnedOnTrapping;
116
117 /// Constructor
118 AlphaFP(const char *mnem, ExtMachInst _machInst, OpClass __opClass)
119 : AlphaStaticInst(mnem, _machInst, __opClass),
120 roundingMode((enum RoundingMode)FP_ROUNDMODE),
121 trappingMode((enum TrappingMode)FP_TRAPMODE),
122 warnedOnRounding(false),
123 warnedOnTrapping(false)
124 {
125 }
126
127 int getC99RoundingMode(uint64_t fpcr_val) const;
128
129 // This differs from the AlphaStaticInst version only in
130 // printing suffixes for non-default rounding & trapping modes.
131 std::string
132 generateDisassembly(Addr pc, const SymbolTable *symtab) const;
133 };
134
135}};
136
137
138output decoder {{
139 int
140 AlphaFP::getC99RoundingMode(uint64_t fpcr_val) const
141 {
142 if (roundingMode == Dynamic) {
143 return alphaToC99RoundingMode[bits(fpcr_val, 59, 58)];
144 }
145 else {
146 return alphaToC99RoundingMode[roundingMode];
147 }
148 }
149
150 std::string
151 AlphaFP::generateDisassembly(Addr pc, const SymbolTable *symtab) const
152 {
153 std::string mnem_str(mnemonic);
154
155#ifndef SS_COMPATIBLE_DISASSEMBLY
156 std::string suffix("");
157 suffix += ((_destRegIdx[0] >= FP_Base_DepTag)
158 ? fpTrappingModeSuffix[trappingMode]
159 : intTrappingModeSuffix[trappingMode]);
160 suffix += roundingModeSuffix[roundingMode];
161
162 if (suffix != "") {
163 mnem_str = csprintf("%s/%s", mnemonic, suffix);
164 }
165#endif
166
167 std::stringstream ss;
168 ccprintf(ss, "%-10s ", mnem_str.c_str());
169
170 // just print the first two source regs... if there's
171 // a third one, it's a read-modify-write dest (Rc),
172 // e.g. for CMOVxx
173 if (_numSrcRegs > 0) {
174 printReg(ss, _srcRegIdx[0]);
175 }
176 if (_numSrcRegs > 1) {
177 ss << ",";
178 printReg(ss, _srcRegIdx[1]);
179 }
180
181 // just print the first dest... if there's a second one,
182 // it's generally implicit
183 if (_numDestRegs > 0) {
184 if (_numSrcRegs > 0)
185 ss << ",";
186 printReg(ss, _destRegIdx[0]);
187 }
188
189 return ss.str();
190 }
191
192 const int AlphaFP::alphaToC99RoundingMode[] = {
193 FE_TOWARDZERO, // Chopped
194 FE_DOWNWARD, // Minus_Infinity
195 FE_TONEAREST, // Normal
196 FE_UPWARD // Dynamic in inst, Plus_Infinity in FPCR
197 };
198
199 const char *AlphaFP::roundingModeSuffix[] = { "c", "m", "", "d" };
200 // mark invalid trapping modes, but don't fail on them, because
201 // you could decode anything on a misspeculated path
202 const char *AlphaFP::fpTrappingModeSuffix[] =
203 { "", "u", "INVTM2", "INVTM3", "INVTM4", "su", "INVTM6", "sui" };
204 const char *AlphaFP::intTrappingModeSuffix[] =
205 { "", "v", "INVTM2", "INVTM3", "INVTM4", "sv", "INVTM6", "svi" };
206}};
207
208// FP instruction class execute method template. Handles non-standard
209// rounding modes.
210def template FloatingPointExecute {{
211 Fault %(class_name)s::execute(%(CPU_exec_context)s *xc,
212 Trace::InstRecord *traceData) const
213 {
214 if (trappingMode != Imprecise && !warnedOnTrapping) {
215 warn("%s: non-standard trapping mode not supported",
216 generateDisassembly(0, NULL));
217 warnedOnTrapping = true;
218 }
219
220 Fault fault = NoFault;
221
222 %(fp_enable_check)s;
223 %(op_decl)s;
224 %(op_rd)s;
225#if USE_FENV
226 if (roundingMode == Normal) {
227 %(code)s;
228 } else {
229 fesetround(getC99RoundingMode(
230 xc->readMiscReg(AlphaISA::Fpcr_DepTag)));
231 %(code)s;
232 fesetround(FE_TONEAREST);
233 }
234#else
235 if (roundingMode != Normal && !warnedOnRounding) {
236 warn("%s: non-standard rounding mode not supported",
237 generateDisassembly(0, NULL));
238 warnedOnRounding = true;
239 }
240 %(code)s;
241#endif
242
243 if (fault == NoFault) {
244 %(op_wb)s;
245 }
246
247 return fault;
248 }
249}};
250
251// FP instruction class execute method template where no dynamic
252// rounding mode control is needed. Like BasicExecute, but includes
253// check & warning for non-standard trapping mode.
254def template FPFixedRoundingExecute {{
255 Fault %(class_name)s::execute(%(CPU_exec_context)s *xc,
256 Trace::InstRecord *traceData) const
257 {
258 if (trappingMode != Imprecise && !warnedOnTrapping) {
259 warn("%s: non-standard trapping mode not supported",
260 generateDisassembly(0, NULL));
261 warnedOnTrapping = true;
262 }
263
264 Fault fault = NoFault;
265
266 %(fp_enable_check)s;
267 %(op_decl)s;
268 %(op_rd)s;
269 %(code)s;
270
271 if (fault == NoFault) {
272 %(op_wb)s;
273 }
274
275 return fault;
276 }
277}};
278
279def template FloatingPointDecode {{
280 {
281 AlphaStaticInst *i = new %(class_name)s(machInst);
282 if (FC == 31) {
283 i = makeNop(i);
284 }
285 return i;
286 }
287}};
288
289// General format for floating-point operate instructions:
290// - Checks trapping and rounding mode flags. Trapping modes
291// currently unimplemented (will fail).
292// - Generates NOP if FC == 31.
293def format FloatingPointOperate(code, *opt_args) {{
294 iop = InstObjParams(name, Name, 'AlphaFP', CodeBlock(code), opt_args)
295 decode_block = FloatingPointDecode.subst(iop)
296 header_output = BasicDeclare.subst(iop)
297 decoder_output = BasicConstructor.subst(iop)
298 exec_output = FloatingPointExecute.subst(iop)
299}};
300
301// Special format for cvttq where rounding mode is pre-decoded
302def format FPFixedRounding(code, class_suffix, *opt_args) {{
303 Name += class_suffix
304 iop = InstObjParams(name, Name, 'AlphaFP', CodeBlock(code), opt_args)
305 decode_block = FloatingPointDecode.subst(iop)
306 header_output = BasicDeclare.subst(iop)
307 decoder_output = BasicConstructor.subst(iop)
308 exec_output = FPFixedRoundingExecute.subst(iop)
309}};
310
30
31////////////////////////////////////////////////////////////////////
32//
33// Floating-point instructions
34//
35// Note that many FP-type instructions which do not support all the
36// various rounding & trapping modes use the simpler format
37// BasicOperateWithNopCheck.
38//
39
40output exec {{
41 /// Check "FP enabled" machine status bit. Called when executing any FP
42 /// instruction in full-system mode.
43 /// @retval Full-system mode: NoFault if FP is enabled, FenFault
44 /// if not. Non-full-system mode: always returns NoFault.
45#if FULL_SYSTEM
46 inline Fault checkFpEnableFault(%(CPU_exec_context)s *xc)
47 {
48 Fault fault = NoFault; // dummy... this ipr access should not fault
49 if (!EV5::ICSR_FPE(xc->readMiscRegWithEffect(AlphaISA::IPR_ICSR, fault))) {
50 fault = new FloatEnableFault;
51 }
52 return fault;
53 }
54#else
55 inline Fault checkFpEnableFault(%(CPU_exec_context)s *xc)
56 {
57 return NoFault;
58 }
59#endif
60}};
61
62output header {{
63 /**
64 * Base class for general floating-point instructions. Includes
65 * support for various Alpha rounding and trapping modes. Only FP
66 * instructions that require this support are derived from this
67 * class; the rest derive directly from AlphaStaticInst.
68 */
69 class AlphaFP : public AlphaStaticInst
70 {
71 public:
72 /// Alpha FP rounding modes.
73 enum RoundingMode {
74 Chopped = 0, ///< round toward zero
75 Minus_Infinity = 1, ///< round toward minus infinity
76 Normal = 2, ///< round to nearest (default)
77 Dynamic = 3, ///< use FPCR setting (in instruction)
78 Plus_Infinity = 3 ///< round to plus inifinity (in FPCR)
79 };
80
81 /// Alpha FP trapping modes.
82 /// For instructions that produce integer results, the
83 /// "Underflow Enable" modes really mean "Overflow Enable", and
84 /// the assembly modifier is V rather than U.
85 enum TrappingMode {
86 /// default: nothing enabled
87 Imprecise = 0, ///< no modifier
88 /// underflow/overflow traps enabled, inexact disabled
89 Underflow_Imprecise = 1, ///< /U or /V
90 Underflow_Precise = 5, ///< /SU or /SV
91 /// underflow/overflow and inexact traps enabled
92 Underflow_Inexact_Precise = 7 ///< /SUI or /SVI
93 };
94
95 protected:
96 /// Map Alpha rounding mode to C99 constants from <fenv.h>.
97 static const int alphaToC99RoundingMode[];
98
99 /// Map enum RoundingMode values to disassembly suffixes.
100 static const char *roundingModeSuffix[];
101 /// Map enum TrappingMode values to FP disassembly suffixes.
102 static const char *fpTrappingModeSuffix[];
103 /// Map enum TrappingMode values to integer disassembly suffixes.
104 static const char *intTrappingModeSuffix[];
105
106 /// This instruction's rounding mode.
107 RoundingMode roundingMode;
108 /// This instruction's trapping mode.
109 TrappingMode trappingMode;
110
111 /// Have we warned about this instruction's unsupported
112 /// rounding mode (if applicable)?
113 mutable bool warnedOnRounding;
114
115 /// Have we warned about this instruction's unsupported
116 /// trapping mode (if applicable)?
117 mutable bool warnedOnTrapping;
118
119 /// Constructor
120 AlphaFP(const char *mnem, ExtMachInst _machInst, OpClass __opClass)
121 : AlphaStaticInst(mnem, _machInst, __opClass),
122 roundingMode((enum RoundingMode)FP_ROUNDMODE),
123 trappingMode((enum TrappingMode)FP_TRAPMODE),
124 warnedOnRounding(false),
125 warnedOnTrapping(false)
126 {
127 }
128
129 int getC99RoundingMode(uint64_t fpcr_val) const;
130
131 // This differs from the AlphaStaticInst version only in
132 // printing suffixes for non-default rounding & trapping modes.
133 std::string
134 generateDisassembly(Addr pc, const SymbolTable *symtab) const;
135 };
136
137}};
138
139
140output decoder {{
141 int
142 AlphaFP::getC99RoundingMode(uint64_t fpcr_val) const
143 {
144 if (roundingMode == Dynamic) {
145 return alphaToC99RoundingMode[bits(fpcr_val, 59, 58)];
146 }
147 else {
148 return alphaToC99RoundingMode[roundingMode];
149 }
150 }
151
152 std::string
153 AlphaFP::generateDisassembly(Addr pc, const SymbolTable *symtab) const
154 {
155 std::string mnem_str(mnemonic);
156
157#ifndef SS_COMPATIBLE_DISASSEMBLY
158 std::string suffix("");
159 suffix += ((_destRegIdx[0] >= FP_Base_DepTag)
160 ? fpTrappingModeSuffix[trappingMode]
161 : intTrappingModeSuffix[trappingMode]);
162 suffix += roundingModeSuffix[roundingMode];
163
164 if (suffix != "") {
165 mnem_str = csprintf("%s/%s", mnemonic, suffix);
166 }
167#endif
168
169 std::stringstream ss;
170 ccprintf(ss, "%-10s ", mnem_str.c_str());
171
172 // just print the first two source regs... if there's
173 // a third one, it's a read-modify-write dest (Rc),
174 // e.g. for CMOVxx
175 if (_numSrcRegs > 0) {
176 printReg(ss, _srcRegIdx[0]);
177 }
178 if (_numSrcRegs > 1) {
179 ss << ",";
180 printReg(ss, _srcRegIdx[1]);
181 }
182
183 // just print the first dest... if there's a second one,
184 // it's generally implicit
185 if (_numDestRegs > 0) {
186 if (_numSrcRegs > 0)
187 ss << ",";
188 printReg(ss, _destRegIdx[0]);
189 }
190
191 return ss.str();
192 }
193
194 const int AlphaFP::alphaToC99RoundingMode[] = {
195 FE_TOWARDZERO, // Chopped
196 FE_DOWNWARD, // Minus_Infinity
197 FE_TONEAREST, // Normal
198 FE_UPWARD // Dynamic in inst, Plus_Infinity in FPCR
199 };
200
201 const char *AlphaFP::roundingModeSuffix[] = { "c", "m", "", "d" };
202 // mark invalid trapping modes, but don't fail on them, because
203 // you could decode anything on a misspeculated path
204 const char *AlphaFP::fpTrappingModeSuffix[] =
205 { "", "u", "INVTM2", "INVTM3", "INVTM4", "su", "INVTM6", "sui" };
206 const char *AlphaFP::intTrappingModeSuffix[] =
207 { "", "v", "INVTM2", "INVTM3", "INVTM4", "sv", "INVTM6", "svi" };
208}};
209
210// FP instruction class execute method template. Handles non-standard
211// rounding modes.
212def template FloatingPointExecute {{
213 Fault %(class_name)s::execute(%(CPU_exec_context)s *xc,
214 Trace::InstRecord *traceData) const
215 {
216 if (trappingMode != Imprecise && !warnedOnTrapping) {
217 warn("%s: non-standard trapping mode not supported",
218 generateDisassembly(0, NULL));
219 warnedOnTrapping = true;
220 }
221
222 Fault fault = NoFault;
223
224 %(fp_enable_check)s;
225 %(op_decl)s;
226 %(op_rd)s;
227#if USE_FENV
228 if (roundingMode == Normal) {
229 %(code)s;
230 } else {
231 fesetround(getC99RoundingMode(
232 xc->readMiscReg(AlphaISA::Fpcr_DepTag)));
233 %(code)s;
234 fesetround(FE_TONEAREST);
235 }
236#else
237 if (roundingMode != Normal && !warnedOnRounding) {
238 warn("%s: non-standard rounding mode not supported",
239 generateDisassembly(0, NULL));
240 warnedOnRounding = true;
241 }
242 %(code)s;
243#endif
244
245 if (fault == NoFault) {
246 %(op_wb)s;
247 }
248
249 return fault;
250 }
251}};
252
253// FP instruction class execute method template where no dynamic
254// rounding mode control is needed. Like BasicExecute, but includes
255// check & warning for non-standard trapping mode.
256def template FPFixedRoundingExecute {{
257 Fault %(class_name)s::execute(%(CPU_exec_context)s *xc,
258 Trace::InstRecord *traceData) const
259 {
260 if (trappingMode != Imprecise && !warnedOnTrapping) {
261 warn("%s: non-standard trapping mode not supported",
262 generateDisassembly(0, NULL));
263 warnedOnTrapping = true;
264 }
265
266 Fault fault = NoFault;
267
268 %(fp_enable_check)s;
269 %(op_decl)s;
270 %(op_rd)s;
271 %(code)s;
272
273 if (fault == NoFault) {
274 %(op_wb)s;
275 }
276
277 return fault;
278 }
279}};
280
281def template FloatingPointDecode {{
282 {
283 AlphaStaticInst *i = new %(class_name)s(machInst);
284 if (FC == 31) {
285 i = makeNop(i);
286 }
287 return i;
288 }
289}};
290
291// General format for floating-point operate instructions:
292// - Checks trapping and rounding mode flags. Trapping modes
293// currently unimplemented (will fail).
294// - Generates NOP if FC == 31.
295def format FloatingPointOperate(code, *opt_args) {{
296 iop = InstObjParams(name, Name, 'AlphaFP', CodeBlock(code), opt_args)
297 decode_block = FloatingPointDecode.subst(iop)
298 header_output = BasicDeclare.subst(iop)
299 decoder_output = BasicConstructor.subst(iop)
300 exec_output = FloatingPointExecute.subst(iop)
301}};
302
303// Special format for cvttq where rounding mode is pre-decoded
304def format FPFixedRounding(code, class_suffix, *opt_args) {{
305 Name += class_suffix
306 iop = InstObjParams(name, Name, 'AlphaFP', CodeBlock(code), opt_args)
307 decode_block = FloatingPointDecode.subst(iop)
308 header_output = BasicDeclare.subst(iop)
309 decoder_output = BasicConstructor.subst(iop)
310 exec_output = FPFixedRoundingExecute.subst(iop)
311}};
312