base_dyn_inst.hh revision 12768:9a299ec956ac
1/* 2 * Copyright (c) 2011,2013,2016 ARM Limited 3 * Copyright (c) 2013 Advanced Micro Devices, Inc. 4 * All rights reserved. 5 * 6 * The license below extends only to copyright in the software and shall 7 * not be construed as granting a license to any other intellectual 8 * property including but not limited to intellectual property relating 9 * to a hardware implementation of the functionality of the software 10 * licensed hereunder. You may use the software subject to the license 11 * terms below provided that you ensure that this notice is replicated 12 * unmodified and in its entirety in all distributions of the software, 13 * modified or unmodified, in source code or in binary form. 14 * 15 * Copyright (c) 2004-2006 The Regents of The University of Michigan 16 * Copyright (c) 2009 The University of Edinburgh 17 * All rights reserved. 18 * 19 * Redistribution and use in source and binary forms, with or without 20 * modification, are permitted provided that the following conditions are 21 * met: redistributions of source code must retain the above copyright 22 * notice, this list of conditions and the following disclaimer; 23 * redistributions in binary form must reproduce the above copyright 24 * notice, this list of conditions and the following disclaimer in the 25 * documentation and/or other materials provided with the distribution; 26 * neither the name of the copyright holders nor the names of its 27 * contributors may be used to endorse or promote products derived from 28 * this software without specific prior written permission. 29 * 30 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 31 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 32 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 33 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 34 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 35 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 36 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 37 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 38 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 39 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 40 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 41 * 42 * Authors: Kevin Lim 43 * Timothy M. Jones 44 */ 45 46#ifndef __CPU_BASE_DYN_INST_HH__ 47#define __CPU_BASE_DYN_INST_HH__ 48 49#include <array> 50#include <bitset> 51#include <deque> 52#include <list> 53#include <string> 54 55#include "arch/generic/tlb.hh" 56#include "arch/utility.hh" 57#include "base/trace.hh" 58#include "config/the_isa.hh" 59#include "cpu/checker/cpu.hh" 60#include "cpu/exec_context.hh" 61#include "cpu/exetrace.hh" 62#include "cpu/inst_res.hh" 63#include "cpu/inst_seq.hh" 64#include "cpu/o3/comm.hh" 65#include "cpu/op_class.hh" 66#include "cpu/static_inst.hh" 67#include "cpu/translation.hh" 68#include "mem/packet.hh" 69#include "mem/request.hh" 70#include "sim/byteswap.hh" 71#include "sim/system.hh" 72 73/** 74 * @file 75 * Defines a dynamic instruction context. 76 */ 77 78template <class Impl> 79class BaseDynInst : public ExecContext, public RefCounted 80{ 81 public: 82 // Typedef for the CPU. 83 typedef typename Impl::CPUType ImplCPU; 84 typedef typename ImplCPU::ImplState ImplState; 85 using VecRegContainer = TheISA::VecRegContainer; 86 87 // The DynInstPtr type. 88 typedef typename Impl::DynInstPtr DynInstPtr; 89 typedef RefCountingPtr<BaseDynInst<Impl> > BaseDynInstPtr; 90 91 // The list of instructions iterator type. 92 typedef typename std::list<DynInstPtr>::iterator ListIt; 93 94 enum { 95 MaxInstSrcRegs = TheISA::MaxInstSrcRegs, /// Max source regs 96 MaxInstDestRegs = TheISA::MaxInstDestRegs /// Max dest regs 97 }; 98 99 protected: 100 enum Status { 101 IqEntry, /// Instruction is in the IQ 102 RobEntry, /// Instruction is in the ROB 103 LsqEntry, /// Instruction is in the LSQ 104 Completed, /// Instruction has completed 105 ResultReady, /// Instruction has its result 106 CanIssue, /// Instruction can issue and execute 107 Issued, /// Instruction has issued 108 Executed, /// Instruction has executed 109 CanCommit, /// Instruction can commit 110 AtCommit, /// Instruction has reached commit 111 Committed, /// Instruction has committed 112 Squashed, /// Instruction is squashed 113 SquashedInIQ, /// Instruction is squashed in the IQ 114 SquashedInLSQ, /// Instruction is squashed in the LSQ 115 SquashedInROB, /// Instruction is squashed in the ROB 116 RecoverInst, /// Is a recover instruction 117 BlockingInst, /// Is a blocking instruction 118 ThreadsyncWait, /// Is a thread synchronization instruction 119 SerializeBefore, /// Needs to serialize on 120 /// instructions ahead of it 121 SerializeAfter, /// Needs to serialize instructions behind it 122 SerializeHandled, /// Serialization has been handled 123 NumStatus 124 }; 125 126 enum Flags { 127 NotAnInst, 128 TranslationStarted, 129 TranslationCompleted, 130 PossibleLoadViolation, 131 HitExternalSnoop, 132 EffAddrValid, 133 RecordResult, 134 Predicate, 135 PredTaken, 136 IsStrictlyOrdered, 137 ReqMade, 138 MemOpDone, 139 MaxFlags 140 }; 141 142 public: 143 /** The sequence number of the instruction. */ 144 InstSeqNum seqNum; 145 146 /** The StaticInst used by this BaseDynInst. */ 147 const StaticInstPtr staticInst; 148 149 /** Pointer to the Impl's CPU object. */ 150 ImplCPU *cpu; 151 152 BaseCPU *getCpuPtr() { return cpu; } 153 154 /** Pointer to the thread state. */ 155 ImplState *thread; 156 157 /** The kind of fault this instruction has generated. */ 158 Fault fault; 159 160 /** InstRecord that tracks this instructions. */ 161 Trace::InstRecord *traceData; 162 163 protected: 164 /** The result of the instruction; assumes an instruction can have many 165 * destination registers. 166 */ 167 std::queue<InstResult> instResult; 168 169 /** PC state for this instruction. */ 170 TheISA::PCState pc; 171 172 /* An amalgamation of a lot of boolean values into one */ 173 std::bitset<MaxFlags> instFlags; 174 175 /** The status of this BaseDynInst. Several bits can be set. */ 176 std::bitset<NumStatus> status; 177 178 /** Whether or not the source register is ready. 179 * @todo: Not sure this should be here vs the derived class. 180 */ 181 std::bitset<MaxInstSrcRegs> _readySrcRegIdx; 182 183 public: 184 /** The thread this instruction is from. */ 185 ThreadID threadNumber; 186 187 /** Iterator pointing to this BaseDynInst in the list of all insts. */ 188 ListIt instListIt; 189 190 ////////////////////// Branch Data /////////////// 191 /** Predicted PC state after this instruction. */ 192 TheISA::PCState predPC; 193 194 /** The Macroop if one exists */ 195 const StaticInstPtr macroop; 196 197 /** How many source registers are ready. */ 198 uint8_t readyRegs; 199 200 public: 201 /////////////////////// Load Store Data ////////////////////// 202 /** The effective virtual address (lds & stores only). */ 203 Addr effAddr; 204 205 /** The effective physical address. */ 206 Addr physEffAddrLow; 207 208 /** The effective physical address 209 * of the second request for a split request 210 */ 211 Addr physEffAddrHigh; 212 213 /** The memory request flags (from translation). */ 214 unsigned memReqFlags; 215 216 /** data address space ID, for loads & stores. */ 217 short asid; 218 219 /** The size of the request */ 220 uint8_t effSize; 221 222 /** Pointer to the data for the memory access. */ 223 uint8_t *memData; 224 225 /** Load queue index. */ 226 int16_t lqIdx; 227 228 /** Store queue index. */ 229 int16_t sqIdx; 230 231 232 /////////////////////// TLB Miss ////////////////////// 233 /** 234 * Saved memory requests (needed when the DTB address translation is 235 * delayed due to a hw page table walk). 236 */ 237 RequestPtr savedReq; 238 RequestPtr savedSreqLow; 239 RequestPtr savedSreqHigh; 240 241 /////////////////////// Checker ////////////////////// 242 // Need a copy of main request pointer to verify on writes. 243 RequestPtr reqToVerify; 244 245 protected: 246 /** Flattened register index of the destination registers of this 247 * instruction. 248 */ 249 std::array<RegId, TheISA::MaxInstDestRegs> _flatDestRegIdx; 250 251 /** Physical register index of the destination registers of this 252 * instruction. 253 */ 254 std::array<PhysRegIdPtr, TheISA::MaxInstDestRegs> _destRegIdx; 255 256 /** Physical register index of the source registers of this 257 * instruction. 258 */ 259 std::array<PhysRegIdPtr, TheISA::MaxInstSrcRegs> _srcRegIdx; 260 261 /** Physical register index of the previous producers of the 262 * architected destinations. 263 */ 264 std::array<PhysRegIdPtr, TheISA::MaxInstDestRegs> _prevDestRegIdx; 265 266 267 public: 268 /** Records changes to result? */ 269 void recordResult(bool f) { instFlags[RecordResult] = f; } 270 271 /** Is the effective virtual address valid. */ 272 bool effAddrValid() const { return instFlags[EffAddrValid]; } 273 274 /** Whether or not the memory operation is done. */ 275 bool memOpDone() const { return instFlags[MemOpDone]; } 276 void memOpDone(bool f) { instFlags[MemOpDone] = f; } 277 278 bool notAnInst() const { return instFlags[NotAnInst]; } 279 void setNotAnInst() { instFlags[NotAnInst] = true; } 280 281 282 //////////////////////////////////////////// 283 // 284 // INSTRUCTION EXECUTION 285 // 286 //////////////////////////////////////////// 287 288 void demapPage(Addr vaddr, uint64_t asn) 289 { 290 cpu->demapPage(vaddr, asn); 291 } 292 void demapInstPage(Addr vaddr, uint64_t asn) 293 { 294 cpu->demapPage(vaddr, asn); 295 } 296 void demapDataPage(Addr vaddr, uint64_t asn) 297 { 298 cpu->demapPage(vaddr, asn); 299 } 300 301 Fault initiateMemRead(Addr addr, unsigned size, Request::Flags flags); 302 303 Fault writeMem(uint8_t *data, unsigned size, Addr addr, 304 Request::Flags flags, uint64_t *res); 305 306 /** Splits a request in two if it crosses a dcache block. */ 307 void splitRequest(const RequestPtr &req, RequestPtr &sreqLow, 308 RequestPtr &sreqHigh); 309 310 /** Initiate a DTB address translation. */ 311 void initiateTranslation(const RequestPtr &req, const RequestPtr &sreqLow, 312 const RequestPtr &sreqHigh, uint64_t *res, 313 BaseTLB::Mode mode); 314 315 /** Finish a DTB address translation. */ 316 void finishTranslation(WholeTranslationState *state); 317 318 /** True if the DTB address translation has started. */ 319 bool translationStarted() const { return instFlags[TranslationStarted]; } 320 void translationStarted(bool f) { instFlags[TranslationStarted] = f; } 321 322 /** True if the DTB address translation has completed. */ 323 bool translationCompleted() const { return instFlags[TranslationCompleted]; } 324 void translationCompleted(bool f) { instFlags[TranslationCompleted] = f; } 325 326 /** True if this address was found to match a previous load and they issued 327 * out of order. If that happend, then it's only a problem if an incoming 328 * snoop invalidate modifies the line, in which case we need to squash. 329 * If nothing modified the line the order doesn't matter. 330 */ 331 bool possibleLoadViolation() const { return instFlags[PossibleLoadViolation]; } 332 void possibleLoadViolation(bool f) { instFlags[PossibleLoadViolation] = f; } 333 334 /** True if the address hit a external snoop while sitting in the LSQ. 335 * If this is true and a older instruction sees it, this instruction must 336 * reexecute 337 */ 338 bool hitExternalSnoop() const { return instFlags[HitExternalSnoop]; } 339 void hitExternalSnoop(bool f) { instFlags[HitExternalSnoop] = f; } 340 341 /** 342 * Returns true if the DTB address translation is being delayed due to a hw 343 * page table walk. 344 */ 345 bool isTranslationDelayed() const 346 { 347 return (translationStarted() && !translationCompleted()); 348 } 349 350 public: 351#ifdef DEBUG 352 void dumpSNList(); 353#endif 354 355 /** Returns the physical register index of the i'th destination 356 * register. 357 */ 358 PhysRegIdPtr renamedDestRegIdx(int idx) const 359 { 360 return _destRegIdx[idx]; 361 } 362 363 /** Returns the physical register index of the i'th source register. */ 364 PhysRegIdPtr renamedSrcRegIdx(int idx) const 365 { 366 assert(TheISA::MaxInstSrcRegs > idx); 367 return _srcRegIdx[idx]; 368 } 369 370 /** Returns the flattened register index of the i'th destination 371 * register. 372 */ 373 const RegId& flattenedDestRegIdx(int idx) const 374 { 375 return _flatDestRegIdx[idx]; 376 } 377 378 /** Returns the physical register index of the previous physical register 379 * that remapped to the same logical register index. 380 */ 381 PhysRegIdPtr prevDestRegIdx(int idx) const 382 { 383 return _prevDestRegIdx[idx]; 384 } 385 386 /** Renames a destination register to a physical register. Also records 387 * the previous physical register that the logical register mapped to. 388 */ 389 void renameDestReg(int idx, 390 PhysRegIdPtr renamed_dest, 391 PhysRegIdPtr previous_rename) 392 { 393 _destRegIdx[idx] = renamed_dest; 394 _prevDestRegIdx[idx] = previous_rename; 395 } 396 397 /** Renames a source logical register to the physical register which 398 * has/will produce that logical register's result. 399 * @todo: add in whether or not the source register is ready. 400 */ 401 void renameSrcReg(int idx, PhysRegIdPtr renamed_src) 402 { 403 _srcRegIdx[idx] = renamed_src; 404 } 405 406 /** Flattens a destination architectural register index into a logical 407 * index. 408 */ 409 void flattenDestReg(int idx, const RegId& flattened_dest) 410 { 411 _flatDestRegIdx[idx] = flattened_dest; 412 } 413 /** BaseDynInst constructor given a binary instruction. 414 * @param staticInst A StaticInstPtr to the underlying instruction. 415 * @param pc The PC state for the instruction. 416 * @param predPC The predicted next PC state for the instruction. 417 * @param seq_num The sequence number of the instruction. 418 * @param cpu Pointer to the instruction's CPU. 419 */ 420 BaseDynInst(const StaticInstPtr &staticInst, const StaticInstPtr ¯oop, 421 TheISA::PCState pc, TheISA::PCState predPC, 422 InstSeqNum seq_num, ImplCPU *cpu); 423 424 /** BaseDynInst constructor given a StaticInst pointer. 425 * @param _staticInst The StaticInst for this BaseDynInst. 426 */ 427 BaseDynInst(const StaticInstPtr &staticInst, const StaticInstPtr ¯oop); 428 429 /** BaseDynInst destructor. */ 430 ~BaseDynInst(); 431 432 private: 433 /** Function to initialize variables in the constructors. */ 434 void initVars(); 435 436 public: 437 /** Dumps out contents of this BaseDynInst. */ 438 void dump(); 439 440 /** Dumps out contents of this BaseDynInst into given string. */ 441 void dump(std::string &outstring); 442 443 /** Read this CPU's ID. */ 444 int cpuId() const { return cpu->cpuId(); } 445 446 /** Read this CPU's Socket ID. */ 447 uint32_t socketId() const { return cpu->socketId(); } 448 449 /** Read this CPU's data requestor ID */ 450 MasterID masterId() const { return cpu->dataMasterId(); } 451 452 /** Read this context's system-wide ID **/ 453 ContextID contextId() const { return thread->contextId(); } 454 455 /** Returns the fault type. */ 456 Fault getFault() const { return fault; } 457 458 /** Checks whether or not this instruction has had its branch target 459 * calculated yet. For now it is not utilized and is hacked to be 460 * always false. 461 * @todo: Actually use this instruction. 462 */ 463 bool doneTargCalc() { return false; } 464 465 /** Set the predicted target of this current instruction. */ 466 void setPredTarg(const TheISA::PCState &_predPC) 467 { 468 predPC = _predPC; 469 } 470 471 const TheISA::PCState &readPredTarg() { return predPC; } 472 473 /** Returns the predicted PC immediately after the branch. */ 474 Addr predInstAddr() { return predPC.instAddr(); } 475 476 /** Returns the predicted PC two instructions after the branch */ 477 Addr predNextInstAddr() { return predPC.nextInstAddr(); } 478 479 /** Returns the predicted micro PC after the branch */ 480 Addr predMicroPC() { return predPC.microPC(); } 481 482 /** Returns whether the instruction was predicted taken or not. */ 483 bool readPredTaken() 484 { 485 return instFlags[PredTaken]; 486 } 487 488 void setPredTaken(bool predicted_taken) 489 { 490 instFlags[PredTaken] = predicted_taken; 491 } 492 493 /** Returns whether the instruction mispredicted. */ 494 bool mispredicted() 495 { 496 TheISA::PCState tempPC = pc; 497 TheISA::advancePC(tempPC, staticInst); 498 return !(tempPC == predPC); 499 } 500 501 // 502 // Instruction types. Forward checks to StaticInst object. 503 // 504 bool isNop() const { return staticInst->isNop(); } 505 bool isMemRef() const { return staticInst->isMemRef(); } 506 bool isLoad() const { return staticInst->isLoad(); } 507 bool isStore() const { return staticInst->isStore(); } 508 bool isAtomic() const { return staticInst->isAtomic(); } 509 bool isStoreConditional() const 510 { return staticInst->isStoreConditional(); } 511 bool isInstPrefetch() const { return staticInst->isInstPrefetch(); } 512 bool isDataPrefetch() const { return staticInst->isDataPrefetch(); } 513 bool isInteger() const { return staticInst->isInteger(); } 514 bool isFloating() const { return staticInst->isFloating(); } 515 bool isVector() const { return staticInst->isVector(); } 516 bool isControl() const { return staticInst->isControl(); } 517 bool isCall() const { return staticInst->isCall(); } 518 bool isReturn() const { return staticInst->isReturn(); } 519 bool isDirectCtrl() const { return staticInst->isDirectCtrl(); } 520 bool isIndirectCtrl() const { return staticInst->isIndirectCtrl(); } 521 bool isCondCtrl() const { return staticInst->isCondCtrl(); } 522 bool isUncondCtrl() const { return staticInst->isUncondCtrl(); } 523 bool isCondDelaySlot() const { return staticInst->isCondDelaySlot(); } 524 bool isThreadSync() const { return staticInst->isThreadSync(); } 525 bool isSerializing() const { return staticInst->isSerializing(); } 526 bool isSerializeBefore() const 527 { return staticInst->isSerializeBefore() || status[SerializeBefore]; } 528 bool isSerializeAfter() const 529 { return staticInst->isSerializeAfter() || status[SerializeAfter]; } 530 bool isSquashAfter() const { return staticInst->isSquashAfter(); } 531 bool isMemBarrier() const { return staticInst->isMemBarrier(); } 532 bool isWriteBarrier() const { return staticInst->isWriteBarrier(); } 533 bool isNonSpeculative() const { return staticInst->isNonSpeculative(); } 534 bool isQuiesce() const { return staticInst->isQuiesce(); } 535 bool isIprAccess() const { return staticInst->isIprAccess(); } 536 bool isUnverifiable() const { return staticInst->isUnverifiable(); } 537 bool isSyscall() const { return staticInst->isSyscall(); } 538 bool isMacroop() const { return staticInst->isMacroop(); } 539 bool isMicroop() const { return staticInst->isMicroop(); } 540 bool isDelayedCommit() const { return staticInst->isDelayedCommit(); } 541 bool isLastMicroop() const { return staticInst->isLastMicroop(); } 542 bool isFirstMicroop() const { return staticInst->isFirstMicroop(); } 543 bool isMicroBranch() const { return staticInst->isMicroBranch(); } 544 545 /** Temporarily sets this instruction as a serialize before instruction. */ 546 void setSerializeBefore() { status.set(SerializeBefore); } 547 548 /** Clears the serializeBefore part of this instruction. */ 549 void clearSerializeBefore() { status.reset(SerializeBefore); } 550 551 /** Checks if this serializeBefore is only temporarily set. */ 552 bool isTempSerializeBefore() { return status[SerializeBefore]; } 553 554 /** Temporarily sets this instruction as a serialize after instruction. */ 555 void setSerializeAfter() { status.set(SerializeAfter); } 556 557 /** Clears the serializeAfter part of this instruction.*/ 558 void clearSerializeAfter() { status.reset(SerializeAfter); } 559 560 /** Checks if this serializeAfter is only temporarily set. */ 561 bool isTempSerializeAfter() { return status[SerializeAfter]; } 562 563 /** Sets the serialization part of this instruction as handled. */ 564 void setSerializeHandled() { status.set(SerializeHandled); } 565 566 /** Checks if the serialization part of this instruction has been 567 * handled. This does not apply to the temporary serializing 568 * state; it only applies to this instruction's own permanent 569 * serializing state. 570 */ 571 bool isSerializeHandled() { return status[SerializeHandled]; } 572 573 /** Returns the opclass of this instruction. */ 574 OpClass opClass() const { return staticInst->opClass(); } 575 576 /** Returns the branch target address. */ 577 TheISA::PCState branchTarget() const 578 { return staticInst->branchTarget(pc); } 579 580 /** Returns the number of source registers. */ 581 int8_t numSrcRegs() const { return staticInst->numSrcRegs(); } 582 583 /** Returns the number of destination registers. */ 584 int8_t numDestRegs() const { return staticInst->numDestRegs(); } 585 586 // the following are used to track physical register usage 587 // for machines with separate int & FP reg files 588 int8_t numFPDestRegs() const { return staticInst->numFPDestRegs(); } 589 int8_t numIntDestRegs() const { return staticInst->numIntDestRegs(); } 590 int8_t numCCDestRegs() const { return staticInst->numCCDestRegs(); } 591 int8_t numVecDestRegs() const { return staticInst->numVecDestRegs(); } 592 int8_t numVecElemDestRegs() const { 593 return staticInst->numVecElemDestRegs(); 594 } 595 596 /** Returns the logical register index of the i'th destination register. */ 597 const RegId& destRegIdx(int i) const { return staticInst->destRegIdx(i); } 598 599 /** Returns the logical register index of the i'th source register. */ 600 const RegId& srcRegIdx(int i) const { return staticInst->srcRegIdx(i); } 601 602 /** Return the size of the instResult queue. */ 603 uint8_t resultSize() { return instResult.size(); } 604 605 /** Pops a result off the instResult queue. 606 * If the result stack is empty, return the default value. 607 * */ 608 InstResult popResult(InstResult dflt = InstResult()) 609 { 610 if (!instResult.empty()) { 611 InstResult t = instResult.front(); 612 instResult.pop(); 613 return t; 614 } 615 return dflt; 616 } 617 618 /** Pushes a result onto the instResult queue. */ 619 /** @{ */ 620 /** Scalar result. */ 621 template<typename T> 622 void setScalarResult(T&& t) 623 { 624 if (instFlags[RecordResult]) { 625 instResult.push(InstResult(std::forward<T>(t), 626 InstResult::ResultType::Scalar)); 627 } 628 } 629 630 /** Full vector result. */ 631 template<typename T> 632 void setVecResult(T&& t) 633 { 634 if (instFlags[RecordResult]) { 635 instResult.push(InstResult(std::forward<T>(t), 636 InstResult::ResultType::VecReg)); 637 } 638 } 639 640 /** Vector element result. */ 641 template<typename T> 642 void setVecElemResult(T&& t) 643 { 644 if (instFlags[RecordResult]) { 645 instResult.push(InstResult(std::forward<T>(t), 646 InstResult::ResultType::VecElem)); 647 } 648 } 649 /** @} */ 650 651 /** Records an integer register being set to a value. */ 652 void setIntRegOperand(const StaticInst *si, int idx, IntReg val) 653 { 654 setScalarResult(val); 655 } 656 657 /** Records a CC register being set to a value. */ 658 void setCCRegOperand(const StaticInst *si, int idx, CCReg val) 659 { 660 setScalarResult(val); 661 } 662 663 /** Records an fp register being set to a value. */ 664 void setFloatRegOperand(const StaticInst *si, int idx, FloatReg val) 665 { 666 setScalarResult(val); 667 } 668 669 /** Record a vector register being set to a value */ 670 void setVecRegOperand(const StaticInst *si, int idx, 671 const VecRegContainer& val) 672 { 673 setVecResult(val); 674 } 675 676 /** Records an fp register being set to an integer value. */ 677 void 678 setFloatRegOperandBits(const StaticInst *si, int idx, FloatRegBits val) 679 { 680 setScalarResult(val); 681 } 682 683 /** Record a vector register being set to a value */ 684 void setVecElemOperand(const StaticInst *si, int idx, const VecElem val) 685 { 686 setVecElemResult(val); 687 } 688 689 /** Records that one of the source registers is ready. */ 690 void markSrcRegReady(); 691 692 /** Marks a specific register as ready. */ 693 void markSrcRegReady(RegIndex src_idx); 694 695 /** Returns if a source register is ready. */ 696 bool isReadySrcRegIdx(int idx) const 697 { 698 return this->_readySrcRegIdx[idx]; 699 } 700 701 /** Sets this instruction as completed. */ 702 void setCompleted() { status.set(Completed); } 703 704 /** Returns whether or not this instruction is completed. */ 705 bool isCompleted() const { return status[Completed]; } 706 707 /** Marks the result as ready. */ 708 void setResultReady() { status.set(ResultReady); } 709 710 /** Returns whether or not the result is ready. */ 711 bool isResultReady() const { return status[ResultReady]; } 712 713 /** Sets this instruction as ready to issue. */ 714 void setCanIssue() { status.set(CanIssue); } 715 716 /** Returns whether or not this instruction is ready to issue. */ 717 bool readyToIssue() const { return status[CanIssue]; } 718 719 /** Clears this instruction being able to issue. */ 720 void clearCanIssue() { status.reset(CanIssue); } 721 722 /** Sets this instruction as issued from the IQ. */ 723 void setIssued() { status.set(Issued); } 724 725 /** Returns whether or not this instruction has issued. */ 726 bool isIssued() const { return status[Issued]; } 727 728 /** Clears this instruction as being issued. */ 729 void clearIssued() { status.reset(Issued); } 730 731 /** Sets this instruction as executed. */ 732 void setExecuted() { status.set(Executed); } 733 734 /** Returns whether or not this instruction has executed. */ 735 bool isExecuted() const { return status[Executed]; } 736 737 /** Sets this instruction as ready to commit. */ 738 void setCanCommit() { status.set(CanCommit); } 739 740 /** Clears this instruction as being ready to commit. */ 741 void clearCanCommit() { status.reset(CanCommit); } 742 743 /** Returns whether or not this instruction is ready to commit. */ 744 bool readyToCommit() const { return status[CanCommit]; } 745 746 void setAtCommit() { status.set(AtCommit); } 747 748 bool isAtCommit() { return status[AtCommit]; } 749 750 /** Sets this instruction as committed. */ 751 void setCommitted() { status.set(Committed); } 752 753 /** Returns whether or not this instruction is committed. */ 754 bool isCommitted() const { return status[Committed]; } 755 756 /** Sets this instruction as squashed. */ 757 void setSquashed() { status.set(Squashed); } 758 759 /** Returns whether or not this instruction is squashed. */ 760 bool isSquashed() const { return status[Squashed]; } 761 762 //Instruction Queue Entry 763 //----------------------- 764 /** Sets this instruction as a entry the IQ. */ 765 void setInIQ() { status.set(IqEntry); } 766 767 /** Sets this instruction as a entry the IQ. */ 768 void clearInIQ() { status.reset(IqEntry); } 769 770 /** Returns whether or not this instruction has issued. */ 771 bool isInIQ() const { return status[IqEntry]; } 772 773 /** Sets this instruction as squashed in the IQ. */ 774 void setSquashedInIQ() { status.set(SquashedInIQ); status.set(Squashed);} 775 776 /** Returns whether or not this instruction is squashed in the IQ. */ 777 bool isSquashedInIQ() const { return status[SquashedInIQ]; } 778 779 780 //Load / Store Queue Functions 781 //----------------------- 782 /** Sets this instruction as a entry the LSQ. */ 783 void setInLSQ() { status.set(LsqEntry); } 784 785 /** Sets this instruction as a entry the LSQ. */ 786 void removeInLSQ() { status.reset(LsqEntry); } 787 788 /** Returns whether or not this instruction is in the LSQ. */ 789 bool isInLSQ() const { return status[LsqEntry]; } 790 791 /** Sets this instruction as squashed in the LSQ. */ 792 void setSquashedInLSQ() { status.set(SquashedInLSQ);} 793 794 /** Returns whether or not this instruction is squashed in the LSQ. */ 795 bool isSquashedInLSQ() const { return status[SquashedInLSQ]; } 796 797 798 //Reorder Buffer Functions 799 //----------------------- 800 /** Sets this instruction as a entry the ROB. */ 801 void setInROB() { status.set(RobEntry); } 802 803 /** Sets this instruction as a entry the ROB. */ 804 void clearInROB() { status.reset(RobEntry); } 805 806 /** Returns whether or not this instruction is in the ROB. */ 807 bool isInROB() const { return status[RobEntry]; } 808 809 /** Sets this instruction as squashed in the ROB. */ 810 void setSquashedInROB() { status.set(SquashedInROB); } 811 812 /** Returns whether or not this instruction is squashed in the ROB. */ 813 bool isSquashedInROB() const { return status[SquashedInROB]; } 814 815 /** Read the PC state of this instruction. */ 816 TheISA::PCState pcState() const { return pc; } 817 818 /** Set the PC state of this instruction. */ 819 void pcState(const TheISA::PCState &val) { pc = val; } 820 821 /** Read the PC of this instruction. */ 822 Addr instAddr() const { return pc.instAddr(); } 823 824 /** Read the PC of the next instruction. */ 825 Addr nextInstAddr() const { return pc.nextInstAddr(); } 826 827 /**Read the micro PC of this instruction. */ 828 Addr microPC() const { return pc.microPC(); } 829 830 bool readPredicate() 831 { 832 return instFlags[Predicate]; 833 } 834 835 void setPredicate(bool val) 836 { 837 instFlags[Predicate] = val; 838 839 if (traceData) { 840 traceData->setPredicate(val); 841 } 842 } 843 844 /** Sets the ASID. */ 845 void setASID(short addr_space_id) { asid = addr_space_id; } 846 847 /** Sets the thread id. */ 848 void setTid(ThreadID tid) { threadNumber = tid; } 849 850 /** Sets the pointer to the thread state. */ 851 void setThreadState(ImplState *state) { thread = state; } 852 853 /** Returns the thread context. */ 854 ThreadContext *tcBase() { return thread->getTC(); } 855 856 public: 857 /** Returns whether or not the eff. addr. source registers are ready. */ 858 bool eaSrcsReady(); 859 860 /** Is this instruction's memory access strictly ordered? */ 861 bool strictlyOrdered() const { return instFlags[IsStrictlyOrdered]; } 862 863 /** Has this instruction generated a memory request. */ 864 bool hasRequest() { return instFlags[ReqMade]; } 865 866 /** Returns iterator to this instruction in the list of all insts. */ 867 ListIt &getInstListIt() { return instListIt; } 868 869 /** Sets iterator for this instruction in the list of all insts. */ 870 void setInstListIt(ListIt _instListIt) { instListIt = _instListIt; } 871 872 public: 873 /** Returns the number of consecutive store conditional failures. */ 874 unsigned int readStCondFailures() const 875 { return thread->storeCondFailures; } 876 877 /** Sets the number of consecutive store conditional failures. */ 878 void setStCondFailures(unsigned int sc_failures) 879 { thread->storeCondFailures = sc_failures; } 880 881 public: 882 // monitor/mwait funtions 883 void armMonitor(Addr address) { cpu->armMonitor(threadNumber, address); } 884 bool mwait(PacketPtr pkt) { return cpu->mwait(threadNumber, pkt); } 885 void mwaitAtomic(ThreadContext *tc) 886 { return cpu->mwaitAtomic(threadNumber, tc, cpu->dtb); } 887 AddressMonitor *getAddrMonitor() 888 { return cpu->getCpuAddrMonitor(threadNumber); } 889}; 890 891template<class Impl> 892Fault 893BaseDynInst<Impl>::initiateMemRead(Addr addr, unsigned size, 894 Request::Flags flags) 895{ 896 instFlags[ReqMade] = true; 897 RequestPtr req = NULL; 898 RequestPtr sreqLow = NULL; 899 RequestPtr sreqHigh = NULL; 900 901 if (instFlags[ReqMade] && translationStarted()) { 902 req = savedReq; 903 sreqLow = savedSreqLow; 904 sreqHigh = savedSreqHigh; 905 } else { 906 req = std::make_shared<Request>( 907 asid, addr, size, flags, masterId(), 908 this->pc.instAddr(), thread->contextId()); 909 910 req->taskId(cpu->taskId()); 911 912 // Only split the request if the ISA supports unaligned accesses. 913 if (TheISA::HasUnalignedMemAcc) { 914 splitRequest(req, sreqLow, sreqHigh); 915 } 916 initiateTranslation(req, sreqLow, sreqHigh, NULL, BaseTLB::Read); 917 } 918 919 if (translationCompleted()) { 920 if (fault == NoFault) { 921 effAddr = req->getVaddr(); 922 effSize = size; 923 instFlags[EffAddrValid] = true; 924 925 if (cpu->checker) { 926 reqToVerify = std::make_shared<Request>(*req); 927 } 928 fault = cpu->read(req, sreqLow, sreqHigh, lqIdx); 929 } else { 930 // Commit will have to clean up whatever happened. Set this 931 // instruction as executed. 932 this->setExecuted(); 933 } 934 } 935 936 if (traceData) 937 traceData->setMem(addr, size, flags); 938 939 return fault; 940} 941 942template<class Impl> 943Fault 944BaseDynInst<Impl>::writeMem(uint8_t *data, unsigned size, Addr addr, 945 Request::Flags flags, uint64_t *res) 946{ 947 if (traceData) 948 traceData->setMem(addr, size, flags); 949 950 instFlags[ReqMade] = true; 951 RequestPtr req = NULL; 952 RequestPtr sreqLow = NULL; 953 RequestPtr sreqHigh = NULL; 954 955 if (instFlags[ReqMade] && translationStarted()) { 956 req = savedReq; 957 sreqLow = savedSreqLow; 958 sreqHigh = savedSreqHigh; 959 } else { 960 req = std::make_shared<Request>( 961 asid, addr, size, flags, masterId(), 962 this->pc.instAddr(), thread->contextId()); 963 964 req->taskId(cpu->taskId()); 965 966 // Only split the request if the ISA supports unaligned accesses. 967 if (TheISA::HasUnalignedMemAcc) { 968 splitRequest(req, sreqLow, sreqHigh); 969 } 970 initiateTranslation(req, sreqLow, sreqHigh, res, BaseTLB::Write); 971 } 972 973 if (fault == NoFault && translationCompleted()) { 974 effAddr = req->getVaddr(); 975 effSize = size; 976 instFlags[EffAddrValid] = true; 977 978 if (cpu->checker) { 979 reqToVerify = std::make_shared<Request>(*req); 980 } 981 fault = cpu->write(req, sreqLow, sreqHigh, data, sqIdx); 982 } 983 984 return fault; 985} 986 987template<class Impl> 988inline void 989BaseDynInst<Impl>::splitRequest(const RequestPtr &req, RequestPtr &sreqLow, 990 RequestPtr &sreqHigh) 991{ 992 // Check to see if the request crosses the next level block boundary. 993 unsigned block_size = cpu->cacheLineSize(); 994 Addr addr = req->getVaddr(); 995 Addr split_addr = roundDown(addr + req->getSize() - 1, block_size); 996 assert(split_addr <= addr || split_addr - addr < block_size); 997 998 // Spans two blocks. 999 if (split_addr > addr) { 1000 req->splitOnVaddr(split_addr, sreqLow, sreqHigh); 1001 } 1002} 1003 1004template<class Impl> 1005inline void 1006BaseDynInst<Impl>::initiateTranslation(const RequestPtr &req, 1007 const RequestPtr &sreqLow, 1008 const RequestPtr &sreqHigh, 1009 uint64_t *res, 1010 BaseTLB::Mode mode) 1011{ 1012 translationStarted(true); 1013 1014 if (!TheISA::HasUnalignedMemAcc || sreqLow == NULL) { 1015 WholeTranslationState *state = 1016 new WholeTranslationState(req, NULL, res, mode); 1017 1018 // One translation if the request isn't split. 1019 DataTranslation<BaseDynInstPtr> *trans = 1020 new DataTranslation<BaseDynInstPtr>(this, state); 1021 1022 cpu->dtb->translateTiming(req, thread->getTC(), trans, mode); 1023 1024 if (!translationCompleted()) { 1025 // The translation isn't yet complete, so we can't possibly have a 1026 // fault. Overwrite any existing fault we might have from a previous 1027 // execution of this instruction (e.g. an uncachable load that 1028 // couldn't execute because it wasn't at the head of the ROB). 1029 fault = NoFault; 1030 1031 // Save memory requests. 1032 savedReq = state->mainReq; 1033 savedSreqLow = state->sreqLow; 1034 savedSreqHigh = state->sreqHigh; 1035 } 1036 } else { 1037 WholeTranslationState *state = 1038 new WholeTranslationState(req, sreqLow, sreqHigh, NULL, res, mode); 1039 1040 // Two translations when the request is split. 1041 DataTranslation<BaseDynInstPtr> *stransLow = 1042 new DataTranslation<BaseDynInstPtr>(this, state, 0); 1043 DataTranslation<BaseDynInstPtr> *stransHigh = 1044 new DataTranslation<BaseDynInstPtr>(this, state, 1); 1045 1046 cpu->dtb->translateTiming(sreqLow, thread->getTC(), stransLow, mode); 1047 cpu->dtb->translateTiming(sreqHigh, thread->getTC(), stransHigh, mode); 1048 1049 if (!translationCompleted()) { 1050 // The translation isn't yet complete, so we can't possibly have a 1051 // fault. Overwrite any existing fault we might have from a previous 1052 // execution of this instruction (e.g. an uncachable load that 1053 // couldn't execute because it wasn't at the head of the ROB). 1054 fault = NoFault; 1055 1056 // Save memory requests. 1057 savedReq = state->mainReq; 1058 savedSreqLow = state->sreqLow; 1059 savedSreqHigh = state->sreqHigh; 1060 } 1061 } 1062} 1063 1064template<class Impl> 1065inline void 1066BaseDynInst<Impl>::finishTranslation(WholeTranslationState *state) 1067{ 1068 fault = state->getFault(); 1069 1070 instFlags[IsStrictlyOrdered] = state->isStrictlyOrdered(); 1071 1072 if (fault == NoFault) { 1073 // save Paddr for a single req 1074 physEffAddrLow = state->getPaddr(); 1075 1076 // case for the request that has been split 1077 if (state->isSplit) { 1078 physEffAddrLow = state->sreqLow->getPaddr(); 1079 physEffAddrHigh = state->sreqHigh->getPaddr(); 1080 } 1081 1082 memReqFlags = state->getFlags(); 1083 1084 if (state->mainReq->isCondSwap()) { 1085 assert(state->res); 1086 state->mainReq->setExtraData(*state->res); 1087 } 1088 1089 } else { 1090 state->deleteReqs(); 1091 } 1092 delete state; 1093 1094 translationCompleted(true); 1095} 1096 1097#endif // __CPU_BASE_DYN_INST_HH__ 1098