/* * Copyright (c) 2004-2005 The Regents of The University of Michigan * All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions are * met: redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer; * redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution; * neither the name of the copyright holders nor the names of its * contributors may be used to endorse or promote products derived from * this software without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. * * Authors: Kevin Lim * Korey Sewell */ #ifndef __CPU_O3_CPU_HH__ #define __CPU_O3_CPU_HH__ #include #include #include #include #include #include "arch/types.hh" #include "base/statistics.hh" #include "base/timebuf.hh" #include "config/full_system.hh" #include "cpu/activity.hh" #include "cpu/base.hh" #include "cpu/simple_thread.hh" #include "cpu/o3/comm.hh" #include "cpu/o3/cpu_policy.hh" #include "cpu/o3/scoreboard.hh" #include "cpu/o3/thread_state.hh" //#include "cpu/o3/thread_context.hh" #include "sim/process.hh" template class Checker; class ThreadContext; template class O3ThreadContext; class Checkpoint; class MemObject; class Process; class BaseO3CPU : public BaseCPU { //Stuff that's pretty ISA independent will go here. public: typedef BaseCPU::Params Params; BaseO3CPU(Params *params); void regStats(); /** Sets this CPU's ID. */ void setCpuId(int id) { cpu_id = id; } /** Reads this CPU's ID. */ int readCpuId() { return cpu_id; } protected: int cpu_id; }; /** * FullO3CPU class, has each of the stages (fetch through commit) * within it, as well as all of the time buffers between stages. The * tick() function for the CPU is defined here. */ template class FullO3CPU : public BaseO3CPU { public: typedef TheISA::FloatReg FloatReg; typedef TheISA::FloatRegBits FloatRegBits; // Typedefs from the Impl here. typedef typename Impl::CPUPol CPUPolicy; typedef typename Impl::Params Params; typedef typename Impl::DynInstPtr DynInstPtr; typedef O3ThreadState Thread; typedef typename std::list::iterator ListIt; friend class O3ThreadContext; public: enum Status { Running, Idle, Halted, Blocked, SwitchedOut }; /** Overall CPU status. */ Status _status; /** Per-thread status in CPU, used for SMT. */ Status _threadStatus[Impl::MaxThreads]; private: class TickEvent : public Event { private: /** Pointer to the CPU. */ FullO3CPU *cpu; public: /** Constructs a tick event. */ TickEvent(FullO3CPU *c); /** Processes a tick event, calling tick() on the CPU. */ void process(); /** Returns the description of the tick event. */ const char *description(); }; /** The tick event used for scheduling CPU ticks. */ TickEvent tickEvent; /** Schedule tick event, regardless of its current state. */ void scheduleTickEvent(int delay) { if (tickEvent.squashed()) tickEvent.reschedule(curTick + cycles(delay)); else if (!tickEvent.scheduled()) tickEvent.schedule(curTick + cycles(delay)); } /** Unschedule tick event, regardless of its current state. */ void unscheduleTickEvent() { if (tickEvent.scheduled()) tickEvent.squash(); } class ActivateThreadEvent : public Event { private: /** Number of Thread to Activate */ int tid; /** Pointer to the CPU. */ FullO3CPU *cpu; public: /** Constructs the event. */ ActivateThreadEvent(); /** Initialize Event */ void init(int thread_num, FullO3CPU *thread_cpu); /** Processes the event, calling activateThread() on the CPU. */ void process(); /** Returns the description of the event. */ const char *description(); }; /** Schedule thread to activate , regardless of its current state. */ void scheduleActivateThreadEvent(int tid, int delay) { // Schedule thread to activate, regardless of its current state. if (activateThreadEvent[tid].squashed()) activateThreadEvent[tid].reschedule(curTick + cycles(delay)); else if (!activateThreadEvent[tid].scheduled()) activateThreadEvent[tid].schedule(curTick + cycles(delay)); } /** Unschedule actiavte thread event, regardless of its current state. */ void unscheduleActivateThreadEvent(int tid) { if (activateThreadEvent[tid].scheduled()) activateThreadEvent[tid].squash(); } /** The tick event used for scheduling CPU ticks. */ ActivateThreadEvent activateThreadEvent[Impl::MaxThreads]; class DeallocateContextEvent : public Event { private: /** Number of Thread to Activate */ int tid; /** Pointer to the CPU. */ FullO3CPU *cpu; public: /** Constructs the event. */ DeallocateContextEvent(); /** Initialize Event */ void init(int thread_num, FullO3CPU *thread_cpu); /** Processes the event, calling activateThread() on the CPU. */ void process(); /** Returns the description of the event. */ const char *description(); }; /** Schedule cpu to deallocate thread context.*/ void scheduleDeallocateContextEvent(int tid, int delay) { // Schedule thread to activate, regardless of its current state. if (deallocateContextEvent[tid].squashed()) deallocateContextEvent[tid].reschedule(curTick + cycles(delay)); else if (!deallocateContextEvent[tid].scheduled()) deallocateContextEvent[tid].schedule(curTick + cycles(delay)); } /** Unschedule thread deallocation in CPU */ void unscheduleDeallocateContextEvent(int tid) { if (deallocateContextEvent[tid].scheduled()) deallocateContextEvent[tid].squash(); } /** The tick event used for scheduling CPU ticks. */ DeallocateContextEvent deallocateContextEvent[Impl::MaxThreads]; public: /** Constructs a CPU with the given parameters. */ FullO3CPU(Params *params); /** Destructor. */ ~FullO3CPU(); /** Registers statistics. */ void fullCPURegStats(); /** Returns a specific port. */ Port *getPort(const std::string &if_name, int idx); /** Ticks CPU, calling tick() on each stage, and checking the overall * activity to see if the CPU should deschedule itself. */ void tick(); /** Initialize the CPU */ void init(); /** Returns the Number of Active Threads in the CPU */ int numActiveThreads() { return activeThreads.size(); } /** Add Thread to Active Threads List */ void activateThread(unsigned tid); /** Remove Thread from Active Threads List */ void deactivateThread(unsigned tid); /** Setup CPU to insert a thread's context */ void insertThread(unsigned tid); /** Remove all of a thread's context from CPU */ void removeThread(unsigned tid); /** Count the Total Instructions Committed in the CPU. */ virtual Counter totalInstructions() const { Counter total(0); for (int i=0; i < thread.size(); i++) total += thread[i]->numInst; return total; } /** Add Thread to Active Threads List. */ void activateContext(int tid, int delay); /** Remove Thread from Active Threads List */ void suspendContext(int tid); /** Remove Thread from Active Threads List && * Remove Thread Context from CPU. */ void deallocateContext(int tid, int delay = 1); /** Remove Thread from Active Threads List && * Remove Thread Context from CPU. */ void haltContext(int tid); /** Activate a Thread When CPU Resources are Available. */ void activateWhenReady(int tid); /** Add or Remove a Thread Context in the CPU. */ void doContextSwitch(); /** Update The Order In Which We Process Threads. */ void updateThreadPriority(); /** Serialize state. */ virtual void serialize(std::ostream &os); /** Unserialize from a checkpoint. */ virtual void unserialize(Checkpoint *cp, const std::string §ion); public: /** Executes a syscall on this cycle. * --------------------------------------- * Note: this is a virtual function. CPU-Specific * functionality defined in derived classes */ virtual void syscall(int tid) { panic("Unimplemented!"); } /** Starts draining the CPU's pipeline of all instructions in * order to stop all memory accesses. */ virtual unsigned int drain(Event *drain_event); /** Resumes execution after a drain. */ virtual void resume(); /** Signals to this CPU that a stage has completed switching out. */ void signalDrained(); /** Switches out this CPU. */ virtual void switchOut(); /** Takes over from another CPU. */ virtual void takeOverFrom(BaseCPU *oldCPU); /** Get the current instruction sequence number, and increment it. */ InstSeqNum getAndIncrementInstSeq() { return globalSeqNum++; } #if FULL_SYSTEM /** Check if this address is a valid instruction address. */ bool validInstAddr(Addr addr) { return true; } /** Check if this address is a valid data address. */ bool validDataAddr(Addr addr) { return true; } /** Get instruction asid. */ int getInstAsid(unsigned tid) { return regFile.miscRegs[tid].getInstAsid(); } /** Get data asid. */ int getDataAsid(unsigned tid) { return regFile.miscRegs[tid].getDataAsid(); } #else /** Get instruction asid. */ int getInstAsid(unsigned tid) { return thread[tid]->getInstAsid(); } /** Get data asid. */ int getDataAsid(unsigned tid) { return thread[tid]->getDataAsid(); } #endif /** Register accessors. Index refers to the physical register index. */ uint64_t readIntReg(int reg_idx); FloatReg readFloatReg(int reg_idx); FloatReg readFloatReg(int reg_idx, int width); FloatRegBits readFloatRegBits(int reg_idx); FloatRegBits readFloatRegBits(int reg_idx, int width); void setIntReg(int reg_idx, uint64_t val); void setFloatReg(int reg_idx, FloatReg val); void setFloatReg(int reg_idx, FloatReg val, int width); void setFloatRegBits(int reg_idx, FloatRegBits val); void setFloatRegBits(int reg_idx, FloatRegBits val, int width); uint64_t readArchIntReg(int reg_idx, unsigned tid); float readArchFloatRegSingle(int reg_idx, unsigned tid); double readArchFloatRegDouble(int reg_idx, unsigned tid); uint64_t readArchFloatRegInt(int reg_idx, unsigned tid); /** Architectural register accessors. Looks up in the commit * rename table to obtain the true physical index of the * architected register first, then accesses that physical * register. */ void setArchIntReg(int reg_idx, uint64_t val, unsigned tid); void setArchFloatRegSingle(int reg_idx, float val, unsigned tid); void setArchFloatRegDouble(int reg_idx, double val, unsigned tid); void setArchFloatRegInt(int reg_idx, uint64_t val, unsigned tid); /** Reads the commit PC of a specific thread. */ uint64_t readPC(unsigned tid); /** Sets the commit PC of a specific thread. */ void setPC(Addr new_PC, unsigned tid); /** Reads the next PC of a specific thread. */ uint64_t readNextPC(unsigned tid); /** Sets the next PC of a specific thread. */ void setNextPC(uint64_t val, unsigned tid); /** Reads the next NPC of a specific thread. */ uint64_t readNextNPC(unsigned tid); /** Sets the next NPC of a specific thread. */ void setNextNPC(uint64_t val, unsigned tid); /** Function to add instruction onto the head of the list of the * instructions. Used when new instructions are fetched. */ ListIt addInst(DynInstPtr &inst); /** Function to tell the CPU that an instruction has completed. */ void instDone(unsigned tid); /** Add Instructions to the CPU Remove List*/ void addToRemoveList(DynInstPtr &inst); /** Remove an instruction from the front end of the list. There's * no restriction on location of the instruction. */ void removeFrontInst(DynInstPtr &inst); /** Remove all instructions that are not currently in the ROB. * There's also an option to not squash delay slot instructions.*/ void removeInstsNotInROB(unsigned tid, bool squash_delay_slot, const InstSeqNum &delay_slot_seq_num); /** Remove all instructions younger than the given sequence number. */ void removeInstsUntil(const InstSeqNum &seq_num,unsigned tid); /** Removes the instruction pointed to by the iterator. */ inline void squashInstIt(const ListIt &instIt, const unsigned &tid); /** Cleans up all instructions on the remove list. */ void cleanUpRemovedInsts(); /** Debug function to print all instructions on the list. */ void dumpInsts(); public: /** List of all the instructions in flight. */ std::list instList; /** List of all the instructions that will be removed at the end of this * cycle. */ std::queue removeList; #ifdef DEBUG /** Debug structure to keep track of the sequence numbers still in * flight. */ std::set snList; #endif /** Records if instructions need to be removed this cycle due to * being retired or squashed. */ bool removeInstsThisCycle; protected: /** The fetch stage. */ typename CPUPolicy::Fetch fetch; /** The decode stage. */ typename CPUPolicy::Decode decode; /** The dispatch stage. */ typename CPUPolicy::Rename rename; /** The issue/execute/writeback stages. */ typename CPUPolicy::IEW iew; /** The commit stage. */ typename CPUPolicy::Commit commit; /** The register file. */ typename CPUPolicy::RegFile regFile; /** The free list. */ typename CPUPolicy::FreeList freeList; /** The rename map. */ typename CPUPolicy::RenameMap renameMap[Impl::MaxThreads]; /** The commit rename map. */ typename CPUPolicy::RenameMap commitRenameMap[Impl::MaxThreads]; /** The re-order buffer. */ typename CPUPolicy::ROB rob; /** Active Threads List */ std::list activeThreads; /** Integer Register Scoreboard */ Scoreboard scoreboard; public: /** Enum to give each stage a specific index, so when calling * activateStage() or deactivateStage(), they can specify which stage * is being activated/deactivated. */ enum StageIdx { FetchIdx, DecodeIdx, RenameIdx, IEWIdx, CommitIdx, NumStages }; /** Typedefs from the Impl to get the structs that each of the * time buffers should use. */ typedef typename CPUPolicy::TimeStruct TimeStruct; typedef typename CPUPolicy::FetchStruct FetchStruct; typedef typename CPUPolicy::DecodeStruct DecodeStruct; typedef typename CPUPolicy::RenameStruct RenameStruct; typedef typename CPUPolicy::IEWStruct IEWStruct; /** The main time buffer to do backwards communication. */ TimeBuffer timeBuffer; /** The fetch stage's instruction queue. */ TimeBuffer fetchQueue; /** The decode stage's instruction queue. */ TimeBuffer decodeQueue; /** The rename stage's instruction queue. */ TimeBuffer renameQueue; /** The IEW stage's instruction queue. */ TimeBuffer iewQueue; private: /** The activity recorder; used to tell if the CPU has any * activity remaining or if it can go to idle and deschedule * itself. */ ActivityRecorder activityRec; public: /** Records that there was time buffer activity this cycle. */ void activityThisCycle() { activityRec.activity(); } /** Changes a stage's status to active within the activity recorder. */ void activateStage(const StageIdx idx) { activityRec.activateStage(idx); } /** Changes a stage's status to inactive within the activity recorder. */ void deactivateStage(const StageIdx idx) { activityRec.deactivateStage(idx); } /** Wakes the CPU, rescheduling the CPU if it's not already active. */ void wakeCPU(); /** Gets a free thread id. Use if thread ids change across system. */ int getFreeTid(); public: /** Returns a pointer to a thread context. */ ThreadContext *tcBase(unsigned tid) { return thread[tid]->getTC(); } /** The global sequence number counter. */ InstSeqNum globalSeqNum; /** Pointer to the checker, which can dynamically verify * instruction results at run time. This can be set to NULL if it * is not being used. */ Checker *checker; #if FULL_SYSTEM /** Pointer to the system. */ System *system; /** Pointer to physical memory. */ PhysicalMemory *physmem; #endif /** Pointer to memory. */ MemObject *mem; /** Event to call process() on once draining has completed. */ Event *drainEvent; /** Counter of how many stages have completed draining. */ int drainCount; /** Pointers to all of the threads in the CPU. */ std::vector thread; /** Pointer to the icache interface. */ MemInterface *icacheInterface; /** Pointer to the dcache interface. */ MemInterface *dcacheInterface; /** Whether or not the CPU should defer its registration. */ bool deferRegistration; /** Is there a context switch pending? */ bool contextSwitch; /** Threads Scheduled to Enter CPU */ std::list cpuWaitList; /** The cycle that the CPU was last running, used for statistics. */ Tick lastRunningCycle; /** The cycle that the CPU was last activated by a new thread*/ Tick lastActivatedCycle; /** Number of Threads CPU can process */ unsigned numThreads; /** Mapping for system thread id to cpu id */ std::map threadMap; /** Available thread ids in the cpu*/ std::vector tids; /** Stat for total number of times the CPU is descheduled. */ Stats::Scalar<> timesIdled; /** Stat for total number of cycles the CPU spends descheduled. */ Stats::Scalar<> idleCycles; /** Stat for the number of committed instructions per thread. */ Stats::Vector<> committedInsts; /** Stat for the total number of committed instructions. */ Stats::Scalar<> totalCommittedInsts; /** Stat for the CPI per thread. */ Stats::Formula cpi; /** Stat for the total CPI. */ Stats::Formula totalCpi; /** Stat for the IPC per thread. */ Stats::Formula ipc; /** Stat for the total IPC. */ Stats::Formula totalIpc; }; #endif // __CPU_O3_CPU_HH__