lsq_unit.hh revision 2669
12292SN/A/* 22329SN/A * Copyright (c) 2004-2006 The Regents of The University of Michigan 32292SN/A * All rights reserved. 42292SN/A * 52292SN/A * Redistribution and use in source and binary forms, with or without 62292SN/A * modification, are permitted provided that the following conditions are 72292SN/A * met: redistributions of source code must retain the above copyright 82292SN/A * notice, this list of conditions and the following disclaimer; 92292SN/A * redistributions in binary form must reproduce the above copyright 102292SN/A * notice, this list of conditions and the following disclaimer in the 112292SN/A * documentation and/or other materials provided with the distribution; 122292SN/A * neither the name of the copyright holders nor the names of its 132292SN/A * contributors may be used to endorse or promote products derived from 142292SN/A * this software without specific prior written permission. 152292SN/A * 162292SN/A * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 172292SN/A * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 182292SN/A * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 192292SN/A * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 202292SN/A * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 212292SN/A * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 222292SN/A * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 232292SN/A * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 242292SN/A * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 252292SN/A * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 262292SN/A * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 272292SN/A */ 282292SN/A 292292SN/A#ifndef __CPU_O3_LSQ_UNIT_HH__ 302292SN/A#define __CPU_O3_LSQ_UNIT_HH__ 312292SN/A 322329SN/A#include <algorithm> 332292SN/A#include <map> 342292SN/A#include <queue> 352292SN/A 362329SN/A#include "arch/faults.hh" 372292SN/A#include "config/full_system.hh" 382292SN/A#include "base/hashmap.hh" 392292SN/A#include "cpu/inst_seq.hh" 402669Sktlim@umich.edu#include "mem/packet.hh" 412669Sktlim@umich.edu#include "mem/port.hh" 422292SN/A//#include "mem/page_table.hh" 432329SN/A//#include "sim/debug.hh" 442329SN/A//#include "sim/sim_object.hh" 452292SN/A 462292SN/A/** 472329SN/A * Class that implements the actual LQ and SQ for each specific 482329SN/A * thread. Both are circular queues; load entries are freed upon 492329SN/A * committing, while store entries are freed once they writeback. The 502329SN/A * LSQUnit tracks if there are memory ordering violations, and also 512329SN/A * detects partial load to store forwarding cases (a store only has 522329SN/A * part of a load's data) that requires the load to wait until the 532329SN/A * store writes back. In the former case it holds onto the instruction 542329SN/A * until the dependence unit looks at it, and in the latter it stalls 552329SN/A * the LSQ until the store writes back. At that point the load is 562329SN/A * replayed. 572292SN/A */ 582292SN/Atemplate <class Impl> 592292SN/Aclass LSQUnit { 602292SN/A protected: 612292SN/A typedef TheISA::IntReg IntReg; 622292SN/A public: 632292SN/A typedef typename Impl::Params Params; 642292SN/A typedef typename Impl::FullCPU FullCPU; 652292SN/A typedef typename Impl::DynInstPtr DynInstPtr; 662292SN/A typedef typename Impl::CPUPol::IEW IEW; 672292SN/A typedef typename Impl::CPUPol::IssueStruct IssueStruct; 682292SN/A 692292SN/A public: 702292SN/A /** Constructs an LSQ unit. init() must be called prior to use. */ 712292SN/A LSQUnit(); 722292SN/A 732292SN/A /** Initializes the LSQ unit with the specified number of entries. */ 742292SN/A void init(Params *params, unsigned maxLQEntries, 752292SN/A unsigned maxSQEntries, unsigned id); 762292SN/A 772292SN/A /** Returns the name of the LSQ unit. */ 782292SN/A std::string name() const; 792292SN/A 802292SN/A /** Sets the CPU pointer. */ 812669Sktlim@umich.edu void setCPU(FullCPU *cpu_ptr); 822292SN/A 832292SN/A /** Sets the IEW stage pointer. */ 842292SN/A void setIEW(IEW *iew_ptr) 852292SN/A { iewStage = iew_ptr; } 862292SN/A 872292SN/A /** Sets the page table pointer. */ 882292SN/A// void setPageTable(PageTable *pt_ptr); 892292SN/A 902307SN/A void switchOut(); 912307SN/A 922307SN/A void takeOverFrom(); 932307SN/A 942307SN/A bool isSwitchedOut() { return switchedOut; } 952307SN/A 962292SN/A /** Ticks the LSQ unit, which in this case only resets the number of 972292SN/A * used cache ports. 982292SN/A * @todo: Move the number of used ports up to the LSQ level so it can 992292SN/A * be shared by all LSQ units. 1002292SN/A */ 1012292SN/A void tick() { usedPorts = 0; } 1022292SN/A 1032292SN/A /** Inserts an instruction. */ 1042292SN/A void insert(DynInstPtr &inst); 1052292SN/A /** Inserts a load instruction. */ 1062292SN/A void insertLoad(DynInstPtr &load_inst); 1072292SN/A /** Inserts a store instruction. */ 1082292SN/A void insertStore(DynInstPtr &store_inst); 1092292SN/A 1102292SN/A /** Executes a load instruction. */ 1112292SN/A Fault executeLoad(DynInstPtr &inst); 1122292SN/A 1132329SN/A Fault executeLoad(int lq_idx) { panic("Not implemented"); return NoFault; } 1142292SN/A /** Executes a store instruction. */ 1152292SN/A Fault executeStore(DynInstPtr &inst); 1162292SN/A 1172292SN/A /** Commits the head load. */ 1182292SN/A void commitLoad(); 1192292SN/A /** Commits loads older than a specific sequence number. */ 1202292SN/A void commitLoads(InstSeqNum &youngest_inst); 1212292SN/A 1222292SN/A /** Commits stores older than a specific sequence number. */ 1232292SN/A void commitStores(InstSeqNum &youngest_inst); 1242292SN/A 1252292SN/A /** Writes back stores. */ 1262292SN/A void writebackStores(); 1272292SN/A 1282669Sktlim@umich.edu void completeDataAccess(PacketPtr pkt); 1292669Sktlim@umich.edu 1302669Sktlim@umich.edu void completeStoreDataAccess(DynInstPtr &inst); 1312669Sktlim@umich.edu 1322292SN/A // @todo: Include stats in the LSQ unit. 1332292SN/A //void regStats(); 1342292SN/A 1352292SN/A /** Clears all the entries in the LQ. */ 1362292SN/A void clearLQ(); 1372292SN/A 1382292SN/A /** Clears all the entries in the SQ. */ 1392292SN/A void clearSQ(); 1402292SN/A 1412292SN/A /** Resizes the LQ to a given size. */ 1422292SN/A void resizeLQ(unsigned size); 1432292SN/A 1442292SN/A /** Resizes the SQ to a given size. */ 1452292SN/A void resizeSQ(unsigned size); 1462292SN/A 1472292SN/A /** Squashes all instructions younger than a specific sequence number. */ 1482292SN/A void squash(const InstSeqNum &squashed_num); 1492292SN/A 1502292SN/A /** Returns if there is a memory ordering violation. Value is reset upon 1512292SN/A * call to getMemDepViolator(). 1522292SN/A */ 1532292SN/A bool violation() { return memDepViolator; } 1542292SN/A 1552292SN/A /** Returns the memory ordering violator. */ 1562292SN/A DynInstPtr getMemDepViolator(); 1572292SN/A 1582329SN/A /** Returns if a load became blocked due to the memory system. */ 1592292SN/A bool loadBlocked() 1602292SN/A { return isLoadBlocked; } 1612292SN/A 1622292SN/A void clearLoadBlocked() 1632292SN/A { isLoadBlocked = false; } 1642292SN/A 1652292SN/A bool isLoadBlockedHandled() 1662292SN/A { return loadBlockedHandled; } 1672292SN/A 1682292SN/A void setLoadBlockedHandled() 1692292SN/A { loadBlockedHandled = true; } 1702292SN/A 1712292SN/A /** Returns the number of free entries (min of free LQ and SQ entries). */ 1722292SN/A unsigned numFreeEntries(); 1732292SN/A 1742292SN/A /** Returns the number of loads ready to execute. */ 1752292SN/A int numLoadsReady(); 1762292SN/A 1772292SN/A /** Returns the number of loads in the LQ. */ 1782292SN/A int numLoads() { return loads; } 1792292SN/A 1802292SN/A /** Returns the number of stores in the SQ. */ 1812292SN/A int numStores() { return stores; } 1822292SN/A 1832292SN/A /** Returns if either the LQ or SQ is full. */ 1842292SN/A bool isFull() { return lqFull() || sqFull(); } 1852292SN/A 1862292SN/A /** Returns if the LQ is full. */ 1872292SN/A bool lqFull() { return loads >= (LQEntries - 1); } 1882292SN/A 1892292SN/A /** Returns if the SQ is full. */ 1902292SN/A bool sqFull() { return stores >= (SQEntries - 1); } 1912292SN/A 1922292SN/A /** Returns the number of instructions in the LSQ. */ 1932292SN/A unsigned getCount() { return loads + stores; } 1942292SN/A 1952292SN/A /** Returns if there are any stores to writeback. */ 1962292SN/A bool hasStoresToWB() { return storesToWB; } 1972292SN/A 1982292SN/A /** Returns the number of stores to writeback. */ 1992292SN/A int numStoresToWB() { return storesToWB; } 2002292SN/A 2012292SN/A /** Returns if the LSQ unit will writeback on this cycle. */ 2022292SN/A bool willWB() { return storeQueue[storeWBIdx].canWB && 2032669Sktlim@umich.edu !storeQueue[storeWBIdx].completed/* && 2042669Sktlim@umich.edu !dcacheInterface->isBlocked()*/; } 2052292SN/A 2062292SN/A private: 2072292SN/A /** Completes the store at the specified index. */ 2082292SN/A void completeStore(int store_idx); 2092292SN/A 2102292SN/A /** Increments the given store index (circular queue). */ 2112292SN/A inline void incrStIdx(int &store_idx); 2122292SN/A /** Decrements the given store index (circular queue). */ 2132292SN/A inline void decrStIdx(int &store_idx); 2142292SN/A /** Increments the given load index (circular queue). */ 2152292SN/A inline void incrLdIdx(int &load_idx); 2162292SN/A /** Decrements the given load index (circular queue). */ 2172292SN/A inline void decrLdIdx(int &load_idx); 2182292SN/A 2192329SN/A public: 2202329SN/A /** Debugging function to dump instructions in the LSQ. */ 2212329SN/A void dumpInsts(); 2222329SN/A 2232292SN/A private: 2242292SN/A /** Pointer to the CPU. */ 2252292SN/A FullCPU *cpu; 2262292SN/A 2272292SN/A /** Pointer to the IEW stage. */ 2282292SN/A IEW *iewStage; 2292292SN/A 2302669Sktlim@umich.edu MemObject *mem; 2312669Sktlim@umich.edu 2322669Sktlim@umich.edu class DcachePort : public Port 2332669Sktlim@umich.edu { 2342669Sktlim@umich.edu protected: 2352669Sktlim@umich.edu FullCPU *cpu; 2362669Sktlim@umich.edu LSQUnit *lsq; 2372669Sktlim@umich.edu 2382669Sktlim@umich.edu public: 2392669Sktlim@umich.edu DcachePort(FullCPU *_cpu, LSQUnit *_lsq) 2402669Sktlim@umich.edu : Port(_lsq->name() + "-dport"), cpu(_cpu), lsq(_lsq) 2412669Sktlim@umich.edu { } 2422669Sktlim@umich.edu 2432669Sktlim@umich.edu protected: 2442669Sktlim@umich.edu virtual Tick recvAtomic(PacketPtr pkt); 2452669Sktlim@umich.edu 2462669Sktlim@umich.edu virtual void recvFunctional(PacketPtr pkt); 2472669Sktlim@umich.edu 2482669Sktlim@umich.edu virtual void recvStatusChange(Status status); 2492669Sktlim@umich.edu 2502669Sktlim@umich.edu virtual void getDeviceAddressRanges(AddrRangeList &resp, 2512669Sktlim@umich.edu AddrRangeList &snoop) 2522669Sktlim@umich.edu { resp.clear(); snoop.clear(); } 2532669Sktlim@umich.edu 2542669Sktlim@umich.edu virtual bool recvTiming(PacketPtr pkt); 2552669Sktlim@umich.edu 2562669Sktlim@umich.edu virtual void recvRetry(); 2572669Sktlim@umich.edu }; 2582669Sktlim@umich.edu 2592292SN/A /** Pointer to the D-cache. */ 2602669Sktlim@umich.edu DcachePort *dcachePort; 2612292SN/A 2622292SN/A /** Pointer to the page table. */ 2632292SN/A// PageTable *pTable; 2642292SN/A 2652292SN/A public: 2662292SN/A struct SQEntry { 2672292SN/A /** Constructs an empty store queue entry. */ 2682292SN/A SQEntry() 2692292SN/A : inst(NULL), req(NULL), size(0), data(0), 2702292SN/A canWB(0), committed(0), completed(0) 2712292SN/A { } 2722292SN/A 2732292SN/A /** Constructs a store queue entry for a given instruction. */ 2742292SN/A SQEntry(DynInstPtr &_inst) 2752292SN/A : inst(_inst), req(NULL), size(0), data(0), 2762292SN/A canWB(0), committed(0), completed(0) 2772292SN/A { } 2782292SN/A 2792292SN/A /** The store instruction. */ 2802292SN/A DynInstPtr inst; 2812669Sktlim@umich.edu /** The request for the store. */ 2822669Sktlim@umich.edu RequestPtr req; 2832292SN/A /** The size of the store. */ 2842292SN/A int size; 2852292SN/A /** The store data. */ 2862292SN/A IntReg data; 2872292SN/A /** Whether or not the store can writeback. */ 2882292SN/A bool canWB; 2892292SN/A /** Whether or not the store is committed. */ 2902292SN/A bool committed; 2912292SN/A /** Whether or not the store is completed. */ 2922292SN/A bool completed; 2932292SN/A }; 2942329SN/A 2952292SN/A private: 2962292SN/A /** The LSQUnit thread id. */ 2972292SN/A unsigned lsqID; 2982292SN/A 2992292SN/A /** The store queue. */ 3002292SN/A std::vector<SQEntry> storeQueue; 3012292SN/A 3022292SN/A /** The load queue. */ 3032292SN/A std::vector<DynInstPtr> loadQueue; 3042292SN/A 3052329SN/A /** The number of LQ entries, plus a sentinel entry (circular queue). 3062329SN/A * @todo: Consider having var that records the true number of LQ entries. 3072329SN/A */ 3082292SN/A unsigned LQEntries; 3092329SN/A /** The number of SQ entries, plus a sentinel entry (circular queue). 3102329SN/A * @todo: Consider having var that records the true number of SQ entries. 3112329SN/A */ 3122292SN/A unsigned SQEntries; 3132292SN/A 3142292SN/A /** The number of load instructions in the LQ. */ 3152292SN/A int loads; 3162329SN/A /** The number of store instructions in the SQ. */ 3172292SN/A int stores; 3182292SN/A /** The number of store instructions in the SQ waiting to writeback. */ 3192292SN/A int storesToWB; 3202292SN/A 3212292SN/A /** The index of the head instruction in the LQ. */ 3222292SN/A int loadHead; 3232292SN/A /** The index of the tail instruction in the LQ. */ 3242292SN/A int loadTail; 3252292SN/A 3262292SN/A /** The index of the head instruction in the SQ. */ 3272292SN/A int storeHead; 3282329SN/A /** The index of the first instruction that may be ready to be 3292329SN/A * written back, and has not yet been written back. 3302292SN/A */ 3312292SN/A int storeWBIdx; 3322292SN/A /** The index of the tail instruction in the SQ. */ 3332292SN/A int storeTail; 3342292SN/A 3352292SN/A /// @todo Consider moving to a more advanced model with write vs read ports 3362292SN/A /** The number of cache ports available each cycle. */ 3372292SN/A int cachePorts; 3382292SN/A 3392292SN/A /** The number of used cache ports in this cycle. */ 3402292SN/A int usedPorts; 3412292SN/A 3422307SN/A bool switchedOut; 3432307SN/A 3442292SN/A //list<InstSeqNum> mshrSeqNums; 3452292SN/A 3462292SN/A /** Wire to read information from the issue stage time queue. */ 3472292SN/A typename TimeBuffer<IssueStruct>::wire fromIssue; 3482292SN/A 3492292SN/A /** Whether or not the LSQ is stalled. */ 3502292SN/A bool stalled; 3512292SN/A /** The store that causes the stall due to partial store to load 3522292SN/A * forwarding. 3532292SN/A */ 3542292SN/A InstSeqNum stallingStoreIsn; 3552292SN/A /** The index of the above store. */ 3562292SN/A int stallingLoadIdx; 3572292SN/A 3582329SN/A /** Whether or not a load is blocked due to the memory system. */ 3592292SN/A bool isLoadBlocked; 3602292SN/A 3612292SN/A bool loadBlockedHandled; 3622292SN/A 3632292SN/A InstSeqNum blockedLoadSeqNum; 3642292SN/A 3652292SN/A /** The oldest load that caused a memory ordering violation. */ 3662292SN/A DynInstPtr memDepViolator; 3672292SN/A 3682292SN/A // Will also need how many read/write ports the Dcache has. Or keep track 3692292SN/A // of that in stage that is one level up, and only call executeLoad/Store 3702292SN/A // the appropriate number of times. 3712307SN/A/* 3722307SN/A // total number of loads forwaded from LSQ stores 3732307SN/A Stats::Vector<> lsq_forw_loads; 3742292SN/A 3752307SN/A // total number of loads ignored due to invalid addresses 3762307SN/A Stats::Vector<> inv_addr_loads; 3772307SN/A 3782307SN/A // total number of software prefetches ignored due to invalid addresses 3792307SN/A Stats::Vector<> inv_addr_swpfs; 3802307SN/A 3812307SN/A // total non-speculative bogus addresses seen (debug var) 3822307SN/A Counter sim_invalid_addrs; 3832307SN/A Stats::Vector<> fu_busy; //cumulative fu busy 3842307SN/A 3852307SN/A // ready loads blocked due to memory disambiguation 3862307SN/A Stats::Vector<> lsq_blocked_loads; 3872307SN/A 3882307SN/A Stats::Scalar<> lsqInversion; 3892307SN/A*/ 3902292SN/A public: 3912292SN/A /** Executes the load at the given index. */ 3922292SN/A template <class T> 3932669Sktlim@umich.edu Fault read(Request *req, T &data, int load_idx); 3942292SN/A 3952292SN/A /** Executes the store at the given index. */ 3962292SN/A template <class T> 3972669Sktlim@umich.edu Fault write(Request *req, T &data, int store_idx); 3982292SN/A 3992292SN/A /** Returns the index of the head load instruction. */ 4002292SN/A int getLoadHead() { return loadHead; } 4012292SN/A /** Returns the sequence number of the head load instruction. */ 4022292SN/A InstSeqNum getLoadHeadSeqNum() 4032292SN/A { 4042292SN/A if (loadQueue[loadHead]) { 4052292SN/A return loadQueue[loadHead]->seqNum; 4062292SN/A } else { 4072292SN/A return 0; 4082292SN/A } 4092292SN/A 4102292SN/A } 4112292SN/A 4122292SN/A /** Returns the index of the head store instruction. */ 4132292SN/A int getStoreHead() { return storeHead; } 4142292SN/A /** Returns the sequence number of the head store instruction. */ 4152292SN/A InstSeqNum getStoreHeadSeqNum() 4162292SN/A { 4172292SN/A if (storeQueue[storeHead].inst) { 4182292SN/A return storeQueue[storeHead].inst->seqNum; 4192292SN/A } else { 4202292SN/A return 0; 4212292SN/A } 4222292SN/A 4232292SN/A } 4242292SN/A 4252292SN/A /** Returns whether or not the LSQ unit is stalled. */ 4262292SN/A bool isStalled() { return stalled; } 4272292SN/A}; 4282292SN/A 4292292SN/Atemplate <class Impl> 4302292SN/Atemplate <class T> 4312292SN/AFault 4322669Sktlim@umich.eduLSQUnit<Impl>::read(Request *req, T &data, int load_idx) 4332292SN/A{ 4342669Sktlim@umich.edu DynInstPtr load_inst = loadQueue[load_idx]; 4352292SN/A 4362669Sktlim@umich.edu assert(load_inst); 4372669Sktlim@umich.edu 4382669Sktlim@umich.edu assert(!load_inst->isExecuted()); 4392292SN/A 4402292SN/A // Make sure this isn't an uncacheable access 4412292SN/A // A bit of a hackish way to get uncached accesses to work only if they're 4422292SN/A // at the head of the LSQ and are ready to commit (at the head of the ROB 4432292SN/A // too). 4442669Sktlim@umich.edu if (req->getFlags() & UNCACHEABLE && 4452669Sktlim@umich.edu (load_idx != loadHead || !load_inst->reachedCommit)) { 4462669Sktlim@umich.edu iewStage->rescheduleMemInst(load_inst); 4472292SN/A return TheISA::genMachineCheckFault(); 4482292SN/A } 4492292SN/A 4502292SN/A // Check the SQ for any previous stores that might lead to forwarding 4512669Sktlim@umich.edu int store_idx = load_inst->sqIdx; 4522292SN/A 4532292SN/A int store_size = 0; 4542292SN/A 4552292SN/A DPRINTF(LSQUnit, "Read called, load idx: %i, store idx: %i, " 4562292SN/A "storeHead: %i addr: %#x\n", 4572669Sktlim@umich.edu load_idx, store_idx, storeHead, req->getPaddr()); 4582292SN/A 4592329SN/A#if 0 4602669Sktlim@umich.edu if (req->getFlags() & LOCKED) { 4612669Sktlim@umich.edu cpu->lockAddr = req->getPaddr(); 4622292SN/A cpu->lockFlag = true; 4632292SN/A } 4642292SN/A#endif 4652292SN/A 4662292SN/A while (store_idx != -1) { 4672292SN/A // End once we've reached the top of the LSQ 4682292SN/A if (store_idx == storeWBIdx) { 4692292SN/A break; 4702292SN/A } 4712292SN/A 4722292SN/A // Move the index to one younger 4732292SN/A if (--store_idx < 0) 4742292SN/A store_idx += SQEntries; 4752292SN/A 4762292SN/A assert(storeQueue[store_idx].inst); 4772292SN/A 4782292SN/A store_size = storeQueue[store_idx].size; 4792292SN/A 4802292SN/A if (store_size == 0) 4812292SN/A continue; 4822292SN/A 4832292SN/A // Check if the store data is within the lower and upper bounds of 4842292SN/A // addresses that the request needs. 4852292SN/A bool store_has_lower_limit = 4862669Sktlim@umich.edu req->getVaddr() >= storeQueue[store_idx].inst->effAddr; 4872292SN/A bool store_has_upper_limit = 4882669Sktlim@umich.edu (req->getVaddr() + req->getSize()) <= 4892669Sktlim@umich.edu (storeQueue[store_idx].inst->effAddr + store_size); 4902292SN/A bool lower_load_has_store_part = 4912669Sktlim@umich.edu req->getVaddr() < (storeQueue[store_idx].inst->effAddr + 4922292SN/A store_size); 4932292SN/A bool upper_load_has_store_part = 4942669Sktlim@umich.edu (req->getVaddr() + req->getSize()) > 4952669Sktlim@umich.edu storeQueue[store_idx].inst->effAddr; 4962292SN/A 4972292SN/A // If the store's data has all of the data needed, we can forward. 4982292SN/A if (store_has_lower_limit && store_has_upper_limit) { 4992329SN/A // Get shift amount for offset into the store's data. 5002669Sktlim@umich.edu int shift_amt = req->getVaddr() & (store_size - 1); 5012329SN/A // @todo: Magic number, assumes byte addressing 5022292SN/A shift_amt = shift_amt << 3; 5032292SN/A 5042292SN/A // Cast this to type T? 5052292SN/A data = storeQueue[store_idx].data >> shift_amt; 5062292SN/A 5072669Sktlim@umich.edu assert(!load_inst->memData); 5082669Sktlim@umich.edu load_inst->memData = new uint8_t[64]; 5092292SN/A 5102669Sktlim@umich.edu memcpy(load_inst->memData, &data, req->getSize()); 5112292SN/A 5122292SN/A DPRINTF(LSQUnit, "Forwarding from store idx %i to load to " 5132292SN/A "addr %#x, data %#x\n", 5142669Sktlim@umich.edu store_idx, req->getVaddr(), *(load_inst->memData)); 5152669Sktlim@umich.edu/* 5162669Sktlim@umich.edu typename LdWritebackEvent *wb = 5172669Sktlim@umich.edu new typename LdWritebackEvent(load_inst, 5182669Sktlim@umich.edu iewStage); 5192292SN/A 5202292SN/A // We'll say this has a 1 cycle load-store forwarding latency 5212292SN/A // for now. 5222292SN/A // @todo: Need to make this a parameter. 5232292SN/A wb->schedule(curTick); 5242669Sktlim@umich.edu*/ 5252292SN/A // Should keep track of stat for forwarded data 5262292SN/A return NoFault; 5272292SN/A } else if ((store_has_lower_limit && lower_load_has_store_part) || 5282292SN/A (store_has_upper_limit && upper_load_has_store_part) || 5292292SN/A (lower_load_has_store_part && upper_load_has_store_part)) { 5302292SN/A // This is the partial store-load forwarding case where a store 5312292SN/A // has only part of the load's data. 5322292SN/A 5332292SN/A // If it's already been written back, then don't worry about 5342292SN/A // stalling on it. 5352292SN/A if (storeQueue[store_idx].completed) { 5362292SN/A continue; 5372292SN/A } 5382292SN/A 5392292SN/A // Must stall load and force it to retry, so long as it's the oldest 5402292SN/A // load that needs to do so. 5412292SN/A if (!stalled || 5422292SN/A (stalled && 5432669Sktlim@umich.edu load_inst->seqNum < 5442292SN/A loadQueue[stallingLoadIdx]->seqNum)) { 5452292SN/A stalled = true; 5462292SN/A stallingStoreIsn = storeQueue[store_idx].inst->seqNum; 5472292SN/A stallingLoadIdx = load_idx; 5482292SN/A } 5492292SN/A 5502292SN/A // Tell IQ/mem dep unit that this instruction will need to be 5512292SN/A // rescheduled eventually 5522669Sktlim@umich.edu iewStage->rescheduleMemInst(load_inst); 5532292SN/A 5542292SN/A // Do not generate a writeback event as this instruction is not 5552292SN/A // complete. 5562292SN/A DPRINTF(LSQUnit, "Load-store forwarding mis-match. " 5572292SN/A "Store idx %i to load addr %#x\n", 5582669Sktlim@umich.edu store_idx, req->getVaddr()); 5592292SN/A 5602292SN/A return NoFault; 5612292SN/A } 5622292SN/A } 5632292SN/A 5642292SN/A // If there's no forwarding case, then go access memory 5652669Sktlim@umich.edu DPRINTF(LSQUnit, "Doing functional access for inst [sn:%lli] PC %#x\n", 5662669Sktlim@umich.edu load_inst->seqNum, load_inst->readPC()); 5672292SN/A 5682669Sktlim@umich.edu assert(!load_inst->memData); 5692669Sktlim@umich.edu load_inst->memData = new uint8_t[64]; 5702292SN/A 5712292SN/A ++usedPorts; 5722292SN/A 5732669Sktlim@umich.edu DPRINTF(LSQUnit, "Doing timing access for inst PC %#x\n", 5742669Sktlim@umich.edu load_inst->readPC()); 5752669Sktlim@umich.edu 5762669Sktlim@umich.edu PacketPtr data_pkt = new Packet(req, Packet::ReadReq, Packet::Broadcast); 5772669Sktlim@umich.edu data_pkt->dataStatic(load_inst->memData); 5782669Sktlim@umich.edu 5792292SN/A // if we have a cache, do cache access too 5802669Sktlim@umich.edu if (!dcachePort->sendTiming(data_pkt)) { 5812669Sktlim@umich.edu // There's an older load that's already going to squash. 5822669Sktlim@umich.edu if (isLoadBlocked && blockedLoadSeqNum < load_inst->seqNum) 5832669Sktlim@umich.edu return NoFault; 5842292SN/A 5852669Sktlim@umich.edu // Record that the load was blocked due to memory. This 5862669Sktlim@umich.edu // load will squash all instructions after it, be 5872669Sktlim@umich.edu // refetched, and re-executed. 5882669Sktlim@umich.edu isLoadBlocked = true; 5892669Sktlim@umich.edu loadBlockedHandled = false; 5902669Sktlim@umich.edu blockedLoadSeqNum = load_inst->seqNum; 5912669Sktlim@umich.edu // No fault occurred, even though the interface is blocked. 5922669Sktlim@umich.edu return NoFault; 5932292SN/A } 5942292SN/A 5952669Sktlim@umich.edu if (data_pkt->result != Packet::Success) { 5962669Sktlim@umich.edu DPRINTF(LSQUnit, "LSQUnit: D-cache miss!\n"); 5972669Sktlim@umich.edu DPRINTF(Activity, "Activity: ld accessing mem miss [sn:%lli]\n", 5982669Sktlim@umich.edu load_inst->seqNum); 5992669Sktlim@umich.edu } else { 6002669Sktlim@umich.edu DPRINTF(LSQUnit, "LSQUnit: D-cache hit!\n"); 6012669Sktlim@umich.edu DPRINTF(Activity, "Activity: ld accessing mem hit [sn:%lli]\n", 6022669Sktlim@umich.edu load_inst->seqNum); 6032669Sktlim@umich.edu } 6042669Sktlim@umich.edu 6052669Sktlim@umich.edu return NoFault; 6062292SN/A} 6072292SN/A 6082292SN/Atemplate <class Impl> 6092292SN/Atemplate <class T> 6102292SN/AFault 6112669Sktlim@umich.eduLSQUnit<Impl>::write(Request *req, T &data, int store_idx) 6122292SN/A{ 6132292SN/A assert(storeQueue[store_idx].inst); 6142292SN/A 6152292SN/A DPRINTF(LSQUnit, "Doing write to store idx %i, addr %#x data %#x" 6162292SN/A " | storeHead:%i [sn:%i]\n", 6172669Sktlim@umich.edu store_idx, req->getPaddr(), data, storeHead, 6182292SN/A storeQueue[store_idx].inst->seqNum); 6192329SN/A 6202292SN/A storeQueue[store_idx].req = req; 6212292SN/A storeQueue[store_idx].size = sizeof(T); 6222292SN/A storeQueue[store_idx].data = data; 6232329SN/A 6242292SN/A // This function only writes the data to the store queue, so no fault 6252292SN/A // can happen here. 6262292SN/A return NoFault; 6272292SN/A} 6282292SN/A 6292292SN/A#endif // __CPU_O3_LSQ_UNIT_HH__ 630