lsq_unit_impl.hh revision 2820
12292SN/A/* 22292SN/A * Copyright (c) 2004-2005 The Regents of The University of Michigan 32292SN/A * All rights reserved. 42292SN/A * 52292SN/A * Redistribution and use in source and binary forms, with or without 62292SN/A * modification, are permitted provided that the following conditions are 72292SN/A * met: redistributions of source code must retain the above copyright 82292SN/A * notice, this list of conditions and the following disclaimer; 92292SN/A * redistributions in binary form must reproduce the above copyright 102292SN/A * notice, this list of conditions and the following disclaimer in the 112292SN/A * documentation and/or other materials provided with the distribution; 122292SN/A * neither the name of the copyright holders nor the names of its 132292SN/A * contributors may be used to endorse or promote products derived from 142292SN/A * this software without specific prior written permission. 152292SN/A * 162292SN/A * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 172292SN/A * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 182292SN/A * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 192292SN/A * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 202292SN/A * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 212292SN/A * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 222292SN/A * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 232292SN/A * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 242292SN/A * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 252292SN/A * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 262292SN/A * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 272689Sktlim@umich.edu * 282689Sktlim@umich.edu * Authors: Kevin Lim 292689Sktlim@umich.edu * Korey Sewell 302292SN/A */ 312292SN/A 322733Sktlim@umich.edu#include "config/use_checker.hh" 332733Sktlim@umich.edu 342292SN/A#include "cpu/o3/lsq_unit.hh" 352292SN/A#include "base/str.hh" 362722Sktlim@umich.edu#include "mem/packet.hh" 372669Sktlim@umich.edu#include "mem/request.hh" 382292SN/A 392790Sktlim@umich.edu#if USE_CHECKER 402790Sktlim@umich.edu#include "cpu/checker/cpu.hh" 412790Sktlim@umich.edu#endif 422790Sktlim@umich.edu 432669Sktlim@umich.edutemplate<class Impl> 442678Sktlim@umich.eduLSQUnit<Impl>::WritebackEvent::WritebackEvent(DynInstPtr &_inst, PacketPtr _pkt, 452678Sktlim@umich.edu LSQUnit *lsq_ptr) 462678Sktlim@umich.edu : Event(&mainEventQueue), inst(_inst), pkt(_pkt), lsqPtr(lsq_ptr) 472292SN/A{ 482678Sktlim@umich.edu this->setFlags(Event::AutoDelete); 492292SN/A} 502292SN/A 512669Sktlim@umich.edutemplate<class Impl> 522292SN/Avoid 532678Sktlim@umich.eduLSQUnit<Impl>::WritebackEvent::process() 542292SN/A{ 552678Sktlim@umich.edu if (!lsqPtr->isSwitchedOut()) { 562678Sktlim@umich.edu lsqPtr->writeback(inst, pkt); 572678Sktlim@umich.edu } 582678Sktlim@umich.edu delete pkt; 592678Sktlim@umich.edu} 602292SN/A 612678Sktlim@umich.edutemplate<class Impl> 622678Sktlim@umich.educonst char * 632678Sktlim@umich.eduLSQUnit<Impl>::WritebackEvent::description() 642678Sktlim@umich.edu{ 652678Sktlim@umich.edu return "Store writeback event"; 662678Sktlim@umich.edu} 672292SN/A 682678Sktlim@umich.edutemplate<class Impl> 692678Sktlim@umich.eduvoid 702678Sktlim@umich.eduLSQUnit<Impl>::completeDataAccess(PacketPtr pkt) 712678Sktlim@umich.edu{ 722678Sktlim@umich.edu LSQSenderState *state = dynamic_cast<LSQSenderState *>(pkt->senderState); 732678Sktlim@umich.edu DynInstPtr inst = state->inst; 742678Sktlim@umich.edu DPRINTF(IEW, "Writeback event [sn:%lli]\n", inst->seqNum); 752698Sktlim@umich.edu DPRINTF(Activity, "Activity: Writeback event [sn:%lli]\n", inst->seqNum); 762344SN/A 772678Sktlim@umich.edu //iewStage->ldstQueue.removeMSHR(inst->threadNumber,inst->seqNum); 782678Sktlim@umich.edu 792678Sktlim@umich.edu if (isSwitchedOut() || inst->isSquashed()) { 802820Sktlim@umich.edu iewStage->decrWb(inst->seqNum); 812678Sktlim@umich.edu delete state; 822678Sktlim@umich.edu delete pkt; 832307SN/A return; 842678Sktlim@umich.edu } else { 852678Sktlim@umich.edu if (!state->noWB) { 862678Sktlim@umich.edu writeback(inst, pkt); 872678Sktlim@umich.edu } 882678Sktlim@umich.edu 892678Sktlim@umich.edu if (inst->isStore()) { 902678Sktlim@umich.edu completeStore(state->idx); 912678Sktlim@umich.edu } 922344SN/A } 932307SN/A 942678Sktlim@umich.edu delete state; 952678Sktlim@umich.edu delete pkt; 962292SN/A} 972292SN/A 982292SN/Atemplate <class Impl> 992669Sktlim@umich.eduTick 1002669Sktlim@umich.eduLSQUnit<Impl>::DcachePort::recvAtomic(PacketPtr pkt) 1012292SN/A{ 1022669Sktlim@umich.edu panic("O3CPU model does not work with atomic mode!"); 1032669Sktlim@umich.edu return curTick; 1042669Sktlim@umich.edu} 1052669Sktlim@umich.edu 1062669Sktlim@umich.edutemplate <class Impl> 1072669Sktlim@umich.eduvoid 1082669Sktlim@umich.eduLSQUnit<Impl>::DcachePort::recvFunctional(PacketPtr pkt) 1092669Sktlim@umich.edu{ 1102669Sktlim@umich.edu panic("O3CPU doesn't expect recvFunctional callback!"); 1112669Sktlim@umich.edu} 1122669Sktlim@umich.edu 1132669Sktlim@umich.edutemplate <class Impl> 1142669Sktlim@umich.eduvoid 1152669Sktlim@umich.eduLSQUnit<Impl>::DcachePort::recvStatusChange(Status status) 1162669Sktlim@umich.edu{ 1172669Sktlim@umich.edu if (status == RangeChange) 1182669Sktlim@umich.edu return; 1192669Sktlim@umich.edu 1202669Sktlim@umich.edu panic("O3CPU doesn't expect recvStatusChange callback!"); 1212669Sktlim@umich.edu} 1222669Sktlim@umich.edu 1232669Sktlim@umich.edutemplate <class Impl> 1242669Sktlim@umich.edubool 1252669Sktlim@umich.eduLSQUnit<Impl>::DcachePort::recvTiming(PacketPtr pkt) 1262669Sktlim@umich.edu{ 1272669Sktlim@umich.edu lsq->completeDataAccess(pkt); 1282669Sktlim@umich.edu return true; 1292669Sktlim@umich.edu} 1302669Sktlim@umich.edu 1312669Sktlim@umich.edutemplate <class Impl> 1322669Sktlim@umich.eduvoid 1332669Sktlim@umich.eduLSQUnit<Impl>::DcachePort::recvRetry() 1342669Sktlim@umich.edu{ 1352693Sktlim@umich.edu lsq->recvRetry(); 1362292SN/A} 1372292SN/A 1382292SN/Atemplate <class Impl> 1392292SN/ALSQUnit<Impl>::LSQUnit() 1402678Sktlim@umich.edu : loads(0), stores(0), storesToWB(0), stalled(false), 1412678Sktlim@umich.edu isStoreBlocked(false), isLoadBlocked(false), 1422292SN/A loadBlockedHandled(false) 1432292SN/A{ 1442292SN/A} 1452292SN/A 1462292SN/Atemplate<class Impl> 1472292SN/Avoid 1482292SN/ALSQUnit<Impl>::init(Params *params, unsigned maxLQEntries, 1492292SN/A unsigned maxSQEntries, unsigned id) 1502292SN/A{ 1512292SN/A DPRINTF(LSQUnit, "Creating LSQUnit%i object.\n",id); 1522292SN/A 1532307SN/A switchedOut = false; 1542307SN/A 1552292SN/A lsqID = id; 1562292SN/A 1572329SN/A // Add 1 for the sentinel entry (they are circular queues). 1582329SN/A LQEntries = maxLQEntries + 1; 1592329SN/A SQEntries = maxSQEntries + 1; 1602292SN/A 1612292SN/A loadQueue.resize(LQEntries); 1622292SN/A storeQueue.resize(SQEntries); 1632292SN/A 1642292SN/A loadHead = loadTail = 0; 1652292SN/A 1662292SN/A storeHead = storeWBIdx = storeTail = 0; 1672292SN/A 1682292SN/A usedPorts = 0; 1692292SN/A cachePorts = params->cachePorts; 1702292SN/A 1712678Sktlim@umich.edu mem = params->mem; 1722292SN/A 1732329SN/A memDepViolator = NULL; 1742292SN/A 1752292SN/A blockedLoadSeqNum = 0; 1762292SN/A} 1772292SN/A 1782292SN/Atemplate<class Impl> 1792669Sktlim@umich.eduvoid 1802733Sktlim@umich.eduLSQUnit<Impl>::setCPU(O3CPU *cpu_ptr) 1812669Sktlim@umich.edu{ 1822669Sktlim@umich.edu cpu = cpu_ptr; 1832669Sktlim@umich.edu dcachePort = new DcachePort(cpu, this); 1842678Sktlim@umich.edu 1852678Sktlim@umich.edu Port *mem_dport = mem->getPort(""); 1862678Sktlim@umich.edu dcachePort->setPeer(mem_dport); 1872678Sktlim@umich.edu mem_dport->setPeer(dcachePort); 1882679Sktlim@umich.edu 1892733Sktlim@umich.edu#if USE_CHECKER 1902679Sktlim@umich.edu if (cpu->checker) { 1912679Sktlim@umich.edu cpu->checker->setDcachePort(dcachePort); 1922679Sktlim@umich.edu } 1932733Sktlim@umich.edu#endif 1942669Sktlim@umich.edu} 1952669Sktlim@umich.edu 1962669Sktlim@umich.edutemplate<class Impl> 1972292SN/Astd::string 1982292SN/ALSQUnit<Impl>::name() const 1992292SN/A{ 2002292SN/A if (Impl::MaxThreads == 1) { 2012292SN/A return iewStage->name() + ".lsq"; 2022292SN/A } else { 2032292SN/A return iewStage->name() + ".lsq.thread." + to_string(lsqID); 2042292SN/A } 2052292SN/A} 2062292SN/A 2072292SN/Atemplate<class Impl> 2082292SN/Avoid 2092727Sktlim@umich.eduLSQUnit<Impl>::regStats() 2102727Sktlim@umich.edu{ 2112727Sktlim@umich.edu lsqForwLoads 2122727Sktlim@umich.edu .name(name() + ".forwLoads") 2132727Sktlim@umich.edu .desc("Number of loads that had data forwarded from stores"); 2142727Sktlim@umich.edu 2152727Sktlim@umich.edu invAddrLoads 2162727Sktlim@umich.edu .name(name() + ".invAddrLoads") 2172727Sktlim@umich.edu .desc("Number of loads ignored due to an invalid address"); 2182727Sktlim@umich.edu 2192727Sktlim@umich.edu lsqSquashedLoads 2202727Sktlim@umich.edu .name(name() + ".squashedLoads") 2212727Sktlim@umich.edu .desc("Number of loads squashed"); 2222727Sktlim@umich.edu 2232727Sktlim@umich.edu lsqIgnoredResponses 2242727Sktlim@umich.edu .name(name() + ".ignoredResponses") 2252727Sktlim@umich.edu .desc("Number of memory responses ignored because the instruction is squashed"); 2262727Sktlim@umich.edu 2272727Sktlim@umich.edu lsqSquashedStores 2282727Sktlim@umich.edu .name(name() + ".squashedStores") 2292727Sktlim@umich.edu .desc("Number of stores squashed"); 2302727Sktlim@umich.edu 2312727Sktlim@umich.edu invAddrSwpfs 2322727Sktlim@umich.edu .name(name() + ".invAddrSwpfs") 2332727Sktlim@umich.edu .desc("Number of software prefetches ignored due to an invalid address"); 2342727Sktlim@umich.edu 2352727Sktlim@umich.edu lsqBlockedLoads 2362727Sktlim@umich.edu .name(name() + ".blockedLoads") 2372727Sktlim@umich.edu .desc("Number of blocked loads due to partial load-store forwarding"); 2382727Sktlim@umich.edu 2392727Sktlim@umich.edu lsqRescheduledLoads 2402727Sktlim@umich.edu .name(name() + ".rescheduledLoads") 2412727Sktlim@umich.edu .desc("Number of loads that were rescheduled"); 2422727Sktlim@umich.edu 2432727Sktlim@umich.edu lsqCacheBlocked 2442727Sktlim@umich.edu .name(name() + ".cacheBlocked") 2452727Sktlim@umich.edu .desc("Number of times an access to memory failed due to the cache being blocked"); 2462727Sktlim@umich.edu} 2472727Sktlim@umich.edu 2482727Sktlim@umich.edutemplate<class Impl> 2492727Sktlim@umich.eduvoid 2502292SN/ALSQUnit<Impl>::clearLQ() 2512292SN/A{ 2522292SN/A loadQueue.clear(); 2532292SN/A} 2542292SN/A 2552292SN/Atemplate<class Impl> 2562292SN/Avoid 2572292SN/ALSQUnit<Impl>::clearSQ() 2582292SN/A{ 2592292SN/A storeQueue.clear(); 2602292SN/A} 2612292SN/A 2622292SN/Atemplate<class Impl> 2632292SN/Avoid 2642307SN/ALSQUnit<Impl>::switchOut() 2652307SN/A{ 2662307SN/A switchedOut = true; 2672307SN/A for (int i = 0; i < loadQueue.size(); ++i) 2682307SN/A loadQueue[i] = NULL; 2692307SN/A 2702329SN/A assert(storesToWB == 0); 2712307SN/A} 2722307SN/A 2732307SN/Atemplate<class Impl> 2742307SN/Avoid 2752307SN/ALSQUnit<Impl>::takeOverFrom() 2762307SN/A{ 2772307SN/A switchedOut = false; 2782307SN/A loads = stores = storesToWB = 0; 2792307SN/A 2802307SN/A loadHead = loadTail = 0; 2812307SN/A 2822307SN/A storeHead = storeWBIdx = storeTail = 0; 2832307SN/A 2842307SN/A usedPorts = 0; 2852307SN/A 2862329SN/A memDepViolator = NULL; 2872307SN/A 2882307SN/A blockedLoadSeqNum = 0; 2892307SN/A 2902307SN/A stalled = false; 2912307SN/A isLoadBlocked = false; 2922307SN/A loadBlockedHandled = false; 2932307SN/A} 2942307SN/A 2952307SN/Atemplate<class Impl> 2962307SN/Avoid 2972292SN/ALSQUnit<Impl>::resizeLQ(unsigned size) 2982292SN/A{ 2992329SN/A unsigned size_plus_sentinel = size + 1; 3002329SN/A assert(size_plus_sentinel >= LQEntries); 3012292SN/A 3022329SN/A if (size_plus_sentinel > LQEntries) { 3032329SN/A while (size_plus_sentinel > loadQueue.size()) { 3042292SN/A DynInstPtr dummy; 3052292SN/A loadQueue.push_back(dummy); 3062292SN/A LQEntries++; 3072292SN/A } 3082292SN/A } else { 3092329SN/A LQEntries = size_plus_sentinel; 3102292SN/A } 3112292SN/A 3122292SN/A} 3132292SN/A 3142292SN/Atemplate<class Impl> 3152292SN/Avoid 3162292SN/ALSQUnit<Impl>::resizeSQ(unsigned size) 3172292SN/A{ 3182329SN/A unsigned size_plus_sentinel = size + 1; 3192329SN/A if (size_plus_sentinel > SQEntries) { 3202329SN/A while (size_plus_sentinel > storeQueue.size()) { 3212292SN/A SQEntry dummy; 3222292SN/A storeQueue.push_back(dummy); 3232292SN/A SQEntries++; 3242292SN/A } 3252292SN/A } else { 3262329SN/A SQEntries = size_plus_sentinel; 3272292SN/A } 3282292SN/A} 3292292SN/A 3302292SN/Atemplate <class Impl> 3312292SN/Avoid 3322292SN/ALSQUnit<Impl>::insert(DynInstPtr &inst) 3332292SN/A{ 3342292SN/A assert(inst->isMemRef()); 3352292SN/A 3362292SN/A assert(inst->isLoad() || inst->isStore()); 3372292SN/A 3382292SN/A if (inst->isLoad()) { 3392292SN/A insertLoad(inst); 3402292SN/A } else { 3412292SN/A insertStore(inst); 3422292SN/A } 3432292SN/A 3442292SN/A inst->setInLSQ(); 3452292SN/A} 3462292SN/A 3472292SN/Atemplate <class Impl> 3482292SN/Avoid 3492292SN/ALSQUnit<Impl>::insertLoad(DynInstPtr &load_inst) 3502292SN/A{ 3512329SN/A assert((loadTail + 1) % LQEntries != loadHead); 3522329SN/A assert(loads < LQEntries); 3532292SN/A 3542292SN/A DPRINTF(LSQUnit, "Inserting load PC %#x, idx:%i [sn:%lli]\n", 3552292SN/A load_inst->readPC(), loadTail, load_inst->seqNum); 3562292SN/A 3572292SN/A load_inst->lqIdx = loadTail; 3582292SN/A 3592292SN/A if (stores == 0) { 3602292SN/A load_inst->sqIdx = -1; 3612292SN/A } else { 3622292SN/A load_inst->sqIdx = storeTail; 3632292SN/A } 3642292SN/A 3652292SN/A loadQueue[loadTail] = load_inst; 3662292SN/A 3672292SN/A incrLdIdx(loadTail); 3682292SN/A 3692292SN/A ++loads; 3702292SN/A} 3712292SN/A 3722292SN/Atemplate <class Impl> 3732292SN/Avoid 3742292SN/ALSQUnit<Impl>::insertStore(DynInstPtr &store_inst) 3752292SN/A{ 3762292SN/A // Make sure it is not full before inserting an instruction. 3772292SN/A assert((storeTail + 1) % SQEntries != storeHead); 3782292SN/A assert(stores < SQEntries); 3792292SN/A 3802292SN/A DPRINTF(LSQUnit, "Inserting store PC %#x, idx:%i [sn:%lli]\n", 3812292SN/A store_inst->readPC(), storeTail, store_inst->seqNum); 3822292SN/A 3832292SN/A store_inst->sqIdx = storeTail; 3842292SN/A store_inst->lqIdx = loadTail; 3852292SN/A 3862292SN/A storeQueue[storeTail] = SQEntry(store_inst); 3872292SN/A 3882292SN/A incrStIdx(storeTail); 3892292SN/A 3902292SN/A ++stores; 3912292SN/A} 3922292SN/A 3932292SN/Atemplate <class Impl> 3942292SN/Atypename Impl::DynInstPtr 3952292SN/ALSQUnit<Impl>::getMemDepViolator() 3962292SN/A{ 3972292SN/A DynInstPtr temp = memDepViolator; 3982292SN/A 3992292SN/A memDepViolator = NULL; 4002292SN/A 4012292SN/A return temp; 4022292SN/A} 4032292SN/A 4042292SN/Atemplate <class Impl> 4052292SN/Aunsigned 4062292SN/ALSQUnit<Impl>::numFreeEntries() 4072292SN/A{ 4082292SN/A unsigned free_lq_entries = LQEntries - loads; 4092292SN/A unsigned free_sq_entries = SQEntries - stores; 4102292SN/A 4112292SN/A // Both the LQ and SQ entries have an extra dummy entry to differentiate 4122292SN/A // empty/full conditions. Subtract 1 from the free entries. 4132292SN/A if (free_lq_entries < free_sq_entries) { 4142292SN/A return free_lq_entries - 1; 4152292SN/A } else { 4162292SN/A return free_sq_entries - 1; 4172292SN/A } 4182292SN/A} 4192292SN/A 4202292SN/Atemplate <class Impl> 4212292SN/Aint 4222292SN/ALSQUnit<Impl>::numLoadsReady() 4232292SN/A{ 4242292SN/A int load_idx = loadHead; 4252292SN/A int retval = 0; 4262292SN/A 4272292SN/A while (load_idx != loadTail) { 4282292SN/A assert(loadQueue[load_idx]); 4292292SN/A 4302292SN/A if (loadQueue[load_idx]->readyToIssue()) { 4312292SN/A ++retval; 4322292SN/A } 4332292SN/A } 4342292SN/A 4352292SN/A return retval; 4362292SN/A} 4372292SN/A 4382292SN/Atemplate <class Impl> 4392292SN/AFault 4402292SN/ALSQUnit<Impl>::executeLoad(DynInstPtr &inst) 4412292SN/A{ 4422292SN/A // Execute a specific load. 4432292SN/A Fault load_fault = NoFault; 4442292SN/A 4452292SN/A DPRINTF(LSQUnit, "Executing load PC %#x, [sn:%lli]\n", 4462292SN/A inst->readPC(),inst->seqNum); 4472292SN/A 4482669Sktlim@umich.edu load_fault = inst->initiateAcc(); 4492292SN/A 4502292SN/A // If the instruction faulted, then we need to send it along to commit 4512292SN/A // without the instruction completing. 4522292SN/A if (load_fault != NoFault) { 4532329SN/A // Send this instruction to commit, also make sure iew stage 4542329SN/A // realizes there is activity. 4552292SN/A iewStage->instToCommit(inst); 4562292SN/A iewStage->activityThisCycle(); 4572292SN/A } 4582292SN/A 4592292SN/A return load_fault; 4602292SN/A} 4612292SN/A 4622292SN/Atemplate <class Impl> 4632292SN/AFault 4642292SN/ALSQUnit<Impl>::executeStore(DynInstPtr &store_inst) 4652292SN/A{ 4662292SN/A using namespace TheISA; 4672292SN/A // Make sure that a store exists. 4682292SN/A assert(stores != 0); 4692292SN/A 4702292SN/A int store_idx = store_inst->sqIdx; 4712292SN/A 4722292SN/A DPRINTF(LSQUnit, "Executing store PC %#x [sn:%lli]\n", 4732292SN/A store_inst->readPC(), store_inst->seqNum); 4742292SN/A 4752292SN/A // Check the recently completed loads to see if any match this store's 4762292SN/A // address. If so, then we have a memory ordering violation. 4772292SN/A int load_idx = store_inst->lqIdx; 4782292SN/A 4792292SN/A Fault store_fault = store_inst->initiateAcc(); 4802292SN/A 4812329SN/A if (storeQueue[store_idx].size == 0) { 4822292SN/A DPRINTF(LSQUnit,"Fault on Store PC %#x, [sn:%lli],Size = 0\n", 4832292SN/A store_inst->readPC(),store_inst->seqNum); 4842292SN/A 4852292SN/A return store_fault; 4862292SN/A } 4872292SN/A 4882292SN/A assert(store_fault == NoFault); 4892292SN/A 4902336SN/A if (store_inst->isStoreConditional()) { 4912336SN/A // Store conditionals need to set themselves as able to 4922336SN/A // writeback if we haven't had a fault by here. 4932329SN/A storeQueue[store_idx].canWB = true; 4942292SN/A 4952329SN/A ++storesToWB; 4962292SN/A } 4972292SN/A 4982292SN/A if (!memDepViolator) { 4992292SN/A while (load_idx != loadTail) { 5002329SN/A // Really only need to check loads that have actually executed 5012329SN/A // It's safe to check all loads because effAddr is set to 5022329SN/A // InvalAddr when the dyn inst is created. 5032292SN/A 5042329SN/A // @todo: For now this is extra conservative, detecting a 5052329SN/A // violation if the addresses match assuming all accesses 5062329SN/A // are quad word accesses. 5072329SN/A 5082292SN/A // @todo: Fix this, magic number being used here 5092292SN/A if ((loadQueue[load_idx]->effAddr >> 8) == 5102292SN/A (store_inst->effAddr >> 8)) { 5112292SN/A // A load incorrectly passed this store. Squash and refetch. 5122292SN/A // For now return a fault to show that it was unsuccessful. 5132292SN/A memDepViolator = loadQueue[load_idx]; 5142292SN/A 5152292SN/A return genMachineCheckFault(); 5162292SN/A } 5172292SN/A 5182292SN/A incrLdIdx(load_idx); 5192292SN/A } 5202292SN/A 5212292SN/A // If we've reached this point, there was no violation. 5222292SN/A memDepViolator = NULL; 5232292SN/A } 5242292SN/A 5252292SN/A return store_fault; 5262292SN/A} 5272292SN/A 5282292SN/Atemplate <class Impl> 5292292SN/Avoid 5302292SN/ALSQUnit<Impl>::commitLoad() 5312292SN/A{ 5322292SN/A assert(loadQueue[loadHead]); 5332292SN/A 5342292SN/A DPRINTF(LSQUnit, "Committing head load instruction, PC %#x\n", 5352292SN/A loadQueue[loadHead]->readPC()); 5362292SN/A 5372292SN/A loadQueue[loadHead] = NULL; 5382292SN/A 5392292SN/A incrLdIdx(loadHead); 5402292SN/A 5412292SN/A --loads; 5422292SN/A} 5432292SN/A 5442292SN/Atemplate <class Impl> 5452292SN/Avoid 5462292SN/ALSQUnit<Impl>::commitLoads(InstSeqNum &youngest_inst) 5472292SN/A{ 5482292SN/A assert(loads == 0 || loadQueue[loadHead]); 5492292SN/A 5502292SN/A while (loads != 0 && loadQueue[loadHead]->seqNum <= youngest_inst) { 5512292SN/A commitLoad(); 5522292SN/A } 5532292SN/A} 5542292SN/A 5552292SN/Atemplate <class Impl> 5562292SN/Avoid 5572292SN/ALSQUnit<Impl>::commitStores(InstSeqNum &youngest_inst) 5582292SN/A{ 5592292SN/A assert(stores == 0 || storeQueue[storeHead].inst); 5602292SN/A 5612292SN/A int store_idx = storeHead; 5622292SN/A 5632292SN/A while (store_idx != storeTail) { 5642292SN/A assert(storeQueue[store_idx].inst); 5652329SN/A // Mark any stores that are now committed and have not yet 5662329SN/A // been marked as able to write back. 5672292SN/A if (!storeQueue[store_idx].canWB) { 5682292SN/A if (storeQueue[store_idx].inst->seqNum > youngest_inst) { 5692292SN/A break; 5702292SN/A } 5712292SN/A DPRINTF(LSQUnit, "Marking store as able to write back, PC " 5722292SN/A "%#x [sn:%lli]\n", 5732292SN/A storeQueue[store_idx].inst->readPC(), 5742292SN/A storeQueue[store_idx].inst->seqNum); 5752292SN/A 5762292SN/A storeQueue[store_idx].canWB = true; 5772292SN/A 5782292SN/A ++storesToWB; 5792292SN/A } 5802292SN/A 5812292SN/A incrStIdx(store_idx); 5822292SN/A } 5832292SN/A} 5842292SN/A 5852292SN/Atemplate <class Impl> 5862292SN/Avoid 5872292SN/ALSQUnit<Impl>::writebackStores() 5882292SN/A{ 5892292SN/A while (storesToWB > 0 && 5902292SN/A storeWBIdx != storeTail && 5912292SN/A storeQueue[storeWBIdx].inst && 5922292SN/A storeQueue[storeWBIdx].canWB && 5932292SN/A usedPorts < cachePorts) { 5942292SN/A 5952678Sktlim@umich.edu if (isStoreBlocked) { 5962678Sktlim@umich.edu DPRINTF(LSQUnit, "Unable to write back any more stores, cache" 5972678Sktlim@umich.edu " is blocked!\n"); 5982678Sktlim@umich.edu break; 5992678Sktlim@umich.edu } 6002678Sktlim@umich.edu 6012329SN/A // Store didn't write any data so no need to write it back to 6022329SN/A // memory. 6032292SN/A if (storeQueue[storeWBIdx].size == 0) { 6042292SN/A completeStore(storeWBIdx); 6052292SN/A 6062292SN/A incrStIdx(storeWBIdx); 6072292SN/A 6082292SN/A continue; 6092292SN/A } 6102678Sktlim@umich.edu 6112292SN/A ++usedPorts; 6122292SN/A 6132292SN/A if (storeQueue[storeWBIdx].inst->isDataPrefetch()) { 6142292SN/A incrStIdx(storeWBIdx); 6152292SN/A 6162292SN/A continue; 6172292SN/A } 6182292SN/A 6192292SN/A assert(storeQueue[storeWBIdx].req); 6202292SN/A assert(!storeQueue[storeWBIdx].committed); 6212292SN/A 6222669Sktlim@umich.edu DynInstPtr inst = storeQueue[storeWBIdx].inst; 6232669Sktlim@umich.edu 6242669Sktlim@umich.edu Request *req = storeQueue[storeWBIdx].req; 6252292SN/A storeQueue[storeWBIdx].committed = true; 6262292SN/A 6272669Sktlim@umich.edu assert(!inst->memData); 6282669Sktlim@umich.edu inst->memData = new uint8_t[64]; 6292678Sktlim@umich.edu memcpy(inst->memData, (uint8_t *)&storeQueue[storeWBIdx].data, 6302678Sktlim@umich.edu req->getSize()); 6312669Sktlim@umich.edu 6322669Sktlim@umich.edu PacketPtr data_pkt = new Packet(req, Packet::WriteReq, Packet::Broadcast); 6332669Sktlim@umich.edu data_pkt->dataStatic(inst->memData); 6342292SN/A 6352678Sktlim@umich.edu LSQSenderState *state = new LSQSenderState; 6362678Sktlim@umich.edu state->isLoad = false; 6372678Sktlim@umich.edu state->idx = storeWBIdx; 6382678Sktlim@umich.edu state->inst = inst; 6392678Sktlim@umich.edu data_pkt->senderState = state; 6402678Sktlim@umich.edu 6412292SN/A DPRINTF(LSQUnit, "D-Cache: Writing back store idx:%i PC:%#x " 6422292SN/A "to Addr:%#x, data:%#x [sn:%lli]\n", 6432669Sktlim@umich.edu storeWBIdx, storeQueue[storeWBIdx].inst->readPC(), 6442669Sktlim@umich.edu req->getPaddr(), *(inst->memData), 6452292SN/A storeQueue[storeWBIdx].inst->seqNum); 6462292SN/A 6472693Sktlim@umich.edu // @todo: Remove this SC hack once the memory system handles it. 6482693Sktlim@umich.edu if (req->getFlags() & LOCKED) { 6492693Sktlim@umich.edu if (req->getFlags() & UNCACHEABLE) { 6502693Sktlim@umich.edu req->setScResult(2); 6512693Sktlim@umich.edu } else { 6522693Sktlim@umich.edu if (cpu->lockFlag) { 6532693Sktlim@umich.edu req->setScResult(1); 6542693Sktlim@umich.edu } else { 6552693Sktlim@umich.edu req->setScResult(0); 6562693Sktlim@umich.edu // Hack: Instantly complete this store. 6572693Sktlim@umich.edu completeDataAccess(data_pkt); 6582693Sktlim@umich.edu incrStIdx(storeWBIdx); 6592693Sktlim@umich.edu continue; 6602693Sktlim@umich.edu } 6612693Sktlim@umich.edu } 6622693Sktlim@umich.edu } else { 6632693Sktlim@umich.edu // Non-store conditionals do not need a writeback. 6642693Sktlim@umich.edu state->noWB = true; 6652693Sktlim@umich.edu } 6662693Sktlim@umich.edu 6672669Sktlim@umich.edu if (!dcachePort->sendTiming(data_pkt)) { 6682669Sktlim@umich.edu // Need to handle becoming blocked on a store. 6692678Sktlim@umich.edu isStoreBlocked = true; 6702727Sktlim@umich.edu ++lsqCacheBlocked; 6712698Sktlim@umich.edu assert(retryPkt == NULL); 6722698Sktlim@umich.edu retryPkt = data_pkt; 6732669Sktlim@umich.edu } else { 6742693Sktlim@umich.edu storePostSend(data_pkt); 6752292SN/A } 6762292SN/A } 6772292SN/A 6782292SN/A // Not sure this should set it to 0. 6792292SN/A usedPorts = 0; 6802292SN/A 6812292SN/A assert(stores >= 0 && storesToWB >= 0); 6822292SN/A} 6832292SN/A 6842292SN/A/*template <class Impl> 6852292SN/Avoid 6862292SN/ALSQUnit<Impl>::removeMSHR(InstSeqNum seqNum) 6872292SN/A{ 6882292SN/A list<InstSeqNum>::iterator mshr_it = find(mshrSeqNums.begin(), 6892292SN/A mshrSeqNums.end(), 6902292SN/A seqNum); 6912292SN/A 6922292SN/A if (mshr_it != mshrSeqNums.end()) { 6932292SN/A mshrSeqNums.erase(mshr_it); 6942292SN/A DPRINTF(LSQUnit, "Removing MSHR. count = %i\n",mshrSeqNums.size()); 6952292SN/A } 6962292SN/A}*/ 6972292SN/A 6982292SN/Atemplate <class Impl> 6992292SN/Avoid 7002292SN/ALSQUnit<Impl>::squash(const InstSeqNum &squashed_num) 7012292SN/A{ 7022292SN/A DPRINTF(LSQUnit, "Squashing until [sn:%lli]!" 7032329SN/A "(Loads:%i Stores:%i)\n", squashed_num, loads, stores); 7042292SN/A 7052292SN/A int load_idx = loadTail; 7062292SN/A decrLdIdx(load_idx); 7072292SN/A 7082292SN/A while (loads != 0 && loadQueue[load_idx]->seqNum > squashed_num) { 7092292SN/A DPRINTF(LSQUnit,"Load Instruction PC %#x squashed, " 7102292SN/A "[sn:%lli]\n", 7112292SN/A loadQueue[load_idx]->readPC(), 7122292SN/A loadQueue[load_idx]->seqNum); 7132292SN/A 7142292SN/A if (isStalled() && load_idx == stallingLoadIdx) { 7152292SN/A stalled = false; 7162292SN/A stallingStoreIsn = 0; 7172292SN/A stallingLoadIdx = 0; 7182292SN/A } 7192292SN/A 7202329SN/A // Clear the smart pointer to make sure it is decremented. 7212731Sktlim@umich.edu loadQueue[load_idx]->setSquashed(); 7222292SN/A loadQueue[load_idx] = NULL; 7232292SN/A --loads; 7242292SN/A 7252292SN/A // Inefficient! 7262292SN/A loadTail = load_idx; 7272292SN/A 7282292SN/A decrLdIdx(load_idx); 7292727Sktlim@umich.edu ++lsqSquashedLoads; 7302292SN/A } 7312292SN/A 7322292SN/A if (isLoadBlocked) { 7332292SN/A if (squashed_num < blockedLoadSeqNum) { 7342292SN/A isLoadBlocked = false; 7352292SN/A loadBlockedHandled = false; 7362292SN/A blockedLoadSeqNum = 0; 7372292SN/A } 7382292SN/A } 7392292SN/A 7402292SN/A int store_idx = storeTail; 7412292SN/A decrStIdx(store_idx); 7422292SN/A 7432292SN/A while (stores != 0 && 7442292SN/A storeQueue[store_idx].inst->seqNum > squashed_num) { 7452329SN/A // Instructions marked as can WB are already committed. 7462292SN/A if (storeQueue[store_idx].canWB) { 7472292SN/A break; 7482292SN/A } 7492292SN/A 7502292SN/A DPRINTF(LSQUnit,"Store Instruction PC %#x squashed, " 7512292SN/A "idx:%i [sn:%lli]\n", 7522292SN/A storeQueue[store_idx].inst->readPC(), 7532292SN/A store_idx, storeQueue[store_idx].inst->seqNum); 7542292SN/A 7552329SN/A // I don't think this can happen. It should have been cleared 7562329SN/A // by the stalling load. 7572292SN/A if (isStalled() && 7582292SN/A storeQueue[store_idx].inst->seqNum == stallingStoreIsn) { 7592292SN/A panic("Is stalled should have been cleared by stalling load!\n"); 7602292SN/A stalled = false; 7612292SN/A stallingStoreIsn = 0; 7622292SN/A } 7632292SN/A 7642329SN/A // Clear the smart pointer to make sure it is decremented. 7652731Sktlim@umich.edu storeQueue[store_idx].inst->setSquashed(); 7662292SN/A storeQueue[store_idx].inst = NULL; 7672292SN/A storeQueue[store_idx].canWB = 0; 7682292SN/A 7692292SN/A storeQueue[store_idx].req = NULL; 7702292SN/A --stores; 7712292SN/A 7722292SN/A // Inefficient! 7732292SN/A storeTail = store_idx; 7742292SN/A 7752292SN/A decrStIdx(store_idx); 7762727Sktlim@umich.edu ++lsqSquashedStores; 7772292SN/A } 7782292SN/A} 7792292SN/A 7802292SN/Atemplate <class Impl> 7812292SN/Avoid 7822693Sktlim@umich.eduLSQUnit<Impl>::storePostSend(Packet *pkt) 7832693Sktlim@umich.edu{ 7842693Sktlim@umich.edu if (isStalled() && 7852693Sktlim@umich.edu storeQueue[storeWBIdx].inst->seqNum == stallingStoreIsn) { 7862693Sktlim@umich.edu DPRINTF(LSQUnit, "Unstalling, stalling store [sn:%lli] " 7872693Sktlim@umich.edu "load idx:%i\n", 7882693Sktlim@umich.edu stallingStoreIsn, stallingLoadIdx); 7892693Sktlim@umich.edu stalled = false; 7902693Sktlim@umich.edu stallingStoreIsn = 0; 7912693Sktlim@umich.edu iewStage->replayMemInst(loadQueue[stallingLoadIdx]); 7922693Sktlim@umich.edu } 7932693Sktlim@umich.edu 7942693Sktlim@umich.edu if (!storeQueue[storeWBIdx].inst->isStoreConditional()) { 7952693Sktlim@umich.edu // The store is basically completed at this time. This 7962693Sktlim@umich.edu // only works so long as the checker doesn't try to 7972693Sktlim@umich.edu // verify the value in memory for stores. 7982693Sktlim@umich.edu storeQueue[storeWBIdx].inst->setCompleted(); 7992733Sktlim@umich.edu#if USE_CHECKER 8002693Sktlim@umich.edu if (cpu->checker) { 8012732Sktlim@umich.edu cpu->checker->verify(storeQueue[storeWBIdx].inst); 8022693Sktlim@umich.edu } 8032733Sktlim@umich.edu#endif 8042693Sktlim@umich.edu } 8052693Sktlim@umich.edu 8062693Sktlim@umich.edu if (pkt->result != Packet::Success) { 8072693Sktlim@umich.edu DPRINTF(LSQUnit,"D-Cache Write Miss on idx:%i!\n", 8082693Sktlim@umich.edu storeWBIdx); 8092693Sktlim@umich.edu 8102693Sktlim@umich.edu DPRINTF(Activity, "Active st accessing mem miss [sn:%lli]\n", 8112693Sktlim@umich.edu storeQueue[storeWBIdx].inst->seqNum); 8122693Sktlim@umich.edu 8132693Sktlim@umich.edu //mshrSeqNums.push_back(storeQueue[storeWBIdx].inst->seqNum); 8142693Sktlim@umich.edu 8152693Sktlim@umich.edu //DPRINTF(LSQUnit, "Added MSHR. count = %i\n",mshrSeqNums.size()); 8162693Sktlim@umich.edu 8172693Sktlim@umich.edu // @todo: Increment stat here. 8182693Sktlim@umich.edu } else { 8192693Sktlim@umich.edu DPRINTF(LSQUnit,"D-Cache: Write Hit on idx:%i !\n", 8202693Sktlim@umich.edu storeWBIdx); 8212693Sktlim@umich.edu 8222693Sktlim@umich.edu DPRINTF(Activity, "Active st accessing mem hit [sn:%lli]\n", 8232693Sktlim@umich.edu storeQueue[storeWBIdx].inst->seqNum); 8242693Sktlim@umich.edu } 8252693Sktlim@umich.edu 8262693Sktlim@umich.edu incrStIdx(storeWBIdx); 8272693Sktlim@umich.edu} 8282693Sktlim@umich.edu 8292693Sktlim@umich.edutemplate <class Impl> 8302693Sktlim@umich.eduvoid 8312678Sktlim@umich.eduLSQUnit<Impl>::writeback(DynInstPtr &inst, PacketPtr pkt) 8322678Sktlim@umich.edu{ 8332678Sktlim@umich.edu iewStage->wakeCPU(); 8342678Sktlim@umich.edu 8352678Sktlim@umich.edu // Squashed instructions do not need to complete their access. 8362678Sktlim@umich.edu if (inst->isSquashed()) { 8372678Sktlim@umich.edu assert(!inst->isStore()); 8382727Sktlim@umich.edu ++lsqIgnoredResponses; 8392678Sktlim@umich.edu return; 8402678Sktlim@umich.edu } 8412678Sktlim@umich.edu 8422678Sktlim@umich.edu if (!inst->isExecuted()) { 8432678Sktlim@umich.edu inst->setExecuted(); 8442678Sktlim@umich.edu 8452678Sktlim@umich.edu // Complete access to copy data to proper place. 8462678Sktlim@umich.edu inst->completeAcc(pkt); 8472678Sktlim@umich.edu } 8482678Sktlim@umich.edu 8492678Sktlim@umich.edu // Need to insert instruction into queue to commit 8502678Sktlim@umich.edu iewStage->instToCommit(inst); 8512678Sktlim@umich.edu 8522678Sktlim@umich.edu iewStage->activityThisCycle(); 8532678Sktlim@umich.edu} 8542678Sktlim@umich.edu 8552678Sktlim@umich.edutemplate <class Impl> 8562678Sktlim@umich.eduvoid 8572292SN/ALSQUnit<Impl>::completeStore(int store_idx) 8582292SN/A{ 8592292SN/A assert(storeQueue[store_idx].inst); 8602292SN/A storeQueue[store_idx].completed = true; 8612292SN/A --storesToWB; 8622292SN/A // A bit conservative because a store completion may not free up entries, 8632292SN/A // but hopefully avoids two store completions in one cycle from making 8642292SN/A // the CPU tick twice. 8652292SN/A cpu->activityThisCycle(); 8662292SN/A 8672292SN/A if (store_idx == storeHead) { 8682292SN/A do { 8692292SN/A incrStIdx(storeHead); 8702292SN/A 8712292SN/A --stores; 8722292SN/A } while (storeQueue[storeHead].completed && 8732292SN/A storeHead != storeTail); 8742292SN/A 8752292SN/A iewStage->updateLSQNextCycle = true; 8762292SN/A } 8772292SN/A 8782329SN/A DPRINTF(LSQUnit, "Completing store [sn:%lli], idx:%i, store head " 8792329SN/A "idx:%i\n", 8802329SN/A storeQueue[store_idx].inst->seqNum, store_idx, storeHead); 8812292SN/A 8822292SN/A if (isStalled() && 8832292SN/A storeQueue[store_idx].inst->seqNum == stallingStoreIsn) { 8842292SN/A DPRINTF(LSQUnit, "Unstalling, stalling store [sn:%lli] " 8852292SN/A "load idx:%i\n", 8862292SN/A stallingStoreIsn, stallingLoadIdx); 8872292SN/A stalled = false; 8882292SN/A stallingStoreIsn = 0; 8892292SN/A iewStage->replayMemInst(loadQueue[stallingLoadIdx]); 8902292SN/A } 8912316SN/A 8922316SN/A storeQueue[store_idx].inst->setCompleted(); 8932329SN/A 8942329SN/A // Tell the checker we've completed this instruction. Some stores 8952329SN/A // may get reported twice to the checker, but the checker can 8962329SN/A // handle that case. 8972733Sktlim@umich.edu#if USE_CHECKER 8982316SN/A if (cpu->checker) { 8992732Sktlim@umich.edu cpu->checker->verify(storeQueue[store_idx].inst); 9002316SN/A } 9012733Sktlim@umich.edu#endif 9022292SN/A} 9032292SN/A 9042292SN/Atemplate <class Impl> 9052693Sktlim@umich.eduvoid 9062693Sktlim@umich.eduLSQUnit<Impl>::recvRetry() 9072693Sktlim@umich.edu{ 9082698Sktlim@umich.edu if (isStoreBlocked) { 9092698Sktlim@umich.edu assert(retryPkt != NULL); 9102693Sktlim@umich.edu 9112698Sktlim@umich.edu if (dcachePort->sendTiming(retryPkt)) { 9122698Sktlim@umich.edu storePostSend(retryPkt); 9132699Sktlim@umich.edu retryPkt = NULL; 9142693Sktlim@umich.edu isStoreBlocked = false; 9152693Sktlim@umich.edu } else { 9162693Sktlim@umich.edu // Still blocked! 9172727Sktlim@umich.edu ++lsqCacheBlocked; 9182693Sktlim@umich.edu } 9192693Sktlim@umich.edu } else if (isLoadBlocked) { 9202693Sktlim@umich.edu DPRINTF(LSQUnit, "Loads squash themselves and all younger insts, " 9212693Sktlim@umich.edu "no need to resend packet.\n"); 9222693Sktlim@umich.edu } else { 9232693Sktlim@umich.edu DPRINTF(LSQUnit, "Retry received but LSQ is no longer blocked.\n"); 9242693Sktlim@umich.edu } 9252693Sktlim@umich.edu} 9262693Sktlim@umich.edu 9272693Sktlim@umich.edutemplate <class Impl> 9282292SN/Ainline void 9292292SN/ALSQUnit<Impl>::incrStIdx(int &store_idx) 9302292SN/A{ 9312292SN/A if (++store_idx >= SQEntries) 9322292SN/A store_idx = 0; 9332292SN/A} 9342292SN/A 9352292SN/Atemplate <class Impl> 9362292SN/Ainline void 9372292SN/ALSQUnit<Impl>::decrStIdx(int &store_idx) 9382292SN/A{ 9392292SN/A if (--store_idx < 0) 9402292SN/A store_idx += SQEntries; 9412292SN/A} 9422292SN/A 9432292SN/Atemplate <class Impl> 9442292SN/Ainline void 9452292SN/ALSQUnit<Impl>::incrLdIdx(int &load_idx) 9462292SN/A{ 9472292SN/A if (++load_idx >= LQEntries) 9482292SN/A load_idx = 0; 9492292SN/A} 9502292SN/A 9512292SN/Atemplate <class Impl> 9522292SN/Ainline void 9532292SN/ALSQUnit<Impl>::decrLdIdx(int &load_idx) 9542292SN/A{ 9552292SN/A if (--load_idx < 0) 9562292SN/A load_idx += LQEntries; 9572292SN/A} 9582329SN/A 9592329SN/Atemplate <class Impl> 9602329SN/Avoid 9612329SN/ALSQUnit<Impl>::dumpInsts() 9622329SN/A{ 9632329SN/A cprintf("Load store queue: Dumping instructions.\n"); 9642329SN/A cprintf("Load queue size: %i\n", loads); 9652329SN/A cprintf("Load queue: "); 9662329SN/A 9672329SN/A int load_idx = loadHead; 9682329SN/A 9692329SN/A while (load_idx != loadTail && loadQueue[load_idx]) { 9702329SN/A cprintf("%#x ", loadQueue[load_idx]->readPC()); 9712329SN/A 9722329SN/A incrLdIdx(load_idx); 9732329SN/A } 9742329SN/A 9752329SN/A cprintf("Store queue size: %i\n", stores); 9762329SN/A cprintf("Store queue: "); 9772329SN/A 9782329SN/A int store_idx = storeHead; 9792329SN/A 9802329SN/A while (store_idx != storeTail && storeQueue[store_idx].inst) { 9812329SN/A cprintf("%#x ", storeQueue[store_idx].inst->readPC()); 9822329SN/A 9832329SN/A incrStIdx(store_idx); 9842329SN/A } 9852329SN/A 9862329SN/A cprintf("\n"); 9872329SN/A} 988