lsq_unit.hh revision 10239
12292SN/A/* 210031SAli.Saidi@ARM.com * Copyright (c) 2012-2013 ARM Limited 39444SAndreas.Sandberg@ARM.com * All rights reserved 49444SAndreas.Sandberg@ARM.com * 59444SAndreas.Sandberg@ARM.com * The license below extends only to copyright in the software and shall 69444SAndreas.Sandberg@ARM.com * not be construed as granting a license to any other intellectual 79444SAndreas.Sandberg@ARM.com * property including but not limited to intellectual property relating 89444SAndreas.Sandberg@ARM.com * to a hardware implementation of the functionality of the software 99444SAndreas.Sandberg@ARM.com * licensed hereunder. You may use the software subject to the license 109444SAndreas.Sandberg@ARM.com * terms below provided that you ensure that this notice is replicated 119444SAndreas.Sandberg@ARM.com * unmodified and in its entirety in all distributions of the software, 129444SAndreas.Sandberg@ARM.com * modified or unmodified, in source code or in binary form. 139444SAndreas.Sandberg@ARM.com * 142329SN/A * Copyright (c) 2004-2006 The Regents of The University of Michigan 1510239Sbinhpham@cs.rutgers.edu * Copyright (c) 2013 Advanced Micro Devices, Inc. 162292SN/A * All rights reserved. 172292SN/A * 182292SN/A * Redistribution and use in source and binary forms, with or without 192292SN/A * modification, are permitted provided that the following conditions are 202292SN/A * met: redistributions of source code must retain the above copyright 212292SN/A * notice, this list of conditions and the following disclaimer; 222292SN/A * redistributions in binary form must reproduce the above copyright 232292SN/A * notice, this list of conditions and the following disclaimer in the 242292SN/A * documentation and/or other materials provided with the distribution; 252292SN/A * neither the name of the copyright holders nor the names of its 262292SN/A * contributors may be used to endorse or promote products derived from 272292SN/A * this software without specific prior written permission. 282292SN/A * 292292SN/A * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 302292SN/A * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 312292SN/A * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 322292SN/A * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 332292SN/A * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 342292SN/A * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 352292SN/A * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 362292SN/A * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 372292SN/A * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 382292SN/A * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 392292SN/A * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 402689Sktlim@umich.edu * 412689Sktlim@umich.edu * Authors: Kevin Lim 422689Sktlim@umich.edu * Korey Sewell 432292SN/A */ 442292SN/A 452292SN/A#ifndef __CPU_O3_LSQ_UNIT_HH__ 462292SN/A#define __CPU_O3_LSQ_UNIT_HH__ 472292SN/A 482329SN/A#include <algorithm> 494395Ssaidi@eecs.umich.edu#include <cstring> 502292SN/A#include <map> 512292SN/A#include <queue> 522292SN/A 538591Sgblack@eecs.umich.edu#include "arch/generic/debugfaults.hh" 548506Sgblack@eecs.umich.edu#include "arch/isa_traits.hh" 553326Sktlim@umich.edu#include "arch/locked_mem.hh" 568481Sgblack@eecs.umich.edu#include "arch/mmapped_ipr.hh" 578229Snate@binkert.org#include "base/hashmap.hh" 586658Snate@binkert.org#include "config/the_isa.hh" 592292SN/A#include "cpu/inst_seq.hh" 608230Snate@binkert.org#include "cpu/timebuf.hh" 618232Snate@binkert.org#include "debug/LSQUnit.hh" 623348Sbinkertn@umich.edu#include "mem/packet.hh" 632669Sktlim@umich.edu#include "mem/port.hh" 648817Sgblack@eecs.umich.edu#include "sim/fault_fwd.hh" 652292SN/A 668737Skoansin.tan@gmail.comstruct DerivO3CPUParams; 675529Snate@binkert.org 682292SN/A/** 692329SN/A * Class that implements the actual LQ and SQ for each specific 702329SN/A * thread. Both are circular queues; load entries are freed upon 712329SN/A * committing, while store entries are freed once they writeback. The 722329SN/A * LSQUnit tracks if there are memory ordering violations, and also 732329SN/A * detects partial load to store forwarding cases (a store only has 742329SN/A * part of a load's data) that requires the load to wait until the 752329SN/A * store writes back. In the former case it holds onto the instruction 762329SN/A * until the dependence unit looks at it, and in the latter it stalls 772329SN/A * the LSQ until the store writes back. At that point the load is 782329SN/A * replayed. 792292SN/A */ 802292SN/Atemplate <class Impl> 812292SN/Aclass LSQUnit { 822292SN/A public: 832733Sktlim@umich.edu typedef typename Impl::O3CPU O3CPU; 842292SN/A typedef typename Impl::DynInstPtr DynInstPtr; 852292SN/A typedef typename Impl::CPUPol::IEW IEW; 862907Sktlim@umich.edu typedef typename Impl::CPUPol::LSQ LSQ; 872292SN/A typedef typename Impl::CPUPol::IssueStruct IssueStruct; 882292SN/A 892292SN/A public: 902292SN/A /** Constructs an LSQ unit. init() must be called prior to use. */ 912292SN/A LSQUnit(); 922292SN/A 932292SN/A /** Initializes the LSQ unit with the specified number of entries. */ 945529Snate@binkert.org void init(O3CPU *cpu_ptr, IEW *iew_ptr, DerivO3CPUParams *params, 955529Snate@binkert.org LSQ *lsq_ptr, unsigned maxLQEntries, unsigned maxSQEntries, 965529Snate@binkert.org unsigned id); 972292SN/A 982292SN/A /** Returns the name of the LSQ unit. */ 992292SN/A std::string name() const; 1002292SN/A 1012727Sktlim@umich.edu /** Registers statistics. */ 1022727Sktlim@umich.edu void regStats(); 1032727Sktlim@umich.edu 1042907Sktlim@umich.edu /** Sets the pointer to the dcache port. */ 1058922Swilliam.wang@arm.com void setDcachePort(MasterPort *dcache_port); 1062907Sktlim@umich.edu 1079444SAndreas.Sandberg@ARM.com /** Perform sanity checks after a drain. */ 1089444SAndreas.Sandberg@ARM.com void drainSanityCheck() const; 1092307SN/A 1102348SN/A /** Takes over from another CPU's thread. */ 1112307SN/A void takeOverFrom(); 1122307SN/A 1132292SN/A /** Ticks the LSQ unit, which in this case only resets the number of 1142292SN/A * used cache ports. 1152292SN/A * @todo: Move the number of used ports up to the LSQ level so it can 1162292SN/A * be shared by all LSQ units. 1172292SN/A */ 1182292SN/A void tick() { usedPorts = 0; } 1192292SN/A 1202292SN/A /** Inserts an instruction. */ 1212292SN/A void insert(DynInstPtr &inst); 1222292SN/A /** Inserts a load instruction. */ 1232292SN/A void insertLoad(DynInstPtr &load_inst); 1242292SN/A /** Inserts a store instruction. */ 1252292SN/A void insertStore(DynInstPtr &store_inst); 1262292SN/A 1278545Ssaidi@eecs.umich.edu /** Check for ordering violations in the LSQ. For a store squash if we 1288545Ssaidi@eecs.umich.edu * ever find a conflicting load. For a load, only squash if we 1298545Ssaidi@eecs.umich.edu * an external snoop invalidate has been seen for that load address 1308199SAli.Saidi@ARM.com * @param load_idx index to start checking at 1318199SAli.Saidi@ARM.com * @param inst the instruction to check 1328199SAli.Saidi@ARM.com */ 1338199SAli.Saidi@ARM.com Fault checkViolations(int load_idx, DynInstPtr &inst); 1348199SAli.Saidi@ARM.com 1358545Ssaidi@eecs.umich.edu /** Check if an incoming invalidate hits in the lsq on a load 1368545Ssaidi@eecs.umich.edu * that might have issued out of order wrt another load beacuse 1378545Ssaidi@eecs.umich.edu * of the intermediate invalidate. 1388545Ssaidi@eecs.umich.edu */ 1398545Ssaidi@eecs.umich.edu void checkSnoop(PacketPtr pkt); 1408545Ssaidi@eecs.umich.edu 1412292SN/A /** Executes a load instruction. */ 1422292SN/A Fault executeLoad(DynInstPtr &inst); 1432292SN/A 1442329SN/A Fault executeLoad(int lq_idx) { panic("Not implemented"); return NoFault; } 1452292SN/A /** Executes a store instruction. */ 1462292SN/A Fault executeStore(DynInstPtr &inst); 1472292SN/A 1482292SN/A /** Commits the head load. */ 1492292SN/A void commitLoad(); 1502292SN/A /** Commits loads older than a specific sequence number. */ 1512292SN/A void commitLoads(InstSeqNum &youngest_inst); 1522292SN/A 1532292SN/A /** Commits stores older than a specific sequence number. */ 1542292SN/A void commitStores(InstSeqNum &youngest_inst); 1552292SN/A 1562292SN/A /** Writes back stores. */ 1572292SN/A void writebackStores(); 1582292SN/A 1592790Sktlim@umich.edu /** Completes the data access that has been returned from the 1602790Sktlim@umich.edu * memory system. */ 1612669Sktlim@umich.edu void completeDataAccess(PacketPtr pkt); 1622669Sktlim@umich.edu 1632292SN/A /** Clears all the entries in the LQ. */ 1642292SN/A void clearLQ(); 1652292SN/A 1662292SN/A /** Clears all the entries in the SQ. */ 1672292SN/A void clearSQ(); 1682292SN/A 1692292SN/A /** Resizes the LQ to a given size. */ 1702292SN/A void resizeLQ(unsigned size); 1712292SN/A 1722292SN/A /** Resizes the SQ to a given size. */ 1732292SN/A void resizeSQ(unsigned size); 1742292SN/A 1752292SN/A /** Squashes all instructions younger than a specific sequence number. */ 1762292SN/A void squash(const InstSeqNum &squashed_num); 1772292SN/A 1782292SN/A /** Returns if there is a memory ordering violation. Value is reset upon 1792292SN/A * call to getMemDepViolator(). 1802292SN/A */ 1812292SN/A bool violation() { return memDepViolator; } 1822292SN/A 1832292SN/A /** Returns the memory ordering violator. */ 1842292SN/A DynInstPtr getMemDepViolator(); 1852292SN/A 1862329SN/A /** Returns if a load became blocked due to the memory system. */ 1872292SN/A bool loadBlocked() 1882292SN/A { return isLoadBlocked; } 1892292SN/A 1902348SN/A /** Clears the signal that a load became blocked. */ 1912292SN/A void clearLoadBlocked() 1922292SN/A { isLoadBlocked = false; } 1932292SN/A 1942348SN/A /** Returns if the blocked load was handled. */ 1952292SN/A bool isLoadBlockedHandled() 1962292SN/A { return loadBlockedHandled; } 1972292SN/A 1982348SN/A /** Records the blocked load as being handled. */ 1992292SN/A void setLoadBlockedHandled() 2002292SN/A { loadBlockedHandled = true; } 2012292SN/A 20210239Sbinhpham@cs.rutgers.edu /** Returns the number of free LQ entries. */ 20310239Sbinhpham@cs.rutgers.edu unsigned numFreeLoadEntries(); 20410239Sbinhpham@cs.rutgers.edu 20510239Sbinhpham@cs.rutgers.edu /** Returns the number of free SQ entries. */ 20610239Sbinhpham@cs.rutgers.edu unsigned numFreeStoreEntries(); 2072292SN/A 2082292SN/A /** Returns the number of loads in the LQ. */ 2092292SN/A int numLoads() { return loads; } 2102292SN/A 2112292SN/A /** Returns the number of stores in the SQ. */ 2122292SN/A int numStores() { return stores; } 2132292SN/A 2142292SN/A /** Returns if either the LQ or SQ is full. */ 2152292SN/A bool isFull() { return lqFull() || sqFull(); } 2162292SN/A 2179444SAndreas.Sandberg@ARM.com /** Returns if both the LQ and SQ are empty. */ 2189444SAndreas.Sandberg@ARM.com bool isEmpty() const { return lqEmpty() && sqEmpty(); } 2199444SAndreas.Sandberg@ARM.com 2202292SN/A /** Returns if the LQ is full. */ 2212292SN/A bool lqFull() { return loads >= (LQEntries - 1); } 2222292SN/A 2232292SN/A /** Returns if the SQ is full. */ 2242292SN/A bool sqFull() { return stores >= (SQEntries - 1); } 2252292SN/A 2269444SAndreas.Sandberg@ARM.com /** Returns if the LQ is empty. */ 2279444SAndreas.Sandberg@ARM.com bool lqEmpty() const { return loads == 0; } 2289444SAndreas.Sandberg@ARM.com 2299444SAndreas.Sandberg@ARM.com /** Returns if the SQ is empty. */ 2309444SAndreas.Sandberg@ARM.com bool sqEmpty() const { return stores == 0; } 2319444SAndreas.Sandberg@ARM.com 2322292SN/A /** Returns the number of instructions in the LSQ. */ 2332292SN/A unsigned getCount() { return loads + stores; } 2342292SN/A 2352292SN/A /** Returns if there are any stores to writeback. */ 2362292SN/A bool hasStoresToWB() { return storesToWB; } 2372292SN/A 2382292SN/A /** Returns the number of stores to writeback. */ 2392292SN/A int numStoresToWB() { return storesToWB; } 2402292SN/A 2412292SN/A /** Returns if the LSQ unit will writeback on this cycle. */ 2422292SN/A bool willWB() { return storeQueue[storeWBIdx].canWB && 2432678Sktlim@umich.edu !storeQueue[storeWBIdx].completed && 2442678Sktlim@umich.edu !isStoreBlocked; } 2452292SN/A 2462907Sktlim@umich.edu /** Handles doing the retry. */ 2472907Sktlim@umich.edu void recvRetry(); 2482907Sktlim@umich.edu 2492292SN/A private: 2509444SAndreas.Sandberg@ARM.com /** Reset the LSQ state */ 2519444SAndreas.Sandberg@ARM.com void resetState(); 2529444SAndreas.Sandberg@ARM.com 2532698Sktlim@umich.edu /** Writes back the instruction, sending it to IEW. */ 2542678Sktlim@umich.edu void writeback(DynInstPtr &inst, PacketPtr pkt); 2552678Sktlim@umich.edu 2566974Stjones1@inf.ed.ac.uk /** Writes back a store that couldn't be completed the previous cycle. */ 2576974Stjones1@inf.ed.ac.uk void writebackPendingStore(); 2586974Stjones1@inf.ed.ac.uk 2592698Sktlim@umich.edu /** Handles completing the send of a store to memory. */ 2603349Sbinkertn@umich.edu void storePostSend(PacketPtr pkt); 2612693Sktlim@umich.edu 2622292SN/A /** Completes the store at the specified index. */ 2632292SN/A void completeStore(int store_idx); 2642292SN/A 2656974Stjones1@inf.ed.ac.uk /** Attempts to send a store to the cache. */ 2666974Stjones1@inf.ed.ac.uk bool sendStore(PacketPtr data_pkt); 2676974Stjones1@inf.ed.ac.uk 2682292SN/A /** Increments the given store index (circular queue). */ 2699440SAndreas.Sandberg@ARM.com inline void incrStIdx(int &store_idx) const; 2702292SN/A /** Decrements the given store index (circular queue). */ 2719440SAndreas.Sandberg@ARM.com inline void decrStIdx(int &store_idx) const; 2722292SN/A /** Increments the given load index (circular queue). */ 2739440SAndreas.Sandberg@ARM.com inline void incrLdIdx(int &load_idx) const; 2742292SN/A /** Decrements the given load index (circular queue). */ 2759440SAndreas.Sandberg@ARM.com inline void decrLdIdx(int &load_idx) const; 2762292SN/A 2772329SN/A public: 2782329SN/A /** Debugging function to dump instructions in the LSQ. */ 2799440SAndreas.Sandberg@ARM.com void dumpInsts() const; 2802329SN/A 2812292SN/A private: 2822292SN/A /** Pointer to the CPU. */ 2832733Sktlim@umich.edu O3CPU *cpu; 2842292SN/A 2852292SN/A /** Pointer to the IEW stage. */ 2862292SN/A IEW *iewStage; 2872292SN/A 2882907Sktlim@umich.edu /** Pointer to the LSQ. */ 2892907Sktlim@umich.edu LSQ *lsq; 2902669Sktlim@umich.edu 2912907Sktlim@umich.edu /** Pointer to the dcache port. Used only for sending. */ 2928922Swilliam.wang@arm.com MasterPort *dcachePort; 2932292SN/A 2942698Sktlim@umich.edu /** Derived class to hold any sender state the LSQ needs. */ 2959044SAli.Saidi@ARM.com class LSQSenderState : public Packet::SenderState 2962678Sktlim@umich.edu { 2972678Sktlim@umich.edu public: 2982698Sktlim@umich.edu /** Default constructor. */ 2992678Sktlim@umich.edu LSQSenderState() 3009046SAli.Saidi@ARM.com : mainPkt(NULL), pendingPacket(NULL), outstanding(1), 3019046SAli.Saidi@ARM.com noWB(false), isSplit(false), pktToSend(false) 3029046SAli.Saidi@ARM.com { } 3032678Sktlim@umich.edu 3042698Sktlim@umich.edu /** Instruction who initiated the access to memory. */ 3052678Sktlim@umich.edu DynInstPtr inst; 3069046SAli.Saidi@ARM.com /** The main packet from a split load, used during writeback. */ 3079046SAli.Saidi@ARM.com PacketPtr mainPkt; 3089046SAli.Saidi@ARM.com /** A second packet from a split store that needs sending. */ 3099046SAli.Saidi@ARM.com PacketPtr pendingPacket; 3109046SAli.Saidi@ARM.com /** The LQ/SQ index of the instruction. */ 3119046SAli.Saidi@ARM.com uint8_t idx; 3129046SAli.Saidi@ARM.com /** Number of outstanding packets to complete. */ 3139046SAli.Saidi@ARM.com uint8_t outstanding; 3142698Sktlim@umich.edu /** Whether or not it is a load. */ 3152678Sktlim@umich.edu bool isLoad; 3162698Sktlim@umich.edu /** Whether or not the instruction will need to writeback. */ 3172678Sktlim@umich.edu bool noWB; 3186974Stjones1@inf.ed.ac.uk /** Whether or not this access is split in two. */ 3196974Stjones1@inf.ed.ac.uk bool isSplit; 3206974Stjones1@inf.ed.ac.uk /** Whether or not there is a packet that needs sending. */ 3216974Stjones1@inf.ed.ac.uk bool pktToSend; 3226974Stjones1@inf.ed.ac.uk 3236974Stjones1@inf.ed.ac.uk /** Completes a packet and returns whether the access is finished. */ 3246974Stjones1@inf.ed.ac.uk inline bool complete() { return --outstanding == 0; } 3252678Sktlim@umich.edu }; 3262678Sktlim@umich.edu 3272698Sktlim@umich.edu /** Writeback event, specifically for when stores forward data to loads. */ 3282678Sktlim@umich.edu class WritebackEvent : public Event { 3292678Sktlim@umich.edu public: 3302678Sktlim@umich.edu /** Constructs a writeback event. */ 3312678Sktlim@umich.edu WritebackEvent(DynInstPtr &_inst, PacketPtr pkt, LSQUnit *lsq_ptr); 3322678Sktlim@umich.edu 3332678Sktlim@umich.edu /** Processes the writeback event. */ 3342678Sktlim@umich.edu void process(); 3352678Sktlim@umich.edu 3362678Sktlim@umich.edu /** Returns the description of this event. */ 3375336Shines@cs.fsu.edu const char *description() const; 3382678Sktlim@umich.edu 3392678Sktlim@umich.edu private: 3402698Sktlim@umich.edu /** Instruction whose results are being written back. */ 3412678Sktlim@umich.edu DynInstPtr inst; 3422678Sktlim@umich.edu 3432698Sktlim@umich.edu /** The packet that would have been sent to memory. */ 3442678Sktlim@umich.edu PacketPtr pkt; 3452678Sktlim@umich.edu 3462678Sktlim@umich.edu /** The pointer to the LSQ unit that issued the store. */ 3472678Sktlim@umich.edu LSQUnit<Impl> *lsqPtr; 3482678Sktlim@umich.edu }; 3492678Sktlim@umich.edu 3502292SN/A public: 3512292SN/A struct SQEntry { 3522292SN/A /** Constructs an empty store queue entry. */ 3532292SN/A SQEntry() 3544326Sgblack@eecs.umich.edu : inst(NULL), req(NULL), size(0), 3552292SN/A canWB(0), committed(0), completed(0) 3564326Sgblack@eecs.umich.edu { 3574395Ssaidi@eecs.umich.edu std::memset(data, 0, sizeof(data)); 3584326Sgblack@eecs.umich.edu } 3592292SN/A 3609152Satgutier@umich.edu ~SQEntry() 3619152Satgutier@umich.edu { 3629152Satgutier@umich.edu inst = NULL; 3639152Satgutier@umich.edu } 3649152Satgutier@umich.edu 3652292SN/A /** Constructs a store queue entry for a given instruction. */ 3662292SN/A SQEntry(DynInstPtr &_inst) 3676974Stjones1@inf.ed.ac.uk : inst(_inst), req(NULL), sreqLow(NULL), sreqHigh(NULL), size(0), 36810031SAli.Saidi@ARM.com isSplit(0), canWB(0), committed(0), completed(0), isAllZeros(0) 3694326Sgblack@eecs.umich.edu { 3704395Ssaidi@eecs.umich.edu std::memset(data, 0, sizeof(data)); 3714326Sgblack@eecs.umich.edu } 3729046SAli.Saidi@ARM.com /** The store data. */ 3739046SAli.Saidi@ARM.com char data[16]; 3742292SN/A /** The store instruction. */ 3752292SN/A DynInstPtr inst; 3762669Sktlim@umich.edu /** The request for the store. */ 3772669Sktlim@umich.edu RequestPtr req; 3786974Stjones1@inf.ed.ac.uk /** The split requests for the store. */ 3796974Stjones1@inf.ed.ac.uk RequestPtr sreqLow; 3806974Stjones1@inf.ed.ac.uk RequestPtr sreqHigh; 3812292SN/A /** The size of the store. */ 3829046SAli.Saidi@ARM.com uint8_t size; 3836974Stjones1@inf.ed.ac.uk /** Whether or not the store is split into two requests. */ 3846974Stjones1@inf.ed.ac.uk bool isSplit; 3852292SN/A /** Whether or not the store can writeback. */ 3862292SN/A bool canWB; 3872292SN/A /** Whether or not the store is committed. */ 3882292SN/A bool committed; 3892292SN/A /** Whether or not the store is completed. */ 3902292SN/A bool completed; 39110031SAli.Saidi@ARM.com /** Does this request write all zeros and thus doesn't 39210031SAli.Saidi@ARM.com * have any data attached to it. Used for cache block zero 39310031SAli.Saidi@ARM.com * style instructs (ARM DC ZVA; ALPHA WH64) 39410031SAli.Saidi@ARM.com */ 39510031SAli.Saidi@ARM.com bool isAllZeros; 3962292SN/A }; 3972329SN/A 3982292SN/A private: 3992292SN/A /** The LSQUnit thread id. */ 4006221Snate@binkert.org ThreadID lsqID; 4012292SN/A 4022292SN/A /** The store queue. */ 4032292SN/A std::vector<SQEntry> storeQueue; 4042292SN/A 4052292SN/A /** The load queue. */ 4062292SN/A std::vector<DynInstPtr> loadQueue; 4072292SN/A 4082329SN/A /** The number of LQ entries, plus a sentinel entry (circular queue). 4092329SN/A * @todo: Consider having var that records the true number of LQ entries. 4102329SN/A */ 4112292SN/A unsigned LQEntries; 4122329SN/A /** The number of SQ entries, plus a sentinel entry (circular queue). 4132329SN/A * @todo: Consider having var that records the true number of SQ entries. 4142329SN/A */ 4152292SN/A unsigned SQEntries; 4162292SN/A 4178199SAli.Saidi@ARM.com /** The number of places to shift addresses in the LSQ before checking 4188199SAli.Saidi@ARM.com * for dependency violations 4198199SAli.Saidi@ARM.com */ 4208199SAli.Saidi@ARM.com unsigned depCheckShift; 4218199SAli.Saidi@ARM.com 4228199SAli.Saidi@ARM.com /** Should loads be checked for dependency issues */ 4238199SAli.Saidi@ARM.com bool checkLoads; 4248199SAli.Saidi@ARM.com 4252292SN/A /** The number of load instructions in the LQ. */ 4262292SN/A int loads; 4272329SN/A /** The number of store instructions in the SQ. */ 4282292SN/A int stores; 4292292SN/A /** The number of store instructions in the SQ waiting to writeback. */ 4302292SN/A int storesToWB; 4312292SN/A 4322292SN/A /** The index of the head instruction in the LQ. */ 4332292SN/A int loadHead; 4342292SN/A /** The index of the tail instruction in the LQ. */ 4352292SN/A int loadTail; 4362292SN/A 4372292SN/A /** The index of the head instruction in the SQ. */ 4382292SN/A int storeHead; 4392329SN/A /** The index of the first instruction that may be ready to be 4402329SN/A * written back, and has not yet been written back. 4412292SN/A */ 4422292SN/A int storeWBIdx; 4432292SN/A /** The index of the tail instruction in the SQ. */ 4442292SN/A int storeTail; 4452292SN/A 4462292SN/A /// @todo Consider moving to a more advanced model with write vs read ports 4472292SN/A /** The number of cache ports available each cycle. */ 4482292SN/A int cachePorts; 4492292SN/A 4502292SN/A /** The number of used cache ports in this cycle. */ 4512292SN/A int usedPorts; 4522292SN/A 4532292SN/A //list<InstSeqNum> mshrSeqNums; 4542292SN/A 4558545Ssaidi@eecs.umich.edu /** Address Mask for a cache block (e.g. ~(cache_block_size-1)) */ 4568545Ssaidi@eecs.umich.edu Addr cacheBlockMask; 4578545Ssaidi@eecs.umich.edu 4582292SN/A /** Wire to read information from the issue stage time queue. */ 4592292SN/A typename TimeBuffer<IssueStruct>::wire fromIssue; 4602292SN/A 4612292SN/A /** Whether or not the LSQ is stalled. */ 4622292SN/A bool stalled; 4632292SN/A /** The store that causes the stall due to partial store to load 4642292SN/A * forwarding. 4652292SN/A */ 4662292SN/A InstSeqNum stallingStoreIsn; 4672292SN/A /** The index of the above store. */ 4682292SN/A int stallingLoadIdx; 4692292SN/A 4702698Sktlim@umich.edu /** The packet that needs to be retried. */ 4712698Sktlim@umich.edu PacketPtr retryPkt; 4722693Sktlim@umich.edu 4732698Sktlim@umich.edu /** Whehter or not a store is blocked due to the memory system. */ 4742678Sktlim@umich.edu bool isStoreBlocked; 4752678Sktlim@umich.edu 4762329SN/A /** Whether or not a load is blocked due to the memory system. */ 4772292SN/A bool isLoadBlocked; 4782292SN/A 4792348SN/A /** Has the blocked load been handled. */ 4802292SN/A bool loadBlockedHandled; 4812292SN/A 4828727Snilay@cs.wisc.edu /** Whether or not a store is in flight. */ 4838727Snilay@cs.wisc.edu bool storeInFlight; 4848727Snilay@cs.wisc.edu 4852348SN/A /** The sequence number of the blocked load. */ 4862292SN/A InstSeqNum blockedLoadSeqNum; 4872292SN/A 4882292SN/A /** The oldest load that caused a memory ordering violation. */ 4892292SN/A DynInstPtr memDepViolator; 4902292SN/A 4916974Stjones1@inf.ed.ac.uk /** Whether or not there is a packet that couldn't be sent because of 4926974Stjones1@inf.ed.ac.uk * a lack of cache ports. */ 4936974Stjones1@inf.ed.ac.uk bool hasPendingPkt; 4946974Stjones1@inf.ed.ac.uk 4956974Stjones1@inf.ed.ac.uk /** The packet that is pending free cache ports. */ 4966974Stjones1@inf.ed.ac.uk PacketPtr pendingPkt; 4976974Stjones1@inf.ed.ac.uk 4988727Snilay@cs.wisc.edu /** Flag for memory model. */ 4998727Snilay@cs.wisc.edu bool needsTSO; 5008727Snilay@cs.wisc.edu 5012292SN/A // Will also need how many read/write ports the Dcache has. Or keep track 5022292SN/A // of that in stage that is one level up, and only call executeLoad/Store 5032292SN/A // the appropriate number of times. 5042727Sktlim@umich.edu /** Total number of loads forwaded from LSQ stores. */ 5055999Snate@binkert.org Stats::Scalar lsqForwLoads; 5062307SN/A 5073126Sktlim@umich.edu /** Total number of loads ignored due to invalid addresses. */ 5085999Snate@binkert.org Stats::Scalar invAddrLoads; 5093126Sktlim@umich.edu 5103126Sktlim@umich.edu /** Total number of squashed loads. */ 5115999Snate@binkert.org Stats::Scalar lsqSquashedLoads; 5123126Sktlim@umich.edu 5133126Sktlim@umich.edu /** Total number of responses from the memory system that are 5143126Sktlim@umich.edu * ignored due to the instruction already being squashed. */ 5155999Snate@binkert.org Stats::Scalar lsqIgnoredResponses; 5163126Sktlim@umich.edu 5173126Sktlim@umich.edu /** Tota number of memory ordering violations. */ 5185999Snate@binkert.org Stats::Scalar lsqMemOrderViolation; 5193126Sktlim@umich.edu 5202727Sktlim@umich.edu /** Total number of squashed stores. */ 5215999Snate@binkert.org Stats::Scalar lsqSquashedStores; 5222727Sktlim@umich.edu 5232727Sktlim@umich.edu /** Total number of software prefetches ignored due to invalid addresses. */ 5245999Snate@binkert.org Stats::Scalar invAddrSwpfs; 5252727Sktlim@umich.edu 5262727Sktlim@umich.edu /** Ready loads blocked due to partial store-forwarding. */ 5275999Snate@binkert.org Stats::Scalar lsqBlockedLoads; 5282727Sktlim@umich.edu 5292727Sktlim@umich.edu /** Number of loads that were rescheduled. */ 5305999Snate@binkert.org Stats::Scalar lsqRescheduledLoads; 5312727Sktlim@umich.edu 5322727Sktlim@umich.edu /** Number of times the LSQ is blocked due to the cache. */ 5335999Snate@binkert.org Stats::Scalar lsqCacheBlocked; 5342727Sktlim@umich.edu 5352292SN/A public: 5362292SN/A /** Executes the load at the given index. */ 5377520Sgblack@eecs.umich.edu Fault read(Request *req, Request *sreqLow, Request *sreqHigh, 5387520Sgblack@eecs.umich.edu uint8_t *data, int load_idx); 5392292SN/A 5402292SN/A /** Executes the store at the given index. */ 5417520Sgblack@eecs.umich.edu Fault write(Request *req, Request *sreqLow, Request *sreqHigh, 5427520Sgblack@eecs.umich.edu uint8_t *data, int store_idx); 5432292SN/A 5442292SN/A /** Returns the index of the head load instruction. */ 5452292SN/A int getLoadHead() { return loadHead; } 5462292SN/A /** Returns the sequence number of the head load instruction. */ 5472292SN/A InstSeqNum getLoadHeadSeqNum() 5482292SN/A { 5492292SN/A if (loadQueue[loadHead]) { 5502292SN/A return loadQueue[loadHead]->seqNum; 5512292SN/A } else { 5522292SN/A return 0; 5532292SN/A } 5542292SN/A 5552292SN/A } 5562292SN/A 5572292SN/A /** Returns the index of the head store instruction. */ 5582292SN/A int getStoreHead() { return storeHead; } 5592292SN/A /** Returns the sequence number of the head store instruction. */ 5602292SN/A InstSeqNum getStoreHeadSeqNum() 5612292SN/A { 5622292SN/A if (storeQueue[storeHead].inst) { 5632292SN/A return storeQueue[storeHead].inst->seqNum; 5642292SN/A } else { 5652292SN/A return 0; 5662292SN/A } 5672292SN/A 5682292SN/A } 5692292SN/A 5702292SN/A /** Returns whether or not the LSQ unit is stalled. */ 5712292SN/A bool isStalled() { return stalled; } 5722292SN/A}; 5732292SN/A 5742292SN/Atemplate <class Impl> 5752292SN/AFault 5766974Stjones1@inf.ed.ac.ukLSQUnit<Impl>::read(Request *req, Request *sreqLow, Request *sreqHigh, 5777520Sgblack@eecs.umich.edu uint8_t *data, int load_idx) 5782292SN/A{ 5792669Sktlim@umich.edu DynInstPtr load_inst = loadQueue[load_idx]; 5802292SN/A 5812669Sktlim@umich.edu assert(load_inst); 5822669Sktlim@umich.edu 5832669Sktlim@umich.edu assert(!load_inst->isExecuted()); 5842292SN/A 5852292SN/A // Make sure this isn't an uncacheable access 5862292SN/A // A bit of a hackish way to get uncached accesses to work only if they're 5872292SN/A // at the head of the LSQ and are ready to commit (at the head of the ROB 5882292SN/A // too). 5893172Sstever@eecs.umich.edu if (req->isUncacheable() && 5902731Sktlim@umich.edu (load_idx != loadHead || !load_inst->isAtCommit())) { 5912669Sktlim@umich.edu iewStage->rescheduleMemInst(load_inst); 5922727Sktlim@umich.edu ++lsqRescheduledLoads; 5937720Sgblack@eecs.umich.edu DPRINTF(LSQUnit, "Uncachable load [sn:%lli] PC %s\n", 5947720Sgblack@eecs.umich.edu load_inst->seqNum, load_inst->pcState()); 5954032Sktlim@umich.edu 5964032Sktlim@umich.edu // Must delete request now that it wasn't handed off to 5974032Sktlim@umich.edu // memory. This is quite ugly. @todo: Figure out the proper 5984032Sktlim@umich.edu // place to really handle request deletes. 5994032Sktlim@umich.edu delete req; 6006974Stjones1@inf.ed.ac.uk if (TheISA::HasUnalignedMemAcc && sreqLow) { 6016974Stjones1@inf.ed.ac.uk delete sreqLow; 6026974Stjones1@inf.ed.ac.uk delete sreqHigh; 6036974Stjones1@inf.ed.ac.uk } 6048591Sgblack@eecs.umich.edu return new GenericISA::M5PanicFault( 6058591Sgblack@eecs.umich.edu "Uncachable load [sn:%llx] PC %s\n", 6068591Sgblack@eecs.umich.edu load_inst->seqNum, load_inst->pcState()); 6072292SN/A } 6082292SN/A 6092292SN/A // Check the SQ for any previous stores that might lead to forwarding 6102669Sktlim@umich.edu int store_idx = load_inst->sqIdx; 6112292SN/A 6122292SN/A int store_size = 0; 6132292SN/A 6142292SN/A DPRINTF(LSQUnit, "Read called, load idx: %i, store idx: %i, " 6156974Stjones1@inf.ed.ac.uk "storeHead: %i addr: %#x%s\n", 6166974Stjones1@inf.ed.ac.uk load_idx, store_idx, storeHead, req->getPaddr(), 6176974Stjones1@inf.ed.ac.uk sreqLow ? " split" : ""); 6182292SN/A 6196102Sgblack@eecs.umich.edu if (req->isLLSC()) { 6206974Stjones1@inf.ed.ac.uk assert(!sreqLow); 6213326Sktlim@umich.edu // Disable recording the result temporarily. Writing to misc 6223326Sktlim@umich.edu // regs normally updates the result, but this is not the 6233326Sktlim@umich.edu // desired behavior when handling store conditionals. 6249046SAli.Saidi@ARM.com load_inst->recordResult(false); 6253326Sktlim@umich.edu TheISA::handleLockedRead(load_inst.get(), req); 6269046SAli.Saidi@ARM.com load_inst->recordResult(true); 6272292SN/A } 6282292SN/A 6298481Sgblack@eecs.umich.edu if (req->isMmappedIpr()) { 6308481Sgblack@eecs.umich.edu assert(!load_inst->memData); 6318481Sgblack@eecs.umich.edu load_inst->memData = new uint8_t[64]; 6328481Sgblack@eecs.umich.edu 6338481Sgblack@eecs.umich.edu ThreadContext *thread = cpu->tcBase(lsqID); 6349180Sandreas.hansson@arm.com Cycles delay(0); 6358949Sandreas.hansson@arm.com PacketPtr data_pkt = new Packet(req, MemCmd::ReadReq); 6368481Sgblack@eecs.umich.edu 6378481Sgblack@eecs.umich.edu if (!TheISA::HasUnalignedMemAcc || !sreqLow) { 6388481Sgblack@eecs.umich.edu data_pkt->dataStatic(load_inst->memData); 6398481Sgblack@eecs.umich.edu delay = TheISA::handleIprRead(thread, data_pkt); 6408481Sgblack@eecs.umich.edu } else { 6418481Sgblack@eecs.umich.edu assert(sreqLow->isMmappedIpr() && sreqHigh->isMmappedIpr()); 6428949Sandreas.hansson@arm.com PacketPtr fst_data_pkt = new Packet(sreqLow, MemCmd::ReadReq); 6438949Sandreas.hansson@arm.com PacketPtr snd_data_pkt = new Packet(sreqHigh, MemCmd::ReadReq); 6448481Sgblack@eecs.umich.edu 6458481Sgblack@eecs.umich.edu fst_data_pkt->dataStatic(load_inst->memData); 6468481Sgblack@eecs.umich.edu snd_data_pkt->dataStatic(load_inst->memData + sreqLow->getSize()); 6478481Sgblack@eecs.umich.edu 6488481Sgblack@eecs.umich.edu delay = TheISA::handleIprRead(thread, fst_data_pkt); 6499180Sandreas.hansson@arm.com Cycles delay2 = TheISA::handleIprRead(thread, snd_data_pkt); 6508481Sgblack@eecs.umich.edu if (delay2 > delay) 6518481Sgblack@eecs.umich.edu delay = delay2; 6528481Sgblack@eecs.umich.edu 6538481Sgblack@eecs.umich.edu delete sreqLow; 6548481Sgblack@eecs.umich.edu delete sreqHigh; 6558481Sgblack@eecs.umich.edu delete fst_data_pkt; 6568481Sgblack@eecs.umich.edu delete snd_data_pkt; 6578481Sgblack@eecs.umich.edu } 6588481Sgblack@eecs.umich.edu WritebackEvent *wb = new WritebackEvent(load_inst, data_pkt, this); 6599179Sandreas.hansson@arm.com cpu->schedule(wb, cpu->clockEdge(delay)); 6608481Sgblack@eecs.umich.edu return NoFault; 6618481Sgblack@eecs.umich.edu } 6628481Sgblack@eecs.umich.edu 6632292SN/A while (store_idx != -1) { 6642292SN/A // End once we've reached the top of the LSQ 6652292SN/A if (store_idx == storeWBIdx) { 6662292SN/A break; 6672292SN/A } 6682292SN/A 6692292SN/A // Move the index to one younger 6702292SN/A if (--store_idx < 0) 6712292SN/A store_idx += SQEntries; 6722292SN/A 6732292SN/A assert(storeQueue[store_idx].inst); 6742292SN/A 6752292SN/A store_size = storeQueue[store_idx].size; 6762292SN/A 6772292SN/A if (store_size == 0) 6782292SN/A continue; 6794032Sktlim@umich.edu else if (storeQueue[store_idx].inst->uncacheable()) 6804032Sktlim@umich.edu continue; 6814032Sktlim@umich.edu 6829046SAli.Saidi@ARM.com assert(storeQueue[store_idx].inst->effAddrValid()); 6832292SN/A 6842292SN/A // Check if the store data is within the lower and upper bounds of 6852292SN/A // addresses that the request needs. 6862292SN/A bool store_has_lower_limit = 6872669Sktlim@umich.edu req->getVaddr() >= storeQueue[store_idx].inst->effAddr; 6882292SN/A bool store_has_upper_limit = 6892669Sktlim@umich.edu (req->getVaddr() + req->getSize()) <= 6902669Sktlim@umich.edu (storeQueue[store_idx].inst->effAddr + store_size); 6912292SN/A bool lower_load_has_store_part = 6922669Sktlim@umich.edu req->getVaddr() < (storeQueue[store_idx].inst->effAddr + 6932292SN/A store_size); 6942292SN/A bool upper_load_has_store_part = 6952669Sktlim@umich.edu (req->getVaddr() + req->getSize()) > 6962669Sktlim@umich.edu storeQueue[store_idx].inst->effAddr; 6972292SN/A 6982292SN/A // If the store's data has all of the data needed, we can forward. 6994032Sktlim@umich.edu if ((store_has_lower_limit && store_has_upper_limit)) { 7002329SN/A // Get shift amount for offset into the store's data. 7018316Sgeoffrey.blake@arm.com int shift_amt = req->getVaddr() - storeQueue[store_idx].inst->effAddr; 7022292SN/A 70310031SAli.Saidi@ARM.com if (storeQueue[store_idx].isAllZeros) 70410031SAli.Saidi@ARM.com memset(data, 0, req->getSize()); 70510031SAli.Saidi@ARM.com else 70610031SAli.Saidi@ARM.com memcpy(data, storeQueue[store_idx].data + shift_amt, 7077520Sgblack@eecs.umich.edu req->getSize()); 7083803Sgblack@eecs.umich.edu 7092669Sktlim@umich.edu assert(!load_inst->memData); 71010031SAli.Saidi@ARM.com load_inst->memData = new uint8_t[req->getSize()]; 71110031SAli.Saidi@ARM.com if (storeQueue[store_idx].isAllZeros) 71210031SAli.Saidi@ARM.com memset(load_inst->memData, 0, req->getSize()); 71310031SAli.Saidi@ARM.com else 71410031SAli.Saidi@ARM.com memcpy(load_inst->memData, 7154326Sgblack@eecs.umich.edu storeQueue[store_idx].data + shift_amt, req->getSize()); 7162292SN/A 7172292SN/A DPRINTF(LSQUnit, "Forwarding from store idx %i to load to " 71810175SMitch.Hayenga@ARM.com "addr %#x\n", store_idx, req->getVaddr()); 7192678Sktlim@umich.edu 7208949Sandreas.hansson@arm.com PacketPtr data_pkt = new Packet(req, MemCmd::ReadReq); 7212678Sktlim@umich.edu data_pkt->dataStatic(load_inst->memData); 7222678Sktlim@umich.edu 7232678Sktlim@umich.edu WritebackEvent *wb = new WritebackEvent(load_inst, data_pkt, this); 7242292SN/A 7252292SN/A // We'll say this has a 1 cycle load-store forwarding latency 7262292SN/A // for now. 7272292SN/A // @todo: Need to make this a parameter. 7287823Ssteve.reinhardt@amd.com cpu->schedule(wb, curTick()); 7292678Sktlim@umich.edu 7306974Stjones1@inf.ed.ac.uk // Don't need to do anything special for split loads. 7316974Stjones1@inf.ed.ac.uk if (TheISA::HasUnalignedMemAcc && sreqLow) { 7326974Stjones1@inf.ed.ac.uk delete sreqLow; 7336974Stjones1@inf.ed.ac.uk delete sreqHigh; 7346974Stjones1@inf.ed.ac.uk } 7356974Stjones1@inf.ed.ac.uk 7362727Sktlim@umich.edu ++lsqForwLoads; 7372292SN/A return NoFault; 7382292SN/A } else if ((store_has_lower_limit && lower_load_has_store_part) || 7392292SN/A (store_has_upper_limit && upper_load_has_store_part) || 7402292SN/A (lower_load_has_store_part && upper_load_has_store_part)) { 7412292SN/A // This is the partial store-load forwarding case where a store 7422292SN/A // has only part of the load's data. 7432292SN/A 7442292SN/A // If it's already been written back, then don't worry about 7452292SN/A // stalling on it. 7462292SN/A if (storeQueue[store_idx].completed) { 7474032Sktlim@umich.edu panic("Should not check one of these"); 7482292SN/A continue; 7492292SN/A } 7502292SN/A 7512292SN/A // Must stall load and force it to retry, so long as it's the oldest 7522292SN/A // load that needs to do so. 7532292SN/A if (!stalled || 7542292SN/A (stalled && 7552669Sktlim@umich.edu load_inst->seqNum < 7562292SN/A loadQueue[stallingLoadIdx]->seqNum)) { 7572292SN/A stalled = true; 7582292SN/A stallingStoreIsn = storeQueue[store_idx].inst->seqNum; 7592292SN/A stallingLoadIdx = load_idx; 7602292SN/A } 7612292SN/A 7622292SN/A // Tell IQ/mem dep unit that this instruction will need to be 7632292SN/A // rescheduled eventually 7642669Sktlim@umich.edu iewStage->rescheduleMemInst(load_inst); 7652927Sktlim@umich.edu iewStage->decrWb(load_inst->seqNum); 7664032Sktlim@umich.edu load_inst->clearIssued(); 7672727Sktlim@umich.edu ++lsqRescheduledLoads; 7682292SN/A 7692292SN/A // Do not generate a writeback event as this instruction is not 7702292SN/A // complete. 7712292SN/A DPRINTF(LSQUnit, "Load-store forwarding mis-match. " 7722292SN/A "Store idx %i to load addr %#x\n", 7732669Sktlim@umich.edu store_idx, req->getVaddr()); 7742292SN/A 7754032Sktlim@umich.edu // Must delete request now that it wasn't handed off to 7764032Sktlim@umich.edu // memory. This is quite ugly. @todo: Figure out the 7774032Sktlim@umich.edu // proper place to really handle request deletes. 7784032Sktlim@umich.edu delete req; 7796974Stjones1@inf.ed.ac.uk if (TheISA::HasUnalignedMemAcc && sreqLow) { 7806974Stjones1@inf.ed.ac.uk delete sreqLow; 7816974Stjones1@inf.ed.ac.uk delete sreqHigh; 7826974Stjones1@inf.ed.ac.uk } 7834032Sktlim@umich.edu 7842292SN/A return NoFault; 7852292SN/A } 7862292SN/A } 7872292SN/A 7882292SN/A // If there's no forwarding case, then go access memory 7897720Sgblack@eecs.umich.edu DPRINTF(LSQUnit, "Doing memory access for inst [sn:%lli] PC %s\n", 7907720Sgblack@eecs.umich.edu load_inst->seqNum, load_inst->pcState()); 7912292SN/A 7922669Sktlim@umich.edu assert(!load_inst->memData); 79310031SAli.Saidi@ARM.com load_inst->memData = new uint8_t[req->getSize()]; 7942292SN/A 7952292SN/A ++usedPorts; 7962292SN/A 7972907Sktlim@umich.edu // if we the cache is not blocked, do cache access 7986974Stjones1@inf.ed.ac.uk bool completedFirst = false; 7992907Sktlim@umich.edu if (!lsq->cacheBlocked()) { 8006974Stjones1@inf.ed.ac.uk MemCmd command = 8016974Stjones1@inf.ed.ac.uk req->isLLSC() ? MemCmd::LoadLockedReq : MemCmd::ReadReq; 8028949Sandreas.hansson@arm.com PacketPtr data_pkt = new Packet(req, command); 8036974Stjones1@inf.ed.ac.uk PacketPtr fst_data_pkt = NULL; 8046974Stjones1@inf.ed.ac.uk PacketPtr snd_data_pkt = NULL; 8056974Stjones1@inf.ed.ac.uk 8063228Sktlim@umich.edu data_pkt->dataStatic(load_inst->memData); 8073228Sktlim@umich.edu 8083228Sktlim@umich.edu LSQSenderState *state = new LSQSenderState; 8093228Sktlim@umich.edu state->isLoad = true; 8103228Sktlim@umich.edu state->idx = load_idx; 8113228Sktlim@umich.edu state->inst = load_inst; 8123228Sktlim@umich.edu data_pkt->senderState = state; 8133228Sktlim@umich.edu 8146974Stjones1@inf.ed.ac.uk if (!TheISA::HasUnalignedMemAcc || !sreqLow) { 8156974Stjones1@inf.ed.ac.uk 8166974Stjones1@inf.ed.ac.uk // Point the first packet at the main data packet. 8176974Stjones1@inf.ed.ac.uk fst_data_pkt = data_pkt; 8186974Stjones1@inf.ed.ac.uk } else { 8196974Stjones1@inf.ed.ac.uk 8206974Stjones1@inf.ed.ac.uk // Create the split packets. 8218949Sandreas.hansson@arm.com fst_data_pkt = new Packet(sreqLow, command); 8228949Sandreas.hansson@arm.com snd_data_pkt = new Packet(sreqHigh, command); 8236974Stjones1@inf.ed.ac.uk 8246974Stjones1@inf.ed.ac.uk fst_data_pkt->dataStatic(load_inst->memData); 8256974Stjones1@inf.ed.ac.uk snd_data_pkt->dataStatic(load_inst->memData + sreqLow->getSize()); 8266974Stjones1@inf.ed.ac.uk 8276974Stjones1@inf.ed.ac.uk fst_data_pkt->senderState = state; 8286974Stjones1@inf.ed.ac.uk snd_data_pkt->senderState = state; 8296974Stjones1@inf.ed.ac.uk 8306974Stjones1@inf.ed.ac.uk state->isSplit = true; 8316974Stjones1@inf.ed.ac.uk state->outstanding = 2; 8326974Stjones1@inf.ed.ac.uk state->mainPkt = data_pkt; 8336974Stjones1@inf.ed.ac.uk } 8346974Stjones1@inf.ed.ac.uk 8358975Sandreas.hansson@arm.com if (!dcachePort->sendTimingReq(fst_data_pkt)) { 8363228Sktlim@umich.edu // Delete state and data packet because a load retry 8373228Sktlim@umich.edu // initiates a pipeline restart; it does not retry. 8383228Sktlim@umich.edu delete state; 8394032Sktlim@umich.edu delete data_pkt->req; 8403228Sktlim@umich.edu delete data_pkt; 8416974Stjones1@inf.ed.ac.uk if (TheISA::HasUnalignedMemAcc && sreqLow) { 8426974Stjones1@inf.ed.ac.uk delete fst_data_pkt->req; 8436974Stjones1@inf.ed.ac.uk delete fst_data_pkt; 8446974Stjones1@inf.ed.ac.uk delete snd_data_pkt->req; 8456974Stjones1@inf.ed.ac.uk delete snd_data_pkt; 8467511Stjones1@inf.ed.ac.uk sreqLow = NULL; 8477511Stjones1@inf.ed.ac.uk sreqHigh = NULL; 8486974Stjones1@inf.ed.ac.uk } 8493228Sktlim@umich.edu 8504032Sktlim@umich.edu req = NULL; 8514032Sktlim@umich.edu 8522907Sktlim@umich.edu // If the access didn't succeed, tell the LSQ by setting 8532907Sktlim@umich.edu // the retry thread id. 8542907Sktlim@umich.edu lsq->setRetryTid(lsqID); 8556974Stjones1@inf.ed.ac.uk } else if (TheISA::HasUnalignedMemAcc && sreqLow) { 8566974Stjones1@inf.ed.ac.uk completedFirst = true; 8576974Stjones1@inf.ed.ac.uk 8586974Stjones1@inf.ed.ac.uk // The first packet was sent without problems, so send this one 8596974Stjones1@inf.ed.ac.uk // too. If there is a problem with this packet then the whole 8606974Stjones1@inf.ed.ac.uk // load will be squashed, so indicate this to the state object. 8616974Stjones1@inf.ed.ac.uk // The first packet will return in completeDataAccess and be 8626974Stjones1@inf.ed.ac.uk // handled there. 8636974Stjones1@inf.ed.ac.uk ++usedPorts; 8648975Sandreas.hansson@arm.com if (!dcachePort->sendTimingReq(snd_data_pkt)) { 8656974Stjones1@inf.ed.ac.uk 8666974Stjones1@inf.ed.ac.uk // The main packet will be deleted in completeDataAccess. 8676974Stjones1@inf.ed.ac.uk delete snd_data_pkt->req; 8686974Stjones1@inf.ed.ac.uk delete snd_data_pkt; 8696974Stjones1@inf.ed.ac.uk 8706974Stjones1@inf.ed.ac.uk state->complete(); 8716974Stjones1@inf.ed.ac.uk 8726974Stjones1@inf.ed.ac.uk req = NULL; 8737511Stjones1@inf.ed.ac.uk sreqHigh = NULL; 8746974Stjones1@inf.ed.ac.uk 8756974Stjones1@inf.ed.ac.uk lsq->setRetryTid(lsqID); 8766974Stjones1@inf.ed.ac.uk } 8772907Sktlim@umich.edu } 8782907Sktlim@umich.edu } 8792907Sktlim@umich.edu 8802907Sktlim@umich.edu // If the cache was blocked, or has become blocked due to the access, 8812907Sktlim@umich.edu // handle it. 8822907Sktlim@umich.edu if (lsq->cacheBlocked()) { 8834032Sktlim@umich.edu if (req) 8844032Sktlim@umich.edu delete req; 8856974Stjones1@inf.ed.ac.uk if (TheISA::HasUnalignedMemAcc && sreqLow && !completedFirst) { 8866974Stjones1@inf.ed.ac.uk delete sreqLow; 8876974Stjones1@inf.ed.ac.uk delete sreqHigh; 8886974Stjones1@inf.ed.ac.uk } 8894032Sktlim@umich.edu 8902727Sktlim@umich.edu ++lsqCacheBlocked; 8913014Srdreslin@umich.edu 8928315Sgeoffrey.blake@arm.com // If the first part of a split access succeeds, then let the LSQ 8938315Sgeoffrey.blake@arm.com // handle the decrWb when completeDataAccess is called upon return 8948315Sgeoffrey.blake@arm.com // of the requested first part of data 8958315Sgeoffrey.blake@arm.com if (!completedFirst) 8968315Sgeoffrey.blake@arm.com iewStage->decrWb(load_inst->seqNum); 8978315Sgeoffrey.blake@arm.com 8982669Sktlim@umich.edu // There's an older load that's already going to squash. 8992669Sktlim@umich.edu if (isLoadBlocked && blockedLoadSeqNum < load_inst->seqNum) 9002669Sktlim@umich.edu return NoFault; 9012292SN/A 9022669Sktlim@umich.edu // Record that the load was blocked due to memory. This 9032669Sktlim@umich.edu // load will squash all instructions after it, be 9042669Sktlim@umich.edu // refetched, and re-executed. 9052669Sktlim@umich.edu isLoadBlocked = true; 9062669Sktlim@umich.edu loadBlockedHandled = false; 9072669Sktlim@umich.edu blockedLoadSeqNum = load_inst->seqNum; 9082669Sktlim@umich.edu // No fault occurred, even though the interface is blocked. 9092669Sktlim@umich.edu return NoFault; 9102292SN/A } 9112292SN/A 9122669Sktlim@umich.edu return NoFault; 9132292SN/A} 9142292SN/A 9152292SN/Atemplate <class Impl> 9162292SN/AFault 9176974Stjones1@inf.ed.ac.ukLSQUnit<Impl>::write(Request *req, Request *sreqLow, Request *sreqHigh, 9187520Sgblack@eecs.umich.edu uint8_t *data, int store_idx) 9192292SN/A{ 9202292SN/A assert(storeQueue[store_idx].inst); 9212292SN/A 92210175SMitch.Hayenga@ARM.com DPRINTF(LSQUnit, "Doing write to store idx %i, addr %#x" 9232292SN/A " | storeHead:%i [sn:%i]\n", 92410175SMitch.Hayenga@ARM.com store_idx, req->getPaddr(), storeHead, 9252292SN/A storeQueue[store_idx].inst->seqNum); 9262329SN/A 9272292SN/A storeQueue[store_idx].req = req; 9286974Stjones1@inf.ed.ac.uk storeQueue[store_idx].sreqLow = sreqLow; 9296974Stjones1@inf.ed.ac.uk storeQueue[store_idx].sreqHigh = sreqHigh; 9307520Sgblack@eecs.umich.edu unsigned size = req->getSize(); 9317520Sgblack@eecs.umich.edu storeQueue[store_idx].size = size; 93210031SAli.Saidi@ARM.com storeQueue[store_idx].isAllZeros = req->getFlags() & Request::CACHE_BLOCK_ZERO; 93310031SAli.Saidi@ARM.com assert(size <= sizeof(storeQueue[store_idx].data) || 93410031SAli.Saidi@ARM.com (req->getFlags() & Request::CACHE_BLOCK_ZERO)); 9357509Stjones1@inf.ed.ac.uk 9367509Stjones1@inf.ed.ac.uk // Split stores can only occur in ISAs with unaligned memory accesses. If 9377509Stjones1@inf.ed.ac.uk // a store request has been split, sreqLow and sreqHigh will be non-null. 9387509Stjones1@inf.ed.ac.uk if (TheISA::HasUnalignedMemAcc && sreqLow) { 9397509Stjones1@inf.ed.ac.uk storeQueue[store_idx].isSplit = true; 9407509Stjones1@inf.ed.ac.uk } 9414326Sgblack@eecs.umich.edu 94210031SAli.Saidi@ARM.com if (!(req->getFlags() & Request::CACHE_BLOCK_ZERO)) 94310031SAli.Saidi@ARM.com memcpy(storeQueue[store_idx].data, data, size); 9442329SN/A 9452292SN/A // This function only writes the data to the store queue, so no fault 9462292SN/A // can happen here. 9472292SN/A return NoFault; 9482292SN/A} 9492292SN/A 9502292SN/A#endif // __CPU_O3_LSQ_UNIT_HH__ 951