coherent_xbar.cc revision 11334
12497SN/A/* 210719SMarco.Balboni@ARM.com * Copyright (c) 2011-2015 ARM Limited 38711SN/A * All rights reserved 48711SN/A * 58711SN/A * The license below extends only to copyright in the software and shall 68711SN/A * not be construed as granting a license to any other intellectual 78711SN/A * property including but not limited to intellectual property relating 88711SN/A * to a hardware implementation of the functionality of the software 98711SN/A * licensed hereunder. You may use the software subject to the license 108711SN/A * terms below provided that you ensure that this notice is replicated 118711SN/A * unmodified and in its entirety in all distributions of the software, 128711SN/A * modified or unmodified, in source code or in binary form. 138711SN/A * 142497SN/A * Copyright (c) 2006 The Regents of The University of Michigan 152497SN/A * All rights reserved. 162497SN/A * 172497SN/A * Redistribution and use in source and binary forms, with or without 182497SN/A * modification, are permitted provided that the following conditions are 192497SN/A * met: redistributions of source code must retain the above copyright 202497SN/A * notice, this list of conditions and the following disclaimer; 212497SN/A * redistributions in binary form must reproduce the above copyright 222497SN/A * notice, this list of conditions and the following disclaimer in the 232497SN/A * documentation and/or other materials provided with the distribution; 242497SN/A * neither the name of the copyright holders nor the names of its 252497SN/A * contributors may be used to endorse or promote products derived from 262497SN/A * this software without specific prior written permission. 272497SN/A * 282497SN/A * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 292497SN/A * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 302497SN/A * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 312497SN/A * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 322497SN/A * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 332497SN/A * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 342497SN/A * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 352497SN/A * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 362497SN/A * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 372497SN/A * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 382497SN/A * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 392665SN/A * 402665SN/A * Authors: Ali Saidi 418715SN/A * Andreas Hansson 428922SN/A * William Wang 432497SN/A */ 442497SN/A 452497SN/A/** 462982SN/A * @file 4710405Sandreas.hansson@arm.com * Definition of a crossbar object. 482497SN/A */ 492497SN/A 502846SN/A#include "base/misc.hh" 512548SN/A#include "base/trace.hh" 5210405Sandreas.hansson@arm.com#include "debug/AddrRanges.hh" 5310405Sandreas.hansson@arm.com#include "debug/CoherentXBar.hh" 5410405Sandreas.hansson@arm.com#include "mem/coherent_xbar.hh" 559524SN/A#include "sim/system.hh" 562497SN/A 5710405Sandreas.hansson@arm.comCoherentXBar::CoherentXBar(const CoherentXBarParams *p) 5810719SMarco.Balboni@ARM.com : BaseXBar(p), system(p->system), snoopFilter(p->snoop_filter), 5911334Sandreas.hansson@arm.com snoopResponseLatency(p->snoop_response_latency), 6011334Sandreas.hansson@arm.com pointOfCoherency(p->point_of_coherency) 617523SN/A{ 628851SN/A // create the ports based on the size of the master and slave 638948SN/A // vector ports, and the presence of the default port, the ports 648948SN/A // are enumerated starting from zero 658851SN/A for (int i = 0; i < p->port_master_connection_count; ++i) { 669095SN/A std::string portName = csprintf("%s.master[%d]", name(), i); 6710405Sandreas.hansson@arm.com MasterPort* bp = new CoherentXBarMasterPort(portName, *this, i); 688922SN/A masterPorts.push_back(bp); 699715SN/A reqLayers.push_back(new ReqLayer(*bp, *this, 709715SN/A csprintf(".reqLayer%d", i))); 7110713Sandreas.hansson@arm.com snoopLayers.push_back(new SnoopRespLayer(*bp, *this, 7210713Sandreas.hansson@arm.com csprintf(".snoopLayer%d", i))); 738851SN/A } 748851SN/A 758948SN/A // see if we have a default slave device connected and if so add 768948SN/A // our corresponding master port 778915SN/A if (p->port_default_connection_count) { 789031SN/A defaultPortID = masterPorts.size(); 799095SN/A std::string portName = name() + ".default"; 8010405Sandreas.hansson@arm.com MasterPort* bp = new CoherentXBarMasterPort(portName, *this, 819036SN/A defaultPortID); 828922SN/A masterPorts.push_back(bp); 839715SN/A reqLayers.push_back(new ReqLayer(*bp, *this, csprintf(".reqLayer%d", 849715SN/A defaultPortID))); 8510713Sandreas.hansson@arm.com snoopLayers.push_back(new SnoopRespLayer(*bp, *this, 8610713Sandreas.hansson@arm.com csprintf(".snoopLayer%d", 8710713Sandreas.hansson@arm.com defaultPortID))); 888915SN/A } 898915SN/A 908948SN/A // create the slave ports, once again starting at zero 918851SN/A for (int i = 0; i < p->port_slave_connection_count; ++i) { 929095SN/A std::string portName = csprintf("%s.slave[%d]", name(), i); 9310888Sandreas.hansson@arm.com QueuedSlavePort* bp = new CoherentXBarSlavePort(portName, *this, i); 948922SN/A slavePorts.push_back(bp); 959715SN/A respLayers.push_back(new RespLayer(*bp, *this, 969715SN/A csprintf(".respLayer%d", i))); 979716SN/A snoopRespPorts.push_back(new SnoopRespPort(*bp, *this)); 988851SN/A } 998851SN/A 1007523SN/A clearPortCache(); 1017523SN/A} 1027523SN/A 10310405Sandreas.hansson@arm.comCoherentXBar::~CoherentXBar() 1049715SN/A{ 10510405Sandreas.hansson@arm.com for (auto l: reqLayers) 10610405Sandreas.hansson@arm.com delete l; 10710405Sandreas.hansson@arm.com for (auto l: respLayers) 10810405Sandreas.hansson@arm.com delete l; 10910405Sandreas.hansson@arm.com for (auto l: snoopLayers) 11010405Sandreas.hansson@arm.com delete l; 11110405Sandreas.hansson@arm.com for (auto p: snoopRespPorts) 11210405Sandreas.hansson@arm.com delete p; 1139715SN/A} 1149715SN/A 1152568SN/Avoid 11610405Sandreas.hansson@arm.comCoherentXBar::init() 1172568SN/A{ 1189278SN/A // the base class is responsible for determining the block size 11910405Sandreas.hansson@arm.com BaseXBar::init(); 1209278SN/A 1218948SN/A // iterate over our slave ports and determine which of our 1228948SN/A // neighbouring master ports are snooping and add them as snoopers 12310405Sandreas.hansson@arm.com for (const auto& p: slavePorts) { 1249088SN/A // check if the connected master port is snooping 12510405Sandreas.hansson@arm.com if (p->isSnooping()) { 12610405Sandreas.hansson@arm.com DPRINTF(AddrRanges, "Adding snooping master %s\n", 12710405Sandreas.hansson@arm.com p->getMasterPort().name()); 12810405Sandreas.hansson@arm.com snoopPorts.push_back(p); 1298711SN/A } 1308711SN/A } 1312568SN/A 1329036SN/A if (snoopPorts.empty()) 13310405Sandreas.hansson@arm.com warn("CoherentXBar %s has no snooping ports attached!\n", name()); 13411133Sandreas.hansson@arm.com 13511133Sandreas.hansson@arm.com // inform the snoop filter about the slave ports so it can create 13611133Sandreas.hansson@arm.com // its own internal representation 13711133Sandreas.hansson@arm.com if (snoopFilter) 13811133Sandreas.hansson@arm.com snoopFilter->setSlavePorts(slavePorts); 1393244SN/A} 1403244SN/A 1418948SN/Abool 14210405Sandreas.hansson@arm.comCoherentXBar::recvTimingReq(PacketPtr pkt, PortID slave_port_id) 1433244SN/A{ 1448975SN/A // determine the source port based on the id 1459032SN/A SlavePort *src_port = slavePorts[slave_port_id]; 1463244SN/A 1479091SN/A // remember if the packet is an express snoop 1489091SN/A bool is_express_snoop = pkt->isExpressSnoop(); 14911284Sandreas.hansson@arm.com bool cache_responding = pkt->cacheResponding(); 15010656Sandreas.hansson@arm.com // for normal requests, going downstream, the express snoop flag 15111284Sandreas.hansson@arm.com // and the cache responding flag should always be the same 15211284Sandreas.hansson@arm.com assert(is_express_snoop == cache_responding); 1539091SN/A 1549612SN/A // determine the destination based on the address 1559712SN/A PortID master_port_id = findPort(pkt->getAddr()); 1569612SN/A 15710405Sandreas.hansson@arm.com // test if the crossbar should be considered occupied for the current 1589033SN/A // port, and exclude express snoops from the check 1599715SN/A if (!is_express_snoop && !reqLayers[master_port_id]->tryTiming(src_port)) { 16010405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "recvTimingReq: src %s %s 0x%x BUSY\n", 1618949SN/A src_port->name(), pkt->cmdString(), pkt->getAddr()); 1623244SN/A return false; 1633244SN/A } 1643244SN/A 16510405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "recvTimingReq: src %s %s expr %d 0x%x\n", 1669091SN/A src_port->name(), pkt->cmdString(), is_express_snoop, 1679091SN/A pkt->getAddr()); 1685197SN/A 1699712SN/A // store size and command as they might be modified when 1709712SN/A // forwarding the packet 1719712SN/A unsigned int pkt_size = pkt->hasData() ? pkt->getSize() : 0; 1729712SN/A unsigned int pkt_cmd = pkt->cmdToIndex(); 1739712SN/A 17410719SMarco.Balboni@ARM.com // store the old header delay so we can restore it if needed 17510719SMarco.Balboni@ARM.com Tick old_header_delay = pkt->headerDelay; 17610719SMarco.Balboni@ARM.com 17710719SMarco.Balboni@ARM.com // a request sees the frontend and forward latency 17810719SMarco.Balboni@ARM.com Tick xbar_delay = (frontendLatency + forwardLatency) * clockPeriod(); 17910719SMarco.Balboni@ARM.com 18010719SMarco.Balboni@ARM.com // set the packet header and payload delay 18110719SMarco.Balboni@ARM.com calcPacketTiming(pkt, xbar_delay); 18210719SMarco.Balboni@ARM.com 18310719SMarco.Balboni@ARM.com // determine how long to be crossbar layer is busy 18410719SMarco.Balboni@ARM.com Tick packetFinishTime = clockEdge(Cycles(1)) + pkt->payloadDelay; 1854912SN/A 18610821Sandreas.hansson@arm.com if (!system->bypassCaches()) { 18711127Sandreas.hansson@arm.com assert(pkt->snoopDelay == 0); 18811127Sandreas.hansson@arm.com 1898979SN/A // the packet is a memory-mapped request and should be 1908979SN/A // broadcasted to our snoopers but the source 19110402SN/A if (snoopFilter) { 19210402SN/A // check with the snoop filter where to forward this packet 19310402SN/A auto sf_res = snoopFilter->lookupRequest(pkt, *src_port); 19411126Sandreas.hansson@arm.com // the time required by a packet to be delivered through 19511126Sandreas.hansson@arm.com // the xbar has to be charged also with to lookup latency 19611126Sandreas.hansson@arm.com // of the snoop filter 19710719SMarco.Balboni@ARM.com pkt->headerDelay += sf_res.second * clockPeriod(); 19810405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "recvTimingReq: src %s %s 0x%x"\ 19910402SN/A " SF size: %i lat: %i\n", src_port->name(), 20010402SN/A pkt->cmdString(), pkt->getAddr(), sf_res.first.size(), 20110402SN/A sf_res.second); 20211196Sali.jafri@arm.com 20311199Sandreas.hansson@arm.com if (pkt->isEviction()) { 20411196Sali.jafri@arm.com // for block-evicting packets, i.e. writebacks and 20511196Sali.jafri@arm.com // clean evictions, there is no need to snoop up, as 20611196Sali.jafri@arm.com // all we do is determine if the block is cached or 20711196Sali.jafri@arm.com // not, instead just set it here based on the snoop 20811196Sali.jafri@arm.com // filter result 20911196Sali.jafri@arm.com if (!sf_res.first.empty()) 21011196Sali.jafri@arm.com pkt->setBlockCached(); 21111196Sali.jafri@arm.com } else { 21211196Sali.jafri@arm.com forwardTiming(pkt, slave_port_id, sf_res.first); 21311196Sali.jafri@arm.com } 21410402SN/A } else { 21510402SN/A forwardTiming(pkt, slave_port_id); 21610402SN/A } 21711127Sandreas.hansson@arm.com 21811127Sandreas.hansson@arm.com // add the snoop delay to our header delay, and then reset it 21911127Sandreas.hansson@arm.com pkt->headerDelay += pkt->snoopDelay; 22011127Sandreas.hansson@arm.com pkt->snoopDelay = 0; 2218979SN/A } 2228948SN/A 22311334Sandreas.hansson@arm.com // set up a sensible starting point 22411334Sandreas.hansson@arm.com bool success = true; 22510883Sali.jafri@arm.com 22611284Sandreas.hansson@arm.com // remember if the packet will generate a snoop response by 22711284Sandreas.hansson@arm.com // checking if a cache set the cacheResponding flag during the 22811284Sandreas.hansson@arm.com // snooping above 22911284Sandreas.hansson@arm.com const bool expect_snoop_resp = !cache_responding && pkt->cacheResponding(); 23011334Sandreas.hansson@arm.com bool expect_response = pkt->needsResponse() && !pkt->cacheResponding(); 2318915SN/A 23211334Sandreas.hansson@arm.com const bool sink_packet = sinkPacket(pkt); 23311334Sandreas.hansson@arm.com 23411334Sandreas.hansson@arm.com // in certain cases the crossbar is responsible for responding 23511334Sandreas.hansson@arm.com bool respond_directly = false; 23611334Sandreas.hansson@arm.com 23711334Sandreas.hansson@arm.com if (sink_packet) { 23811334Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "Not forwarding %s to %#llx\n", 23911334Sandreas.hansson@arm.com pkt->cmdString(), pkt->getAddr()); 24011334Sandreas.hansson@arm.com } else { 24111334Sandreas.hansson@arm.com // determine if we are forwarding the packet, or responding to 24211334Sandreas.hansson@arm.com // it 24311334Sandreas.hansson@arm.com if (!pointOfCoherency || pkt->isRead() || pkt->isWrite()) { 24411334Sandreas.hansson@arm.com // if we are passing on, rather than sinking, a packet to 24511334Sandreas.hansson@arm.com // which an upstream cache has committed to responding, 24611334Sandreas.hansson@arm.com // the line was needs writable, and the responding only 24711334Sandreas.hansson@arm.com // had an Owned copy, so we need to immidiately let the 24811334Sandreas.hansson@arm.com // downstream caches know, bypass any flow control 24911334Sandreas.hansson@arm.com if (pkt->cacheResponding()) { 25011334Sandreas.hansson@arm.com pkt->setExpressSnoop(); 25111334Sandreas.hansson@arm.com } 25211334Sandreas.hansson@arm.com 25311334Sandreas.hansson@arm.com // since it is a normal request, attempt to send the packet 25411334Sandreas.hansson@arm.com success = masterPorts[master_port_id]->sendTimingReq(pkt); 25511334Sandreas.hansson@arm.com } else { 25611334Sandreas.hansson@arm.com // no need to forward, turn this packet around and respond 25711334Sandreas.hansson@arm.com // directly 25811334Sandreas.hansson@arm.com assert(pkt->needsResponse()); 25911334Sandreas.hansson@arm.com 26011334Sandreas.hansson@arm.com respond_directly = true; 26111334Sandreas.hansson@arm.com assert(!expect_snoop_resp); 26211334Sandreas.hansson@arm.com expect_response = false; 26311334Sandreas.hansson@arm.com } 26411334Sandreas.hansson@arm.com } 2658948SN/A 26610821Sandreas.hansson@arm.com if (snoopFilter && !system->bypassCaches()) { 26710402SN/A // Let the snoop filter know about the success of the send operation 26811131Sandreas.hansson@arm.com snoopFilter->finishRequest(!success, pkt); 26910402SN/A } 27010402SN/A 27110656Sandreas.hansson@arm.com // check if we were successful in sending the packet onwards 27210656Sandreas.hansson@arm.com if (!success) { 27311284Sandreas.hansson@arm.com // express snoops should never be forced to retry 27410656Sandreas.hansson@arm.com assert(!is_express_snoop); 27510656Sandreas.hansson@arm.com 27610719SMarco.Balboni@ARM.com // restore the header delay 27710719SMarco.Balboni@ARM.com pkt->headerDelay = old_header_delay; 27810656Sandreas.hansson@arm.com 27910656Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "recvTimingReq: src %s %s 0x%x RETRY\n", 28010656Sandreas.hansson@arm.com src_port->name(), pkt->cmdString(), pkt->getAddr()); 28110656Sandreas.hansson@arm.com 28210656Sandreas.hansson@arm.com // update the layer state and schedule an idle event 28310656Sandreas.hansson@arm.com reqLayers[master_port_id]->failedTiming(src_port, 28410719SMarco.Balboni@ARM.com clockEdge(Cycles(1))); 2859091SN/A } else { 28610656Sandreas.hansson@arm.com // express snoops currently bypass the crossbar state entirely 28710656Sandreas.hansson@arm.com if (!is_express_snoop) { 28810656Sandreas.hansson@arm.com // if this particular request will generate a snoop 28910656Sandreas.hansson@arm.com // response 29010656Sandreas.hansson@arm.com if (expect_snoop_resp) { 29110656Sandreas.hansson@arm.com // we should never have an exsiting request outstanding 29210656Sandreas.hansson@arm.com assert(outstandingSnoop.find(pkt->req) == 29310656Sandreas.hansson@arm.com outstandingSnoop.end()); 29410656Sandreas.hansson@arm.com outstandingSnoop.insert(pkt->req); 2958948SN/A 29610656Sandreas.hansson@arm.com // basic sanity check on the outstanding snoops 29710656Sandreas.hansson@arm.com panic_if(outstandingSnoop.size() > 512, 29810656Sandreas.hansson@arm.com "Outstanding snoop requests exceeded 512\n"); 29910656Sandreas.hansson@arm.com } 3008948SN/A 30110656Sandreas.hansson@arm.com // remember where to route the normal response to 30210656Sandreas.hansson@arm.com if (expect_response || expect_snoop_resp) { 30310656Sandreas.hansson@arm.com assert(routeTo.find(pkt->req) == routeTo.end()); 30410656Sandreas.hansson@arm.com routeTo[pkt->req] = slave_port_id; 3059549SN/A 30610656Sandreas.hansson@arm.com panic_if(routeTo.size() > 512, 30710656Sandreas.hansson@arm.com "Routing table exceeds 512 packets\n"); 30810656Sandreas.hansson@arm.com } 3098948SN/A 31010405Sandreas.hansson@arm.com // update the layer state and schedule an idle event 3119715SN/A reqLayers[master_port_id]->succeededTiming(packetFinishTime); 3129091SN/A } 3138975SN/A 31410656Sandreas.hansson@arm.com // stats updates only consider packets that were successfully sent 3159712SN/A pktCount[slave_port_id][master_port_id]++; 31610405Sandreas.hansson@arm.com pktSize[slave_port_id][master_port_id] += pkt_size; 3179712SN/A transDist[pkt_cmd]++; 31810656Sandreas.hansson@arm.com 31910656Sandreas.hansson@arm.com if (is_express_snoop) 32010656Sandreas.hansson@arm.com snoops++; 3219712SN/A } 3229712SN/A 32311334Sandreas.hansson@arm.com if (sink_packet) 32411334Sandreas.hansson@arm.com // queue the packet for deletion 32511334Sandreas.hansson@arm.com pendingDelete.reset(pkt); 32611334Sandreas.hansson@arm.com 32711334Sandreas.hansson@arm.com if (respond_directly) { 32811334Sandreas.hansson@arm.com assert(pkt->needsResponse()); 32911334Sandreas.hansson@arm.com assert(success); 33011334Sandreas.hansson@arm.com 33111334Sandreas.hansson@arm.com pkt->makeResponse(); 33211334Sandreas.hansson@arm.com 33311334Sandreas.hansson@arm.com if (snoopFilter && !system->bypassCaches()) { 33411334Sandreas.hansson@arm.com // let the snoop filter inspect the response and update its state 33511334Sandreas.hansson@arm.com snoopFilter->updateResponse(pkt, *slavePorts[slave_port_id]); 33611334Sandreas.hansson@arm.com } 33711334Sandreas.hansson@arm.com 33811334Sandreas.hansson@arm.com Tick response_time = clockEdge() + pkt->headerDelay; 33911334Sandreas.hansson@arm.com pkt->headerDelay = 0; 34011334Sandreas.hansson@arm.com 34111334Sandreas.hansson@arm.com slavePorts[slave_port_id]->schedTimingResp(pkt, response_time); 34211334Sandreas.hansson@arm.com } 34311334Sandreas.hansson@arm.com 3449091SN/A return success; 3458975SN/A} 3468975SN/A 3478975SN/Abool 34810405Sandreas.hansson@arm.comCoherentXBar::recvTimingResp(PacketPtr pkt, PortID master_port_id) 3498975SN/A{ 3508975SN/A // determine the source port based on the id 3519032SN/A MasterPort *src_port = masterPorts[master_port_id]; 3528975SN/A 35310656Sandreas.hansson@arm.com // determine the destination 35410656Sandreas.hansson@arm.com const auto route_lookup = routeTo.find(pkt->req); 35510656Sandreas.hansson@arm.com assert(route_lookup != routeTo.end()); 35610656Sandreas.hansson@arm.com const PortID slave_port_id = route_lookup->second; 35710572Sandreas.hansson@arm.com assert(slave_port_id != InvalidPortID); 35810572Sandreas.hansson@arm.com assert(slave_port_id < respLayers.size()); 3599713SN/A 36010405Sandreas.hansson@arm.com // test if the crossbar should be considered occupied for the 36110405Sandreas.hansson@arm.com // current port 3629715SN/A if (!respLayers[slave_port_id]->tryTiming(src_port)) { 36310405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "recvTimingResp: src %s %s 0x%x BUSY\n", 3648975SN/A src_port->name(), pkt->cmdString(), pkt->getAddr()); 3658975SN/A return false; 3668975SN/A } 3678975SN/A 36810405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "recvTimingResp: src %s %s 0x%x\n", 3698975SN/A src_port->name(), pkt->cmdString(), pkt->getAddr()); 3708975SN/A 3719712SN/A // store size and command as they might be modified when 3729712SN/A // forwarding the packet 3739712SN/A unsigned int pkt_size = pkt->hasData() ? pkt->getSize() : 0; 3749712SN/A unsigned int pkt_cmd = pkt->cmdToIndex(); 3759712SN/A 37610719SMarco.Balboni@ARM.com // a response sees the response latency 37710719SMarco.Balboni@ARM.com Tick xbar_delay = responseLatency * clockPeriod(); 37810719SMarco.Balboni@ARM.com 37910719SMarco.Balboni@ARM.com // set the packet header and payload delay 38010719SMarco.Balboni@ARM.com calcPacketTiming(pkt, xbar_delay); 38110719SMarco.Balboni@ARM.com 38210719SMarco.Balboni@ARM.com // determine how long to be crossbar layer is busy 38310719SMarco.Balboni@ARM.com Tick packetFinishTime = clockEdge(Cycles(1)) + pkt->payloadDelay; 3848975SN/A 38510821Sandreas.hansson@arm.com if (snoopFilter && !system->bypassCaches()) { 38610402SN/A // let the snoop filter inspect the response and update its state 38710402SN/A snoopFilter->updateResponse(pkt, *slavePorts[slave_port_id]); 38810402SN/A } 38910402SN/A 39010888Sandreas.hansson@arm.com // send the packet through the destination slave port and pay for 39110888Sandreas.hansson@arm.com // any outstanding header delay 39210888Sandreas.hansson@arm.com Tick latency = pkt->headerDelay; 39310888Sandreas.hansson@arm.com pkt->headerDelay = 0; 39410888Sandreas.hansson@arm.com slavePorts[slave_port_id]->schedTimingResp(pkt, curTick() + latency); 3958975SN/A 39610656Sandreas.hansson@arm.com // remove the request from the routing table 39710656Sandreas.hansson@arm.com routeTo.erase(route_lookup); 39810656Sandreas.hansson@arm.com 3999715SN/A respLayers[slave_port_id]->succeededTiming(packetFinishTime); 4008975SN/A 4019712SN/A // stats updates 4029712SN/A pktCount[slave_port_id][master_port_id]++; 40310405Sandreas.hansson@arm.com pktSize[slave_port_id][master_port_id] += pkt_size; 4049712SN/A transDist[pkt_cmd]++; 4059712SN/A 4068975SN/A return true; 4078975SN/A} 4088975SN/A 4098975SN/Avoid 41010405Sandreas.hansson@arm.comCoherentXBar::recvTimingSnoopReq(PacketPtr pkt, PortID master_port_id) 4118975SN/A{ 41210405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "recvTimingSnoopReq: src %s %s 0x%x\n", 4139032SN/A masterPorts[master_port_id]->name(), pkt->cmdString(), 4148975SN/A pkt->getAddr()); 4158975SN/A 4169712SN/A // update stats here as we know the forwarding will succeed 4179712SN/A transDist[pkt->cmdToIndex()]++; 41810405Sandreas.hansson@arm.com snoops++; 4199712SN/A 4208975SN/A // we should only see express snoops from caches 4218975SN/A assert(pkt->isExpressSnoop()); 4228975SN/A 42311127Sandreas.hansson@arm.com // set the packet header and payload delay, for now use forward latency 42411127Sandreas.hansson@arm.com // @todo Assess the choice of latency further 42511127Sandreas.hansson@arm.com calcPacketTiming(pkt, forwardLatency * clockPeriod()); 42611127Sandreas.hansson@arm.com 42711284Sandreas.hansson@arm.com // remember if a cache has already committed to responding so we 42811284Sandreas.hansson@arm.com // can see if it changes during the snooping 42911284Sandreas.hansson@arm.com const bool cache_responding = pkt->cacheResponding(); 4309032SN/A 43111127Sandreas.hansson@arm.com assert(pkt->snoopDelay == 0); 43211127Sandreas.hansson@arm.com 43310402SN/A if (snoopFilter) { 43410402SN/A // let the Snoop Filter work its magic and guide probing 43510402SN/A auto sf_res = snoopFilter->lookupSnoop(pkt); 43611126Sandreas.hansson@arm.com // the time required by a packet to be delivered through 43711126Sandreas.hansson@arm.com // the xbar has to be charged also with to lookup latency 43811126Sandreas.hansson@arm.com // of the snoop filter 43911126Sandreas.hansson@arm.com pkt->headerDelay += sf_res.second * clockPeriod(); 44010405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "recvTimingSnoopReq: src %s %s 0x%x"\ 44110402SN/A " SF size: %i lat: %i\n", masterPorts[master_port_id]->name(), 44210402SN/A pkt->cmdString(), pkt->getAddr(), sf_res.first.size(), 44310402SN/A sf_res.second); 44410402SN/A 44510402SN/A // forward to all snoopers 44610402SN/A forwardTiming(pkt, InvalidPortID, sf_res.first); 44710402SN/A } else { 44810402SN/A forwardTiming(pkt, InvalidPortID); 44910402SN/A } 4508975SN/A 45111127Sandreas.hansson@arm.com // add the snoop delay to our header delay, and then reset it 45211127Sandreas.hansson@arm.com pkt->headerDelay += pkt->snoopDelay; 45311127Sandreas.hansson@arm.com pkt->snoopDelay = 0; 45411127Sandreas.hansson@arm.com 45510656Sandreas.hansson@arm.com // if we can expect a response, remember how to route it 45611284Sandreas.hansson@arm.com if (!cache_responding && pkt->cacheResponding()) { 45710656Sandreas.hansson@arm.com assert(routeTo.find(pkt->req) == routeTo.end()); 45810656Sandreas.hansson@arm.com routeTo[pkt->req] = master_port_id; 45910656Sandreas.hansson@arm.com } 46010656Sandreas.hansson@arm.com 4618975SN/A // a snoop request came from a connected slave device (one of 4628975SN/A // our master ports), and if it is not coming from the slave 4638975SN/A // device responsible for the address range something is 4648975SN/A // wrong, hence there is nothing further to do as the packet 4658975SN/A // would be going back to where it came from 4669032SN/A assert(master_port_id == findPort(pkt->getAddr())); 4678975SN/A} 4688975SN/A 4698975SN/Abool 47010405Sandreas.hansson@arm.comCoherentXBar::recvTimingSnoopResp(PacketPtr pkt, PortID slave_port_id) 4718975SN/A{ 4728975SN/A // determine the source port based on the id 4739032SN/A SlavePort* src_port = slavePorts[slave_port_id]; 4748975SN/A 47510656Sandreas.hansson@arm.com // get the destination 47610656Sandreas.hansson@arm.com const auto route_lookup = routeTo.find(pkt->req); 47710656Sandreas.hansson@arm.com assert(route_lookup != routeTo.end()); 47810656Sandreas.hansson@arm.com const PortID dest_port_id = route_lookup->second; 47910572Sandreas.hansson@arm.com assert(dest_port_id != InvalidPortID); 4809714SN/A 4819714SN/A // determine if the response is from a snoop request we 4829714SN/A // created as the result of a normal request (in which case it 48310656Sandreas.hansson@arm.com // should be in the outstandingSnoop), or if we merely forwarded 4849714SN/A // someone else's snoop request 48510656Sandreas.hansson@arm.com const bool forwardAsSnoop = outstandingSnoop.find(pkt->req) == 48610656Sandreas.hansson@arm.com outstandingSnoop.end(); 4879714SN/A 48810405Sandreas.hansson@arm.com // test if the crossbar should be considered occupied for the 48910405Sandreas.hansson@arm.com // current port, note that the check is bypassed if the response 49010405Sandreas.hansson@arm.com // is being passed on as a normal response since this is occupying 49110405Sandreas.hansson@arm.com // the response layer rather than the snoop response layer 4929715SN/A if (forwardAsSnoop) { 49310572Sandreas.hansson@arm.com assert(dest_port_id < snoopLayers.size()); 4949715SN/A if (!snoopLayers[dest_port_id]->tryTiming(src_port)) { 49510405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "recvTimingSnoopResp: src %s %s 0x%x BUSY\n", 4969715SN/A src_port->name(), pkt->cmdString(), pkt->getAddr()); 4979715SN/A return false; 4989715SN/A } 4999716SN/A } else { 5009716SN/A // get the master port that mirrors this slave port internally 5019716SN/A MasterPort* snoop_port = snoopRespPorts[slave_port_id]; 50210572Sandreas.hansson@arm.com assert(dest_port_id < respLayers.size()); 5039716SN/A if (!respLayers[dest_port_id]->tryTiming(snoop_port)) { 50410405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "recvTimingSnoopResp: src %s %s 0x%x BUSY\n", 5059716SN/A snoop_port->name(), pkt->cmdString(), pkt->getAddr()); 5069716SN/A return false; 5079716SN/A } 5088975SN/A } 5098975SN/A 51010405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "recvTimingSnoopResp: src %s %s 0x%x\n", 5118975SN/A src_port->name(), pkt->cmdString(), pkt->getAddr()); 5128975SN/A 5139712SN/A // store size and command as they might be modified when 5149712SN/A // forwarding the packet 5159712SN/A unsigned int pkt_size = pkt->hasData() ? pkt->getSize() : 0; 5169712SN/A unsigned int pkt_cmd = pkt->cmdToIndex(); 5179712SN/A 5188975SN/A // responses are never express snoops 5198975SN/A assert(!pkt->isExpressSnoop()); 5208975SN/A 52110719SMarco.Balboni@ARM.com // a snoop response sees the snoop response latency, and if it is 52210719SMarco.Balboni@ARM.com // forwarded as a normal response, the response latency 52310719SMarco.Balboni@ARM.com Tick xbar_delay = 52410719SMarco.Balboni@ARM.com (forwardAsSnoop ? snoopResponseLatency : responseLatency) * 52510719SMarco.Balboni@ARM.com clockPeriod(); 52610719SMarco.Balboni@ARM.com 52710719SMarco.Balboni@ARM.com // set the packet header and payload delay 52810719SMarco.Balboni@ARM.com calcPacketTiming(pkt, xbar_delay); 52910719SMarco.Balboni@ARM.com 53010719SMarco.Balboni@ARM.com // determine how long to be crossbar layer is busy 53110719SMarco.Balboni@ARM.com Tick packetFinishTime = clockEdge(Cycles(1)) + pkt->payloadDelay; 5328975SN/A 5339714SN/A // forward it either as a snoop response or a normal response 5349714SN/A if (forwardAsSnoop) { 5359714SN/A // this is a snoop response to a snoop request we forwarded, 5369714SN/A // e.g. coming from the L1 and going to the L2, and it should 5379714SN/A // be forwarded as a snoop response 53810402SN/A 53910402SN/A if (snoopFilter) { 54010402SN/A // update the probe filter so that it can properly track the line 54110402SN/A snoopFilter->updateSnoopForward(pkt, *slavePorts[slave_port_id], 54210402SN/A *masterPorts[dest_port_id]); 54310402SN/A } 54410402SN/A 5459712SN/A bool success M5_VAR_USED = 5469712SN/A masterPorts[dest_port_id]->sendTimingSnoopResp(pkt); 5479712SN/A pktCount[slave_port_id][dest_port_id]++; 54810405Sandreas.hansson@arm.com pktSize[slave_port_id][dest_port_id] += pkt_size; 5498975SN/A assert(success); 5509714SN/A 5519715SN/A snoopLayers[dest_port_id]->succeededTiming(packetFinishTime); 5523244SN/A } else { 5538975SN/A // we got a snoop response on one of our slave ports, 55410405Sandreas.hansson@arm.com // i.e. from a coherent master connected to the crossbar, and 55510405Sandreas.hansson@arm.com // since we created the snoop request as part of recvTiming, 55610405Sandreas.hansson@arm.com // this should now be a normal response again 55710656Sandreas.hansson@arm.com outstandingSnoop.erase(pkt->req); 5588948SN/A 55910656Sandreas.hansson@arm.com // this is a snoop response from a coherent master, hence it 56010656Sandreas.hansson@arm.com // should never go back to where the snoop response came from, 56110656Sandreas.hansson@arm.com // but instead to where the original request came from 5629712SN/A assert(slave_port_id != dest_port_id); 5638948SN/A 56410402SN/A if (snoopFilter) { 56510402SN/A // update the probe filter so that it can properly track the line 56610402SN/A snoopFilter->updateSnoopResponse(pkt, *slavePorts[slave_port_id], 56710402SN/A *slavePorts[dest_port_id]); 56810402SN/A } 56910402SN/A 57010405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "recvTimingSnoopResp: src %s %s 0x%x"\ 57110402SN/A " FWD RESP\n", src_port->name(), pkt->cmdString(), 57210402SN/A pkt->getAddr()); 57310402SN/A 5749714SN/A // as a normal response, it should go back to a master through 57510888Sandreas.hansson@arm.com // one of our slave ports, we also pay for any outstanding 57610888Sandreas.hansson@arm.com // header latency 57710888Sandreas.hansson@arm.com Tick latency = pkt->headerDelay; 57810888Sandreas.hansson@arm.com pkt->headerDelay = 0; 57910888Sandreas.hansson@arm.com slavePorts[dest_port_id]->schedTimingResp(pkt, curTick() + latency); 5809716SN/A 5819716SN/A respLayers[dest_port_id]->succeededTiming(packetFinishTime); 5823244SN/A } 5833244SN/A 58410656Sandreas.hansson@arm.com // remove the request from the routing table 58510656Sandreas.hansson@arm.com routeTo.erase(route_lookup); 58610656Sandreas.hansson@arm.com 5879712SN/A // stats updates 5889712SN/A transDist[pkt_cmd]++; 58910405Sandreas.hansson@arm.com snoops++; 5909712SN/A 5918948SN/A return true; 5928948SN/A} 5938948SN/A 5943210SN/A 5958948SN/Avoid 59610405Sandreas.hansson@arm.comCoherentXBar::forwardTiming(PacketPtr pkt, PortID exclude_slave_port_id, 59710888Sandreas.hansson@arm.com const std::vector<QueuedSlavePort*>& dests) 5988948SN/A{ 59910405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "%s for %s address %x size %d\n", __func__, 6009663SN/A pkt->cmdString(), pkt->getAddr(), pkt->getSize()); 6019663SN/A 6029524SN/A // snoops should only happen if the system isn't bypassing caches 6039524SN/A assert(!system->bypassCaches()); 6049524SN/A 60510401SN/A unsigned fanout = 0; 60610401SN/A 60710405Sandreas.hansson@arm.com for (const auto& p: dests) { 6088948SN/A // we could have gotten this request from a snooping master 6098948SN/A // (corresponding to our own slave port that is also in 6108948SN/A // snoopPorts) and should not send it back to where it came 6118948SN/A // from 6129031SN/A if (exclude_slave_port_id == InvalidPortID || 6138948SN/A p->getId() != exclude_slave_port_id) { 6148948SN/A // cache is not allowed to refuse snoop 6158975SN/A p->sendTimingSnoopReq(pkt); 61610401SN/A fanout++; 6178948SN/A } 6188948SN/A } 61910401SN/A 62010401SN/A // Stats for fanout of this forward operation 62110401SN/A snoopFanout.sample(fanout); 6222497SN/A} 6232497SN/A 6249092SN/Avoid 62510713Sandreas.hansson@arm.comCoherentXBar::recvReqRetry(PortID master_port_id) 6269092SN/A{ 6279093SN/A // responses and snoop responses never block on forwarding them, 6289093SN/A // so the retry will always be coming from a port to which we 6299093SN/A // tried to forward a request 6309715SN/A reqLayers[master_port_id]->recvRetry(); 6319092SN/A} 6329092SN/A 6339036SN/ATick 63410405Sandreas.hansson@arm.comCoherentXBar::recvAtomic(PacketPtr pkt, PortID slave_port_id) 6352657SN/A{ 63610405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "recvAtomic: packet src %s addr 0x%x cmd %s\n", 6379032SN/A slavePorts[slave_port_id]->name(), pkt->getAddr(), 6388949SN/A pkt->cmdString()); 6398915SN/A 64010405Sandreas.hansson@arm.com unsigned int pkt_size = pkt->hasData() ? pkt->getSize() : 0; 64110405Sandreas.hansson@arm.com unsigned int pkt_cmd = pkt->cmdToIndex(); 6429712SN/A 6438979SN/A MemCmd snoop_response_cmd = MemCmd::InvalidCmd; 6448979SN/A Tick snoop_response_latency = 0; 6458979SN/A 64610821Sandreas.hansson@arm.com if (!system->bypassCaches()) { 6478979SN/A // forward to all snoopers but the source 64810402SN/A std::pair<MemCmd, Tick> snoop_result; 64910402SN/A if (snoopFilter) { 65010402SN/A // check with the snoop filter where to forward this packet 65110402SN/A auto sf_res = 65210402SN/A snoopFilter->lookupRequest(pkt, *slavePorts[slave_port_id]); 65310402SN/A snoop_response_latency += sf_res.second * clockPeriod(); 65410405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "%s: src %s %s 0x%x"\ 65510402SN/A " SF size: %i lat: %i\n", __func__, 65610402SN/A slavePorts[slave_port_id]->name(), pkt->cmdString(), 65710402SN/A pkt->getAddr(), sf_res.first.size(), sf_res.second); 65811130Sali.jafri@arm.com 65911130Sali.jafri@arm.com // let the snoop filter know about the success of the send 66011130Sali.jafri@arm.com // operation, and do it even before sending it onwards to 66111130Sali.jafri@arm.com // avoid situations where atomic upward snoops sneak in 66211130Sali.jafri@arm.com // between and change the filter state 66311131Sandreas.hansson@arm.com snoopFilter->finishRequest(false, pkt); 66411130Sali.jafri@arm.com 66510402SN/A snoop_result = forwardAtomic(pkt, slave_port_id, InvalidPortID, 66610402SN/A sf_res.first); 66710402SN/A } else { 66810402SN/A snoop_result = forwardAtomic(pkt, slave_port_id); 66910402SN/A } 6708979SN/A snoop_response_cmd = snoop_result.first; 67110402SN/A snoop_response_latency += snoop_result.second; 6728979SN/A } 6738915SN/A 67411334Sandreas.hansson@arm.com // set up a sensible default value 67511334Sandreas.hansson@arm.com Tick response_latency = 0; 67611334Sandreas.hansson@arm.com 67711334Sandreas.hansson@arm.com const bool sink_packet = sinkPacket(pkt); 67811130Sali.jafri@arm.com 6798948SN/A // even if we had a snoop response, we must continue and also 6808948SN/A // perform the actual request at the destination 68110405Sandreas.hansson@arm.com PortID master_port_id = findPort(pkt->getAddr()); 68210405Sandreas.hansson@arm.com 68311334Sandreas.hansson@arm.com if (sink_packet) { 68411334Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "Not forwarding %s to %#llx\n", 68511334Sandreas.hansson@arm.com pkt->cmdString(), pkt->getAddr()); 68611334Sandreas.hansson@arm.com } else { 68711334Sandreas.hansson@arm.com if (!pointOfCoherency || pkt->isRead() || pkt->isWrite()) { 68811334Sandreas.hansson@arm.com // forward the request to the appropriate destination 68911334Sandreas.hansson@arm.com response_latency = masterPorts[master_port_id]->sendAtomic(pkt); 69011334Sandreas.hansson@arm.com } else { 69111334Sandreas.hansson@arm.com // if it does not need a response we sink the packet above 69211334Sandreas.hansson@arm.com assert(pkt->needsResponse()); 69311334Sandreas.hansson@arm.com 69411334Sandreas.hansson@arm.com pkt->makeResponse(); 69511334Sandreas.hansson@arm.com } 69611334Sandreas.hansson@arm.com } 69711334Sandreas.hansson@arm.com 69810405Sandreas.hansson@arm.com // stats updates for the request 69910405Sandreas.hansson@arm.com pktCount[slave_port_id][master_port_id]++; 70010405Sandreas.hansson@arm.com pktSize[slave_port_id][master_port_id] += pkt_size; 70110405Sandreas.hansson@arm.com transDist[pkt_cmd]++; 7028948SN/A 7038948SN/A 70411130Sali.jafri@arm.com // if lower levels have replied, tell the snoop filter 70511130Sali.jafri@arm.com if (!system->bypassCaches() && snoopFilter && pkt->isResponse()) { 70610402SN/A snoopFilter->updateResponse(pkt, *slavePorts[slave_port_id]); 70710402SN/A } 70810402SN/A 7098948SN/A // if we got a response from a snooper, restore it here 7108948SN/A if (snoop_response_cmd != MemCmd::InvalidCmd) { 7118948SN/A // no one else should have responded 7128948SN/A assert(!pkt->isResponse()); 7138948SN/A pkt->cmd = snoop_response_cmd; 7148948SN/A response_latency = snoop_response_latency; 7158948SN/A } 7168948SN/A 7179712SN/A // add the response data 71810405Sandreas.hansson@arm.com if (pkt->isResponse()) { 71910405Sandreas.hansson@arm.com pkt_size = pkt->hasData() ? pkt->getSize() : 0; 72010405Sandreas.hansson@arm.com pkt_cmd = pkt->cmdToIndex(); 72110405Sandreas.hansson@arm.com 72210405Sandreas.hansson@arm.com // stats updates 72310405Sandreas.hansson@arm.com pktCount[slave_port_id][master_port_id]++; 72410405Sandreas.hansson@arm.com pktSize[slave_port_id][master_port_id] += pkt_size; 72510405Sandreas.hansson@arm.com transDist[pkt_cmd]++; 72610405Sandreas.hansson@arm.com } 7279712SN/A 72810694SMarco.Balboni@ARM.com // @todo: Not setting header time 72910694SMarco.Balboni@ARM.com pkt->payloadDelay = response_latency; 7308948SN/A return response_latency; 7318948SN/A} 7328948SN/A 7338948SN/ATick 73410405Sandreas.hansson@arm.comCoherentXBar::recvAtomicSnoop(PacketPtr pkt, PortID master_port_id) 7358948SN/A{ 73610405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "recvAtomicSnoop: packet src %s addr 0x%x cmd %s\n", 7379032SN/A masterPorts[master_port_id]->name(), pkt->getAddr(), 7388949SN/A pkt->cmdString()); 7398948SN/A 7409712SN/A // add the request snoop data 74110405Sandreas.hansson@arm.com snoops++; 7429712SN/A 7438948SN/A // forward to all snoopers 74410402SN/A std::pair<MemCmd, Tick> snoop_result; 74510402SN/A Tick snoop_response_latency = 0; 74610402SN/A if (snoopFilter) { 74710402SN/A auto sf_res = snoopFilter->lookupSnoop(pkt); 74810402SN/A snoop_response_latency += sf_res.second * clockPeriod(); 74910405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, "%s: src %s %s 0x%x SF size: %i lat: %i\n", 75010402SN/A __func__, masterPorts[master_port_id]->name(), pkt->cmdString(), 75110402SN/A pkt->getAddr(), sf_res.first.size(), sf_res.second); 75210402SN/A snoop_result = forwardAtomic(pkt, InvalidPortID, master_port_id, 75310402SN/A sf_res.first); 75410402SN/A } else { 75510402SN/A snoop_result = forwardAtomic(pkt, InvalidPortID); 75610402SN/A } 7578948SN/A MemCmd snoop_response_cmd = snoop_result.first; 75810402SN/A snoop_response_latency += snoop_result.second; 7598948SN/A 7608948SN/A if (snoop_response_cmd != MemCmd::InvalidCmd) 7618948SN/A pkt->cmd = snoop_response_cmd; 7628948SN/A 7639712SN/A // add the response snoop data 76410401SN/A if (pkt->isResponse()) { 76510405Sandreas.hansson@arm.com snoops++; 76610401SN/A } 7679712SN/A 76810694SMarco.Balboni@ARM.com // @todo: Not setting header time 76910694SMarco.Balboni@ARM.com pkt->payloadDelay = snoop_response_latency; 7708948SN/A return snoop_response_latency; 7718948SN/A} 7728948SN/A 7738948SN/Astd::pair<MemCmd, Tick> 77410405Sandreas.hansson@arm.comCoherentXBar::forwardAtomic(PacketPtr pkt, PortID exclude_slave_port_id, 77510402SN/A PortID source_master_port_id, 77610888Sandreas.hansson@arm.com const std::vector<QueuedSlavePort*>& dests) 7778948SN/A{ 7789032SN/A // the packet may be changed on snoops, record the original 7799032SN/A // command to enable us to restore it between snoops so that 7808948SN/A // additional snoops can take place properly 7814626SN/A MemCmd orig_cmd = pkt->cmd; 7824879SN/A MemCmd snoop_response_cmd = MemCmd::InvalidCmd; 7834879SN/A Tick snoop_response_latency = 0; 7843662SN/A 7859524SN/A // snoops should only happen if the system isn't bypassing caches 7869524SN/A assert(!system->bypassCaches()); 7879524SN/A 78810401SN/A unsigned fanout = 0; 78910401SN/A 79010405Sandreas.hansson@arm.com for (const auto& p: dests) { 7918915SN/A // we could have gotten this request from a snooping master 7928915SN/A // (corresponding to our own slave port that is also in 7938915SN/A // snoopPorts) and should not send it back to where it came 7948915SN/A // from 79510402SN/A if (exclude_slave_port_id != InvalidPortID && 79610402SN/A p->getId() == exclude_slave_port_id) 79710402SN/A continue; 79810401SN/A 79910402SN/A Tick latency = p->sendAtomicSnoop(pkt); 80010402SN/A fanout++; 80110402SN/A 80210402SN/A // in contrast to a functional access, we have to keep on 80310402SN/A // going as all snoopers must be updated even if we get a 80410402SN/A // response 80510402SN/A if (!pkt->isResponse()) 80610402SN/A continue; 80710402SN/A 80810402SN/A // response from snoop agent 80910402SN/A assert(pkt->cmd != orig_cmd); 81011284Sandreas.hansson@arm.com assert(pkt->cacheResponding()); 81110402SN/A // should only happen once 81210402SN/A assert(snoop_response_cmd == MemCmd::InvalidCmd); 81310402SN/A // save response state 81410402SN/A snoop_response_cmd = pkt->cmd; 81510402SN/A snoop_response_latency = latency; 81610402SN/A 81710402SN/A if (snoopFilter) { 81810402SN/A // Handle responses by the snoopers and differentiate between 81910402SN/A // responses to requests from above and snoops from below 82010402SN/A if (source_master_port_id != InvalidPortID) { 82110402SN/A // Getting a response for a snoop from below 82210402SN/A assert(exclude_slave_port_id == InvalidPortID); 82310402SN/A snoopFilter->updateSnoopForward(pkt, *p, 82410402SN/A *masterPorts[source_master_port_id]); 82510402SN/A } else { 82610402SN/A // Getting a response for a request from above 82710402SN/A assert(source_master_port_id == InvalidPortID); 82810402SN/A snoopFilter->updateSnoopResponse(pkt, *p, 82910402SN/A *slavePorts[exclude_slave_port_id]); 8304626SN/A } 8314626SN/A } 83210402SN/A // restore original packet state for remaining snoopers 83310402SN/A pkt->cmd = orig_cmd; 8344626SN/A } 8354626SN/A 83610401SN/A // Stats for fanout 83710401SN/A snoopFanout.sample(fanout); 83810401SN/A 8398948SN/A // the packet is restored as part of the loop and any potential 8408948SN/A // snoop response is part of the returned pair 8418948SN/A return std::make_pair(snoop_response_cmd, snoop_response_latency); 8422497SN/A} 8432497SN/A 8442497SN/Avoid 84510405Sandreas.hansson@arm.comCoherentXBar::recvFunctional(PacketPtr pkt, PortID slave_port_id) 8462497SN/A{ 8478663SN/A if (!pkt->isPrint()) { 8488663SN/A // don't do DPRINTFs on PrintReq as it clutters up the output 84910405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, 8508949SN/A "recvFunctional: packet src %s addr 0x%x cmd %s\n", 8519032SN/A slavePorts[slave_port_id]->name(), pkt->getAddr(), 8528663SN/A pkt->cmdString()); 8538663SN/A } 8548663SN/A 85510821Sandreas.hansson@arm.com if (!system->bypassCaches()) { 8568979SN/A // forward to all snoopers but the source 8579032SN/A forwardFunctional(pkt, slave_port_id); 8588979SN/A } 8594912SN/A 8608948SN/A // there is no need to continue if the snooping has found what we 8618948SN/A // were looking for and the packet is already a response 8628948SN/A if (!pkt->isResponse()) { 86310888Sandreas.hansson@arm.com // since our slave ports are queued ports we need to check them as well 86410888Sandreas.hansson@arm.com for (const auto& p : slavePorts) { 86510888Sandreas.hansson@arm.com // if we find a response that has the data, then the 86610888Sandreas.hansson@arm.com // downstream caches/memories may be out of date, so simply stop 86710888Sandreas.hansson@arm.com // here 86810888Sandreas.hansson@arm.com if (p->checkFunctional(pkt)) { 86910888Sandreas.hansson@arm.com if (pkt->needsResponse()) 87010888Sandreas.hansson@arm.com pkt->makeResponse(); 87110888Sandreas.hansson@arm.com return; 87210888Sandreas.hansson@arm.com } 87310888Sandreas.hansson@arm.com } 87410888Sandreas.hansson@arm.com 8759031SN/A PortID dest_id = findPort(pkt->getAddr()); 8768948SN/A 8778948SN/A masterPorts[dest_id]->sendFunctional(pkt); 8788948SN/A } 8798948SN/A} 8808948SN/A 8818948SN/Avoid 88210405Sandreas.hansson@arm.comCoherentXBar::recvFunctionalSnoop(PacketPtr pkt, PortID master_port_id) 8838948SN/A{ 8848948SN/A if (!pkt->isPrint()) { 8858948SN/A // don't do DPRINTFs on PrintReq as it clutters up the output 88610405Sandreas.hansson@arm.com DPRINTF(CoherentXBar, 8878949SN/A "recvFunctionalSnoop: packet src %s addr 0x%x cmd %s\n", 8889032SN/A masterPorts[master_port_id]->name(), pkt->getAddr(), 8898948SN/A pkt->cmdString()); 8908948SN/A } 8918948SN/A 89211188Sandreas.sandberg@arm.com for (const auto& p : slavePorts) { 89311188Sandreas.sandberg@arm.com if (p->checkFunctional(pkt)) { 89411188Sandreas.sandberg@arm.com if (pkt->needsResponse()) 89511188Sandreas.sandberg@arm.com pkt->makeResponse(); 89611188Sandreas.sandberg@arm.com return; 89711188Sandreas.sandberg@arm.com } 89811188Sandreas.sandberg@arm.com } 89911188Sandreas.sandberg@arm.com 9008948SN/A // forward to all snoopers 9019031SN/A forwardFunctional(pkt, InvalidPortID); 9028948SN/A} 9038948SN/A 9048948SN/Avoid 90510405Sandreas.hansson@arm.comCoherentXBar::forwardFunctional(PacketPtr pkt, PortID exclude_slave_port_id) 9068948SN/A{ 9079524SN/A // snoops should only happen if the system isn't bypassing caches 9089524SN/A assert(!system->bypassCaches()); 9099524SN/A 91010405Sandreas.hansson@arm.com for (const auto& p: snoopPorts) { 9118915SN/A // we could have gotten this request from a snooping master 9128915SN/A // (corresponding to our own slave port that is also in 9138915SN/A // snoopPorts) and should not send it back to where it came 9148915SN/A // from 9159031SN/A if (exclude_slave_port_id == InvalidPortID || 9168948SN/A p->getId() != exclude_slave_port_id) 9178948SN/A p->sendFunctionalSnoop(pkt); 9188915SN/A 9198948SN/A // if we get a response we are done 9208948SN/A if (pkt->isResponse()) { 9218948SN/A break; 9228915SN/A } 9233650SN/A } 9242497SN/A} 9252497SN/A 92611334Sandreas.hansson@arm.combool 92711334Sandreas.hansson@arm.comCoherentXBar::sinkPacket(const PacketPtr pkt) const 92811334Sandreas.hansson@arm.com{ 92911334Sandreas.hansson@arm.com // we can sink the packet if: 93011334Sandreas.hansson@arm.com // 1) the crossbar is the point of coherency, and a cache is 93111334Sandreas.hansson@arm.com // responding after being snooped 93211334Sandreas.hansson@arm.com // 2) the crossbar is the point of coherency, and the packet is a 93311334Sandreas.hansson@arm.com // coherency packet (not a read or a write) that does not 93411334Sandreas.hansson@arm.com // require a response 93511334Sandreas.hansson@arm.com // 3) this is a clean evict or clean writeback, but the packet is 93611334Sandreas.hansson@arm.com // found in a cache above this crossbar 93711334Sandreas.hansson@arm.com // 4) a cache is responding after being snooped, and the packet 93811334Sandreas.hansson@arm.com // either does not need the block to be writable, or the cache 93911334Sandreas.hansson@arm.com // that has promised to respond (setting the cache responding 94011334Sandreas.hansson@arm.com // flag) is providing writable and thus had a Modified block, 94111334Sandreas.hansson@arm.com // and no further action is needed 94211334Sandreas.hansson@arm.com return (pointOfCoherency && pkt->cacheResponding()) || 94311334Sandreas.hansson@arm.com (pointOfCoherency && !(pkt->isRead() || pkt->isWrite()) && 94411334Sandreas.hansson@arm.com !pkt->needsResponse()) || 94511334Sandreas.hansson@arm.com (pkt->isCleanEviction() && pkt->isBlockCached()) || 94611334Sandreas.hansson@arm.com (pkt->cacheResponding() && 94711334Sandreas.hansson@arm.com (!pkt->needsWritable() || pkt->responderHadWritable())); 94811334Sandreas.hansson@arm.com} 94911334Sandreas.hansson@arm.com 9509712SN/Avoid 95110405Sandreas.hansson@arm.comCoherentXBar::regStats() 9529712SN/A{ 95310405Sandreas.hansson@arm.com // register the stats of the base class and our layers 95410405Sandreas.hansson@arm.com BaseXBar::regStats(); 95510405Sandreas.hansson@arm.com for (auto l: reqLayers) 95610405Sandreas.hansson@arm.com l->regStats(); 95710405Sandreas.hansson@arm.com for (auto l: respLayers) 95810405Sandreas.hansson@arm.com l->regStats(); 95910405Sandreas.hansson@arm.com for (auto l: snoopLayers) 96010405Sandreas.hansson@arm.com l->regStats(); 9619712SN/A 96210405Sandreas.hansson@arm.com snoops 96310405Sandreas.hansson@arm.com .name(name() + ".snoops") 96410401SN/A .desc("Total snoops (count)") 96510401SN/A ; 96610401SN/A 96710401SN/A snoopFanout 96810401SN/A .init(0, snoopPorts.size(), 1) 96910401SN/A .name(name() + ".snoop_fanout") 97010401SN/A .desc("Request fanout histogram") 97110401SN/A ; 9729712SN/A} 9739712SN/A 97410405Sandreas.hansson@arm.comCoherentXBar * 97510405Sandreas.hansson@arm.comCoherentXBarParams::create() 9762497SN/A{ 97710405Sandreas.hansson@arm.com return new CoherentXBar(this); 9782497SN/A} 979