Cross Reference: /gem5/src/mem/ruby/system/Sequencer.cc

Deleted Added

sdiff udiff text old ( 11793:ef606668d247 ) new ( 12051:4cc27e53748d )

full compact

Sequencer.cc (11793:ef606668d247)	Sequencer.cc (12051:4cc27e53748d)
1/* 2 * Copyright (c) 1999-2008 Mark D. Hill and David A. Wood 3 * All rights reserved. 4 * 5 * Redistribution and use in source and binary forms, with or without 6 * modification, are permitted provided that the following conditions are 7 * met: redistributions of source code must retain the above copyright 8 * notice, this list of conditions and the following disclaimer; 9 * redistributions in binary form must reproduce the above copyright 10 * notice, this list of conditions and the following disclaimer in the 11 * documentation and/or other materials provided with the distribution; 12 * neither the name of the copyright holders nor the names of its 13 * contributors may be used to endorse or promote products derived from 14 * this software without specific prior written permission. 15 * 16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 17 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 18 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 19 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 20 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 21 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 22 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 23 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 24 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 25 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 26 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 27 / 28 29#include "mem/ruby/system/Sequencer.hh" 30 31#include "arch/x86/ldstflags.hh" 32#include "base/misc.hh" 33#include "base/str.hh" 34#include "cpu/testers/rubytest/RubyTester.hh" 35#include "debug/MemoryAccess.hh" 36#include "debug/ProtocolTrace.hh" 37#include "debug/RubySequencer.hh" 38#include "debug/RubyStats.hh" 39#include "mem/packet.hh" 40#include "mem/protocol/PrefetchBit.hh" 41#include "mem/protocol/RubyAccessMode.hh" 42#include "mem/ruby/profiler/Profiler.hh" 43#include "mem/ruby/slicc_interface/RubyRequest.hh" 44#include "mem/ruby/system/RubySystem.hh" 45#include "sim/system.hh" 46 47using namespace std; 48 49Sequencer 50RubySequencerParams::create() 51{ 52 return new Sequencer(this); 53} 54 55Sequencer::Sequencer(const Params p) 56 : RubyPort(p), m_IncompleteTimes(MachineType_NUM), deadlockCheckEvent(this) 57{ 58 m_outstanding_count = 0; 59 60 m_instCache_ptr = p->icache; 61 m_dataCache_ptr = p->dcache; 62 m_data_cache_hit_latency = p->dcache_hit_latency; 63 m_inst_cache_hit_latency = p->icache_hit_latency; 64 m_max_outstanding_requests = p->max_outstanding_requests; 65 m_deadlock_threshold = p->deadlock_threshold; 66 67 m_coreId = p->coreid; // for tracking the two CorePair sequencers 68 assert(m_max_outstanding_requests > 0); 69 assert(m_deadlock_threshold > 0); 70 assert(m_instCache_ptr != NULL); 71 assert(m_dataCache_ptr != NULL); 72 assert(m_data_cache_hit_latency > 0); 73 assert(m_inst_cache_hit_latency > 0); 74 75 m_runningGarnetStandalone = p->garnet_standalone; 76} 77 78Sequencer::~Sequencer() 79{ 80} 81 82void 83Sequencer::wakeup() 84{ 85 assert(drainState() != DrainState::Draining); 86 87 // Check for deadlock of any of the requests 88 Cycles current_time = curCycle(); 89 90 // Check across all outstanding requests 91 int total_outstanding = 0; 92 93 RequestTable::iterator read = m_readRequestTable.begin(); 94 RequestTable::iterator read_end = m_readRequestTable.end(); 95 for (; read != read_end; ++read) { 96 SequencerRequest request = read->second; 97 if (current_time - request->issue_time < m_deadlock_threshold) 98 continue; 99 100 panic("Possible Deadlock detected. Aborting!\n" 101 "version: %d request.paddr: 0x%x m_readRequestTable: %d " 102 "current time: %u issue_time: %d difference: %d\n", m_version, 103 request->pkt->getAddr(), m_readRequestTable.size(), 104 current_time * clockPeriod(), request->issue_time * clockPeriod(), 105 (current_time * clockPeriod()) - (request->issue_time * clockPeriod())); 106 } 107 108 RequestTable::iterator write = m_writeRequestTable.begin(); 109 RequestTable::iterator write_end = m_writeRequestTable.end(); 110 for (; write != write_end; ++write) { 111 SequencerRequest* request = write->second; 112 if (current_time - request->issue_time < m_deadlock_threshold) 113 continue; 114 115 panic("Possible Deadlock detected. Aborting!\n" 116 "version: %d request.paddr: 0x%x m_writeRequestTable: %d " 117 "current time: %u issue_time: %d difference: %d\n", m_version, 118 request->pkt->getAddr(), m_writeRequestTable.size(), 119 current_time * clockPeriod(), request->issue_time * clockPeriod(), 120 (current_time * clockPeriod()) - (request->issue_time * clockPeriod())); 121 } 122 123 total_outstanding += m_writeRequestTable.size(); 124 total_outstanding += m_readRequestTable.size(); 125 126 assert(m_outstanding_count == total_outstanding); 127 128 if (m_outstanding_count > 0) { 129 // If there are still outstanding requests, keep checking 130 schedule(deadlockCheckEvent, clockEdge(m_deadlock_threshold)); 131 } 132} 133 134void Sequencer::resetStats() 135{ 136 m_latencyHist.reset(); 137 m_hitLatencyHist.reset(); 138 m_missLatencyHist.reset(); 139 for (int i = 0; i < RubyRequestType_NUM; i++) { 140 m_typeLatencyHist[i]->reset(); 141 m_hitTypeLatencyHist[i]->reset(); 142 m_missTypeLatencyHist[i]->reset(); 143 for (int j = 0; j < MachineType_NUM; j++) { 144 m_hitTypeMachLatencyHist[i][j]->reset(); 145 m_missTypeMachLatencyHist[i][j]->reset(); 146 } 147 } 148 149 for (int i = 0; i < MachineType_NUM; i++) { 150 m_missMachLatencyHist[i]->reset(); 151 m_hitMachLatencyHist[i]->reset(); 152 153 m_IssueToInitialDelayHist[i]->reset(); 154 m_InitialToForwardDelayHist[i]->reset(); 155 m_ForwardToFirstResponseDelayHist[i]->reset(); 156 m_FirstResponseToCompletionDelayHist[i]->reset(); 157 158 m_IncompleteTimes[i] = 0; 159 } 160} 161 162// Insert the request on the correct request table. Return true if 163// the entry was already present. 164RequestStatus 165Sequencer::insertRequest(PacketPtr pkt, RubyRequestType request_type) 166{ 167 assert(m_outstanding_count == 168 (m_writeRequestTable.size() + m_readRequestTable.size())); 169 170 // See if we should schedule a deadlock check 171 if (!deadlockCheckEvent.scheduled() && 172 drainState() != DrainState::Draining) { 173 schedule(deadlockCheckEvent, clockEdge(m_deadlock_threshold)); 174 } 175 176 Addr line_addr = makeLineAddress(pkt->getAddr()); 177 178 // Check if the line is blocked for a Locked_RMW 179 if (m_controller->isBlocked(line_addr) && 180 (request_type != RubyRequestType_Locked_RMW_Write)) { 181 // Return that this request's cache line address aliases with 182 // a prior request that locked the cache line. The request cannot 183 // proceed until the cache line is unlocked by a Locked_RMW_Write 184 return RequestStatus_Aliased; 185 } 186 187 // Create a default entry, mapping the address to NULL, the cast is 188 // there to make gcc 4.4 happy 189 RequestTable::value_type default_entry(line_addr, 190 (SequencerRequest) NULL); 191* 192 if ((request_type == RubyRequestType_ST) \|\| 193 (request_type == RubyRequestType_RMW_Read) \|\| 194 (request_type == RubyRequestType_RMW_Write) \|\| 195 (request_type == RubyRequestType_Load_Linked) \|\| 196 (request_type == RubyRequestType_Store_Conditional) \|\| 197 (request_type == RubyRequestType_Locked_RMW_Read) \|\| 198 (request_type == RubyRequestType_Locked_RMW_Write) \|\| 199 (request_type == RubyRequestType_FLUSH)) { 200 201 // Check if there is any outstanding read request for the same 202 // cache line. 203 if (m_readRequestTable.count(line_addr) > 0) { 204 m_store_waiting_on_load++; 205 return RequestStatus_Aliased; 206 } 207 208 pair<RequestTable::iterator, bool> r = 209 m_writeRequestTable.insert(default_entry); 210 if (r.second) { 211 RequestTable::iterator i = r.first; 212 i->second = new SequencerRequest(pkt, request_type, curCycle()); 213 m_outstanding_count++; 214 } else { 215 // There is an outstanding write request for the cache line 216 m_store_waiting_on_store++; 217 return RequestStatus_Aliased; 218 } 219 } else { 220 // Check if there is any outstanding write request for the same 221 // cache line. 222 if (m_writeRequestTable.count(line_addr) > 0) { 223 m_load_waiting_on_store++; 224 return RequestStatus_Aliased; 225 } 226 227 pair<RequestTable::iterator, bool> r = 228 m_readRequestTable.insert(default_entry); 229 230 if (r.second) { 231 RequestTable::iterator i = r.first; 232 i->second = new SequencerRequest(pkt, request_type, curCycle()); 233 m_outstanding_count++; 234 } else { 235 // There is an outstanding read request for the cache line 236 m_load_waiting_on_load++; 237 return RequestStatus_Aliased; 238 } 239 } 240 241 m_outstandReqHist.sample(m_outstanding_count); 242 assert(m_outstanding_count == 243 (m_writeRequestTable.size() + m_readRequestTable.size())); 244 245 return RequestStatus_Ready; 246} 247 248void 249Sequencer::markRemoved() 250{ 251 m_outstanding_count--; 252 assert(m_outstanding_count == 253 m_writeRequestTable.size() + m_readRequestTable.size()); 254} 255 256void 257Sequencer::invalidateSC(Addr address) 258{ 259 AbstractCacheEntry e = m_dataCache_ptr->lookup(address); 260* // The controller has lost the coherence permissions, hence the lock 261 // on the cache line maintained by the cache should be cleared. 262 if (e && e->isLocked(m_version)) { 263 e->clearLocked(); 264 } 265} 266 267bool 268Sequencer::handleLlsc(Addr address, SequencerRequest* request) 269{ 270 AbstractCacheEntry e = m_dataCache_ptr->lookup(address); 271* if (!e) 272 return true; 273 274 // The success flag indicates whether the LLSC operation was successful. 275 // LL ops will always succeed, but SC may fail if the cache line is no 276 // longer locked. 277 bool success = true; 278 if (request->m_type == RubyRequestType_Store_Conditional) { 279 if (!e->isLocked(m_version)) { 280 // 281 // For failed SC requests, indicate the failure to the cpu by 282 // setting the extra data to zero. 283 // 284 request->pkt->req->setExtraData(0); 285 success = false; 286 } else { 287 // 288 // For successful SC requests, indicate the success to the cpu by 289 // setting the extra data to one. 290 // 291 request->pkt->req->setExtraData(1); 292 } 293 // 294 // Independent of success, all SC operations must clear the lock 295 // 296 e->clearLocked(); 297 } else if (request->m_type == RubyRequestType_Load_Linked) { 298 // 299 // Note: To fully follow Alpha LLSC semantics, should the LL clear any 300 // previously locked cache lines? 301 // 302 e->setLocked(m_version); 303 } else if (e->isLocked(m_version)) { 304 // 305 // Normal writes should clear the locked address 306 // 307 e->clearLocked(); 308 } 309 return success; 310} 311 312void 313Sequencer::recordMissLatency(const Cycles cycles, const RubyRequestType type, 314 const MachineType respondingMach, 315 bool isExternalHit, Cycles issuedTime, 316 Cycles initialRequestTime, 317 Cycles forwardRequestTime, 318 Cycles firstResponseTime, Cycles completionTime) 319{ 320 m_latencyHist.sample(cycles); 321 m_typeLatencyHist[type]->sample(cycles); 322 323 if (isExternalHit) { 324 m_missLatencyHist.sample(cycles); 325 m_missTypeLatencyHist[type]->sample(cycles); 326 327 if (respondingMach != MachineType_NUM) { 328 m_missMachLatencyHist[respondingMach]->sample(cycles); 329 m_missTypeMachLatencyHist[type][respondingMach]->sample(cycles); 330 331 if ((issuedTime <= initialRequestTime) && 332 (initialRequestTime <= forwardRequestTime) && 333 (forwardRequestTime <= firstResponseTime) && 334 (firstResponseTime <= completionTime)) { 335 336 m_IssueToInitialDelayHist[respondingMach]->sample( 337 initialRequestTime - issuedTime); 338 m_InitialToForwardDelayHist[respondingMach]->sample( 339 forwardRequestTime - initialRequestTime); 340 m_ForwardToFirstResponseDelayHist[respondingMach]->sample( 341 firstResponseTime - forwardRequestTime); 342 m_FirstResponseToCompletionDelayHist[respondingMach]->sample( 343 completionTime - firstResponseTime); 344 } else { 345 m_IncompleteTimes[respondingMach]++; 346 } 347 } 348 } else { 349 m_hitLatencyHist.sample(cycles); 350 m_hitTypeLatencyHist[type]->sample(cycles); 351 352 if (respondingMach != MachineType_NUM) { 353 m_hitMachLatencyHist[respondingMach]->sample(cycles); 354 m_hitTypeMachLatencyHist[type][respondingMach]->sample(cycles); 355 } 356 } 357} 358 359void 360Sequencer::writeCallback(Addr address, DataBlock& data, 361 const bool externalHit, const MachineType mach, 362 const Cycles initialRequestTime, 363 const Cycles forwardRequestTime, 364 const Cycles firstResponseTime) 365{ 366 assert(address == makeLineAddress(address)); 367 assert(m_writeRequestTable.count(makeLineAddress(address))); 368 369 RequestTable::iterator i = m_writeRequestTable.find(address); 370 assert(i != m_writeRequestTable.end()); 371 SequencerRequest* request = i->second; 372 373 m_writeRequestTable.erase(i); 374 markRemoved(); 375 376 assert((request->m_type == RubyRequestType_ST) \|\| 377 (request->m_type == RubyRequestType_ATOMIC) \|\| 378 (request->m_type == RubyRequestType_RMW_Read) \|\| 379 (request->m_type == RubyRequestType_RMW_Write) \|\| 380 (request->m_type == RubyRequestType_Load_Linked) \|\| 381 (request->m_type == RubyRequestType_Store_Conditional) \|\| 382 (request->m_type == RubyRequestType_Locked_RMW_Read) \|\| 383 (request->m_type == RubyRequestType_Locked_RMW_Write) \|\| 384 (request->m_type == RubyRequestType_FLUSH)); 385 386 // 387 // For Alpha, properly handle LL, SC, and write requests with respect to 388 // locked cache blocks. 389 // 390 // Not valid for Garnet_standalone protocl 391 // 392 bool success = true; 393 if (!m_runningGarnetStandalone) 394 success = handleLlsc(address, request); 395 396 // Handle SLICC block_on behavior for Locked_RMW accesses. NOTE: the 397 // address variable here is assumed to be a line address, so when 398 // blocking buffers, must check line addresses. 399 if (request->m_type == RubyRequestType_Locked_RMW_Read) { 400 // blockOnQueue blocks all first-level cache controller queues 401 // waiting on memory accesses for the specified address that go to 402 // the specified queue. In this case, a Locked_RMW_Write must go to 403 // the mandatory_q before unblocking the first-level controller. 404 // This will block standard loads, stores, ifetches, etc. 405 m_controller->blockOnQueue(address, m_mandatory_q_ptr); 406 } else if (request->m_type == RubyRequestType_Locked_RMW_Write) { 407 m_controller->unblock(address); 408 } 409 410 hitCallback(request, data, success, mach, externalHit, 411 initialRequestTime, forwardRequestTime, firstResponseTime); 412} 413 414void 415Sequencer::readCallback(Addr address, DataBlock& data, 416 bool externalHit, const MachineType mach, 417 Cycles initialRequestTime, 418 Cycles forwardRequestTime, 419 Cycles firstResponseTime) 420{ 421 assert(address == makeLineAddress(address)); 422 assert(m_readRequestTable.count(makeLineAddress(address))); 423 424 RequestTable::iterator i = m_readRequestTable.find(address); 425 assert(i != m_readRequestTable.end()); 426 SequencerRequest* request = i->second; 427 428 m_readRequestTable.erase(i); 429 markRemoved(); 430 431 assert((request->m_type == RubyRequestType_LD) \|\| 432 (request->m_type == RubyRequestType_IFETCH)); 433 434 hitCallback(request, data, true, mach, externalHit, 435 initialRequestTime, forwardRequestTime, firstResponseTime); 436} 437 438void 439Sequencer::hitCallback(SequencerRequest* srequest, DataBlock& data, 440 bool llscSuccess, 441 const MachineType mach, const bool externalHit, 442 const Cycles initialRequestTime, 443 const Cycles forwardRequestTime, 444 const Cycles firstResponseTime) 445{ 446 warn_once("Replacement policy updates recently became the responsibility " 447 "of SLICC state machines. Make sure to setMRU() near callbacks " 448 "in .sm files!"); 449 450 PacketPtr pkt = srequest->pkt; 451 Addr request_address(pkt->getAddr()); 452 RubyRequestType type = srequest->m_type; 453 Cycles issued_time = srequest->issue_time; 454 455 assert(curCycle() >= issued_time); 456 Cycles total_latency = curCycle() - issued_time; 457 458 // Profile the latency for all demand accesses. 459 recordMissLatency(total_latency, type, mach, externalHit, issued_time, 460 initialRequestTime, forwardRequestTime, 461 firstResponseTime, curCycle()); 462 463 DPRINTFR(ProtocolTrace, "%15s %3s %10s%20s %6s>%-6s %#x %d cycles\n", 464 curTick(), m_version, "Seq", 465 llscSuccess ? "Done" : "SC_Failed", "", "", 466 printAddress(request_address), total_latency); 467 468 // update the data unless it is a non-data-carrying flush 469 if (RubySystem::getWarmupEnabled()) { 470 data.setData(pkt->getConstPtr<uint8_t>(), 471 getOffset(request_address), pkt->getSize()); 472 } else if (!pkt->isFlush()) { 473 if ((type == RubyRequestType_LD) \|\| 474 (type == RubyRequestType_IFETCH) \|\| 475 (type == RubyRequestType_RMW_Read) \|\| 476 (type == RubyRequestType_Locked_RMW_Read) \|\| 477 (type == RubyRequestType_Load_Linked)) { 478 memcpy(pkt->getPtr<uint8_t>(), 479 data.getData(getOffset(request_address), pkt->getSize()), 480 pkt->getSize()); 481 DPRINTF(RubySequencer, "read data %s\n", data); 482 } else if (pkt->req->isSwap()) { 483 std::vector<uint8_t> overwrite_val(pkt->getSize()); 484 memcpy(&overwrite_val[0], pkt->getConstPtr<uint8_t>(), 485 pkt->getSize()); 486 memcpy(pkt->getPtr<uint8_t>(), 487 data.getData(getOffset(request_address), pkt->getSize()), 488 pkt->getSize()); 489 data.setData(&overwrite_val[0], 490 getOffset(request_address), pkt->getSize()); 491 DPRINTF(RubySequencer, "swap data %s\n", data);	1/* 2 * Copyright (c) 1999-2008 Mark D. Hill and David A. Wood 3 * All rights reserved. 4 * 5 * Redistribution and use in source and binary forms, with or without 6 * modification, are permitted provided that the following conditions are 7 * met: redistributions of source code must retain the above copyright 8 * notice, this list of conditions and the following disclaimer; 9 * redistributions in binary form must reproduce the above copyright 10 * notice, this list of conditions and the following disclaimer in the 11 * documentation and/or other materials provided with the distribution; 12 * neither the name of the copyright holders nor the names of its 13 * contributors may be used to endorse or promote products derived from 14 * this software without specific prior written permission. 15 * 16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 17 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 18 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 19 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 20 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 21 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 22 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 23 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 24 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 25 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 26 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 27 / 28 29#include "mem/ruby/system/Sequencer.hh" 30 31#include "arch/x86/ldstflags.hh" 32#include "base/misc.hh" 33#include "base/str.hh" 34#include "cpu/testers/rubytest/RubyTester.hh" 35#include "debug/MemoryAccess.hh" 36#include "debug/ProtocolTrace.hh" 37#include "debug/RubySequencer.hh" 38#include "debug/RubyStats.hh" 39#include "mem/packet.hh" 40#include "mem/protocol/PrefetchBit.hh" 41#include "mem/protocol/RubyAccessMode.hh" 42#include "mem/ruby/profiler/Profiler.hh" 43#include "mem/ruby/slicc_interface/RubyRequest.hh" 44#include "mem/ruby/system/RubySystem.hh" 45#include "sim/system.hh" 46 47using namespace std; 48 49Sequencer 50RubySequencerParams::create() 51{ 52 return new Sequencer(this); 53} 54 55Sequencer::Sequencer(const Params p) 56 : RubyPort(p), m_IncompleteTimes(MachineType_NUM), deadlockCheckEvent(this) 57{ 58 m_outstanding_count = 0; 59 60 m_instCache_ptr = p->icache; 61 m_dataCache_ptr = p->dcache; 62 m_data_cache_hit_latency = p->dcache_hit_latency; 63 m_inst_cache_hit_latency = p->icache_hit_latency; 64 m_max_outstanding_requests = p->max_outstanding_requests; 65 m_deadlock_threshold = p->deadlock_threshold; 66 67 m_coreId = p->coreid; // for tracking the two CorePair sequencers 68 assert(m_max_outstanding_requests > 0); 69 assert(m_deadlock_threshold > 0); 70 assert(m_instCache_ptr != NULL); 71 assert(m_dataCache_ptr != NULL); 72 assert(m_data_cache_hit_latency > 0); 73 assert(m_inst_cache_hit_latency > 0); 74 75 m_runningGarnetStandalone = p->garnet_standalone; 76} 77 78Sequencer::~Sequencer() 79{ 80} 81 82void 83Sequencer::wakeup() 84{ 85 assert(drainState() != DrainState::Draining); 86 87 // Check for deadlock of any of the requests 88 Cycles current_time = curCycle(); 89 90 // Check across all outstanding requests 91 int total_outstanding = 0; 92 93 RequestTable::iterator read = m_readRequestTable.begin(); 94 RequestTable::iterator read_end = m_readRequestTable.end(); 95 for (; read != read_end; ++read) { 96 SequencerRequest request = read->second; 97 if (current_time - request->issue_time < m_deadlock_threshold) 98 continue; 99 100 panic("Possible Deadlock detected. Aborting!\n" 101 "version: %d request.paddr: 0x%x m_readRequestTable: %d " 102 "current time: %u issue_time: %d difference: %d\n", m_version, 103 request->pkt->getAddr(), m_readRequestTable.size(), 104 current_time * clockPeriod(), request->issue_time * clockPeriod(), 105 (current_time * clockPeriod()) - (request->issue_time * clockPeriod())); 106 } 107 108 RequestTable::iterator write = m_writeRequestTable.begin(); 109 RequestTable::iterator write_end = m_writeRequestTable.end(); 110 for (; write != write_end; ++write) { 111 SequencerRequest* request = write->second; 112 if (current_time - request->issue_time < m_deadlock_threshold) 113 continue; 114 115 panic("Possible Deadlock detected. Aborting!\n" 116 "version: %d request.paddr: 0x%x m_writeRequestTable: %d " 117 "current time: %u issue_time: %d difference: %d\n", m_version, 118 request->pkt->getAddr(), m_writeRequestTable.size(), 119 current_time * clockPeriod(), request->issue_time * clockPeriod(), 120 (current_time * clockPeriod()) - (request->issue_time * clockPeriod())); 121 } 122 123 total_outstanding += m_writeRequestTable.size(); 124 total_outstanding += m_readRequestTable.size(); 125 126 assert(m_outstanding_count == total_outstanding); 127 128 if (m_outstanding_count > 0) { 129 // If there are still outstanding requests, keep checking 130 schedule(deadlockCheckEvent, clockEdge(m_deadlock_threshold)); 131 } 132} 133 134void Sequencer::resetStats() 135{ 136 m_latencyHist.reset(); 137 m_hitLatencyHist.reset(); 138 m_missLatencyHist.reset(); 139 for (int i = 0; i < RubyRequestType_NUM; i++) { 140 m_typeLatencyHist[i]->reset(); 141 m_hitTypeLatencyHist[i]->reset(); 142 m_missTypeLatencyHist[i]->reset(); 143 for (int j = 0; j < MachineType_NUM; j++) { 144 m_hitTypeMachLatencyHist[i][j]->reset(); 145 m_missTypeMachLatencyHist[i][j]->reset(); 146 } 147 } 148 149 for (int i = 0; i < MachineType_NUM; i++) { 150 m_missMachLatencyHist[i]->reset(); 151 m_hitMachLatencyHist[i]->reset(); 152 153 m_IssueToInitialDelayHist[i]->reset(); 154 m_InitialToForwardDelayHist[i]->reset(); 155 m_ForwardToFirstResponseDelayHist[i]->reset(); 156 m_FirstResponseToCompletionDelayHist[i]->reset(); 157 158 m_IncompleteTimes[i] = 0; 159 } 160} 161 162// Insert the request on the correct request table. Return true if 163// the entry was already present. 164RequestStatus 165Sequencer::insertRequest(PacketPtr pkt, RubyRequestType request_type) 166{ 167 assert(m_outstanding_count == 168 (m_writeRequestTable.size() + m_readRequestTable.size())); 169 170 // See if we should schedule a deadlock check 171 if (!deadlockCheckEvent.scheduled() && 172 drainState() != DrainState::Draining) { 173 schedule(deadlockCheckEvent, clockEdge(m_deadlock_threshold)); 174 } 175 176 Addr line_addr = makeLineAddress(pkt->getAddr()); 177 178 // Check if the line is blocked for a Locked_RMW 179 if (m_controller->isBlocked(line_addr) && 180 (request_type != RubyRequestType_Locked_RMW_Write)) { 181 // Return that this request's cache line address aliases with 182 // a prior request that locked the cache line. The request cannot 183 // proceed until the cache line is unlocked by a Locked_RMW_Write 184 return RequestStatus_Aliased; 185 } 186 187 // Create a default entry, mapping the address to NULL, the cast is 188 // there to make gcc 4.4 happy 189 RequestTable::value_type default_entry(line_addr, 190 (SequencerRequest) NULL); 191* 192 if ((request_type == RubyRequestType_ST) \|\| 193 (request_type == RubyRequestType_RMW_Read) \|\| 194 (request_type == RubyRequestType_RMW_Write) \|\| 195 (request_type == RubyRequestType_Load_Linked) \|\| 196 (request_type == RubyRequestType_Store_Conditional) \|\| 197 (request_type == RubyRequestType_Locked_RMW_Read) \|\| 198 (request_type == RubyRequestType_Locked_RMW_Write) \|\| 199 (request_type == RubyRequestType_FLUSH)) { 200 201 // Check if there is any outstanding read request for the same 202 // cache line. 203 if (m_readRequestTable.count(line_addr) > 0) { 204 m_store_waiting_on_load++; 205 return RequestStatus_Aliased; 206 } 207 208 pair<RequestTable::iterator, bool> r = 209 m_writeRequestTable.insert(default_entry); 210 if (r.second) { 211 RequestTable::iterator i = r.first; 212 i->second = new SequencerRequest(pkt, request_type, curCycle()); 213 m_outstanding_count++; 214 } else { 215 // There is an outstanding write request for the cache line 216 m_store_waiting_on_store++; 217 return RequestStatus_Aliased; 218 } 219 } else { 220 // Check if there is any outstanding write request for the same 221 // cache line. 222 if (m_writeRequestTable.count(line_addr) > 0) { 223 m_load_waiting_on_store++; 224 return RequestStatus_Aliased; 225 } 226 227 pair<RequestTable::iterator, bool> r = 228 m_readRequestTable.insert(default_entry); 229 230 if (r.second) { 231 RequestTable::iterator i = r.first; 232 i->second = new SequencerRequest(pkt, request_type, curCycle()); 233 m_outstanding_count++; 234 } else { 235 // There is an outstanding read request for the cache line 236 m_load_waiting_on_load++; 237 return RequestStatus_Aliased; 238 } 239 } 240 241 m_outstandReqHist.sample(m_outstanding_count); 242 assert(m_outstanding_count == 243 (m_writeRequestTable.size() + m_readRequestTable.size())); 244 245 return RequestStatus_Ready; 246} 247 248void 249Sequencer::markRemoved() 250{ 251 m_outstanding_count--; 252 assert(m_outstanding_count == 253 m_writeRequestTable.size() + m_readRequestTable.size()); 254} 255 256void 257Sequencer::invalidateSC(Addr address) 258{ 259 AbstractCacheEntry e = m_dataCache_ptr->lookup(address); 260* // The controller has lost the coherence permissions, hence the lock 261 // on the cache line maintained by the cache should be cleared. 262 if (e && e->isLocked(m_version)) { 263 e->clearLocked(); 264 } 265} 266 267bool 268Sequencer::handleLlsc(Addr address, SequencerRequest* request) 269{ 270 AbstractCacheEntry e = m_dataCache_ptr->lookup(address); 271* if (!e) 272 return true; 273 274 // The success flag indicates whether the LLSC operation was successful. 275 // LL ops will always succeed, but SC may fail if the cache line is no 276 // longer locked. 277 bool success = true; 278 if (request->m_type == RubyRequestType_Store_Conditional) { 279 if (!e->isLocked(m_version)) { 280 // 281 // For failed SC requests, indicate the failure to the cpu by 282 // setting the extra data to zero. 283 // 284 request->pkt->req->setExtraData(0); 285 success = false; 286 } else { 287 // 288 // For successful SC requests, indicate the success to the cpu by 289 // setting the extra data to one. 290 // 291 request->pkt->req->setExtraData(1); 292 } 293 // 294 // Independent of success, all SC operations must clear the lock 295 // 296 e->clearLocked(); 297 } else if (request->m_type == RubyRequestType_Load_Linked) { 298 // 299 // Note: To fully follow Alpha LLSC semantics, should the LL clear any 300 // previously locked cache lines? 301 // 302 e->setLocked(m_version); 303 } else if (e->isLocked(m_version)) { 304 // 305 // Normal writes should clear the locked address 306 // 307 e->clearLocked(); 308 } 309 return success; 310} 311 312void 313Sequencer::recordMissLatency(const Cycles cycles, const RubyRequestType type, 314 const MachineType respondingMach, 315 bool isExternalHit, Cycles issuedTime, 316 Cycles initialRequestTime, 317 Cycles forwardRequestTime, 318 Cycles firstResponseTime, Cycles completionTime) 319{ 320 m_latencyHist.sample(cycles); 321 m_typeLatencyHist[type]->sample(cycles); 322 323 if (isExternalHit) { 324 m_missLatencyHist.sample(cycles); 325 m_missTypeLatencyHist[type]->sample(cycles); 326 327 if (respondingMach != MachineType_NUM) { 328 m_missMachLatencyHist[respondingMach]->sample(cycles); 329 m_missTypeMachLatencyHist[type][respondingMach]->sample(cycles); 330 331 if ((issuedTime <= initialRequestTime) && 332 (initialRequestTime <= forwardRequestTime) && 333 (forwardRequestTime <= firstResponseTime) && 334 (firstResponseTime <= completionTime)) { 335 336 m_IssueToInitialDelayHist[respondingMach]->sample( 337 initialRequestTime - issuedTime); 338 m_InitialToForwardDelayHist[respondingMach]->sample( 339 forwardRequestTime - initialRequestTime); 340 m_ForwardToFirstResponseDelayHist[respondingMach]->sample( 341 firstResponseTime - forwardRequestTime); 342 m_FirstResponseToCompletionDelayHist[respondingMach]->sample( 343 completionTime - firstResponseTime); 344 } else { 345 m_IncompleteTimes[respondingMach]++; 346 } 347 } 348 } else { 349 m_hitLatencyHist.sample(cycles); 350 m_hitTypeLatencyHist[type]->sample(cycles); 351 352 if (respondingMach != MachineType_NUM) { 353 m_hitMachLatencyHist[respondingMach]->sample(cycles); 354 m_hitTypeMachLatencyHist[type][respondingMach]->sample(cycles); 355 } 356 } 357} 358 359void 360Sequencer::writeCallback(Addr address, DataBlock& data, 361 const bool externalHit, const MachineType mach, 362 const Cycles initialRequestTime, 363 const Cycles forwardRequestTime, 364 const Cycles firstResponseTime) 365{ 366 assert(address == makeLineAddress(address)); 367 assert(m_writeRequestTable.count(makeLineAddress(address))); 368 369 RequestTable::iterator i = m_writeRequestTable.find(address); 370 assert(i != m_writeRequestTable.end()); 371 SequencerRequest* request = i->second; 372 373 m_writeRequestTable.erase(i); 374 markRemoved(); 375 376 assert((request->m_type == RubyRequestType_ST) \|\| 377 (request->m_type == RubyRequestType_ATOMIC) \|\| 378 (request->m_type == RubyRequestType_RMW_Read) \|\| 379 (request->m_type == RubyRequestType_RMW_Write) \|\| 380 (request->m_type == RubyRequestType_Load_Linked) \|\| 381 (request->m_type == RubyRequestType_Store_Conditional) \|\| 382 (request->m_type == RubyRequestType_Locked_RMW_Read) \|\| 383 (request->m_type == RubyRequestType_Locked_RMW_Write) \|\| 384 (request->m_type == RubyRequestType_FLUSH)); 385 386 // 387 // For Alpha, properly handle LL, SC, and write requests with respect to 388 // locked cache blocks. 389 // 390 // Not valid for Garnet_standalone protocl 391 // 392 bool success = true; 393 if (!m_runningGarnetStandalone) 394 success = handleLlsc(address, request); 395 396 // Handle SLICC block_on behavior for Locked_RMW accesses. NOTE: the 397 // address variable here is assumed to be a line address, so when 398 // blocking buffers, must check line addresses. 399 if (request->m_type == RubyRequestType_Locked_RMW_Read) { 400 // blockOnQueue blocks all first-level cache controller queues 401 // waiting on memory accesses for the specified address that go to 402 // the specified queue. In this case, a Locked_RMW_Write must go to 403 // the mandatory_q before unblocking the first-level controller. 404 // This will block standard loads, stores, ifetches, etc. 405 m_controller->blockOnQueue(address, m_mandatory_q_ptr); 406 } else if (request->m_type == RubyRequestType_Locked_RMW_Write) { 407 m_controller->unblock(address); 408 } 409 410 hitCallback(request, data, success, mach, externalHit, 411 initialRequestTime, forwardRequestTime, firstResponseTime); 412} 413 414void 415Sequencer::readCallback(Addr address, DataBlock& data, 416 bool externalHit, const MachineType mach, 417 Cycles initialRequestTime, 418 Cycles forwardRequestTime, 419 Cycles firstResponseTime) 420{ 421 assert(address == makeLineAddress(address)); 422 assert(m_readRequestTable.count(makeLineAddress(address))); 423 424 RequestTable::iterator i = m_readRequestTable.find(address); 425 assert(i != m_readRequestTable.end()); 426 SequencerRequest* request = i->second; 427 428 m_readRequestTable.erase(i); 429 markRemoved(); 430 431 assert((request->m_type == RubyRequestType_LD) \|\| 432 (request->m_type == RubyRequestType_IFETCH)); 433 434 hitCallback(request, data, true, mach, externalHit, 435 initialRequestTime, forwardRequestTime, firstResponseTime); 436} 437 438void 439Sequencer::hitCallback(SequencerRequest* srequest, DataBlock& data, 440 bool llscSuccess, 441 const MachineType mach, const bool externalHit, 442 const Cycles initialRequestTime, 443 const Cycles forwardRequestTime, 444 const Cycles firstResponseTime) 445{ 446 warn_once("Replacement policy updates recently became the responsibility " 447 "of SLICC state machines. Make sure to setMRU() near callbacks " 448 "in .sm files!"); 449 450 PacketPtr pkt = srequest->pkt; 451 Addr request_address(pkt->getAddr()); 452 RubyRequestType type = srequest->m_type; 453 Cycles issued_time = srequest->issue_time; 454 455 assert(curCycle() >= issued_time); 456 Cycles total_latency = curCycle() - issued_time; 457 458 // Profile the latency for all demand accesses. 459 recordMissLatency(total_latency, type, mach, externalHit, issued_time, 460 initialRequestTime, forwardRequestTime, 461 firstResponseTime, curCycle()); 462 463 DPRINTFR(ProtocolTrace, "%15s %3s %10s%20s %6s>%-6s %#x %d cycles\n", 464 curTick(), m_version, "Seq", 465 llscSuccess ? "Done" : "SC_Failed", "", "", 466 printAddress(request_address), total_latency); 467 468 // update the data unless it is a non-data-carrying flush 469 if (RubySystem::getWarmupEnabled()) { 470 data.setData(pkt->getConstPtr<uint8_t>(), 471 getOffset(request_address), pkt->getSize()); 472 } else if (!pkt->isFlush()) { 473 if ((type == RubyRequestType_LD) \|\| 474 (type == RubyRequestType_IFETCH) \|\| 475 (type == RubyRequestType_RMW_Read) \|\| 476 (type == RubyRequestType_Locked_RMW_Read) \|\| 477 (type == RubyRequestType_Load_Linked)) { 478 memcpy(pkt->getPtr<uint8_t>(), 479 data.getData(getOffset(request_address), pkt->getSize()), 480 pkt->getSize()); 481 DPRINTF(RubySequencer, "read data %s\n", data); 482 } else if (pkt->req->isSwap()) { 483 std::vector<uint8_t> overwrite_val(pkt->getSize()); 484 memcpy(&overwrite_val[0], pkt->getConstPtr<uint8_t>(), 485 pkt->getSize()); 486 memcpy(pkt->getPtr<uint8_t>(), 487 data.getData(getOffset(request_address), pkt->getSize()), 488 pkt->getSize()); 489 data.setData(&overwrite_val[0], 490 getOffset(request_address), pkt->getSize()); 491 DPRINTF(RubySequencer, "swap data %s\n", data);
492 } else {	492 } else if (type != RubyRequestType_Store_Conditional \|\| llscSuccess) { 493 // Types of stores set the actual data here, apart from 494 // failed Store Conditional requests
493 data.setData(pkt->getConstPtr<uint8_t>(), 494 getOffset(request_address), pkt->getSize()); 495 DPRINTF(RubySequencer, "set data %s\n", data); 496 } 497 } 498 499 // If using the RubyTester, update the RubyTester sender state's 500 // subBlock with the recieved data. The tester will later access 501 // this state. 502 if (m_usingRubyTester) { 503 DPRINTF(RubySequencer, "hitCallback %s 0x%x using RubyTester\n", 504 pkt->cmdString(), pkt->getAddr()); 505 RubyTester::SenderState* testerSenderState = 506 pkt->findNextSenderState<RubyTester::SenderState>(); 507 assert(testerSenderState); 508 testerSenderState->subBlock.mergeFrom(data); 509 } 510 511 delete srequest; 512 513 RubySystem rs = m_ruby_system; 514* if (RubySystem::getWarmupEnabled()) { 515 assert(pkt->req); 516 delete pkt->req; 517 delete pkt; 518 rs->m_cache_recorder->enqueueNextFetchRequest(); 519 } else if (RubySystem::getCooldownEnabled()) { 520 delete pkt; 521 rs->m_cache_recorder->enqueueNextFlushRequest(); 522 } else { 523 ruby_hit_callback(pkt); 524 testDrainComplete(); 525 } 526} 527 528bool 529Sequencer::empty() const 530{ 531 return m_writeRequestTable.empty() && m_readRequestTable.empty(); 532} 533 534RequestStatus 535Sequencer::makeRequest(PacketPtr pkt) 536{ 537 if (m_outstanding_count >= m_max_outstanding_requests) { 538 return RequestStatus_BufferFull; 539 } 540 541 RubyRequestType primary_type = RubyRequestType_NULL; 542 RubyRequestType secondary_type = RubyRequestType_NULL; 543 544 if (pkt->isLLSC()) { 545 // 546 // Alpha LL/SC instructions need to be handled carefully by the cache 547 // coherence protocol to ensure they follow the proper semantics. In 548 // particular, by identifying the operations as atomic, the protocol 549 // should understand that migratory sharing optimizations should not 550 // be performed (i.e. a load between the LL and SC should not steal 551 // away exclusive permission). 552 // 553 if (pkt->isWrite()) { 554 DPRINTF(RubySequencer, "Issuing SC\n"); 555 primary_type = RubyRequestType_Store_Conditional; 556 } else { 557 DPRINTF(RubySequencer, "Issuing LL\n"); 558 assert(pkt->isRead()); 559 primary_type = RubyRequestType_Load_Linked; 560 } 561 secondary_type = RubyRequestType_ATOMIC; 562 } else if (pkt->req->isLockedRMW()) { 563 // 564 // x86 locked instructions are translated to store cache coherence 565 // requests because these requests should always be treated as read 566 // exclusive operations and should leverage any migratory sharing 567 // optimization built into the protocol. 568 // 569 if (pkt->isWrite()) { 570 DPRINTF(RubySequencer, "Issuing Locked RMW Write\n"); 571 primary_type = RubyRequestType_Locked_RMW_Write; 572 } else { 573 DPRINTF(RubySequencer, "Issuing Locked RMW Read\n"); 574 assert(pkt->isRead()); 575 primary_type = RubyRequestType_Locked_RMW_Read; 576 } 577 secondary_type = RubyRequestType_ST; 578 } else { 579 // 580 // To support SwapReq, we need to check isWrite() first: a SwapReq 581 // should always be treated like a write, but since a SwapReq implies 582 // both isWrite() and isRead() are true, check isWrite() first here. 583 // 584 if (pkt->isWrite()) { 585 // 586 // Note: M5 packets do not differentiate ST from RMW_Write 587 // 588 primary_type = secondary_type = RubyRequestType_ST; 589 } else if (pkt->isRead()) { 590 if (pkt->req->isInstFetch()) { 591 primary_type = secondary_type = RubyRequestType_IFETCH; 592 } else { 593 bool storeCheck = false; 594 // only X86 need the store check 595 if (system->getArch() == Arch::X86ISA) { 596 uint32_t flags = pkt->req->getFlags(); 597 storeCheck = flags & 598 (X86ISA::StoreCheck << X86ISA::FlagShift); 599 } 600 if (storeCheck) { 601 primary_type = RubyRequestType_RMW_Read; 602 secondary_type = RubyRequestType_ST; 603 } else { 604 primary_type = secondary_type = RubyRequestType_LD; 605 } 606 } 607 } else if (pkt->isFlush()) { 608 primary_type = secondary_type = RubyRequestType_FLUSH; 609 } else { 610 panic("Unsupported ruby packet type\n"); 611 } 612 } 613 614 RequestStatus status = insertRequest(pkt, primary_type); 615 if (status != RequestStatus_Ready) 616 return status; 617 618 issueRequest(pkt, secondary_type); 619 620 // TODO: issue hardware prefetches here 621 return RequestStatus_Issued; 622} 623 624void 625Sequencer::issueRequest(PacketPtr pkt, RubyRequestType secondary_type) 626{ 627 assert(pkt != NULL); 628 ContextID proc_id = pkt->req->hasContextId() ? 629 pkt->req->contextId() : InvalidContextID; 630 631 ContextID core_id = coreId(); 632 633 // If valid, copy the pc to the ruby request 634 Addr pc = 0; 635 if (pkt->req->hasPC()) { 636 pc = pkt->req->getPC(); 637 } 638 639 // check if the packet has data as for example prefetch and flush 640 // requests do not 641 std::shared_ptr<RubyRequest> msg = 642 std::make_shared<RubyRequest>(clockEdge(), pkt->getAddr(), 643 pkt->isFlush() ? 644 nullptr : pkt->getPtr<uint8_t>(), 645 pkt->getSize(), pc, secondary_type, 646 RubyAccessMode_Supervisor, pkt, 647 PrefetchBit_No, proc_id, core_id); 648 649 DPRINTFR(ProtocolTrace, "%15s %3s %10s%20s %6s>%-6s %#x %s\n", 650 curTick(), m_version, "Seq", "Begin", "", "", 651 printAddress(msg->getPhysicalAddress()), 652 RubyRequestType_to_string(secondary_type)); 653 654 // The Sequencer currently assesses instruction and data cache hit latency 655 // for the top-level caches at the beginning of a memory access. 656 // TODO: Eventually, this latency should be moved to represent the actual 657 // cache access latency portion of the memory access. This will require 658 // changing cache controller protocol files to assess the latency on the 659 // access response path. 660 Cycles latency(0); // Initialize to zero to catch misconfigured latency 661 if (secondary_type == RubyRequestType_IFETCH) 662 latency = m_inst_cache_hit_latency; 663 else 664 latency = m_data_cache_hit_latency; 665 666 // Send the message to the cache controller 667 assert(latency > 0); 668 669 assert(m_mandatory_q_ptr != NULL); 670 m_mandatory_q_ptr->enqueue(msg, clockEdge(), cyclesToTicks(latency)); 671} 672 673template <class KEY, class VALUE> 674std::ostream & 675operator<<(ostream &out, const std::unordered_map<KEY, VALUE> &map) 676{ 677 auto i = map.begin(); 678 auto end = map.end(); 679 680 out << "["; 681 for (; i != end; ++i) 682 out << " " << i->first << "=" << i->second; 683 out << " ]"; 684 685 return out; 686} 687 688void 689Sequencer::print(ostream& out) const 690{ 691 out << "[Sequencer: " << m_version 692 << ", outstanding requests: " << m_outstanding_count 693 << ", read request table: " << m_readRequestTable 694 << ", write request table: " << m_writeRequestTable 695 << "]"; 696} 697 698// this can be called from setState whenever coherence permissions are 699// upgraded when invoked, coherence violations will be checked for the 700// given block 701void 702Sequencer::checkCoherence(Addr addr) 703{ 704#ifdef CHECK_COHERENCE 705 m_ruby_system->checkGlobalCoherenceInvariant(addr); 706#endif 707} 708 709void 710Sequencer::recordRequestType(SequencerRequestType requestType) { 711 DPRINTF(RubyStats, "Recorded statistic: %s\n", 712 SequencerRequestType_to_string(requestType)); 713} 714 715 716void 717Sequencer::evictionCallback(Addr address) 718{ 719 ruby_eviction_callback(address); 720} 721 722void 723Sequencer::regStats() 724{ 725 RubyPort::regStats(); 726 727 m_store_waiting_on_load 728 .name(name() + ".store_waiting_on_load") 729 .desc("Number of times a store aliased with a pending load") 730 .flags(Stats::nozero); 731 m_store_waiting_on_store 732 .name(name() + ".store_waiting_on_store") 733 .desc("Number of times a store aliased with a pending store") 734 .flags(Stats::nozero); 735 m_load_waiting_on_load 736 .name(name() + ".load_waiting_on_load") 737 .desc("Number of times a load aliased with a pending load") 738 .flags(Stats::nozero); 739 m_load_waiting_on_store 740 .name(name() + ".load_waiting_on_store") 741 .desc("Number of times a load aliased with a pending store") 742 .flags(Stats::nozero); 743 744 // These statistical variables are not for display. 745 // The profiler will collate these across different 746 // sequencers and display those collated statistics. 747 m_outstandReqHist.init(10); 748 m_latencyHist.init(10); 749 m_hitLatencyHist.init(10); 750 m_missLatencyHist.init(10); 751 752 for (int i = 0; i < RubyRequestType_NUM; i++) { 753 m_typeLatencyHist.push_back(new Stats::Histogram()); 754 m_typeLatencyHist[i]->init(10); 755 756 m_hitTypeLatencyHist.push_back(new Stats::Histogram()); 757 m_hitTypeLatencyHist[i]->init(10); 758 759 m_missTypeLatencyHist.push_back(new Stats::Histogram()); 760 m_missTypeLatencyHist[i]->init(10); 761 } 762 763 for (int i = 0; i < MachineType_NUM; i++) { 764 m_hitMachLatencyHist.push_back(new Stats::Histogram()); 765 m_hitMachLatencyHist[i]->init(10); 766 767 m_missMachLatencyHist.push_back(new Stats::Histogram()); 768 m_missMachLatencyHist[i]->init(10); 769 770 m_IssueToInitialDelayHist.push_back(new Stats::Histogram()); 771 m_IssueToInitialDelayHist[i]->init(10); 772 773 m_InitialToForwardDelayHist.push_back(new Stats::Histogram()); 774 m_InitialToForwardDelayHist[i]->init(10); 775 776 m_ForwardToFirstResponseDelayHist.push_back(new Stats::Histogram()); 777 m_ForwardToFirstResponseDelayHist[i]->init(10); 778 779 m_FirstResponseToCompletionDelayHist.push_back(new Stats::Histogram()); 780 m_FirstResponseToCompletionDelayHist[i]->init(10); 781 } 782 783 for (int i = 0; i < RubyRequestType_NUM; i++) { 784 m_hitTypeMachLatencyHist.push_back(std::vector<Stats::Histogram >()); 785* m_missTypeMachLatencyHist.push_back(std::vector<Stats::Histogram >()); 786* 787 for (int j = 0; j < MachineType_NUM; j++) { 788 m_hitTypeMachLatencyHist[i].push_back(new Stats::Histogram()); 789 m_hitTypeMachLatencyHist[i][j]->init(10); 790 791 m_missTypeMachLatencyHist[i].push_back(new Stats::Histogram()); 792 m_missTypeMachLatencyHist[i][j]->init(10); 793 } 794 } 795}	495 data.setData(pkt->getConstPtr<uint8_t>(), 496 getOffset(request_address), pkt->getSize()); 497 DPRINTF(RubySequencer, "set data %s\n", data); 498 } 499 } 500 501 // If using the RubyTester, update the RubyTester sender state's 502 // subBlock with the recieved data. The tester will later access 503 // this state. 504 if (m_usingRubyTester) { 505 DPRINTF(RubySequencer, "hitCallback %s 0x%x using RubyTester\n", 506 pkt->cmdString(), pkt->getAddr()); 507 RubyTester::SenderState* testerSenderState = 508 pkt->findNextSenderState<RubyTester::SenderState>(); 509 assert(testerSenderState); 510 testerSenderState->subBlock.mergeFrom(data); 511 } 512 513 delete srequest; 514 515 RubySystem rs = m_ruby_system; 516* if (RubySystem::getWarmupEnabled()) { 517 assert(pkt->req); 518 delete pkt->req; 519 delete pkt; 520 rs->m_cache_recorder->enqueueNextFetchRequest(); 521 } else if (RubySystem::getCooldownEnabled()) { 522 delete pkt; 523 rs->m_cache_recorder->enqueueNextFlushRequest(); 524 } else { 525 ruby_hit_callback(pkt); 526 testDrainComplete(); 527 } 528} 529 530bool 531Sequencer::empty() const 532{ 533 return m_writeRequestTable.empty() && m_readRequestTable.empty(); 534} 535 536RequestStatus 537Sequencer::makeRequest(PacketPtr pkt) 538{ 539 if (m_outstanding_count >= m_max_outstanding_requests) { 540 return RequestStatus_BufferFull; 541 } 542 543 RubyRequestType primary_type = RubyRequestType_NULL; 544 RubyRequestType secondary_type = RubyRequestType_NULL; 545 546 if (pkt->isLLSC()) { 547 // 548 // Alpha LL/SC instructions need to be handled carefully by the cache 549 // coherence protocol to ensure they follow the proper semantics. In 550 // particular, by identifying the operations as atomic, the protocol 551 // should understand that migratory sharing optimizations should not 552 // be performed (i.e. a load between the LL and SC should not steal 553 // away exclusive permission). 554 // 555 if (pkt->isWrite()) { 556 DPRINTF(RubySequencer, "Issuing SC\n"); 557 primary_type = RubyRequestType_Store_Conditional; 558 } else { 559 DPRINTF(RubySequencer, "Issuing LL\n"); 560 assert(pkt->isRead()); 561 primary_type = RubyRequestType_Load_Linked; 562 } 563 secondary_type = RubyRequestType_ATOMIC; 564 } else if (pkt->req->isLockedRMW()) { 565 // 566 // x86 locked instructions are translated to store cache coherence 567 // requests because these requests should always be treated as read 568 // exclusive operations and should leverage any migratory sharing 569 // optimization built into the protocol. 570 // 571 if (pkt->isWrite()) { 572 DPRINTF(RubySequencer, "Issuing Locked RMW Write\n"); 573 primary_type = RubyRequestType_Locked_RMW_Write; 574 } else { 575 DPRINTF(RubySequencer, "Issuing Locked RMW Read\n"); 576 assert(pkt->isRead()); 577 primary_type = RubyRequestType_Locked_RMW_Read; 578 } 579 secondary_type = RubyRequestType_ST; 580 } else { 581 // 582 // To support SwapReq, we need to check isWrite() first: a SwapReq 583 // should always be treated like a write, but since a SwapReq implies 584 // both isWrite() and isRead() are true, check isWrite() first here. 585 // 586 if (pkt->isWrite()) { 587 // 588 // Note: M5 packets do not differentiate ST from RMW_Write 589 // 590 primary_type = secondary_type = RubyRequestType_ST; 591 } else if (pkt->isRead()) { 592 if (pkt->req->isInstFetch()) { 593 primary_type = secondary_type = RubyRequestType_IFETCH; 594 } else { 595 bool storeCheck = false; 596 // only X86 need the store check 597 if (system->getArch() == Arch::X86ISA) { 598 uint32_t flags = pkt->req->getFlags(); 599 storeCheck = flags & 600 (X86ISA::StoreCheck << X86ISA::FlagShift); 601 } 602 if (storeCheck) { 603 primary_type = RubyRequestType_RMW_Read; 604 secondary_type = RubyRequestType_ST; 605 } else { 606 primary_type = secondary_type = RubyRequestType_LD; 607 } 608 } 609 } else if (pkt->isFlush()) { 610 primary_type = secondary_type = RubyRequestType_FLUSH; 611 } else { 612 panic("Unsupported ruby packet type\n"); 613 } 614 } 615 616 RequestStatus status = insertRequest(pkt, primary_type); 617 if (status != RequestStatus_Ready) 618 return status; 619 620 issueRequest(pkt, secondary_type); 621 622 // TODO: issue hardware prefetches here 623 return RequestStatus_Issued; 624} 625 626void 627Sequencer::issueRequest(PacketPtr pkt, RubyRequestType secondary_type) 628{ 629 assert(pkt != NULL); 630 ContextID proc_id = pkt->req->hasContextId() ? 631 pkt->req->contextId() : InvalidContextID; 632 633 ContextID core_id = coreId(); 634 635 // If valid, copy the pc to the ruby request 636 Addr pc = 0; 637 if (pkt->req->hasPC()) { 638 pc = pkt->req->getPC(); 639 } 640 641 // check if the packet has data as for example prefetch and flush 642 // requests do not 643 std::shared_ptr<RubyRequest> msg = 644 std::make_shared<RubyRequest>(clockEdge(), pkt->getAddr(), 645 pkt->isFlush() ? 646 nullptr : pkt->getPtr<uint8_t>(), 647 pkt->getSize(), pc, secondary_type, 648 RubyAccessMode_Supervisor, pkt, 649 PrefetchBit_No, proc_id, core_id); 650 651 DPRINTFR(ProtocolTrace, "%15s %3s %10s%20s %6s>%-6s %#x %s\n", 652 curTick(), m_version, "Seq", "Begin", "", "", 653 printAddress(msg->getPhysicalAddress()), 654 RubyRequestType_to_string(secondary_type)); 655 656 // The Sequencer currently assesses instruction and data cache hit latency 657 // for the top-level caches at the beginning of a memory access. 658 // TODO: Eventually, this latency should be moved to represent the actual 659 // cache access latency portion of the memory access. This will require 660 // changing cache controller protocol files to assess the latency on the 661 // access response path. 662 Cycles latency(0); // Initialize to zero to catch misconfigured latency 663 if (secondary_type == RubyRequestType_IFETCH) 664 latency = m_inst_cache_hit_latency; 665 else 666 latency = m_data_cache_hit_latency; 667 668 // Send the message to the cache controller 669 assert(latency > 0); 670 671 assert(m_mandatory_q_ptr != NULL); 672 m_mandatory_q_ptr->enqueue(msg, clockEdge(), cyclesToTicks(latency)); 673} 674 675template <class KEY, class VALUE> 676std::ostream & 677operator<<(ostream &out, const std::unordered_map<KEY, VALUE> &map) 678{ 679 auto i = map.begin(); 680 auto end = map.end(); 681 682 out << "["; 683 for (; i != end; ++i) 684 out << " " << i->first << "=" << i->second; 685 out << " ]"; 686 687 return out; 688} 689 690void 691Sequencer::print(ostream& out) const 692{ 693 out << "[Sequencer: " << m_version 694 << ", outstanding requests: " << m_outstanding_count 695 << ", read request table: " << m_readRequestTable 696 << ", write request table: " << m_writeRequestTable 697 << "]"; 698} 699 700// this can be called from setState whenever coherence permissions are 701// upgraded when invoked, coherence violations will be checked for the 702// given block 703void 704Sequencer::checkCoherence(Addr addr) 705{ 706#ifdef CHECK_COHERENCE 707 m_ruby_system->checkGlobalCoherenceInvariant(addr); 708#endif 709} 710 711void 712Sequencer::recordRequestType(SequencerRequestType requestType) { 713 DPRINTF(RubyStats, "Recorded statistic: %s\n", 714 SequencerRequestType_to_string(requestType)); 715} 716 717 718void 719Sequencer::evictionCallback(Addr address) 720{ 721 ruby_eviction_callback(address); 722} 723 724void 725Sequencer::regStats() 726{ 727 RubyPort::regStats(); 728 729 m_store_waiting_on_load 730 .name(name() + ".store_waiting_on_load") 731 .desc("Number of times a store aliased with a pending load") 732 .flags(Stats::nozero); 733 m_store_waiting_on_store 734 .name(name() + ".store_waiting_on_store") 735 .desc("Number of times a store aliased with a pending store") 736 .flags(Stats::nozero); 737 m_load_waiting_on_load 738 .name(name() + ".load_waiting_on_load") 739 .desc("Number of times a load aliased with a pending load") 740 .flags(Stats::nozero); 741 m_load_waiting_on_store 742 .name(name() + ".load_waiting_on_store") 743 .desc("Number of times a load aliased with a pending store") 744 .flags(Stats::nozero); 745 746 // These statistical variables are not for display. 747 // The profiler will collate these across different 748 // sequencers and display those collated statistics. 749 m_outstandReqHist.init(10); 750 m_latencyHist.init(10); 751 m_hitLatencyHist.init(10); 752 m_missLatencyHist.init(10); 753 754 for (int i = 0; i < RubyRequestType_NUM; i++) { 755 m_typeLatencyHist.push_back(new Stats::Histogram()); 756 m_typeLatencyHist[i]->init(10); 757 758 m_hitTypeLatencyHist.push_back(new Stats::Histogram()); 759 m_hitTypeLatencyHist[i]->init(10); 760 761 m_missTypeLatencyHist.push_back(new Stats::Histogram()); 762 m_missTypeLatencyHist[i]->init(10); 763 } 764 765 for (int i = 0; i < MachineType_NUM; i++) { 766 m_hitMachLatencyHist.push_back(new Stats::Histogram()); 767 m_hitMachLatencyHist[i]->init(10); 768 769 m_missMachLatencyHist.push_back(new Stats::Histogram()); 770 m_missMachLatencyHist[i]->init(10); 771 772 m_IssueToInitialDelayHist.push_back(new Stats::Histogram()); 773 m_IssueToInitialDelayHist[i]->init(10); 774 775 m_InitialToForwardDelayHist.push_back(new Stats::Histogram()); 776 m_InitialToForwardDelayHist[i]->init(10); 777 778 m_ForwardToFirstResponseDelayHist.push_back(new Stats::Histogram()); 779 m_ForwardToFirstResponseDelayHist[i]->init(10); 780 781 m_FirstResponseToCompletionDelayHist.push_back(new Stats::Histogram()); 782 m_FirstResponseToCompletionDelayHist[i]->init(10); 783 } 784 785 for (int i = 0; i < RubyRequestType_NUM; i++) { 786 m_hitTypeMachLatencyHist.push_back(std::vector<Stats::Histogram >()); 787* m_missTypeMachLatencyHist.push_back(std::vector<Stats::Histogram >()); 788* 789 for (int j = 0; j < MachineType_NUM; j++) { 790 m_hitTypeMachLatencyHist[i].push_back(new Stats::Histogram()); 791 m_hitTypeMachLatencyHist[i][j]->init(10); 792 793 m_missTypeMachLatencyHist[i].push_back(new Stats::Histogram()); 794 m_missTypeMachLatencyHist[i][j]->init(10); 795 } 796 } 797}