Cross Reference: /gem5/src/mem/ruby/system/Sequencer.cc

Deleted Added

sdiff udiff text old ( 6151:bc6b84108443 ) new ( 6152:705b277e1141 )

full compact

Sequencer.cc (6151:bc6b84108443)	Sequencer.cc (6152:705b277e1141)
1 2/* 3 * Copyright (c) 1999-2008 Mark D. Hill and David A. Wood 4 * All rights reserved. 5 * 6 * Redistribution and use in source and binary forms, with or without 7 * modification, are permitted provided that the following conditions are 8 * met: redistributions of source code must retain the above copyright 9 * notice, this list of conditions and the following disclaimer; 10 * redistributions in binary form must reproduce the above copyright 11 * notice, this list of conditions and the following disclaimer in the 12 * documentation and/or other materials provided with the distribution; 13 * neither the name of the copyright holders nor the names of its 14 * contributors may be used to endorse or promote products derived from 15 * this software without specific prior written permission. 16 * 17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 18 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 19 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 20 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 21 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 22 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 23 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 24 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 25 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 26 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 27 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 28 / 29 30/ 31 * $Id: Sequencer.C 1.131 2006/11/06 17:41:01-06:00 bobba@gratiano.cs.wisc.edu $ 32 * 33 */ 34 35#include "Global.hh" 36#include "Sequencer.hh" 37#include "System.hh" 38#include "Protocol.hh" 39#include "Profiler.hh" 40#include "CacheMemory.hh" 41#include "RubyConfig.hh" 42//#include "Tracer.hh" 43#include "AbstractChip.hh" 44#include "Chip.hh" 45#include "Tester.hh" 46#include "SubBlock.hh" 47#include "Protocol.hh" 48#include "Map.hh" 49#include "interface.hh"	1 2/* 3 * Copyright (c) 1999-2008 Mark D. Hill and David A. Wood 4 * All rights reserved. 5 * 6 * Redistribution and use in source and binary forms, with or without 7 * modification, are permitted provided that the following conditions are 8 * met: redistributions of source code must retain the above copyright 9 * notice, this list of conditions and the following disclaimer; 10 * redistributions in binary form must reproduce the above copyright 11 * notice, this list of conditions and the following disclaimer in the 12 * documentation and/or other materials provided with the distribution; 13 * neither the name of the copyright holders nor the names of its 14 * contributors may be used to endorse or promote products derived from 15 * this software without specific prior written permission. 16 * 17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 18 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 19 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 20 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 21 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 22 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 23 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 24 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 25 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 26 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 27 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 28 / 29 30/ 31 * $Id: Sequencer.C 1.131 2006/11/06 17:41:01-06:00 bobba@gratiano.cs.wisc.edu $ 32 * 33 */ 34 35#include "Global.hh" 36#include "Sequencer.hh" 37#include "System.hh" 38#include "Protocol.hh" 39#include "Profiler.hh" 40#include "CacheMemory.hh" 41#include "RubyConfig.hh" 42//#include "Tracer.hh" 43#include "AbstractChip.hh" 44#include "Chip.hh" 45#include "Tester.hh" 46#include "SubBlock.hh" 47#include "Protocol.hh" 48#include "Map.hh" 49#include "interface.hh"
50//#include "XactCommitArbiter.hh" 51// #include "TransactionInterfaceManager.hh" 52//#include "TransactionVersionManager.hh" 53//#include "LazyTransactionVersionManager.hh"
54	50
55//#define XACT_MGR g_system_ptr->getChip(m_chip_ptr->getID())->getTransactionInterfaceManager(m_version) 56
57Sequencer::Sequencer(AbstractChip* chip_ptr, int version) { 58 m_chip_ptr = chip_ptr; 59 m_version = version; 60 61 m_deadlock_check_scheduled = false; 62 m_outstanding_count = 0; 63 64 int smt_threads = RubyConfig::numberofSMTThreads(); 65 m_writeRequestTable_ptr = new Map<Address, CacheMsg>[smt_threads]; 66 m_readRequestTable_ptr = new Map<Address, CacheMsg>[smt_threads]; 67 68 for(int p=0; p < smt_threads; ++p){ 69 m_writeRequestTable_ptr[p] = new Map<Address, CacheMsg>; 70 m_readRequestTable_ptr[p] = new Map<Address, CacheMsg>; 71 } 72 73} 74 75Sequencer::~Sequencer() { 76 int smt_threads = RubyConfig::numberofSMTThreads(); 77 for(int i=0; i < smt_threads; ++i){ 78 if(m_writeRequestTable_ptr[i]){ 79 delete m_writeRequestTable_ptr[i]; 80 } 81 if(m_readRequestTable_ptr[i]){ 82 delete m_readRequestTable_ptr[i]; 83 } 84 } 85 if(m_writeRequestTable_ptr){ 86 delete [] m_writeRequestTable_ptr; 87 } 88 if(m_readRequestTable_ptr){ 89 delete [] m_readRequestTable_ptr; 90 } 91} 92 93void Sequencer::wakeup() { 94 // Check for deadlock of any of the requests 95 Time current_time = g_eventQueue_ptr->getTime(); 96 bool deadlock = false; 97 98 // Check across all outstanding requests 99 int smt_threads = RubyConfig::numberofSMTThreads(); 100 int total_outstanding = 0; 101 for(int p=0; p < smt_threads; ++p){ 102 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 103 for (int i=0; i<keys.size(); i++) { 104 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]); 105 if (current_time - request.getTime() >= g_DEADLOCK_THRESHOLD) { 106 WARN_MSG("Possible Deadlock detected"); 107 WARN_EXPR(request); 108 WARN_EXPR(m_chip_ptr->getID()); 109 WARN_EXPR(m_version); 110 WARN_EXPR(keys.size()); 111 WARN_EXPR(current_time); 112 WARN_EXPR(request.getTime()); 113 WARN_EXPR(current_time - request.getTime()); 114 WARN_EXPR(m_readRequestTable_ptr[p]); 115* ERROR_MSG("Aborting"); 116 deadlock = true; 117 } 118 } 119 120 keys = m_writeRequestTable_ptr[p]->keys(); 121 for (int i=0; i<keys.size(); i++) { 122 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 123 if (current_time - request.getTime() >= g_DEADLOCK_THRESHOLD) { 124 WARN_MSG("Possible Deadlock detected"); 125 WARN_EXPR(request); 126 WARN_EXPR(m_chip_ptr->getID()); 127 WARN_EXPR(m_version); 128 WARN_EXPR(current_time); 129 WARN_EXPR(request.getTime()); 130 WARN_EXPR(current_time - request.getTime()); 131 WARN_EXPR(keys.size()); 132 WARN_EXPR(m_writeRequestTable_ptr[p]); 133* ERROR_MSG("Aborting"); 134 deadlock = true; 135 } 136 } 137 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 138 } // across all request tables 139 assert(m_outstanding_count == total_outstanding); 140 141 if (m_outstanding_count > 0) { // If there are still outstanding requests, keep checking 142 g_eventQueue_ptr->scheduleEvent(this, g_DEADLOCK_THRESHOLD); 143 } else { 144 m_deadlock_check_scheduled = false; 145 } 146} 147 148//returns the total number of requests 149int Sequencer::getNumberOutstanding(){ 150 return m_outstanding_count; 151} 152 153// returns the total number of demand requests 154int Sequencer::getNumberOutstandingDemand(){ 155 int smt_threads = RubyConfig::numberofSMTThreads(); 156 int total_demand = 0; 157 for(int p=0; p < smt_threads; ++p){ 158 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 159 for (int i=0; i< keys.size(); i++) { 160 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]);	51Sequencer::Sequencer(AbstractChip* chip_ptr, int version) { 52 m_chip_ptr = chip_ptr; 53 m_version = version; 54 55 m_deadlock_check_scheduled = false; 56 m_outstanding_count = 0; 57 58 int smt_threads = RubyConfig::numberofSMTThreads(); 59 m_writeRequestTable_ptr = new Map<Address, CacheMsg>[smt_threads]; 60 m_readRequestTable_ptr = new Map<Address, CacheMsg>[smt_threads]; 61 62 for(int p=0; p < smt_threads; ++p){ 63 m_writeRequestTable_ptr[p] = new Map<Address, CacheMsg>; 64 m_readRequestTable_ptr[p] = new Map<Address, CacheMsg>; 65 } 66 67} 68 69Sequencer::~Sequencer() { 70 int smt_threads = RubyConfig::numberofSMTThreads(); 71 for(int i=0; i < smt_threads; ++i){ 72 if(m_writeRequestTable_ptr[i]){ 73 delete m_writeRequestTable_ptr[i]; 74 } 75 if(m_readRequestTable_ptr[i]){ 76 delete m_readRequestTable_ptr[i]; 77 } 78 } 79 if(m_writeRequestTable_ptr){ 80 delete [] m_writeRequestTable_ptr; 81 } 82 if(m_readRequestTable_ptr){ 83 delete [] m_readRequestTable_ptr; 84 } 85} 86 87void Sequencer::wakeup() { 88 // Check for deadlock of any of the requests 89 Time current_time = g_eventQueue_ptr->getTime(); 90 bool deadlock = false; 91 92 // Check across all outstanding requests 93 int smt_threads = RubyConfig::numberofSMTThreads(); 94 int total_outstanding = 0; 95 for(int p=0; p < smt_threads; ++p){ 96 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 97 for (int i=0; i<keys.size(); i++) { 98 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]); 99 if (current_time - request.getTime() >= g_DEADLOCK_THRESHOLD) { 100 WARN_MSG("Possible Deadlock detected"); 101 WARN_EXPR(request); 102 WARN_EXPR(m_chip_ptr->getID()); 103 WARN_EXPR(m_version); 104 WARN_EXPR(keys.size()); 105 WARN_EXPR(current_time); 106 WARN_EXPR(request.getTime()); 107 WARN_EXPR(current_time - request.getTime()); 108 WARN_EXPR(m_readRequestTable_ptr[p]); 109* ERROR_MSG("Aborting"); 110 deadlock = true; 111 } 112 } 113 114 keys = m_writeRequestTable_ptr[p]->keys(); 115 for (int i=0; i<keys.size(); i++) { 116 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 117 if (current_time - request.getTime() >= g_DEADLOCK_THRESHOLD) { 118 WARN_MSG("Possible Deadlock detected"); 119 WARN_EXPR(request); 120 WARN_EXPR(m_chip_ptr->getID()); 121 WARN_EXPR(m_version); 122 WARN_EXPR(current_time); 123 WARN_EXPR(request.getTime()); 124 WARN_EXPR(current_time - request.getTime()); 125 WARN_EXPR(keys.size()); 126 WARN_EXPR(m_writeRequestTable_ptr[p]); 127* ERROR_MSG("Aborting"); 128 deadlock = true; 129 } 130 } 131 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 132 } // across all request tables 133 assert(m_outstanding_count == total_outstanding); 134 135 if (m_outstanding_count > 0) { // If there are still outstanding requests, keep checking 136 g_eventQueue_ptr->scheduleEvent(this, g_DEADLOCK_THRESHOLD); 137 } else { 138 m_deadlock_check_scheduled = false; 139 } 140} 141 142//returns the total number of requests 143int Sequencer::getNumberOutstanding(){ 144 return m_outstanding_count; 145} 146 147// returns the total number of demand requests 148int Sequencer::getNumberOutstandingDemand(){ 149 int smt_threads = RubyConfig::numberofSMTThreads(); 150 int total_demand = 0; 151 for(int p=0; p < smt_threads; ++p){ 152 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 153 for (int i=0; i< keys.size(); i++) { 154 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]);
161 // don't count transactional begin/commit requests 162 if(request.getType() != CacheRequestType_BEGIN_XACT && request.getType() != CacheRequestType_COMMIT_XACT){ 163 if(request.getPrefetch() == PrefetchBit_No){ 164 total_demand++; 165 }	155 if(request.getPrefetch() == PrefetchBit_No){ 156 total_demand++;
166 } 167 } 168 169 keys = m_writeRequestTable_ptr[p]->keys(); 170 for (int i=0; i< keys.size(); i++) { 171 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 172 if(request.getPrefetch() == PrefetchBit_No){ 173 total_demand++; 174 } 175 } 176 } 177 178 return total_demand; 179} 180 181int Sequencer::getNumberOutstandingPrefetch(){ 182 int smt_threads = RubyConfig::numberofSMTThreads(); 183 int total_prefetch = 0; 184 for(int p=0; p < smt_threads; ++p){ 185 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 186 for (int i=0; i< keys.size(); i++) { 187 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]); 188 if(request.getPrefetch() == PrefetchBit_Yes){ 189 total_prefetch++; 190 } 191 } 192 193 keys = m_writeRequestTable_ptr[p]->keys(); 194 for (int i=0; i< keys.size(); i++) { 195 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 196 if(request.getPrefetch() == PrefetchBit_Yes){ 197 total_prefetch++; 198 } 199 } 200 } 201 202 return total_prefetch; 203} 204 205bool Sequencer::isPrefetchRequest(const Address & lineaddr){ 206 int smt_threads = RubyConfig::numberofSMTThreads(); 207 for(int p=0; p < smt_threads; ++p){ 208 // check load requests 209 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 210 for (int i=0; i< keys.size(); i++) { 211 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]); 212 if(line_address(request.getAddress()) == lineaddr){ 213 if(request.getPrefetch() == PrefetchBit_Yes){ 214 return true; 215 } 216 else{ 217 return false; 218 } 219 } 220 } 221 222 // check store requests 223 keys = m_writeRequestTable_ptr[p]->keys(); 224 for (int i=0; i< keys.size(); i++) { 225 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 226 if(line_address(request.getAddress()) == lineaddr){ 227 if(request.getPrefetch() == PrefetchBit_Yes){ 228 return true; 229 } 230 else{ 231 return false; 232 } 233 } 234 } 235 } 236 // we should've found a matching request 237 cout << "isRequestPrefetch() ERROR request NOT FOUND : " << lineaddr << endl; 238 printProgress(cout); 239 assert(0); 240} 241 242AccessModeType Sequencer::getAccessModeOfRequest(Address addr, int thread){ 243 if(m_readRequestTable_ptr[thread]->exist(line_address(addr))){ 244 CacheMsg& request = m_readRequestTable_ptr[thread]->lookup(addr); 245 return request.getAccessMode(); 246 } else if(m_writeRequestTable_ptr[thread]->exist(line_address(addr))){ 247 CacheMsg& request = m_writeRequestTable_ptr[thread]->lookup(addr); 248 return request.getAccessMode(); 249 } else { 250 printProgress(cout); 251 ERROR_MSG("Request not found in RequestTables"); 252 } 253} 254 255Address Sequencer::getLogicalAddressOfRequest(Address addr, int thread){ 256 assert(thread >= 0); 257 if(m_readRequestTable_ptr[thread]->exist(line_address(addr))){ 258 CacheMsg& request = m_readRequestTable_ptr[thread]->lookup(addr); 259 return request.getLogicalAddress(); 260 } else if(m_writeRequestTable_ptr[thread]->exist(line_address(addr))){ 261 CacheMsg& request = m_writeRequestTable_ptr[thread]->lookup(addr); 262 return request.getLogicalAddress(); 263 } else { 264 printProgress(cout); 265 WARN_MSG("Request not found in RequestTables"); 266 WARN_MSG(addr); 267 WARN_MSG(thread); 268 ASSERT(0); 269 } 270} 271 272// returns the ThreadID of the request 273int Sequencer::getRequestThreadID(const Address & addr){ 274 int smt_threads = RubyConfig::numberofSMTThreads(); 275 int thread = -1; 276 int num_found = 0; 277 for(int p=0; p < smt_threads; ++p){ 278 if(m_readRequestTable_ptr[p]->exist(addr)){ 279 num_found++; 280 thread = p; 281 } 282 if(m_writeRequestTable_ptr[p]->exist(addr)){ 283 num_found++; 284 thread = p; 285 } 286 } 287 if(num_found != 1){ 288 cout << "getRequestThreadID ERROR too many matching requests addr = " << addr << endl; 289 printProgress(cout); 290 } 291 ASSERT(num_found == 1); 292 ASSERT(thread != -1); 293 294 return thread; 295} 296 297// given a line address, return the request's physical address 298Address Sequencer::getRequestPhysicalAddress(const Address & lineaddr){ 299 int smt_threads = RubyConfig::numberofSMTThreads(); 300 Address physaddr; 301 int num_found = 0; 302 for(int p=0; p < smt_threads; ++p){ 303 if(m_readRequestTable_ptr[p]->exist(lineaddr)){ 304 num_found++; 305 physaddr = (m_readRequestTable_ptr[p]->lookup(lineaddr)).getAddress(); 306 } 307 if(m_writeRequestTable_ptr[p]->exist(lineaddr)){ 308 num_found++; 309 physaddr = (m_writeRequestTable_ptr[p]->lookup(lineaddr)).getAddress(); 310 } 311 } 312 if(num_found != 1){ 313 cout << "getRequestPhysicalAddress ERROR too many matching requests addr = " << lineaddr << endl; 314 printProgress(cout); 315 } 316 ASSERT(num_found == 1); 317 318 return physaddr; 319} 320 321void Sequencer::printProgress(ostream& out) const{ 322 323 int total_demand = 0; 324 out << "Sequencer Stats Version " << m_version << endl; 325 out << "Current time = " << g_eventQueue_ptr->getTime() << endl; 326 out << "---------------" << endl; 327 out << "outstanding requests" << endl; 328 329 int smt_threads = RubyConfig::numberofSMTThreads(); 330 for(int p=0; p < smt_threads; ++p){ 331 Vector<Address> rkeys = m_readRequestTable_ptr[p]->keys(); 332 int read_size = rkeys.size(); 333 out << "proc " << m_chip_ptr->getID() << " thread " << p << " Read Requests = " << read_size << endl; 334 // print the request table 335 for(int i=0; i < read_size; ++i){ 336 CacheMsg & request = m_readRequestTable_ptr[p]->lookup(rkeys[i]); 337 out << "\tRequest[ " << i << " ] = " << request.getType() << " Address " << rkeys[i] << " Posted " << request.getTime() << " PF " << request.getPrefetch() << endl; 338 if( request.getPrefetch() == PrefetchBit_No ){ 339 total_demand++; 340 } 341 } 342 343 Vector<Address> wkeys = m_writeRequestTable_ptr[p]->keys(); 344 int write_size = wkeys.size(); 345 out << "proc " << m_chip_ptr->getID() << " thread " << p << " Write Requests = " << write_size << endl; 346 // print the request table 347 for(int i=0; i < write_size; ++i){ 348 CacheMsg & request = m_writeRequestTable_ptr[p]->lookup(wkeys[i]); 349 out << "\tRequest[ " << i << " ] = " << request.getType() << " Address " << wkeys[i] << " Posted " << request.getTime() << " PF " << request.getPrefetch() << endl; 350 if( request.getPrefetch() == PrefetchBit_No ){ 351 total_demand++; 352 } 353 } 354 355 out << endl; 356 } 357 out << "Total Number Outstanding: " << m_outstanding_count << endl; 358 out << "Total Number Demand : " << total_demand << endl; 359 out << "Total Number Prefetches : " << m_outstanding_count - total_demand << endl; 360 out << endl; 361 out << endl; 362 363} 364 365void Sequencer::printConfig(ostream& out) { 366 if (TSO) { 367 out << "sequencer: Sequencer - TSO" << endl; 368 } else { 369 out << "sequencer: Sequencer - SC" << endl; 370 } 371 out << " max_outstanding_requests: " << g_SEQUENCER_OUTSTANDING_REQUESTS << endl; 372} 373 374bool Sequencer::empty() const { 375 return m_outstanding_count == 0; 376} 377 378// Insert the request on the correct request table. Return true if 379// the entry was already present. 380bool Sequencer::insertRequest(const CacheMsg& request) { 381 int thread = request.getThreadID(); 382 assert(thread >= 0); 383 int total_outstanding = 0; 384 int smt_threads = RubyConfig::numberofSMTThreads(); 385 for(int p=0; p < smt_threads; ++p){ 386 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 387 } 388 assert(m_outstanding_count == total_outstanding); 389 390 // See if we should schedule a deadlock check 391 if (m_deadlock_check_scheduled == false) { 392 g_eventQueue_ptr->scheduleEvent(this, g_DEADLOCK_THRESHOLD); 393 m_deadlock_check_scheduled = true; 394 } 395 396 if ((request.getType() == CacheRequestType_ST) \|\|	157 } 158 } 159 160 keys = m_writeRequestTable_ptr[p]->keys(); 161 for (int i=0; i< keys.size(); i++) { 162 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 163 if(request.getPrefetch() == PrefetchBit_No){ 164 total_demand++; 165 } 166 } 167 } 168 169 return total_demand; 170} 171 172int Sequencer::getNumberOutstandingPrefetch(){ 173 int smt_threads = RubyConfig::numberofSMTThreads(); 174 int total_prefetch = 0; 175 for(int p=0; p < smt_threads; ++p){ 176 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 177 for (int i=0; i< keys.size(); i++) { 178 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]); 179 if(request.getPrefetch() == PrefetchBit_Yes){ 180 total_prefetch++; 181 } 182 } 183 184 keys = m_writeRequestTable_ptr[p]->keys(); 185 for (int i=0; i< keys.size(); i++) { 186 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 187 if(request.getPrefetch() == PrefetchBit_Yes){ 188 total_prefetch++; 189 } 190 } 191 } 192 193 return total_prefetch; 194} 195 196bool Sequencer::isPrefetchRequest(const Address & lineaddr){ 197 int smt_threads = RubyConfig::numberofSMTThreads(); 198 for(int p=0; p < smt_threads; ++p){ 199 // check load requests 200 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 201 for (int i=0; i< keys.size(); i++) { 202 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]); 203 if(line_address(request.getAddress()) == lineaddr){ 204 if(request.getPrefetch() == PrefetchBit_Yes){ 205 return true; 206 } 207 else{ 208 return false; 209 } 210 } 211 } 212 213 // check store requests 214 keys = m_writeRequestTable_ptr[p]->keys(); 215 for (int i=0; i< keys.size(); i++) { 216 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 217 if(line_address(request.getAddress()) == lineaddr){ 218 if(request.getPrefetch() == PrefetchBit_Yes){ 219 return true; 220 } 221 else{ 222 return false; 223 } 224 } 225 } 226 } 227 // we should've found a matching request 228 cout << "isRequestPrefetch() ERROR request NOT FOUND : " << lineaddr << endl; 229 printProgress(cout); 230 assert(0); 231} 232 233AccessModeType Sequencer::getAccessModeOfRequest(Address addr, int thread){ 234 if(m_readRequestTable_ptr[thread]->exist(line_address(addr))){ 235 CacheMsg& request = m_readRequestTable_ptr[thread]->lookup(addr); 236 return request.getAccessMode(); 237 } else if(m_writeRequestTable_ptr[thread]->exist(line_address(addr))){ 238 CacheMsg& request = m_writeRequestTable_ptr[thread]->lookup(addr); 239 return request.getAccessMode(); 240 } else { 241 printProgress(cout); 242 ERROR_MSG("Request not found in RequestTables"); 243 } 244} 245 246Address Sequencer::getLogicalAddressOfRequest(Address addr, int thread){ 247 assert(thread >= 0); 248 if(m_readRequestTable_ptr[thread]->exist(line_address(addr))){ 249 CacheMsg& request = m_readRequestTable_ptr[thread]->lookup(addr); 250 return request.getLogicalAddress(); 251 } else if(m_writeRequestTable_ptr[thread]->exist(line_address(addr))){ 252 CacheMsg& request = m_writeRequestTable_ptr[thread]->lookup(addr); 253 return request.getLogicalAddress(); 254 } else { 255 printProgress(cout); 256 WARN_MSG("Request not found in RequestTables"); 257 WARN_MSG(addr); 258 WARN_MSG(thread); 259 ASSERT(0); 260 } 261} 262 263// returns the ThreadID of the request 264int Sequencer::getRequestThreadID(const Address & addr){ 265 int smt_threads = RubyConfig::numberofSMTThreads(); 266 int thread = -1; 267 int num_found = 0; 268 for(int p=0; p < smt_threads; ++p){ 269 if(m_readRequestTable_ptr[p]->exist(addr)){ 270 num_found++; 271 thread = p; 272 } 273 if(m_writeRequestTable_ptr[p]->exist(addr)){ 274 num_found++; 275 thread = p; 276 } 277 } 278 if(num_found != 1){ 279 cout << "getRequestThreadID ERROR too many matching requests addr = " << addr << endl; 280 printProgress(cout); 281 } 282 ASSERT(num_found == 1); 283 ASSERT(thread != -1); 284 285 return thread; 286} 287 288// given a line address, return the request's physical address 289Address Sequencer::getRequestPhysicalAddress(const Address & lineaddr){ 290 int smt_threads = RubyConfig::numberofSMTThreads(); 291 Address physaddr; 292 int num_found = 0; 293 for(int p=0; p < smt_threads; ++p){ 294 if(m_readRequestTable_ptr[p]->exist(lineaddr)){ 295 num_found++; 296 physaddr = (m_readRequestTable_ptr[p]->lookup(lineaddr)).getAddress(); 297 } 298 if(m_writeRequestTable_ptr[p]->exist(lineaddr)){ 299 num_found++; 300 physaddr = (m_writeRequestTable_ptr[p]->lookup(lineaddr)).getAddress(); 301 } 302 } 303 if(num_found != 1){ 304 cout << "getRequestPhysicalAddress ERROR too many matching requests addr = " << lineaddr << endl; 305 printProgress(cout); 306 } 307 ASSERT(num_found == 1); 308 309 return physaddr; 310} 311 312void Sequencer::printProgress(ostream& out) const{ 313 314 int total_demand = 0; 315 out << "Sequencer Stats Version " << m_version << endl; 316 out << "Current time = " << g_eventQueue_ptr->getTime() << endl; 317 out << "---------------" << endl; 318 out << "outstanding requests" << endl; 319 320 int smt_threads = RubyConfig::numberofSMTThreads(); 321 for(int p=0; p < smt_threads; ++p){ 322 Vector<Address> rkeys = m_readRequestTable_ptr[p]->keys(); 323 int read_size = rkeys.size(); 324 out << "proc " << m_chip_ptr->getID() << " thread " << p << " Read Requests = " << read_size << endl; 325 // print the request table 326 for(int i=0; i < read_size; ++i){ 327 CacheMsg & request = m_readRequestTable_ptr[p]->lookup(rkeys[i]); 328 out << "\tRequest[ " << i << " ] = " << request.getType() << " Address " << rkeys[i] << " Posted " << request.getTime() << " PF " << request.getPrefetch() << endl; 329 if( request.getPrefetch() == PrefetchBit_No ){ 330 total_demand++; 331 } 332 } 333 334 Vector<Address> wkeys = m_writeRequestTable_ptr[p]->keys(); 335 int write_size = wkeys.size(); 336 out << "proc " << m_chip_ptr->getID() << " thread " << p << " Write Requests = " << write_size << endl; 337 // print the request table 338 for(int i=0; i < write_size; ++i){ 339 CacheMsg & request = m_writeRequestTable_ptr[p]->lookup(wkeys[i]); 340 out << "\tRequest[ " << i << " ] = " << request.getType() << " Address " << wkeys[i] << " Posted " << request.getTime() << " PF " << request.getPrefetch() << endl; 341 if( request.getPrefetch() == PrefetchBit_No ){ 342 total_demand++; 343 } 344 } 345 346 out << endl; 347 } 348 out << "Total Number Outstanding: " << m_outstanding_count << endl; 349 out << "Total Number Demand : " << total_demand << endl; 350 out << "Total Number Prefetches : " << m_outstanding_count - total_demand << endl; 351 out << endl; 352 out << endl; 353 354} 355 356void Sequencer::printConfig(ostream& out) { 357 if (TSO) { 358 out << "sequencer: Sequencer - TSO" << endl; 359 } else { 360 out << "sequencer: Sequencer - SC" << endl; 361 } 362 out << " max_outstanding_requests: " << g_SEQUENCER_OUTSTANDING_REQUESTS << endl; 363} 364 365bool Sequencer::empty() const { 366 return m_outstanding_count == 0; 367} 368 369// Insert the request on the correct request table. Return true if 370// the entry was already present. 371bool Sequencer::insertRequest(const CacheMsg& request) { 372 int thread = request.getThreadID(); 373 assert(thread >= 0); 374 int total_outstanding = 0; 375 int smt_threads = RubyConfig::numberofSMTThreads(); 376 for(int p=0; p < smt_threads; ++p){ 377 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 378 } 379 assert(m_outstanding_count == total_outstanding); 380 381 // See if we should schedule a deadlock check 382 if (m_deadlock_check_scheduled == false) { 383 g_eventQueue_ptr->scheduleEvent(this, g_DEADLOCK_THRESHOLD); 384 m_deadlock_check_scheduled = true; 385 } 386 387 if ((request.getType() == CacheRequestType_ST) \|\|
397 (request.getType() == CacheRequestType_ST_XACT) \|\| 398 (request.getType() == CacheRequestType_LDX_XACT) \|\|
399 (request.getType() == CacheRequestType_ATOMIC)) { 400 if (m_writeRequestTable_ptr[thread]->exist(line_address(request.getAddress()))) { 401 m_writeRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 402 return true; 403 } 404 m_writeRequestTable_ptr[thread]->allocate(line_address(request.getAddress())); 405 m_writeRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 406 m_outstanding_count++; 407 } else { 408 if (m_readRequestTable_ptr[thread]->exist(line_address(request.getAddress()))) { 409 m_readRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 410 return true; 411 } 412 m_readRequestTable_ptr[thread]->allocate(line_address(request.getAddress())); 413 m_readRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 414 m_outstanding_count++; 415 } 416 417 g_system_ptr->getProfiler()->sequencerRequests(m_outstanding_count); 418 419 total_outstanding = 0; 420 for(int p=0; p < smt_threads; ++p){ 421 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 422 } 423 424 assert(m_outstanding_count == total_outstanding); 425 return false; 426} 427 428void Sequencer::removeRequest(const CacheMsg& request) { 429 int thread = request.getThreadID(); 430 assert(thread >= 0); 431 int total_outstanding = 0; 432 int smt_threads = RubyConfig::numberofSMTThreads(); 433 for(int p=0; p < smt_threads; ++p){ 434 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 435 } 436 assert(m_outstanding_count == total_outstanding); 437 438 if ((request.getType() == CacheRequestType_ST) \|\|	388 (request.getType() == CacheRequestType_ATOMIC)) { 389 if (m_writeRequestTable_ptr[thread]->exist(line_address(request.getAddress()))) { 390 m_writeRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 391 return true; 392 } 393 m_writeRequestTable_ptr[thread]->allocate(line_address(request.getAddress())); 394 m_writeRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 395 m_outstanding_count++; 396 } else { 397 if (m_readRequestTable_ptr[thread]->exist(line_address(request.getAddress()))) { 398 m_readRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 399 return true; 400 } 401 m_readRequestTable_ptr[thread]->allocate(line_address(request.getAddress())); 402 m_readRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 403 m_outstanding_count++; 404 } 405 406 g_system_ptr->getProfiler()->sequencerRequests(m_outstanding_count); 407 408 total_outstanding = 0; 409 for(int p=0; p < smt_threads; ++p){ 410 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 411 } 412 413 assert(m_outstanding_count == total_outstanding); 414 return false; 415} 416 417void Sequencer::removeRequest(const CacheMsg& request) { 418 int thread = request.getThreadID(); 419 assert(thread >= 0); 420 int total_outstanding = 0; 421 int smt_threads = RubyConfig::numberofSMTThreads(); 422 for(int p=0; p < smt_threads; ++p){ 423 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 424 } 425 assert(m_outstanding_count == total_outstanding); 426 427 if ((request.getType() == CacheRequestType_ST) \|\|
439 (request.getType() == CacheRequestType_ST_XACT) \|\| 440 (request.getType() == CacheRequestType_LDX_XACT) \|\|
441 (request.getType() == CacheRequestType_ATOMIC)) { 442 m_writeRequestTable_ptr[thread]->deallocate(line_address(request.getAddress())); 443 } else { 444 m_readRequestTable_ptr[thread]->deallocate(line_address(request.getAddress())); 445 } 446 m_outstanding_count--; 447 448 total_outstanding = 0; 449 for(int p=0; p < smt_threads; ++p){ 450 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 451 } 452 assert(m_outstanding_count == total_outstanding); 453} 454 455void Sequencer::writeCallback(const Address& address) { 456 DataBlock data; 457 writeCallback(address, data); 458} 459 460void Sequencer::writeCallback(const Address& address, DataBlock& data) { 461 // process oldest thread first 462 int thread = -1; 463 Time oldest_time = 0; 464 int smt_threads = RubyConfig::numberofSMTThreads(); 465 for(int t=0; t < smt_threads; ++t){ 466 if(m_writeRequestTable_ptr[t]->exist(address)){ 467 CacheMsg & request = m_writeRequestTable_ptr[t]->lookup(address); 468 if(thread == -1 \|\| (request.getTime() < oldest_time) ){ 469 thread = t; 470 oldest_time = request.getTime(); 471 } 472 } 473 } 474 // make sure we found an oldest thread 475 ASSERT(thread != -1); 476 477 CacheMsg & request = m_writeRequestTable_ptr[thread]->lookup(address); 478 479 writeCallback(address, data, GenericMachineType_NULL, PrefetchBit_No, thread); 480} 481 482void Sequencer::writeCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, PrefetchBit pf, int thread) { 483 484 assert(address == line_address(address)); 485 assert(thread >= 0); 486 assert(m_writeRequestTable_ptr[thread]->exist(line_address(address))); 487 488 writeCallback(address, data, respondingMach, thread); 489 490} 491 492void Sequencer::writeCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, int thread) { 493 assert(address == line_address(address)); 494 assert(m_writeRequestTable_ptr[thread]->exist(line_address(address))); 495 CacheMsg request = m_writeRequestTable_ptr[thread]->lookup(address); 496 assert( request.getThreadID() == thread); 497 removeRequest(request); 498 499 assert((request.getType() == CacheRequestType_ST) \|\|	428 (request.getType() == CacheRequestType_ATOMIC)) { 429 m_writeRequestTable_ptr[thread]->deallocate(line_address(request.getAddress())); 430 } else { 431 m_readRequestTable_ptr[thread]->deallocate(line_address(request.getAddress())); 432 } 433 m_outstanding_count--; 434 435 total_outstanding = 0; 436 for(int p=0; p < smt_threads; ++p){ 437 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 438 } 439 assert(m_outstanding_count == total_outstanding); 440} 441 442void Sequencer::writeCallback(const Address& address) { 443 DataBlock data; 444 writeCallback(address, data); 445} 446 447void Sequencer::writeCallback(const Address& address, DataBlock& data) { 448 // process oldest thread first 449 int thread = -1; 450 Time oldest_time = 0; 451 int smt_threads = RubyConfig::numberofSMTThreads(); 452 for(int t=0; t < smt_threads; ++t){ 453 if(m_writeRequestTable_ptr[t]->exist(address)){ 454 CacheMsg & request = m_writeRequestTable_ptr[t]->lookup(address); 455 if(thread == -1 \|\| (request.getTime() < oldest_time) ){ 456 thread = t; 457 oldest_time = request.getTime(); 458 } 459 } 460 } 461 // make sure we found an oldest thread 462 ASSERT(thread != -1); 463 464 CacheMsg & request = m_writeRequestTable_ptr[thread]->lookup(address); 465 466 writeCallback(address, data, GenericMachineType_NULL, PrefetchBit_No, thread); 467} 468 469void Sequencer::writeCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, PrefetchBit pf, int thread) { 470 471 assert(address == line_address(address)); 472 assert(thread >= 0); 473 assert(m_writeRequestTable_ptr[thread]->exist(line_address(address))); 474 475 writeCallback(address, data, respondingMach, thread); 476 477} 478 479void Sequencer::writeCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, int thread) { 480 assert(address == line_address(address)); 481 assert(m_writeRequestTable_ptr[thread]->exist(line_address(address))); 482 CacheMsg request = m_writeRequestTable_ptr[thread]->lookup(address); 483 assert( request.getThreadID() == thread); 484 removeRequest(request); 485 486 assert((request.getType() == CacheRequestType_ST) \|\|
500 (request.getType() == CacheRequestType_ST_XACT) \|\| 501 (request.getType() == CacheRequestType_LDX_XACT) \|\|
502 (request.getType() == CacheRequestType_ATOMIC)); 503 504 hitCallback(request, data, respondingMach, thread); 505 506} 507 508void Sequencer::readCallback(const Address& address) { 509 DataBlock data; 510 readCallback(address, data); 511} 512 513void Sequencer::readCallback(const Address& address, DataBlock& data) { 514 // process oldest thread first 515 int thread = -1; 516 Time oldest_time = 0; 517 int smt_threads = RubyConfig::numberofSMTThreads(); 518 for(int t=0; t < smt_threads; ++t){ 519 if(m_readRequestTable_ptr[t]->exist(address)){ 520 CacheMsg & request = m_readRequestTable_ptr[t]->lookup(address); 521 if(thread == -1 \|\| (request.getTime() < oldest_time) ){ 522 thread = t; 523 oldest_time = request.getTime(); 524 } 525 } 526 } 527 // make sure we found an oldest thread 528 ASSERT(thread != -1); 529 530 CacheMsg & request = m_readRequestTable_ptr[thread]->lookup(address); 531 532 readCallback(address, data, GenericMachineType_NULL, PrefetchBit_No, thread); 533} 534 535void Sequencer::readCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, PrefetchBit pf, int thread) { 536 537 assert(address == line_address(address)); 538 assert(m_readRequestTable_ptr[thread]->exist(line_address(address))); 539 540 readCallback(address, data, respondingMach, thread); 541} 542 543void Sequencer::readCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, int thread) { 544 assert(address == line_address(address)); 545 assert(m_readRequestTable_ptr[thread]->exist(line_address(address))); 546 547 CacheMsg request = m_readRequestTable_ptr[thread]->lookup(address); 548 assert( request.getThreadID() == thread ); 549 removeRequest(request); 550 551 assert((request.getType() == CacheRequestType_LD) \|\|	487 (request.getType() == CacheRequestType_ATOMIC)); 488 489 hitCallback(request, data, respondingMach, thread); 490 491} 492 493void Sequencer::readCallback(const Address& address) { 494 DataBlock data; 495 readCallback(address, data); 496} 497 498void Sequencer::readCallback(const Address& address, DataBlock& data) { 499 // process oldest thread first 500 int thread = -1; 501 Time oldest_time = 0; 502 int smt_threads = RubyConfig::numberofSMTThreads(); 503 for(int t=0; t < smt_threads; ++t){ 504 if(m_readRequestTable_ptr[t]->exist(address)){ 505 CacheMsg & request = m_readRequestTable_ptr[t]->lookup(address); 506 if(thread == -1 \|\| (request.getTime() < oldest_time) ){ 507 thread = t; 508 oldest_time = request.getTime(); 509 } 510 } 511 } 512 // make sure we found an oldest thread 513 ASSERT(thread != -1); 514 515 CacheMsg & request = m_readRequestTable_ptr[thread]->lookup(address); 516 517 readCallback(address, data, GenericMachineType_NULL, PrefetchBit_No, thread); 518} 519 520void Sequencer::readCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, PrefetchBit pf, int thread) { 521 522 assert(address == line_address(address)); 523 assert(m_readRequestTable_ptr[thread]->exist(line_address(address))); 524 525 readCallback(address, data, respondingMach, thread); 526} 527 528void Sequencer::readCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, int thread) { 529 assert(address == line_address(address)); 530 assert(m_readRequestTable_ptr[thread]->exist(line_address(address))); 531 532 CacheMsg request = m_readRequestTable_ptr[thread]->lookup(address); 533 assert( request.getThreadID() == thread ); 534 removeRequest(request); 535 536 assert((request.getType() == CacheRequestType_LD) \|\|
552 (request.getType() == CacheRequestType_LD_XACT) \|\|
553 (request.getType() == CacheRequestType_IFETCH) 554 ); 555 556 hitCallback(request, data, respondingMach, thread); 557} 558 559void Sequencer::hitCallback(const CacheMsg& request, DataBlock& data, GenericMachineType respondingMach, int thread) { 560 int size = request.getSize(); 561 Address request_address = request.getAddress(); 562 Address request_logical_address = request.getLogicalAddress(); 563 Address request_line_address = line_address(request_address); 564 CacheRequestType type = request.getType(); 565 int threadID = request.getThreadID(); 566 Time issued_time = request.getTime(); 567 int logical_proc_no = ((m_chip_ptr->getID() * RubyConfig::numberOfProcsPerChip()) + m_version) * RubyConfig::numberofSMTThreads() + threadID; 568 569 DEBUG_MSG(SEQUENCER_COMP, MedPrio, size); 570 571 // Set this cache entry to the most recently used 572 if (type == CacheRequestType_IFETCH) { 573 if (Protocol::m_TwoLevelCache) { 574 if (m_chip_ptr->m_L1Cache_L1IcacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 575 m_chip_ptr->m_L1Cache_L1IcacheMemory_vec[m_version]->setMRU(request_line_address); 576 } 577 } 578 else { 579 if (m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 580 m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->setMRU(request_line_address); 581 } 582 } 583 } else { 584 if (Protocol::m_TwoLevelCache) { 585 if (m_chip_ptr->m_L1Cache_L1DcacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 586 m_chip_ptr->m_L1Cache_L1DcacheMemory_vec[m_version]->setMRU(request_line_address); 587 } 588 } 589 else { 590 if (m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 591 m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->setMRU(request_line_address); 592 } 593 } 594 } 595 596 assert(g_eventQueue_ptr->getTime() >= issued_time); 597 Time miss_latency = g_eventQueue_ptr->getTime() - issued_time; 598 599 if (PROTOCOL_DEBUG_TRACE) { 600 g_system_ptr->getProfiler()->profileTransition("Seq", (m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version), -1, request.getAddress(), "", "Done", "", 601* int_to_string(miss_latency)+" cycles "+GenericMachineType_to_string(respondingMach)+" "+CacheRequestType_to_string(request.getType())+" "+PrefetchBit_to_string(request.getPrefetch())); 602 } 603 604 DEBUG_MSG(SEQUENCER_COMP, MedPrio, request_address); 605 DEBUG_MSG(SEQUENCER_COMP, MedPrio, request.getPrefetch()); 606 if (request.getPrefetch() == PrefetchBit_Yes) { 607 DEBUG_MSG(SEQUENCER_COMP, MedPrio, "return"); 608 g_system_ptr->getProfiler()->swPrefetchLatency(miss_latency, type, respondingMach); 609 return; // Ignore the software prefetch, don't callback the driver 610 } 611 612 // Profile the miss latency for all non-zero demand misses 613 if (miss_latency != 0) { 614 g_system_ptr->getProfiler()->missLatency(miss_latency, type, respondingMach); 615 616#if 0 617 uinteger_t tick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick")); 618 uinteger_t tick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick_cmpr")); 619 uinteger_t stick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick")); 620 uinteger_t stick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick_cmpr")); 621 cout << "END PROC " << m_version << hex << " tick = " << tick << " tick_cmpr = " << tick_cmpr << " stick = " << stick << " stick_cmpr = " << stick_cmpr << " cycle = "<< g_eventQueue_ptr->getTime() << dec << endl; 622#endif 623 624 } 625 626 bool write = 627 (type == CacheRequestType_ST) \|\|	537 (request.getType() == CacheRequestType_IFETCH) 538 ); 539 540 hitCallback(request, data, respondingMach, thread); 541} 542 543void Sequencer::hitCallback(const CacheMsg& request, DataBlock& data, GenericMachineType respondingMach, int thread) { 544 int size = request.getSize(); 545 Address request_address = request.getAddress(); 546 Address request_logical_address = request.getLogicalAddress(); 547 Address request_line_address = line_address(request_address); 548 CacheRequestType type = request.getType(); 549 int threadID = request.getThreadID(); 550 Time issued_time = request.getTime(); 551 int logical_proc_no = ((m_chip_ptr->getID() * RubyConfig::numberOfProcsPerChip()) + m_version) * RubyConfig::numberofSMTThreads() + threadID; 552 553 DEBUG_MSG(SEQUENCER_COMP, MedPrio, size); 554 555 // Set this cache entry to the most recently used 556 if (type == CacheRequestType_IFETCH) { 557 if (Protocol::m_TwoLevelCache) { 558 if (m_chip_ptr->m_L1Cache_L1IcacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 559 m_chip_ptr->m_L1Cache_L1IcacheMemory_vec[m_version]->setMRU(request_line_address); 560 } 561 } 562 else { 563 if (m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 564 m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->setMRU(request_line_address); 565 } 566 } 567 } else { 568 if (Protocol::m_TwoLevelCache) { 569 if (m_chip_ptr->m_L1Cache_L1DcacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 570 m_chip_ptr->m_L1Cache_L1DcacheMemory_vec[m_version]->setMRU(request_line_address); 571 } 572 } 573 else { 574 if (m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 575 m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->setMRU(request_line_address); 576 } 577 } 578 } 579 580 assert(g_eventQueue_ptr->getTime() >= issued_time); 581 Time miss_latency = g_eventQueue_ptr->getTime() - issued_time; 582 583 if (PROTOCOL_DEBUG_TRACE) { 584 g_system_ptr->getProfiler()->profileTransition("Seq", (m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version), -1, request.getAddress(), "", "Done", "", 585* int_to_string(miss_latency)+" cycles "+GenericMachineType_to_string(respondingMach)+" "+CacheRequestType_to_string(request.getType())+" "+PrefetchBit_to_string(request.getPrefetch())); 586 } 587 588 DEBUG_MSG(SEQUENCER_COMP, MedPrio, request_address); 589 DEBUG_MSG(SEQUENCER_COMP, MedPrio, request.getPrefetch()); 590 if (request.getPrefetch() == PrefetchBit_Yes) { 591 DEBUG_MSG(SEQUENCER_COMP, MedPrio, "return"); 592 g_system_ptr->getProfiler()->swPrefetchLatency(miss_latency, type, respondingMach); 593 return; // Ignore the software prefetch, don't callback the driver 594 } 595 596 // Profile the miss latency for all non-zero demand misses 597 if (miss_latency != 0) { 598 g_system_ptr->getProfiler()->missLatency(miss_latency, type, respondingMach); 599 600#if 0 601 uinteger_t tick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick")); 602 uinteger_t tick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick_cmpr")); 603 uinteger_t stick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick")); 604 uinteger_t stick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick_cmpr")); 605 cout << "END PROC " << m_version << hex << " tick = " << tick << " tick_cmpr = " << tick_cmpr << " stick = " << stick << " stick_cmpr = " << stick_cmpr << " cycle = "<< g_eventQueue_ptr->getTime() << dec << endl; 606#endif 607 608 } 609 610 bool write = 611 (type == CacheRequestType_ST) \|\|
628 (type == CacheRequestType_ST_XACT) \|\| 629 (type == CacheRequestType_LDX_XACT) \|\|
630 (type == CacheRequestType_ATOMIC); 631 632 if (TSO && write) { 633 m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->callBack(line_address(request.getAddress()), data); 634 } else { 635 636 // Copy the correct bytes out of the cache line into the subblock 637 SubBlock subblock(request_address, request_logical_address, size); 638 subblock.mergeFrom(data); // copy the correct bytes from DataBlock in the SubBlock 639 640 // Scan the store buffer to see if there are any outstanding stores we need to collect 641 if (TSO) { 642 m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->updateSubBlock(subblock); 643 } 644 645 // Call into the Driver (Tester or Simics) and let it read and/or modify the sub-block 646 g_system_ptr->getDriver()->hitCallback(m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version, subblock, type, threadID); 647* 648 // If the request was a Store or Atomic, apply the changes in the SubBlock to the DataBlock 649 // (This is only triggered for the non-TSO case) 650 if (write) { 651 assert(!TSO); 652 subblock.mergeTo(data); // copy the correct bytes from SubBlock into the DataBlock 653 } 654 } 655} 656	612 (type == CacheRequestType_ATOMIC); 613 614 if (TSO && write) { 615 m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->callBack(line_address(request.getAddress()), data); 616 } else { 617 618 // Copy the correct bytes out of the cache line into the subblock 619 SubBlock subblock(request_address, request_logical_address, size); 620 subblock.mergeFrom(data); // copy the correct bytes from DataBlock in the SubBlock 621 622 // Scan the store buffer to see if there are any outstanding stores we need to collect 623 if (TSO) { 624 m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->updateSubBlock(subblock); 625 } 626 627 // Call into the Driver (Tester or Simics) and let it read and/or modify the sub-block 628 g_system_ptr->getDriver()->hitCallback(m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version, subblock, type, threadID); 629* 630 // If the request was a Store or Atomic, apply the changes in the SubBlock to the DataBlock 631 // (This is only triggered for the non-TSO case) 632 if (write) { 633 assert(!TSO); 634 subblock.mergeTo(data); // copy the correct bytes from SubBlock into the DataBlock 635 } 636 } 637} 638
657void Sequencer::readConflictCallback(const Address& address) { 658 // process oldest thread first 659 int thread = -1; 660 Time oldest_time = 0; 661 int smt_threads = RubyConfig::numberofSMTThreads(); 662 for(int t=0; t < smt_threads; ++t){ 663 if(m_readRequestTable_ptr[t]->exist(address)){ 664 CacheMsg & request = m_readRequestTable_ptr[t]->lookup(address); 665 if(thread == -1 \|\| (request.getTime() < oldest_time) ){ 666 thread = t; 667 oldest_time = request.getTime(); 668 } 669 } 670 } 671 // make sure we found an oldest thread 672 ASSERT(thread != -1); 673 674 CacheMsg & request = m_readRequestTable_ptr[thread]->lookup(address); 675 676 readConflictCallback(address, GenericMachineType_NULL, thread); 677} 678 679void Sequencer::readConflictCallback(const Address& address, GenericMachineType respondingMach, int thread) { 680 assert(address == line_address(address)); 681 assert(m_readRequestTable_ptr[thread]->exist(line_address(address))); 682 683 CacheMsg request = m_readRequestTable_ptr[thread]->lookup(address); 684 assert( request.getThreadID() == thread ); 685 removeRequest(request); 686 687 assert((request.getType() == CacheRequestType_LD) \|\| 688 (request.getType() == CacheRequestType_LD_XACT) \|\| 689 (request.getType() == CacheRequestType_IFETCH) 690 ); 691 692 conflictCallback(request, respondingMach, thread); 693} 694 695void Sequencer::writeConflictCallback(const Address& address) { 696 // process oldest thread first 697 int thread = -1; 698 Time oldest_time = 0; 699 int smt_threads = RubyConfig::numberofSMTThreads(); 700 for(int t=0; t < smt_threads; ++t){ 701 if(m_writeRequestTable_ptr[t]->exist(address)){ 702 CacheMsg & request = m_writeRequestTable_ptr[t]->lookup(address); 703 if(thread == -1 \|\| (request.getTime() < oldest_time) ){ 704 thread = t; 705 oldest_time = request.getTime(); 706 } 707 } 708 } 709 // make sure we found an oldest thread 710 ASSERT(thread != -1); 711 712 CacheMsg & request = m_writeRequestTable_ptr[thread]->lookup(address); 713 714 writeConflictCallback(address, GenericMachineType_NULL, thread); 715} 716 717void Sequencer::writeConflictCallback(const Address& address, GenericMachineType respondingMach, int thread) { 718 assert(address == line_address(address)); 719 assert(m_writeRequestTable_ptr[thread]->exist(line_address(address))); 720 CacheMsg request = m_writeRequestTable_ptr[thread]->lookup(address); 721 assert( request.getThreadID() == thread); 722 removeRequest(request); 723 724 assert((request.getType() == CacheRequestType_ST) \|\| 725 (request.getType() == CacheRequestType_ST_XACT) \|\| 726 (request.getType() == CacheRequestType_LDX_XACT) \|\| 727 (request.getType() == CacheRequestType_ATOMIC)); 728 729 conflictCallback(request, respondingMach, thread); 730 731} 732 733void Sequencer::conflictCallback(const CacheMsg& request, GenericMachineType respondingMach, int thread) { 734 assert(XACT_MEMORY); 735 int size = request.getSize(); 736 Address request_address = request.getAddress(); 737 Address request_logical_address = request.getLogicalAddress(); 738 Address request_line_address = line_address(request_address); 739 CacheRequestType type = request.getType(); 740 int threadID = request.getThreadID(); 741 Time issued_time = request.getTime(); 742 int logical_proc_no = ((m_chip_ptr->getID() * RubyConfig::numberOfProcsPerChip()) + m_version) * RubyConfig::numberofSMTThreads() + threadID; 743 744 DEBUG_MSG(SEQUENCER_COMP, MedPrio, size); 745 746 assert(g_eventQueue_ptr->getTime() >= issued_time); 747 Time miss_latency = g_eventQueue_ptr->getTime() - issued_time; 748 749 if (PROTOCOL_DEBUG_TRACE) { 750 g_system_ptr->getProfiler()->profileTransition("Seq", (m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version), -1, request.getAddress(), "", "Conflict", "", 751* int_to_string(miss_latency)+" cycles "+GenericMachineType_to_string(respondingMach)+" "+CacheRequestType_to_string(request.getType())+" "+PrefetchBit_to_string(request.getPrefetch())); 752 } 753 754 DEBUG_MSG(SEQUENCER_COMP, MedPrio, request_address); 755 DEBUG_MSG(SEQUENCER_COMP, MedPrio, request.getPrefetch()); 756 if (request.getPrefetch() == PrefetchBit_Yes) { 757 DEBUG_MSG(SEQUENCER_COMP, MedPrio, "return"); 758 g_system_ptr->getProfiler()->swPrefetchLatency(miss_latency, type, respondingMach); 759 return; // Ignore the software prefetch, don't callback the driver 760 } 761 762 bool write = 763 (type == CacheRequestType_ST) \|\| 764 (type == CacheRequestType_ST_XACT) \|\| 765 (type == CacheRequestType_LDX_XACT) \|\| 766 (type == CacheRequestType_ATOMIC); 767 768 // Copy the correct bytes out of the cache line into the subblock 769 SubBlock subblock(request_address, request_logical_address, size); 770 771 // Call into the Driver (Tester or Simics) 772 g_system_ptr->getDriver()->conflictCallback(m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version, subblock, type, threadID); 773* 774 // If the request was a Store or Atomic, apply the changes in the SubBlock to the DataBlock 775 // (This is only triggered for the non-TSO case) 776 if (write) { 777 assert(!TSO); 778 } 779} 780
781void Sequencer::printDebug(){ 782 //notify driver of debug 783 g_system_ptr->getDriver()->printDebug(); 784} 785 786// Returns true if the sequencer already has a load or store outstanding 787bool 788Sequencer::isReady(const Packet* pkt) const 789{ 790 791 int cpu_number = pkt->req->contextId(); 792 la_t logical_addr = pkt->req->getVaddr(); 793 pa_t physical_addr = pkt->req->getPaddr(); 794 CacheRequestType type_of_request; 795 if ( pkt->req->isInstFetch() ) { 796 type_of_request = CacheRequestType_IFETCH; 797 } else if ( pkt->req->isLocked() \|\| pkt->req->isSwap() ) { 798 type_of_request = CacheRequestType_ATOMIC; 799 } else if ( pkt->isRead() ) { 800 type_of_request = CacheRequestType_LD; 801 } else if ( pkt->isWrite() ) { 802 type_of_request = CacheRequestType_ST; 803 } else { 804 assert(false); 805 } 806 int thread = pkt->req->threadId(); 807 808 CacheMsg request(Address( physical_addr ), 809 Address( physical_addr ), 810 type_of_request, 811 Address(0), 812 AccessModeType_UserMode, // User/supervisor mode 813 0, // Size in bytes of request 814 PrefetchBit_No, // Not a prefetch 815 0, // Version number 816 Address(logical_addr), // Virtual Address	639void Sequencer::printDebug(){ 640 //notify driver of debug 641 g_system_ptr->getDriver()->printDebug(); 642} 643 644// Returns true if the sequencer already has a load or store outstanding 645bool 646Sequencer::isReady(const Packet* pkt) const 647{ 648 649 int cpu_number = pkt->req->contextId(); 650 la_t logical_addr = pkt->req->getVaddr(); 651 pa_t physical_addr = pkt->req->getPaddr(); 652 CacheRequestType type_of_request; 653 if ( pkt->req->isInstFetch() ) { 654 type_of_request = CacheRequestType_IFETCH; 655 } else if ( pkt->req->isLocked() \|\| pkt->req->isSwap() ) { 656 type_of_request = CacheRequestType_ATOMIC; 657 } else if ( pkt->isRead() ) { 658 type_of_request = CacheRequestType_LD; 659 } else if ( pkt->isWrite() ) { 660 type_of_request = CacheRequestType_ST; 661 } else { 662 assert(false); 663 } 664 int thread = pkt->req->threadId(); 665 666 CacheMsg request(Address( physical_addr ), 667 Address( physical_addr ), 668 type_of_request, 669 Address(0), 670 AccessModeType_UserMode, // User/supervisor mode 671 0, // Size in bytes of request 672 PrefetchBit_No, // Not a prefetch 673 0, // Version number 674 Address(logical_addr), // Virtual Address
817 thread, // SMT thread 818 0, // TM specific - timestamp of memory request 819 false // TM specific - whether request is part of escape action	675 thread // SMT thread
820 ); 821 isReady(request); 822} 823 824bool 825Sequencer::isReady(const CacheMsg& request) const 826{ 827 if (m_outstanding_count >= g_SEQUENCER_OUTSTANDING_REQUESTS) { 828 //cout << "TOO MANY OUTSTANDING: " << m_outstanding_count << " " << g_SEQUENCER_OUTSTANDING_REQUESTS << " VER " << m_version << endl; 829 //printProgress(cout); 830 return false; 831 } 832 833 // This code allows reads to be performed even when we have a write 834 // request outstanding for the line 835 bool write = 836 (request.getType() == CacheRequestType_ST) \|\|	676 ); 677 isReady(request); 678} 679 680bool 681Sequencer::isReady(const CacheMsg& request) const 682{ 683 if (m_outstanding_count >= g_SEQUENCER_OUTSTANDING_REQUESTS) { 684 //cout << "TOO MANY OUTSTANDING: " << m_outstanding_count << " " << g_SEQUENCER_OUTSTANDING_REQUESTS << " VER " << m_version << endl; 685 //printProgress(cout); 686 return false; 687 } 688 689 // This code allows reads to be performed even when we have a write 690 // request outstanding for the line 691 bool write = 692 (request.getType() == CacheRequestType_ST) \|\|
837 (request.getType() == CacheRequestType_ST_XACT) \|\| 838 (request.getType() == CacheRequestType_LDX_XACT) \|\|
839 (request.getType() == CacheRequestType_ATOMIC); 840 841 // LUKE - disallow more than one request type per address 842 // INVARIANT: at most one request type per address, per processor 843 int smt_threads = RubyConfig::numberofSMTThreads(); 844 for(int p=0; p < smt_threads; ++p){ 845 if( m_writeRequestTable_ptr[p]->exist(line_address(request.getAddress())) \|\| 846 m_readRequestTable_ptr[p]->exist(line_address(request.getAddress())) ){ 847 //cout << "OUTSTANDING REQUEST EXISTS " << p << " VER " << m_version << endl; 848 //printProgress(cout); 849 return false; 850 } 851 } 852 853 if (TSO) { 854 return m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->isReady(); 855 } 856 return true; 857} 858 859// Called by Driver (Simics or Tester). 860void 861Sequencer::makeRequest(const Packet* pkt, void* data) 862{ 863 int cpu_number = pkt->req->contextId(); 864 la_t logical_addr = pkt->req->getVaddr(); 865 pa_t physical_addr = pkt->req->getPaddr(); 866 int request_size = pkt->getSize(); 867 CacheRequestType type_of_request; 868 if ( pkt->req->isInstFetch() ) { 869 type_of_request = CacheRequestType_IFETCH; 870 } else if ( pkt->req->isLocked() \|\| pkt->req->isSwap() ) { 871 type_of_request = CacheRequestType_ATOMIC; 872 } else if ( pkt->isRead() ) { 873 type_of_request = CacheRequestType_LD; 874 } else if ( pkt->isWrite() ) { 875 type_of_request = CacheRequestType_ST; 876 } else { 877 assert(false); 878 } 879 la_t virtual_pc = pkt->req->getPC(); 880 int isPriv = false; // TODO: get permission data 881 int thread = pkt->req->threadId(); 882 883 AccessModeType access_mode = AccessModeType_UserMode; // TODO: get actual permission 884 885 CacheMsg request(Address( physical_addr ), 886 Address( physical_addr ), 887 type_of_request, 888 Address(virtual_pc), 889 access_mode, // User/supervisor mode 890 request_size, // Size in bytes of request 891 PrefetchBit_No, // Not a prefetch 892 0, // Version number 893 Address(logical_addr), // Virtual Address	693 (request.getType() == CacheRequestType_ATOMIC); 694 695 // LUKE - disallow more than one request type per address 696 // INVARIANT: at most one request type per address, per processor 697 int smt_threads = RubyConfig::numberofSMTThreads(); 698 for(int p=0; p < smt_threads; ++p){ 699 if( m_writeRequestTable_ptr[p]->exist(line_address(request.getAddress())) \|\| 700 m_readRequestTable_ptr[p]->exist(line_address(request.getAddress())) ){ 701 //cout << "OUTSTANDING REQUEST EXISTS " << p << " VER " << m_version << endl; 702 //printProgress(cout); 703 return false; 704 } 705 } 706 707 if (TSO) { 708 return m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->isReady(); 709 } 710 return true; 711} 712 713// Called by Driver (Simics or Tester). 714void 715Sequencer::makeRequest(const Packet* pkt, void* data) 716{ 717 int cpu_number = pkt->req->contextId(); 718 la_t logical_addr = pkt->req->getVaddr(); 719 pa_t physical_addr = pkt->req->getPaddr(); 720 int request_size = pkt->getSize(); 721 CacheRequestType type_of_request; 722 if ( pkt->req->isInstFetch() ) { 723 type_of_request = CacheRequestType_IFETCH; 724 } else if ( pkt->req->isLocked() \|\| pkt->req->isSwap() ) { 725 type_of_request = CacheRequestType_ATOMIC; 726 } else if ( pkt->isRead() ) { 727 type_of_request = CacheRequestType_LD; 728 } else if ( pkt->isWrite() ) { 729 type_of_request = CacheRequestType_ST; 730 } else { 731 assert(false); 732 } 733 la_t virtual_pc = pkt->req->getPC(); 734 int isPriv = false; // TODO: get permission data 735 int thread = pkt->req->threadId(); 736 737 AccessModeType access_mode = AccessModeType_UserMode; // TODO: get actual permission 738 739 CacheMsg request(Address( physical_addr ), 740 Address( physical_addr ), 741 type_of_request, 742 Address(virtual_pc), 743 access_mode, // User/supervisor mode 744 request_size, // Size in bytes of request 745 PrefetchBit_No, // Not a prefetch 746 0, // Version number 747 Address(logical_addr), // Virtual Address
894 thread, // SMT thread 895 0, // TM specific - timestamp of memory request 896 false // TM specific - whether request is part of escape action	748 thread // SMT thread
897 ); 898 makeRequest(request); 899} 900 901void 902Sequencer::makeRequest(const CacheMsg& request) 903{ 904 bool write = (request.getType() == CacheRequestType_ST) \|\|	749 ); 750 makeRequest(request); 751} 752 753void 754Sequencer::makeRequest(const CacheMsg& request) 755{ 756 bool write = (request.getType() == CacheRequestType_ST) \|\|
905 (request.getType() == CacheRequestType_ST_XACT) \|\| 906 (request.getType() == CacheRequestType_LDX_XACT) \|\|
907 (request.getType() == CacheRequestType_ATOMIC); 908 909 if (TSO && (request.getPrefetch() == PrefetchBit_No) && write) { 910 assert(m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->isReady()); 911 m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->insertStore(request); 912 return; 913 } 914 915 bool hit = doRequest(request); 916 917} 918 919bool Sequencer::doRequest(const CacheMsg& request) { 920 bool hit = false; 921 // Check the fast path 922 DataBlock* data_ptr; 923 924 int thread = request.getThreadID(); 925 926 hit = tryCacheAccess(line_address(request.getAddress()), 927 request.getType(), 928 request.getProgramCounter(), 929 request.getAccessMode(), 930 request.getSize(), 931 data_ptr); 932 933 if (hit && (request.getType() == CacheRequestType_IFETCH \|\| !REMOVE_SINGLE_CYCLE_DCACHE_FAST_PATH) ) { 934 DEBUG_MSG(SEQUENCER_COMP, MedPrio, "Fast path hit"); 935 hitCallback(request, data_ptr, GenericMachineType_L1Cache, thread); 936* return true; 937 } 938 939#if 0 940 uinteger_t tick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick")); 941 uinteger_t tick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick_cmpr")); 942 uinteger_t stick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick")); 943 uinteger_t stick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick_cmpr")); 944 cout << "START PROC " << m_version << hex << " tick = " << tick << " tick_cmpr = " << tick_cmpr << " stick = " << stick << " stick_cmpr = " << stick_cmpr << " cycle = "<< g_eventQueue_ptr->getTime() << dec << endl;; 945#endif 946 947 if (TSO && (request.getType() == CacheRequestType_LD \|\| request.getType() == CacheRequestType_IFETCH)) { 948 949 // See if we can satisfy the load entirely from the store buffer 950 SubBlock subblock(line_address(request.getAddress()), request.getSize()); 951 if (m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->trySubBlock(subblock)) { 952 DataBlock dummy; 953 hitCallback(request, dummy, GenericMachineType_NULL, thread); // Call with an 'empty' datablock, since the data is in the store buffer 954 return true; 955 } 956 } 957 958 DEBUG_MSG(SEQUENCER_COMP, MedPrio, "Fast path miss"); 959 issueRequest(request); 960 return hit; 961} 962 963void Sequencer::issueRequest(const CacheMsg& request) { 964 bool found = insertRequest(request); 965 966 if (!found) { 967 CacheMsg msg = request; 968 msg.getAddress() = line_address(request.getAddress()); // Make line address 969 970 // Fast Path L1 misses are profiled here - all non-fast path misses are profiled within the generated protocol code 971 if (!REMOVE_SINGLE_CYCLE_DCACHE_FAST_PATH) { 972 g_system_ptr->getProfiler()->addPrimaryStatSample(msg, m_chip_ptr->getID()); 973 } 974 975 if (PROTOCOL_DEBUG_TRACE) { 976 g_system_ptr->getProfiler()->profileTransition("Seq", (m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip() + m_version), -1, msg.getAddress(),"", "Begin", "", CacheRequestType_to_string(request.getType())); 977* } 978 979#if 0 980 // Commented out by nate binkert because I removed the trace stuff 981 if (g_system_ptr->getTracer()->traceEnabled()) { 982 g_system_ptr->getTracer()->traceRequest((m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version), msg.getAddress(), msg.getProgramCounter(), 983* msg.getType(), g_eventQueue_ptr->getTime()); 984 } 985#endif 986 987 Time latency = 0; // initialzed to an null value 988 989 latency = SEQUENCER_TO_CONTROLLER_LATENCY; 990 991 // Send the message to the cache controller 992 assert(latency > 0); 993 m_chip_ptr->m_L1Cache_mandatoryQueue_vec[m_version]->enqueue(msg, latency); 994 995 } // !found 996} 997 998bool Sequencer::tryCacheAccess(const Address& addr, CacheRequestType type, 999 const Address& pc, AccessModeType access_mode, 1000 int size, DataBlock& data_ptr) { 1001* if (type == CacheRequestType_IFETCH) { 1002 if (Protocol::m_TwoLevelCache) { 1003 return m_chip_ptr->m_L1Cache_L1IcacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 1004 } 1005 else { 1006 return m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 1007 } 1008 } else { 1009 if (Protocol::m_TwoLevelCache) { 1010 return m_chip_ptr->m_L1Cache_L1DcacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 1011 } 1012 else { 1013 return m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 1014 } 1015 } 1016} 1017 1018void Sequencer::resetRequestTime(const Address& addr, int thread){ 1019 assert(thread >= 0); 1020 //reset both load and store requests, if they exist 1021 if(m_readRequestTable_ptr[thread]->exist(line_address(addr))){ 1022 CacheMsg& request = m_readRequestTable_ptr[thread]->lookup(addr); 1023 if( request.m_AccessMode != AccessModeType_UserMode){ 1024 cout << "resetRequestType ERROR read request addr = " << addr << " thread = "<< thread << " is SUPERVISOR MODE" << endl; 1025 printProgress(cout); 1026 } 1027 //ASSERT(request.m_AccessMode == AccessModeType_UserMode); 1028 request.setTime(g_eventQueue_ptr->getTime()); 1029 } 1030 if(m_writeRequestTable_ptr[thread]->exist(line_address(addr))){ 1031 CacheMsg& request = m_writeRequestTable_ptr[thread]->lookup(addr); 1032 if( request.m_AccessMode != AccessModeType_UserMode){ 1033 cout << "resetRequestType ERROR write request addr = " << addr << " thread = "<< thread << " is SUPERVISOR MODE" << endl; 1034 printProgress(cout); 1035 } 1036 //ASSERT(request.m_AccessMode == AccessModeType_UserMode); 1037 request.setTime(g_eventQueue_ptr->getTime()); 1038 } 1039} 1040 1041// removes load request from queue 1042void Sequencer::removeLoadRequest(const Address & addr, int thread){ 1043 removeRequest(getReadRequest(addr, thread)); 1044} 1045 1046void Sequencer::removeStoreRequest(const Address & addr, int thread){ 1047 removeRequest(getWriteRequest(addr, thread)); 1048} 1049 1050// returns the read CacheMsg 1051CacheMsg & Sequencer::getReadRequest( const Address & addr, int thread ){ 1052 Address temp = addr; 1053 assert(thread >= 0); 1054 assert(temp == line_address(temp)); 1055 assert(m_readRequestTable_ptr[thread]->exist(addr)); 1056 return m_readRequestTable_ptr[thread]->lookup(addr); 1057} 1058 1059CacheMsg & Sequencer::getWriteRequest( const Address & addr, int thread){ 1060 Address temp = addr; 1061 assert(thread >= 0); 1062 assert(temp == line_address(temp)); 1063 assert(m_writeRequestTable_ptr[thread]->exist(addr)); 1064 return m_writeRequestTable_ptr[thread]->lookup(addr); 1065} 1066 1067void Sequencer::print(ostream& out) const { 1068 out << "[Sequencer: " << m_chip_ptr->getID() 1069 << ", outstanding requests: " << m_outstanding_count; 1070 1071 int smt_threads = RubyConfig::numberofSMTThreads(); 1072 for(int p=0; p < smt_threads; ++p){ 1073 out << ", read request table[ " << p << " ]: " << m_readRequestTable_ptr[p] 1074* << ", write request table[ " << p << " ]: " << m_writeRequestTable_ptr[p]; 1075* } 1076 out << "]"; 1077} 1078 1079// this can be called from setState whenever coherence permissions are upgraded 1080// when invoked, coherence violations will be checked for the given block 1081void Sequencer::checkCoherence(const Address& addr) { 1082#ifdef CHECK_COHERENCE 1083 g_system_ptr->checkGlobalCoherenceInvariant(addr); 1084#endif 1085} 1086 1087bool Sequencer::getRubyMemoryValue(const Address& addr, char* value, 1088 unsigned int size_in_bytes ) { 1089 if(g_SIMICS){ 1090 for(unsigned int i=0; i < size_in_bytes; i++) { 1091 value[i] = SIMICS_read_physical_memory( m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version, 1092* addr.getAddress() + i, 1 ); 1093 } 1094 return false; // Do nothing? 1095 } else { 1096 bool found = false; 1097 const Address lineAddr = line_address(addr); 1098 DataBlock data; 1099 PhysAddress paddr(addr); 1100 DataBlock* dataPtr = &data; 1101 Chip* n = dynamic_cast<Chip>(m_chip_ptr); 1102* // LUKE - use variable names instead of macros 1103 assert(n->m_L1Cache_L1IcacheMemory_vec[m_version] != NULL); 1104 assert(n->m_L1Cache_L1DcacheMemory_vec[m_version] != NULL); 1105 1106 MachineID l2_mach = map_L2ChipId_to_L2Cache(addr, m_chip_ptr->getID() ); 1107 int l2_ver = l2_mach.num%RubyConfig::numberOfL2CachePerChip(); 1108 1109 if (Protocol::m_TwoLevelCache) { 1110 if(Protocol::m_CMP){ 1111 assert(n->m_L2Cache_L2cacheMemory_vec[l2_ver] != NULL); 1112 } 1113 else{ 1114 assert(n->m_L1Cache_cacheMemory_vec[m_version] != NULL); 1115 } 1116 } 1117 1118 if (n->m_L1Cache_L1IcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_IFETCH, dataPtr)){ 1119 n->m_L1Cache_L1IcacheMemory_vec[m_version]->getMemoryValue(addr, value, size_in_bytes); 1120 found = true; 1121 } else if (n->m_L1Cache_L1DcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 1122 n->m_L1Cache_L1DcacheMemory_vec[m_version]->getMemoryValue(addr, value, size_in_bytes); 1123 found = true; 1124 } else if (Protocol::m_CMP && n->m_L2Cache_L2cacheMemory_vec[l2_ver]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 1125 n->m_L2Cache_L2cacheMemory_vec[l2_ver]->getMemoryValue(addr, value, size_in_bytes); 1126 found = true; 1127 // } else if (n->TBE_TABLE_MEMBER_VARIABLE->isPresent(lineAddr)){ 1128 // ASSERT(n->TBE_TABLE_MEMBER_VARIABLE->isPresent(lineAddr)); 1129 // L1Cache_TBE tbeEntry = n->TBE_TABLE_MEMBER_VARIABLE->lookup(lineAddr); 1130 1131 // int offset = addr.getOffset(); 1132 // for(int i=0; i<size_in_bytes; ++i){ 1133 // value[i] = tbeEntry.getDataBlk().getByte(offset + i); 1134 // } 1135 1136 // found = true; 1137 } else { 1138 // Address not found 1139 //cout << " " << m_chip_ptr->getID() << " NOT IN CACHE, Value at Directory is: " << (int) value[0] << endl; 1140 n = dynamic_cast<Chip>(g_system_ptr->getChip(map_Address_to_DirectoryNode(addr)/RubyConfig::numberOfDirectoryPerChip())); 1141* int dir_version = map_Address_to_DirectoryNode(addr)%RubyConfig::numberOfDirectoryPerChip(); 1142 for(unsigned int i=0; i<size_in_bytes; ++i){ 1143 int offset = addr.getOffset(); 1144 value[i] = n->m_Directory_directory_vec[dir_version]->lookup(lineAddr).m_DataBlk.getByte(offset + i); 1145 } 1146 // Address not found 1147 //WARN_MSG("Couldn't find address"); 1148 //WARN_EXPR(addr); 1149 found = false; 1150 } 1151 return true; 1152 } 1153} 1154 1155bool Sequencer::setRubyMemoryValue(const Address& addr, char value, 1156* unsigned int size_in_bytes) { 1157 char test_buffer[64]; 1158 1159 if(g_SIMICS){ 1160 return false; // Do nothing? 1161 } else { 1162 // idea here is that coherent cache should find the 1163 // latest data, the update it 1164 bool found = false; 1165 const Address lineAddr = line_address(addr); 1166 PhysAddress paddr(addr); 1167 DataBlock data; 1168 DataBlock* dataPtr = &data; 1169 Chip* n = dynamic_cast<Chip>(m_chip_ptr); 1170* 1171 MachineID l2_mach = map_L2ChipId_to_L2Cache(addr, m_chip_ptr->getID() ); 1172 int l2_ver = l2_mach.num%RubyConfig::numberOfL2CachePerChip(); 1173 // LUKE - use variable names instead of macros 1174 //cout << "number of L2caches per chip = " << RubyConfig::numberOfL2CachePerChip(m_version) << endl; 1175 //cout << "L1I cache vec size = " << n->m_L1Cache_L1IcacheMemory_vec.size() << endl; 1176 //cout << "L1D cache vec size = " << n->m_L1Cache_L1DcacheMemory_vec.size() << endl; 1177 //cout << "L1cache_cachememory size = " << n->m_L1Cache_cacheMemory_vec.size() << endl; 1178 //cout << "L1cache_l2cachememory size = " << n->m_L1Cache_L2cacheMemory_vec.size() << endl; 1179 // if (Protocol::m_TwoLevelCache) { 1180 // if(Protocol::m_CMP){ 1181 // cout << "CMP L2 cache vec size = " << n->m_L2Cache_L2cacheMemory_vec.size() << endl; 1182 // } 1183 // else{ 1184 // cout << "L2 cache vec size = " << n->m_L1Cache_cacheMemory_vec.size() << endl; 1185 // } 1186 // } 1187 1188 assert(n->m_L1Cache_L1IcacheMemory_vec[m_version] != NULL); 1189 assert(n->m_L1Cache_L1DcacheMemory_vec[m_version] != NULL); 1190 if (Protocol::m_TwoLevelCache) { 1191 if(Protocol::m_CMP){ 1192 assert(n->m_L2Cache_L2cacheMemory_vec[l2_ver] != NULL); 1193 } 1194 else{ 1195 assert(n->m_L1Cache_cacheMemory_vec[m_version] != NULL); 1196 } 1197 } 1198 1199 if (n->m_L1Cache_L1IcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_IFETCH, dataPtr)){ 1200 n->m_L1Cache_L1IcacheMemory_vec[m_version]->setMemoryValue(addr, value, size_in_bytes); 1201 found = true; 1202 } else if (n->m_L1Cache_L1DcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 1203 n->m_L1Cache_L1DcacheMemory_vec[m_version]->setMemoryValue(addr, value, size_in_bytes); 1204 found = true; 1205 } else if (Protocol::m_CMP && n->m_L2Cache_L2cacheMemory_vec[l2_ver]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 1206 n->m_L2Cache_L2cacheMemory_vec[l2_ver]->setMemoryValue(addr, value, size_in_bytes); 1207 found = true; 1208 // } else if (n->TBE_TABLE_MEMBER_VARIABLE->isTagPresent(lineAddr)){ 1209 // L1Cache_TBE& tbeEntry = n->TBE_TABLE_MEMBER_VARIABLE->lookup(lineAddr); 1210 // DataBlock tmpData; 1211 // int offset = addr.getOffset(); 1212 // for(int i=0; i<size_in_bytes; ++i){ 1213 // tmpData.setByte(offset + i, value[i]); 1214 // } 1215 // tbeEntry.setDataBlk(tmpData); 1216 // tbeEntry.setDirty(true); 1217 } else { 1218 // Address not found 1219 n = dynamic_cast<Chip>(g_system_ptr->getChip(map_Address_to_DirectoryNode(addr)/RubyConfig::numberOfDirectoryPerChip())); 1220* int dir_version = map_Address_to_DirectoryNode(addr)%RubyConfig::numberOfDirectoryPerChip(); 1221 for(unsigned int i=0; i<size_in_bytes; ++i){ 1222 int offset = addr.getOffset(); 1223 n->m_Directory_directory_vec[dir_version]->lookup(lineAddr).m_DataBlk.setByte(offset + i, value[i]); 1224 } 1225 found = false; 1226 } 1227 1228 if (found){ 1229 found = getRubyMemoryValue(addr, test_buffer, size_in_bytes); 1230 assert(found); 1231 if(value[0] != test_buffer[0]){ 1232 WARN_EXPR((int) value[0]); 1233 WARN_EXPR((int) test_buffer[0]); 1234 ERROR_MSG("setRubyMemoryValue failed to set value."); 1235 } 1236 } 1237 1238 return true; 1239 } 1240}	757 (request.getType() == CacheRequestType_ATOMIC); 758 759 if (TSO && (request.getPrefetch() == PrefetchBit_No) && write) { 760 assert(m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->isReady()); 761 m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->insertStore(request); 762 return; 763 } 764 765 bool hit = doRequest(request); 766 767} 768 769bool Sequencer::doRequest(const CacheMsg& request) { 770 bool hit = false; 771 // Check the fast path 772 DataBlock* data_ptr; 773 774 int thread = request.getThreadID(); 775 776 hit = tryCacheAccess(line_address(request.getAddress()), 777 request.getType(), 778 request.getProgramCounter(), 779 request.getAccessMode(), 780 request.getSize(), 781 data_ptr); 782 783 if (hit && (request.getType() == CacheRequestType_IFETCH \|\| !REMOVE_SINGLE_CYCLE_DCACHE_FAST_PATH) ) { 784 DEBUG_MSG(SEQUENCER_COMP, MedPrio, "Fast path hit"); 785 hitCallback(request, data_ptr, GenericMachineType_L1Cache, thread); 786* return true; 787 } 788 789#if 0 790 uinteger_t tick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick")); 791 uinteger_t tick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick_cmpr")); 792 uinteger_t stick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick")); 793 uinteger_t stick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick_cmpr")); 794 cout << "START PROC " << m_version << hex << " tick = " << tick << " tick_cmpr = " << tick_cmpr << " stick = " << stick << " stick_cmpr = " << stick_cmpr << " cycle = "<< g_eventQueue_ptr->getTime() << dec << endl;; 795#endif 796 797 if (TSO && (request.getType() == CacheRequestType_LD \|\| request.getType() == CacheRequestType_IFETCH)) { 798 799 // See if we can satisfy the load entirely from the store buffer 800 SubBlock subblock(line_address(request.getAddress()), request.getSize()); 801 if (m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->trySubBlock(subblock)) { 802 DataBlock dummy; 803 hitCallback(request, dummy, GenericMachineType_NULL, thread); // Call with an 'empty' datablock, since the data is in the store buffer 804 return true; 805 } 806 } 807 808 DEBUG_MSG(SEQUENCER_COMP, MedPrio, "Fast path miss"); 809 issueRequest(request); 810 return hit; 811} 812 813void Sequencer::issueRequest(const CacheMsg& request) { 814 bool found = insertRequest(request); 815 816 if (!found) { 817 CacheMsg msg = request; 818 msg.getAddress() = line_address(request.getAddress()); // Make line address 819 820 // Fast Path L1 misses are profiled here - all non-fast path misses are profiled within the generated protocol code 821 if (!REMOVE_SINGLE_CYCLE_DCACHE_FAST_PATH) { 822 g_system_ptr->getProfiler()->addPrimaryStatSample(msg, m_chip_ptr->getID()); 823 } 824 825 if (PROTOCOL_DEBUG_TRACE) { 826 g_system_ptr->getProfiler()->profileTransition("Seq", (m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip() + m_version), -1, msg.getAddress(),"", "Begin", "", CacheRequestType_to_string(request.getType())); 827* } 828 829#if 0 830 // Commented out by nate binkert because I removed the trace stuff 831 if (g_system_ptr->getTracer()->traceEnabled()) { 832 g_system_ptr->getTracer()->traceRequest((m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version), msg.getAddress(), msg.getProgramCounter(), 833* msg.getType(), g_eventQueue_ptr->getTime()); 834 } 835#endif 836 837 Time latency = 0; // initialzed to an null value 838 839 latency = SEQUENCER_TO_CONTROLLER_LATENCY; 840 841 // Send the message to the cache controller 842 assert(latency > 0); 843 m_chip_ptr->m_L1Cache_mandatoryQueue_vec[m_version]->enqueue(msg, latency); 844 845 } // !found 846} 847 848bool Sequencer::tryCacheAccess(const Address& addr, CacheRequestType type, 849 const Address& pc, AccessModeType access_mode, 850 int size, DataBlock& data_ptr) { 851* if (type == CacheRequestType_IFETCH) { 852 if (Protocol::m_TwoLevelCache) { 853 return m_chip_ptr->m_L1Cache_L1IcacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 854 } 855 else { 856 return m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 857 } 858 } else { 859 if (Protocol::m_TwoLevelCache) { 860 return m_chip_ptr->m_L1Cache_L1DcacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 861 } 862 else { 863 return m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 864 } 865 } 866} 867 868void Sequencer::resetRequestTime(const Address& addr, int thread){ 869 assert(thread >= 0); 870 //reset both load and store requests, if they exist 871 if(m_readRequestTable_ptr[thread]->exist(line_address(addr))){ 872 CacheMsg& request = m_readRequestTable_ptr[thread]->lookup(addr); 873 if( request.m_AccessMode != AccessModeType_UserMode){ 874 cout << "resetRequestType ERROR read request addr = " << addr << " thread = "<< thread << " is SUPERVISOR MODE" << endl; 875 printProgress(cout); 876 } 877 //ASSERT(request.m_AccessMode == AccessModeType_UserMode); 878 request.setTime(g_eventQueue_ptr->getTime()); 879 } 880 if(m_writeRequestTable_ptr[thread]->exist(line_address(addr))){ 881 CacheMsg& request = m_writeRequestTable_ptr[thread]->lookup(addr); 882 if( request.m_AccessMode != AccessModeType_UserMode){ 883 cout << "resetRequestType ERROR write request addr = " << addr << " thread = "<< thread << " is SUPERVISOR MODE" << endl; 884 printProgress(cout); 885 } 886 //ASSERT(request.m_AccessMode == AccessModeType_UserMode); 887 request.setTime(g_eventQueue_ptr->getTime()); 888 } 889} 890 891// removes load request from queue 892void Sequencer::removeLoadRequest(const Address & addr, int thread){ 893 removeRequest(getReadRequest(addr, thread)); 894} 895 896void Sequencer::removeStoreRequest(const Address & addr, int thread){ 897 removeRequest(getWriteRequest(addr, thread)); 898} 899 900// returns the read CacheMsg 901CacheMsg & Sequencer::getReadRequest( const Address & addr, int thread ){ 902 Address temp = addr; 903 assert(thread >= 0); 904 assert(temp == line_address(temp)); 905 assert(m_readRequestTable_ptr[thread]->exist(addr)); 906 return m_readRequestTable_ptr[thread]->lookup(addr); 907} 908 909CacheMsg & Sequencer::getWriteRequest( const Address & addr, int thread){ 910 Address temp = addr; 911 assert(thread >= 0); 912 assert(temp == line_address(temp)); 913 assert(m_writeRequestTable_ptr[thread]->exist(addr)); 914 return m_writeRequestTable_ptr[thread]->lookup(addr); 915} 916 917void Sequencer::print(ostream& out) const { 918 out << "[Sequencer: " << m_chip_ptr->getID() 919 << ", outstanding requests: " << m_outstanding_count; 920 921 int smt_threads = RubyConfig::numberofSMTThreads(); 922 for(int p=0; p < smt_threads; ++p){ 923 out << ", read request table[ " << p << " ]: " << m_readRequestTable_ptr[p] 924* << ", write request table[ " << p << " ]: " << m_writeRequestTable_ptr[p]; 925* } 926 out << "]"; 927} 928 929// this can be called from setState whenever coherence permissions are upgraded 930// when invoked, coherence violations will be checked for the given block 931void Sequencer::checkCoherence(const Address& addr) { 932#ifdef CHECK_COHERENCE 933 g_system_ptr->checkGlobalCoherenceInvariant(addr); 934#endif 935} 936 937bool Sequencer::getRubyMemoryValue(const Address& addr, char* value, 938 unsigned int size_in_bytes ) { 939 if(g_SIMICS){ 940 for(unsigned int i=0; i < size_in_bytes; i++) { 941 value[i] = SIMICS_read_physical_memory( m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version, 942* addr.getAddress() + i, 1 ); 943 } 944 return false; // Do nothing? 945 } else { 946 bool found = false; 947 const Address lineAddr = line_address(addr); 948 DataBlock data; 949 PhysAddress paddr(addr); 950 DataBlock* dataPtr = &data; 951 Chip* n = dynamic_cast<Chip>(m_chip_ptr); 952* // LUKE - use variable names instead of macros 953 assert(n->m_L1Cache_L1IcacheMemory_vec[m_version] != NULL); 954 assert(n->m_L1Cache_L1DcacheMemory_vec[m_version] != NULL); 955 956 MachineID l2_mach = map_L2ChipId_to_L2Cache(addr, m_chip_ptr->getID() ); 957 int l2_ver = l2_mach.num%RubyConfig::numberOfL2CachePerChip(); 958 959 if (Protocol::m_TwoLevelCache) { 960 if(Protocol::m_CMP){ 961 assert(n->m_L2Cache_L2cacheMemory_vec[l2_ver] != NULL); 962 } 963 else{ 964 assert(n->m_L1Cache_cacheMemory_vec[m_version] != NULL); 965 } 966 } 967 968 if (n->m_L1Cache_L1IcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_IFETCH, dataPtr)){ 969 n->m_L1Cache_L1IcacheMemory_vec[m_version]->getMemoryValue(addr, value, size_in_bytes); 970 found = true; 971 } else if (n->m_L1Cache_L1DcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 972 n->m_L1Cache_L1DcacheMemory_vec[m_version]->getMemoryValue(addr, value, size_in_bytes); 973 found = true; 974 } else if (Protocol::m_CMP && n->m_L2Cache_L2cacheMemory_vec[l2_ver]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 975 n->m_L2Cache_L2cacheMemory_vec[l2_ver]->getMemoryValue(addr, value, size_in_bytes); 976 found = true; 977 // } else if (n->TBE_TABLE_MEMBER_VARIABLE->isPresent(lineAddr)){ 978 // ASSERT(n->TBE_TABLE_MEMBER_VARIABLE->isPresent(lineAddr)); 979 // L1Cache_TBE tbeEntry = n->TBE_TABLE_MEMBER_VARIABLE->lookup(lineAddr); 980 981 // int offset = addr.getOffset(); 982 // for(int i=0; i<size_in_bytes; ++i){ 983 // value[i] = tbeEntry.getDataBlk().getByte(offset + i); 984 // } 985 986 // found = true; 987 } else { 988 // Address not found 989 //cout << " " << m_chip_ptr->getID() << " NOT IN CACHE, Value at Directory is: " << (int) value[0] << endl; 990 n = dynamic_cast<Chip>(g_system_ptr->getChip(map_Address_to_DirectoryNode(addr)/RubyConfig::numberOfDirectoryPerChip())); 991* int dir_version = map_Address_to_DirectoryNode(addr)%RubyConfig::numberOfDirectoryPerChip(); 992 for(unsigned int i=0; i<size_in_bytes; ++i){ 993 int offset = addr.getOffset(); 994 value[i] = n->m_Directory_directory_vec[dir_version]->lookup(lineAddr).m_DataBlk.getByte(offset + i); 995 } 996 // Address not found 997 //WARN_MSG("Couldn't find address"); 998 //WARN_EXPR(addr); 999 found = false; 1000 } 1001 return true; 1002 } 1003} 1004 1005bool Sequencer::setRubyMemoryValue(const Address& addr, char value, 1006* unsigned int size_in_bytes) { 1007 char test_buffer[64]; 1008 1009 if(g_SIMICS){ 1010 return false; // Do nothing? 1011 } else { 1012 // idea here is that coherent cache should find the 1013 // latest data, the update it 1014 bool found = false; 1015 const Address lineAddr = line_address(addr); 1016 PhysAddress paddr(addr); 1017 DataBlock data; 1018 DataBlock* dataPtr = &data; 1019 Chip* n = dynamic_cast<Chip>(m_chip_ptr); 1020* 1021 MachineID l2_mach = map_L2ChipId_to_L2Cache(addr, m_chip_ptr->getID() ); 1022 int l2_ver = l2_mach.num%RubyConfig::numberOfL2CachePerChip(); 1023 // LUKE - use variable names instead of macros 1024 //cout << "number of L2caches per chip = " << RubyConfig::numberOfL2CachePerChip(m_version) << endl; 1025 //cout << "L1I cache vec size = " << n->m_L1Cache_L1IcacheMemory_vec.size() << endl; 1026 //cout << "L1D cache vec size = " << n->m_L1Cache_L1DcacheMemory_vec.size() << endl; 1027 //cout << "L1cache_cachememory size = " << n->m_L1Cache_cacheMemory_vec.size() << endl; 1028 //cout << "L1cache_l2cachememory size = " << n->m_L1Cache_L2cacheMemory_vec.size() << endl; 1029 // if (Protocol::m_TwoLevelCache) { 1030 // if(Protocol::m_CMP){ 1031 // cout << "CMP L2 cache vec size = " << n->m_L2Cache_L2cacheMemory_vec.size() << endl; 1032 // } 1033 // else{ 1034 // cout << "L2 cache vec size = " << n->m_L1Cache_cacheMemory_vec.size() << endl; 1035 // } 1036 // } 1037 1038 assert(n->m_L1Cache_L1IcacheMemory_vec[m_version] != NULL); 1039 assert(n->m_L1Cache_L1DcacheMemory_vec[m_version] != NULL); 1040 if (Protocol::m_TwoLevelCache) { 1041 if(Protocol::m_CMP){ 1042 assert(n->m_L2Cache_L2cacheMemory_vec[l2_ver] != NULL); 1043 } 1044 else{ 1045 assert(n->m_L1Cache_cacheMemory_vec[m_version] != NULL); 1046 } 1047 } 1048 1049 if (n->m_L1Cache_L1IcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_IFETCH, dataPtr)){ 1050 n->m_L1Cache_L1IcacheMemory_vec[m_version]->setMemoryValue(addr, value, size_in_bytes); 1051 found = true; 1052 } else if (n->m_L1Cache_L1DcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 1053 n->m_L1Cache_L1DcacheMemory_vec[m_version]->setMemoryValue(addr, value, size_in_bytes); 1054 found = true; 1055 } else if (Protocol::m_CMP && n->m_L2Cache_L2cacheMemory_vec[l2_ver]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 1056 n->m_L2Cache_L2cacheMemory_vec[l2_ver]->setMemoryValue(addr, value, size_in_bytes); 1057 found = true; 1058 // } else if (n->TBE_TABLE_MEMBER_VARIABLE->isTagPresent(lineAddr)){ 1059 // L1Cache_TBE& tbeEntry = n->TBE_TABLE_MEMBER_VARIABLE->lookup(lineAddr); 1060 // DataBlock tmpData; 1061 // int offset = addr.getOffset(); 1062 // for(int i=0; i<size_in_bytes; ++i){ 1063 // tmpData.setByte(offset + i, value[i]); 1064 // } 1065 // tbeEntry.setDataBlk(tmpData); 1066 // tbeEntry.setDirty(true); 1067 } else { 1068 // Address not found 1069 n = dynamic_cast<Chip>(g_system_ptr->getChip(map_Address_to_DirectoryNode(addr)/RubyConfig::numberOfDirectoryPerChip())); 1070* int dir_version = map_Address_to_DirectoryNode(addr)%RubyConfig::numberOfDirectoryPerChip(); 1071 for(unsigned int i=0; i<size_in_bytes; ++i){ 1072 int offset = addr.getOffset(); 1073 n->m_Directory_directory_vec[dir_version]->lookup(lineAddr).m_DataBlk.setByte(offset + i, value[i]); 1074 } 1075 found = false; 1076 } 1077 1078 if (found){ 1079 found = getRubyMemoryValue(addr, test_buffer, size_in_bytes); 1080 assert(found); 1081 if(value[0] != test_buffer[0]){ 1082 WARN_EXPR((int) value[0]); 1083 WARN_EXPR((int) test_buffer[0]); 1084 ERROR_MSG("setRubyMemoryValue failed to set value."); 1085 } 1086 } 1087 1088 return true; 1089 } 1090}

Sequencer.cc (6151:bc6b84108443)	Sequencer.cc (6152:705b277e1141)
1 2/* 3 * Copyright (c) 1999-2008 Mark D. Hill and David A. Wood 4 * All rights reserved. 5 * 6 * Redistribution and use in source and binary forms, with or without 7 * modification, are permitted provided that the following conditions are 8 * met: redistributions of source code must retain the above copyright 9 * notice, this list of conditions and the following disclaimer; 10 * redistributions in binary form must reproduce the above copyright 11 * notice, this list of conditions and the following disclaimer in the 12 * documentation and/or other materials provided with the distribution; 13 * neither the name of the copyright holders nor the names of its 14 * contributors may be used to endorse or promote products derived from 15 * this software without specific prior written permission. 16 * 17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 18 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 19 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 20 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 21 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 22 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 23 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 24 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 25 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 26 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 27 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 28 / 29 30/ 31 * $Id: Sequencer.C 1.131 2006/11/06 17:41:01-06:00 bobba@gratiano.cs.wisc.edu $ 32 * 33 */ 34 35#include "Global.hh" 36#include "Sequencer.hh" 37#include "System.hh" 38#include "Protocol.hh" 39#include "Profiler.hh" 40#include "CacheMemory.hh" 41#include "RubyConfig.hh" 42//#include "Tracer.hh" 43#include "AbstractChip.hh" 44#include "Chip.hh" 45#include "Tester.hh" 46#include "SubBlock.hh" 47#include "Protocol.hh" 48#include "Map.hh" 49#include "interface.hh"	1 2/* 3 * Copyright (c) 1999-2008 Mark D. Hill and David A. Wood 4 * All rights reserved. 5 * 6 * Redistribution and use in source and binary forms, with or without 7 * modification, are permitted provided that the following conditions are 8 * met: redistributions of source code must retain the above copyright 9 * notice, this list of conditions and the following disclaimer; 10 * redistributions in binary form must reproduce the above copyright 11 * notice, this list of conditions and the following disclaimer in the 12 * documentation and/or other materials provided with the distribution; 13 * neither the name of the copyright holders nor the names of its 14 * contributors may be used to endorse or promote products derived from 15 * this software without specific prior written permission. 16 * 17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 18 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 19 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 20 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 21 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 22 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 23 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 24 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 25 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 26 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 27 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 28 / 29 30/ 31 * $Id: Sequencer.C 1.131 2006/11/06 17:41:01-06:00 bobba@gratiano.cs.wisc.edu $ 32 * 33 */ 34 35#include "Global.hh" 36#include "Sequencer.hh" 37#include "System.hh" 38#include "Protocol.hh" 39#include "Profiler.hh" 40#include "CacheMemory.hh" 41#include "RubyConfig.hh" 42//#include "Tracer.hh" 43#include "AbstractChip.hh" 44#include "Chip.hh" 45#include "Tester.hh" 46#include "SubBlock.hh" 47#include "Protocol.hh" 48#include "Map.hh" 49#include "interface.hh"
50//#include "XactCommitArbiter.hh" 51// #include "TransactionInterfaceManager.hh" 52//#include "TransactionVersionManager.hh" 53//#include "LazyTransactionVersionManager.hh"
54	50
55//#define XACT_MGR g_system_ptr->getChip(m_chip_ptr->getID())->getTransactionInterfaceManager(m_version) 56
57Sequencer::Sequencer(AbstractChip* chip_ptr, int version) { 58 m_chip_ptr = chip_ptr; 59 m_version = version; 60 61 m_deadlock_check_scheduled = false; 62 m_outstanding_count = 0; 63 64 int smt_threads = RubyConfig::numberofSMTThreads(); 65 m_writeRequestTable_ptr = new Map<Address, CacheMsg>[smt_threads]; 66 m_readRequestTable_ptr = new Map<Address, CacheMsg>[smt_threads]; 67 68 for(int p=0; p < smt_threads; ++p){ 69 m_writeRequestTable_ptr[p] = new Map<Address, CacheMsg>; 70 m_readRequestTable_ptr[p] = new Map<Address, CacheMsg>; 71 } 72 73} 74 75Sequencer::~Sequencer() { 76 int smt_threads = RubyConfig::numberofSMTThreads(); 77 for(int i=0; i < smt_threads; ++i){ 78 if(m_writeRequestTable_ptr[i]){ 79 delete m_writeRequestTable_ptr[i]; 80 } 81 if(m_readRequestTable_ptr[i]){ 82 delete m_readRequestTable_ptr[i]; 83 } 84 } 85 if(m_writeRequestTable_ptr){ 86 delete [] m_writeRequestTable_ptr; 87 } 88 if(m_readRequestTable_ptr){ 89 delete [] m_readRequestTable_ptr; 90 } 91} 92 93void Sequencer::wakeup() { 94 // Check for deadlock of any of the requests 95 Time current_time = g_eventQueue_ptr->getTime(); 96 bool deadlock = false; 97 98 // Check across all outstanding requests 99 int smt_threads = RubyConfig::numberofSMTThreads(); 100 int total_outstanding = 0; 101 for(int p=0; p < smt_threads; ++p){ 102 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 103 for (int i=0; i<keys.size(); i++) { 104 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]); 105 if (current_time - request.getTime() >= g_DEADLOCK_THRESHOLD) { 106 WARN_MSG("Possible Deadlock detected"); 107 WARN_EXPR(request); 108 WARN_EXPR(m_chip_ptr->getID()); 109 WARN_EXPR(m_version); 110 WARN_EXPR(keys.size()); 111 WARN_EXPR(current_time); 112 WARN_EXPR(request.getTime()); 113 WARN_EXPR(current_time - request.getTime()); 114 WARN_EXPR(m_readRequestTable_ptr[p]); 115* ERROR_MSG("Aborting"); 116 deadlock = true; 117 } 118 } 119 120 keys = m_writeRequestTable_ptr[p]->keys(); 121 for (int i=0; i<keys.size(); i++) { 122 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 123 if (current_time - request.getTime() >= g_DEADLOCK_THRESHOLD) { 124 WARN_MSG("Possible Deadlock detected"); 125 WARN_EXPR(request); 126 WARN_EXPR(m_chip_ptr->getID()); 127 WARN_EXPR(m_version); 128 WARN_EXPR(current_time); 129 WARN_EXPR(request.getTime()); 130 WARN_EXPR(current_time - request.getTime()); 131 WARN_EXPR(keys.size()); 132 WARN_EXPR(m_writeRequestTable_ptr[p]); 133* ERROR_MSG("Aborting"); 134 deadlock = true; 135 } 136 } 137 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 138 } // across all request tables 139 assert(m_outstanding_count == total_outstanding); 140 141 if (m_outstanding_count > 0) { // If there are still outstanding requests, keep checking 142 g_eventQueue_ptr->scheduleEvent(this, g_DEADLOCK_THRESHOLD); 143 } else { 144 m_deadlock_check_scheduled = false; 145 } 146} 147 148//returns the total number of requests 149int Sequencer::getNumberOutstanding(){ 150 return m_outstanding_count; 151} 152 153// returns the total number of demand requests 154int Sequencer::getNumberOutstandingDemand(){ 155 int smt_threads = RubyConfig::numberofSMTThreads(); 156 int total_demand = 0; 157 for(int p=0; p < smt_threads; ++p){ 158 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 159 for (int i=0; i< keys.size(); i++) { 160 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]);	51Sequencer::Sequencer(AbstractChip* chip_ptr, int version) { 52 m_chip_ptr = chip_ptr; 53 m_version = version; 54 55 m_deadlock_check_scheduled = false; 56 m_outstanding_count = 0; 57 58 int smt_threads = RubyConfig::numberofSMTThreads(); 59 m_writeRequestTable_ptr = new Map<Address, CacheMsg>[smt_threads]; 60 m_readRequestTable_ptr = new Map<Address, CacheMsg>[smt_threads]; 61 62 for(int p=0; p < smt_threads; ++p){ 63 m_writeRequestTable_ptr[p] = new Map<Address, CacheMsg>; 64 m_readRequestTable_ptr[p] = new Map<Address, CacheMsg>; 65 } 66 67} 68 69Sequencer::~Sequencer() { 70 int smt_threads = RubyConfig::numberofSMTThreads(); 71 for(int i=0; i < smt_threads; ++i){ 72 if(m_writeRequestTable_ptr[i]){ 73 delete m_writeRequestTable_ptr[i]; 74 } 75 if(m_readRequestTable_ptr[i]){ 76 delete m_readRequestTable_ptr[i]; 77 } 78 } 79 if(m_writeRequestTable_ptr){ 80 delete [] m_writeRequestTable_ptr; 81 } 82 if(m_readRequestTable_ptr){ 83 delete [] m_readRequestTable_ptr; 84 } 85} 86 87void Sequencer::wakeup() { 88 // Check for deadlock of any of the requests 89 Time current_time = g_eventQueue_ptr->getTime(); 90 bool deadlock = false; 91 92 // Check across all outstanding requests 93 int smt_threads = RubyConfig::numberofSMTThreads(); 94 int total_outstanding = 0; 95 for(int p=0; p < smt_threads; ++p){ 96 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 97 for (int i=0; i<keys.size(); i++) { 98 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]); 99 if (current_time - request.getTime() >= g_DEADLOCK_THRESHOLD) { 100 WARN_MSG("Possible Deadlock detected"); 101 WARN_EXPR(request); 102 WARN_EXPR(m_chip_ptr->getID()); 103 WARN_EXPR(m_version); 104 WARN_EXPR(keys.size()); 105 WARN_EXPR(current_time); 106 WARN_EXPR(request.getTime()); 107 WARN_EXPR(current_time - request.getTime()); 108 WARN_EXPR(m_readRequestTable_ptr[p]); 109* ERROR_MSG("Aborting"); 110 deadlock = true; 111 } 112 } 113 114 keys = m_writeRequestTable_ptr[p]->keys(); 115 for (int i=0; i<keys.size(); i++) { 116 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 117 if (current_time - request.getTime() >= g_DEADLOCK_THRESHOLD) { 118 WARN_MSG("Possible Deadlock detected"); 119 WARN_EXPR(request); 120 WARN_EXPR(m_chip_ptr->getID()); 121 WARN_EXPR(m_version); 122 WARN_EXPR(current_time); 123 WARN_EXPR(request.getTime()); 124 WARN_EXPR(current_time - request.getTime()); 125 WARN_EXPR(keys.size()); 126 WARN_EXPR(m_writeRequestTable_ptr[p]); 127* ERROR_MSG("Aborting"); 128 deadlock = true; 129 } 130 } 131 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 132 } // across all request tables 133 assert(m_outstanding_count == total_outstanding); 134 135 if (m_outstanding_count > 0) { // If there are still outstanding requests, keep checking 136 g_eventQueue_ptr->scheduleEvent(this, g_DEADLOCK_THRESHOLD); 137 } else { 138 m_deadlock_check_scheduled = false; 139 } 140} 141 142//returns the total number of requests 143int Sequencer::getNumberOutstanding(){ 144 return m_outstanding_count; 145} 146 147// returns the total number of demand requests 148int Sequencer::getNumberOutstandingDemand(){ 149 int smt_threads = RubyConfig::numberofSMTThreads(); 150 int total_demand = 0; 151 for(int p=0; p < smt_threads; ++p){ 152 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 153 for (int i=0; i< keys.size(); i++) { 154 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]);
161 // don't count transactional begin/commit requests 162 if(request.getType() != CacheRequestType_BEGIN_XACT && request.getType() != CacheRequestType_COMMIT_XACT){ 163 if(request.getPrefetch() == PrefetchBit_No){ 164 total_demand++; 165 }	155 if(request.getPrefetch() == PrefetchBit_No){ 156 total_demand++;
166 } 167 } 168 169 keys = m_writeRequestTable_ptr[p]->keys(); 170 for (int i=0; i< keys.size(); i++) { 171 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 172 if(request.getPrefetch() == PrefetchBit_No){ 173 total_demand++; 174 } 175 } 176 } 177 178 return total_demand; 179} 180 181int Sequencer::getNumberOutstandingPrefetch(){ 182 int smt_threads = RubyConfig::numberofSMTThreads(); 183 int total_prefetch = 0; 184 for(int p=0; p < smt_threads; ++p){ 185 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 186 for (int i=0; i< keys.size(); i++) { 187 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]); 188 if(request.getPrefetch() == PrefetchBit_Yes){ 189 total_prefetch++; 190 } 191 } 192 193 keys = m_writeRequestTable_ptr[p]->keys(); 194 for (int i=0; i< keys.size(); i++) { 195 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 196 if(request.getPrefetch() == PrefetchBit_Yes){ 197 total_prefetch++; 198 } 199 } 200 } 201 202 return total_prefetch; 203} 204 205bool Sequencer::isPrefetchRequest(const Address & lineaddr){ 206 int smt_threads = RubyConfig::numberofSMTThreads(); 207 for(int p=0; p < smt_threads; ++p){ 208 // check load requests 209 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 210 for (int i=0; i< keys.size(); i++) { 211 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]); 212 if(line_address(request.getAddress()) == lineaddr){ 213 if(request.getPrefetch() == PrefetchBit_Yes){ 214 return true; 215 } 216 else{ 217 return false; 218 } 219 } 220 } 221 222 // check store requests 223 keys = m_writeRequestTable_ptr[p]->keys(); 224 for (int i=0; i< keys.size(); i++) { 225 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 226 if(line_address(request.getAddress()) == lineaddr){ 227 if(request.getPrefetch() == PrefetchBit_Yes){ 228 return true; 229 } 230 else{ 231 return false; 232 } 233 } 234 } 235 } 236 // we should've found a matching request 237 cout << "isRequestPrefetch() ERROR request NOT FOUND : " << lineaddr << endl; 238 printProgress(cout); 239 assert(0); 240} 241 242AccessModeType Sequencer::getAccessModeOfRequest(Address addr, int thread){ 243 if(m_readRequestTable_ptr[thread]->exist(line_address(addr))){ 244 CacheMsg& request = m_readRequestTable_ptr[thread]->lookup(addr); 245 return request.getAccessMode(); 246 } else if(m_writeRequestTable_ptr[thread]->exist(line_address(addr))){ 247 CacheMsg& request = m_writeRequestTable_ptr[thread]->lookup(addr); 248 return request.getAccessMode(); 249 } else { 250 printProgress(cout); 251 ERROR_MSG("Request not found in RequestTables"); 252 } 253} 254 255Address Sequencer::getLogicalAddressOfRequest(Address addr, int thread){ 256 assert(thread >= 0); 257 if(m_readRequestTable_ptr[thread]->exist(line_address(addr))){ 258 CacheMsg& request = m_readRequestTable_ptr[thread]->lookup(addr); 259 return request.getLogicalAddress(); 260 } else if(m_writeRequestTable_ptr[thread]->exist(line_address(addr))){ 261 CacheMsg& request = m_writeRequestTable_ptr[thread]->lookup(addr); 262 return request.getLogicalAddress(); 263 } else { 264 printProgress(cout); 265 WARN_MSG("Request not found in RequestTables"); 266 WARN_MSG(addr); 267 WARN_MSG(thread); 268 ASSERT(0); 269 } 270} 271 272// returns the ThreadID of the request 273int Sequencer::getRequestThreadID(const Address & addr){ 274 int smt_threads = RubyConfig::numberofSMTThreads(); 275 int thread = -1; 276 int num_found = 0; 277 for(int p=0; p < smt_threads; ++p){ 278 if(m_readRequestTable_ptr[p]->exist(addr)){ 279 num_found++; 280 thread = p; 281 } 282 if(m_writeRequestTable_ptr[p]->exist(addr)){ 283 num_found++; 284 thread = p; 285 } 286 } 287 if(num_found != 1){ 288 cout << "getRequestThreadID ERROR too many matching requests addr = " << addr << endl; 289 printProgress(cout); 290 } 291 ASSERT(num_found == 1); 292 ASSERT(thread != -1); 293 294 return thread; 295} 296 297// given a line address, return the request's physical address 298Address Sequencer::getRequestPhysicalAddress(const Address & lineaddr){ 299 int smt_threads = RubyConfig::numberofSMTThreads(); 300 Address physaddr; 301 int num_found = 0; 302 for(int p=0; p < smt_threads; ++p){ 303 if(m_readRequestTable_ptr[p]->exist(lineaddr)){ 304 num_found++; 305 physaddr = (m_readRequestTable_ptr[p]->lookup(lineaddr)).getAddress(); 306 } 307 if(m_writeRequestTable_ptr[p]->exist(lineaddr)){ 308 num_found++; 309 physaddr = (m_writeRequestTable_ptr[p]->lookup(lineaddr)).getAddress(); 310 } 311 } 312 if(num_found != 1){ 313 cout << "getRequestPhysicalAddress ERROR too many matching requests addr = " << lineaddr << endl; 314 printProgress(cout); 315 } 316 ASSERT(num_found == 1); 317 318 return physaddr; 319} 320 321void Sequencer::printProgress(ostream& out) const{ 322 323 int total_demand = 0; 324 out << "Sequencer Stats Version " << m_version << endl; 325 out << "Current time = " << g_eventQueue_ptr->getTime() << endl; 326 out << "---------------" << endl; 327 out << "outstanding requests" << endl; 328 329 int smt_threads = RubyConfig::numberofSMTThreads(); 330 for(int p=0; p < smt_threads; ++p){ 331 Vector<Address> rkeys = m_readRequestTable_ptr[p]->keys(); 332 int read_size = rkeys.size(); 333 out << "proc " << m_chip_ptr->getID() << " thread " << p << " Read Requests = " << read_size << endl; 334 // print the request table 335 for(int i=0; i < read_size; ++i){ 336 CacheMsg & request = m_readRequestTable_ptr[p]->lookup(rkeys[i]); 337 out << "\tRequest[ " << i << " ] = " << request.getType() << " Address " << rkeys[i] << " Posted " << request.getTime() << " PF " << request.getPrefetch() << endl; 338 if( request.getPrefetch() == PrefetchBit_No ){ 339 total_demand++; 340 } 341 } 342 343 Vector<Address> wkeys = m_writeRequestTable_ptr[p]->keys(); 344 int write_size = wkeys.size(); 345 out << "proc " << m_chip_ptr->getID() << " thread " << p << " Write Requests = " << write_size << endl; 346 // print the request table 347 for(int i=0; i < write_size; ++i){ 348 CacheMsg & request = m_writeRequestTable_ptr[p]->lookup(wkeys[i]); 349 out << "\tRequest[ " << i << " ] = " << request.getType() << " Address " << wkeys[i] << " Posted " << request.getTime() << " PF " << request.getPrefetch() << endl; 350 if( request.getPrefetch() == PrefetchBit_No ){ 351 total_demand++; 352 } 353 } 354 355 out << endl; 356 } 357 out << "Total Number Outstanding: " << m_outstanding_count << endl; 358 out << "Total Number Demand : " << total_demand << endl; 359 out << "Total Number Prefetches : " << m_outstanding_count - total_demand << endl; 360 out << endl; 361 out << endl; 362 363} 364 365void Sequencer::printConfig(ostream& out) { 366 if (TSO) { 367 out << "sequencer: Sequencer - TSO" << endl; 368 } else { 369 out << "sequencer: Sequencer - SC" << endl; 370 } 371 out << " max_outstanding_requests: " << g_SEQUENCER_OUTSTANDING_REQUESTS << endl; 372} 373 374bool Sequencer::empty() const { 375 return m_outstanding_count == 0; 376} 377 378// Insert the request on the correct request table. Return true if 379// the entry was already present. 380bool Sequencer::insertRequest(const CacheMsg& request) { 381 int thread = request.getThreadID(); 382 assert(thread >= 0); 383 int total_outstanding = 0; 384 int smt_threads = RubyConfig::numberofSMTThreads(); 385 for(int p=0; p < smt_threads; ++p){ 386 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 387 } 388 assert(m_outstanding_count == total_outstanding); 389 390 // See if we should schedule a deadlock check 391 if (m_deadlock_check_scheduled == false) { 392 g_eventQueue_ptr->scheduleEvent(this, g_DEADLOCK_THRESHOLD); 393 m_deadlock_check_scheduled = true; 394 } 395 396 if ((request.getType() == CacheRequestType_ST) \|\|	157 } 158 } 159 160 keys = m_writeRequestTable_ptr[p]->keys(); 161 for (int i=0; i< keys.size(); i++) { 162 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 163 if(request.getPrefetch() == PrefetchBit_No){ 164 total_demand++; 165 } 166 } 167 } 168 169 return total_demand; 170} 171 172int Sequencer::getNumberOutstandingPrefetch(){ 173 int smt_threads = RubyConfig::numberofSMTThreads(); 174 int total_prefetch = 0; 175 for(int p=0; p < smt_threads; ++p){ 176 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 177 for (int i=0; i< keys.size(); i++) { 178 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]); 179 if(request.getPrefetch() == PrefetchBit_Yes){ 180 total_prefetch++; 181 } 182 } 183 184 keys = m_writeRequestTable_ptr[p]->keys(); 185 for (int i=0; i< keys.size(); i++) { 186 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 187 if(request.getPrefetch() == PrefetchBit_Yes){ 188 total_prefetch++; 189 } 190 } 191 } 192 193 return total_prefetch; 194} 195 196bool Sequencer::isPrefetchRequest(const Address & lineaddr){ 197 int smt_threads = RubyConfig::numberofSMTThreads(); 198 for(int p=0; p < smt_threads; ++p){ 199 // check load requests 200 Vector<Address> keys = m_readRequestTable_ptr[p]->keys(); 201 for (int i=0; i< keys.size(); i++) { 202 CacheMsg& request = m_readRequestTable_ptr[p]->lookup(keys[i]); 203 if(line_address(request.getAddress()) == lineaddr){ 204 if(request.getPrefetch() == PrefetchBit_Yes){ 205 return true; 206 } 207 else{ 208 return false; 209 } 210 } 211 } 212 213 // check store requests 214 keys = m_writeRequestTable_ptr[p]->keys(); 215 for (int i=0; i< keys.size(); i++) { 216 CacheMsg& request = m_writeRequestTable_ptr[p]->lookup(keys[i]); 217 if(line_address(request.getAddress()) == lineaddr){ 218 if(request.getPrefetch() == PrefetchBit_Yes){ 219 return true; 220 } 221 else{ 222 return false; 223 } 224 } 225 } 226 } 227 // we should've found a matching request 228 cout << "isRequestPrefetch() ERROR request NOT FOUND : " << lineaddr << endl; 229 printProgress(cout); 230 assert(0); 231} 232 233AccessModeType Sequencer::getAccessModeOfRequest(Address addr, int thread){ 234 if(m_readRequestTable_ptr[thread]->exist(line_address(addr))){ 235 CacheMsg& request = m_readRequestTable_ptr[thread]->lookup(addr); 236 return request.getAccessMode(); 237 } else if(m_writeRequestTable_ptr[thread]->exist(line_address(addr))){ 238 CacheMsg& request = m_writeRequestTable_ptr[thread]->lookup(addr); 239 return request.getAccessMode(); 240 } else { 241 printProgress(cout); 242 ERROR_MSG("Request not found in RequestTables"); 243 } 244} 245 246Address Sequencer::getLogicalAddressOfRequest(Address addr, int thread){ 247 assert(thread >= 0); 248 if(m_readRequestTable_ptr[thread]->exist(line_address(addr))){ 249 CacheMsg& request = m_readRequestTable_ptr[thread]->lookup(addr); 250 return request.getLogicalAddress(); 251 } else if(m_writeRequestTable_ptr[thread]->exist(line_address(addr))){ 252 CacheMsg& request = m_writeRequestTable_ptr[thread]->lookup(addr); 253 return request.getLogicalAddress(); 254 } else { 255 printProgress(cout); 256 WARN_MSG("Request not found in RequestTables"); 257 WARN_MSG(addr); 258 WARN_MSG(thread); 259 ASSERT(0); 260 } 261} 262 263// returns the ThreadID of the request 264int Sequencer::getRequestThreadID(const Address & addr){ 265 int smt_threads = RubyConfig::numberofSMTThreads(); 266 int thread = -1; 267 int num_found = 0; 268 for(int p=0; p < smt_threads; ++p){ 269 if(m_readRequestTable_ptr[p]->exist(addr)){ 270 num_found++; 271 thread = p; 272 } 273 if(m_writeRequestTable_ptr[p]->exist(addr)){ 274 num_found++; 275 thread = p; 276 } 277 } 278 if(num_found != 1){ 279 cout << "getRequestThreadID ERROR too many matching requests addr = " << addr << endl; 280 printProgress(cout); 281 } 282 ASSERT(num_found == 1); 283 ASSERT(thread != -1); 284 285 return thread; 286} 287 288// given a line address, return the request's physical address 289Address Sequencer::getRequestPhysicalAddress(const Address & lineaddr){ 290 int smt_threads = RubyConfig::numberofSMTThreads(); 291 Address physaddr; 292 int num_found = 0; 293 for(int p=0; p < smt_threads; ++p){ 294 if(m_readRequestTable_ptr[p]->exist(lineaddr)){ 295 num_found++; 296 physaddr = (m_readRequestTable_ptr[p]->lookup(lineaddr)).getAddress(); 297 } 298 if(m_writeRequestTable_ptr[p]->exist(lineaddr)){ 299 num_found++; 300 physaddr = (m_writeRequestTable_ptr[p]->lookup(lineaddr)).getAddress(); 301 } 302 } 303 if(num_found != 1){ 304 cout << "getRequestPhysicalAddress ERROR too many matching requests addr = " << lineaddr << endl; 305 printProgress(cout); 306 } 307 ASSERT(num_found == 1); 308 309 return physaddr; 310} 311 312void Sequencer::printProgress(ostream& out) const{ 313 314 int total_demand = 0; 315 out << "Sequencer Stats Version " << m_version << endl; 316 out << "Current time = " << g_eventQueue_ptr->getTime() << endl; 317 out << "---------------" << endl; 318 out << "outstanding requests" << endl; 319 320 int smt_threads = RubyConfig::numberofSMTThreads(); 321 for(int p=0; p < smt_threads; ++p){ 322 Vector<Address> rkeys = m_readRequestTable_ptr[p]->keys(); 323 int read_size = rkeys.size(); 324 out << "proc " << m_chip_ptr->getID() << " thread " << p << " Read Requests = " << read_size << endl; 325 // print the request table 326 for(int i=0; i < read_size; ++i){ 327 CacheMsg & request = m_readRequestTable_ptr[p]->lookup(rkeys[i]); 328 out << "\tRequest[ " << i << " ] = " << request.getType() << " Address " << rkeys[i] << " Posted " << request.getTime() << " PF " << request.getPrefetch() << endl; 329 if( request.getPrefetch() == PrefetchBit_No ){ 330 total_demand++; 331 } 332 } 333 334 Vector<Address> wkeys = m_writeRequestTable_ptr[p]->keys(); 335 int write_size = wkeys.size(); 336 out << "proc " << m_chip_ptr->getID() << " thread " << p << " Write Requests = " << write_size << endl; 337 // print the request table 338 for(int i=0; i < write_size; ++i){ 339 CacheMsg & request = m_writeRequestTable_ptr[p]->lookup(wkeys[i]); 340 out << "\tRequest[ " << i << " ] = " << request.getType() << " Address " << wkeys[i] << " Posted " << request.getTime() << " PF " << request.getPrefetch() << endl; 341 if( request.getPrefetch() == PrefetchBit_No ){ 342 total_demand++; 343 } 344 } 345 346 out << endl; 347 } 348 out << "Total Number Outstanding: " << m_outstanding_count << endl; 349 out << "Total Number Demand : " << total_demand << endl; 350 out << "Total Number Prefetches : " << m_outstanding_count - total_demand << endl; 351 out << endl; 352 out << endl; 353 354} 355 356void Sequencer::printConfig(ostream& out) { 357 if (TSO) { 358 out << "sequencer: Sequencer - TSO" << endl; 359 } else { 360 out << "sequencer: Sequencer - SC" << endl; 361 } 362 out << " max_outstanding_requests: " << g_SEQUENCER_OUTSTANDING_REQUESTS << endl; 363} 364 365bool Sequencer::empty() const { 366 return m_outstanding_count == 0; 367} 368 369// Insert the request on the correct request table. Return true if 370// the entry was already present. 371bool Sequencer::insertRequest(const CacheMsg& request) { 372 int thread = request.getThreadID(); 373 assert(thread >= 0); 374 int total_outstanding = 0; 375 int smt_threads = RubyConfig::numberofSMTThreads(); 376 for(int p=0; p < smt_threads; ++p){ 377 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 378 } 379 assert(m_outstanding_count == total_outstanding); 380 381 // See if we should schedule a deadlock check 382 if (m_deadlock_check_scheduled == false) { 383 g_eventQueue_ptr->scheduleEvent(this, g_DEADLOCK_THRESHOLD); 384 m_deadlock_check_scheduled = true; 385 } 386 387 if ((request.getType() == CacheRequestType_ST) \|\|
397 (request.getType() == CacheRequestType_ST_XACT) \|\| 398 (request.getType() == CacheRequestType_LDX_XACT) \|\|
399 (request.getType() == CacheRequestType_ATOMIC)) { 400 if (m_writeRequestTable_ptr[thread]->exist(line_address(request.getAddress()))) { 401 m_writeRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 402 return true; 403 } 404 m_writeRequestTable_ptr[thread]->allocate(line_address(request.getAddress())); 405 m_writeRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 406 m_outstanding_count++; 407 } else { 408 if (m_readRequestTable_ptr[thread]->exist(line_address(request.getAddress()))) { 409 m_readRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 410 return true; 411 } 412 m_readRequestTable_ptr[thread]->allocate(line_address(request.getAddress())); 413 m_readRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 414 m_outstanding_count++; 415 } 416 417 g_system_ptr->getProfiler()->sequencerRequests(m_outstanding_count); 418 419 total_outstanding = 0; 420 for(int p=0; p < smt_threads; ++p){ 421 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 422 } 423 424 assert(m_outstanding_count == total_outstanding); 425 return false; 426} 427 428void Sequencer::removeRequest(const CacheMsg& request) { 429 int thread = request.getThreadID(); 430 assert(thread >= 0); 431 int total_outstanding = 0; 432 int smt_threads = RubyConfig::numberofSMTThreads(); 433 for(int p=0; p < smt_threads; ++p){ 434 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 435 } 436 assert(m_outstanding_count == total_outstanding); 437 438 if ((request.getType() == CacheRequestType_ST) \|\|	388 (request.getType() == CacheRequestType_ATOMIC)) { 389 if (m_writeRequestTable_ptr[thread]->exist(line_address(request.getAddress()))) { 390 m_writeRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 391 return true; 392 } 393 m_writeRequestTable_ptr[thread]->allocate(line_address(request.getAddress())); 394 m_writeRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 395 m_outstanding_count++; 396 } else { 397 if (m_readRequestTable_ptr[thread]->exist(line_address(request.getAddress()))) { 398 m_readRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 399 return true; 400 } 401 m_readRequestTable_ptr[thread]->allocate(line_address(request.getAddress())); 402 m_readRequestTable_ptr[thread]->lookup(line_address(request.getAddress())) = request; 403 m_outstanding_count++; 404 } 405 406 g_system_ptr->getProfiler()->sequencerRequests(m_outstanding_count); 407 408 total_outstanding = 0; 409 for(int p=0; p < smt_threads; ++p){ 410 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 411 } 412 413 assert(m_outstanding_count == total_outstanding); 414 return false; 415} 416 417void Sequencer::removeRequest(const CacheMsg& request) { 418 int thread = request.getThreadID(); 419 assert(thread >= 0); 420 int total_outstanding = 0; 421 int smt_threads = RubyConfig::numberofSMTThreads(); 422 for(int p=0; p < smt_threads; ++p){ 423 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 424 } 425 assert(m_outstanding_count == total_outstanding); 426 427 if ((request.getType() == CacheRequestType_ST) \|\|
439 (request.getType() == CacheRequestType_ST_XACT) \|\| 440 (request.getType() == CacheRequestType_LDX_XACT) \|\|
441 (request.getType() == CacheRequestType_ATOMIC)) { 442 m_writeRequestTable_ptr[thread]->deallocate(line_address(request.getAddress())); 443 } else { 444 m_readRequestTable_ptr[thread]->deallocate(line_address(request.getAddress())); 445 } 446 m_outstanding_count--; 447 448 total_outstanding = 0; 449 for(int p=0; p < smt_threads; ++p){ 450 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 451 } 452 assert(m_outstanding_count == total_outstanding); 453} 454 455void Sequencer::writeCallback(const Address& address) { 456 DataBlock data; 457 writeCallback(address, data); 458} 459 460void Sequencer::writeCallback(const Address& address, DataBlock& data) { 461 // process oldest thread first 462 int thread = -1; 463 Time oldest_time = 0; 464 int smt_threads = RubyConfig::numberofSMTThreads(); 465 for(int t=0; t < smt_threads; ++t){ 466 if(m_writeRequestTable_ptr[t]->exist(address)){ 467 CacheMsg & request = m_writeRequestTable_ptr[t]->lookup(address); 468 if(thread == -1 \|\| (request.getTime() < oldest_time) ){ 469 thread = t; 470 oldest_time = request.getTime(); 471 } 472 } 473 } 474 // make sure we found an oldest thread 475 ASSERT(thread != -1); 476 477 CacheMsg & request = m_writeRequestTable_ptr[thread]->lookup(address); 478 479 writeCallback(address, data, GenericMachineType_NULL, PrefetchBit_No, thread); 480} 481 482void Sequencer::writeCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, PrefetchBit pf, int thread) { 483 484 assert(address == line_address(address)); 485 assert(thread >= 0); 486 assert(m_writeRequestTable_ptr[thread]->exist(line_address(address))); 487 488 writeCallback(address, data, respondingMach, thread); 489 490} 491 492void Sequencer::writeCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, int thread) { 493 assert(address == line_address(address)); 494 assert(m_writeRequestTable_ptr[thread]->exist(line_address(address))); 495 CacheMsg request = m_writeRequestTable_ptr[thread]->lookup(address); 496 assert( request.getThreadID() == thread); 497 removeRequest(request); 498 499 assert((request.getType() == CacheRequestType_ST) \|\|	428 (request.getType() == CacheRequestType_ATOMIC)) { 429 m_writeRequestTable_ptr[thread]->deallocate(line_address(request.getAddress())); 430 } else { 431 m_readRequestTable_ptr[thread]->deallocate(line_address(request.getAddress())); 432 } 433 m_outstanding_count--; 434 435 total_outstanding = 0; 436 for(int p=0; p < smt_threads; ++p){ 437 total_outstanding += m_writeRequestTable_ptr[p]->size() + m_readRequestTable_ptr[p]->size(); 438 } 439 assert(m_outstanding_count == total_outstanding); 440} 441 442void Sequencer::writeCallback(const Address& address) { 443 DataBlock data; 444 writeCallback(address, data); 445} 446 447void Sequencer::writeCallback(const Address& address, DataBlock& data) { 448 // process oldest thread first 449 int thread = -1; 450 Time oldest_time = 0; 451 int smt_threads = RubyConfig::numberofSMTThreads(); 452 for(int t=0; t < smt_threads; ++t){ 453 if(m_writeRequestTable_ptr[t]->exist(address)){ 454 CacheMsg & request = m_writeRequestTable_ptr[t]->lookup(address); 455 if(thread == -1 \|\| (request.getTime() < oldest_time) ){ 456 thread = t; 457 oldest_time = request.getTime(); 458 } 459 } 460 } 461 // make sure we found an oldest thread 462 ASSERT(thread != -1); 463 464 CacheMsg & request = m_writeRequestTable_ptr[thread]->lookup(address); 465 466 writeCallback(address, data, GenericMachineType_NULL, PrefetchBit_No, thread); 467} 468 469void Sequencer::writeCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, PrefetchBit pf, int thread) { 470 471 assert(address == line_address(address)); 472 assert(thread >= 0); 473 assert(m_writeRequestTable_ptr[thread]->exist(line_address(address))); 474 475 writeCallback(address, data, respondingMach, thread); 476 477} 478 479void Sequencer::writeCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, int thread) { 480 assert(address == line_address(address)); 481 assert(m_writeRequestTable_ptr[thread]->exist(line_address(address))); 482 CacheMsg request = m_writeRequestTable_ptr[thread]->lookup(address); 483 assert( request.getThreadID() == thread); 484 removeRequest(request); 485 486 assert((request.getType() == CacheRequestType_ST) \|\|
500 (request.getType() == CacheRequestType_ST_XACT) \|\| 501 (request.getType() == CacheRequestType_LDX_XACT) \|\|
502 (request.getType() == CacheRequestType_ATOMIC)); 503 504 hitCallback(request, data, respondingMach, thread); 505 506} 507 508void Sequencer::readCallback(const Address& address) { 509 DataBlock data; 510 readCallback(address, data); 511} 512 513void Sequencer::readCallback(const Address& address, DataBlock& data) { 514 // process oldest thread first 515 int thread = -1; 516 Time oldest_time = 0; 517 int smt_threads = RubyConfig::numberofSMTThreads(); 518 for(int t=0; t < smt_threads; ++t){ 519 if(m_readRequestTable_ptr[t]->exist(address)){ 520 CacheMsg & request = m_readRequestTable_ptr[t]->lookup(address); 521 if(thread == -1 \|\| (request.getTime() < oldest_time) ){ 522 thread = t; 523 oldest_time = request.getTime(); 524 } 525 } 526 } 527 // make sure we found an oldest thread 528 ASSERT(thread != -1); 529 530 CacheMsg & request = m_readRequestTable_ptr[thread]->lookup(address); 531 532 readCallback(address, data, GenericMachineType_NULL, PrefetchBit_No, thread); 533} 534 535void Sequencer::readCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, PrefetchBit pf, int thread) { 536 537 assert(address == line_address(address)); 538 assert(m_readRequestTable_ptr[thread]->exist(line_address(address))); 539 540 readCallback(address, data, respondingMach, thread); 541} 542 543void Sequencer::readCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, int thread) { 544 assert(address == line_address(address)); 545 assert(m_readRequestTable_ptr[thread]->exist(line_address(address))); 546 547 CacheMsg request = m_readRequestTable_ptr[thread]->lookup(address); 548 assert( request.getThreadID() == thread ); 549 removeRequest(request); 550 551 assert((request.getType() == CacheRequestType_LD) \|\|	487 (request.getType() == CacheRequestType_ATOMIC)); 488 489 hitCallback(request, data, respondingMach, thread); 490 491} 492 493void Sequencer::readCallback(const Address& address) { 494 DataBlock data; 495 readCallback(address, data); 496} 497 498void Sequencer::readCallback(const Address& address, DataBlock& data) { 499 // process oldest thread first 500 int thread = -1; 501 Time oldest_time = 0; 502 int smt_threads = RubyConfig::numberofSMTThreads(); 503 for(int t=0; t < smt_threads; ++t){ 504 if(m_readRequestTable_ptr[t]->exist(address)){ 505 CacheMsg & request = m_readRequestTable_ptr[t]->lookup(address); 506 if(thread == -1 \|\| (request.getTime() < oldest_time) ){ 507 thread = t; 508 oldest_time = request.getTime(); 509 } 510 } 511 } 512 // make sure we found an oldest thread 513 ASSERT(thread != -1); 514 515 CacheMsg & request = m_readRequestTable_ptr[thread]->lookup(address); 516 517 readCallback(address, data, GenericMachineType_NULL, PrefetchBit_No, thread); 518} 519 520void Sequencer::readCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, PrefetchBit pf, int thread) { 521 522 assert(address == line_address(address)); 523 assert(m_readRequestTable_ptr[thread]->exist(line_address(address))); 524 525 readCallback(address, data, respondingMach, thread); 526} 527 528void Sequencer::readCallback(const Address& address, DataBlock& data, GenericMachineType respondingMach, int thread) { 529 assert(address == line_address(address)); 530 assert(m_readRequestTable_ptr[thread]->exist(line_address(address))); 531 532 CacheMsg request = m_readRequestTable_ptr[thread]->lookup(address); 533 assert( request.getThreadID() == thread ); 534 removeRequest(request); 535 536 assert((request.getType() == CacheRequestType_LD) \|\|
552 (request.getType() == CacheRequestType_LD_XACT) \|\|
553 (request.getType() == CacheRequestType_IFETCH) 554 ); 555 556 hitCallback(request, data, respondingMach, thread); 557} 558 559void Sequencer::hitCallback(const CacheMsg& request, DataBlock& data, GenericMachineType respondingMach, int thread) { 560 int size = request.getSize(); 561 Address request_address = request.getAddress(); 562 Address request_logical_address = request.getLogicalAddress(); 563 Address request_line_address = line_address(request_address); 564 CacheRequestType type = request.getType(); 565 int threadID = request.getThreadID(); 566 Time issued_time = request.getTime(); 567 int logical_proc_no = ((m_chip_ptr->getID() * RubyConfig::numberOfProcsPerChip()) + m_version) * RubyConfig::numberofSMTThreads() + threadID; 568 569 DEBUG_MSG(SEQUENCER_COMP, MedPrio, size); 570 571 // Set this cache entry to the most recently used 572 if (type == CacheRequestType_IFETCH) { 573 if (Protocol::m_TwoLevelCache) { 574 if (m_chip_ptr->m_L1Cache_L1IcacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 575 m_chip_ptr->m_L1Cache_L1IcacheMemory_vec[m_version]->setMRU(request_line_address); 576 } 577 } 578 else { 579 if (m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 580 m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->setMRU(request_line_address); 581 } 582 } 583 } else { 584 if (Protocol::m_TwoLevelCache) { 585 if (m_chip_ptr->m_L1Cache_L1DcacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 586 m_chip_ptr->m_L1Cache_L1DcacheMemory_vec[m_version]->setMRU(request_line_address); 587 } 588 } 589 else { 590 if (m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 591 m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->setMRU(request_line_address); 592 } 593 } 594 } 595 596 assert(g_eventQueue_ptr->getTime() >= issued_time); 597 Time miss_latency = g_eventQueue_ptr->getTime() - issued_time; 598 599 if (PROTOCOL_DEBUG_TRACE) { 600 g_system_ptr->getProfiler()->profileTransition("Seq", (m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version), -1, request.getAddress(), "", "Done", "", 601* int_to_string(miss_latency)+" cycles "+GenericMachineType_to_string(respondingMach)+" "+CacheRequestType_to_string(request.getType())+" "+PrefetchBit_to_string(request.getPrefetch())); 602 } 603 604 DEBUG_MSG(SEQUENCER_COMP, MedPrio, request_address); 605 DEBUG_MSG(SEQUENCER_COMP, MedPrio, request.getPrefetch()); 606 if (request.getPrefetch() == PrefetchBit_Yes) { 607 DEBUG_MSG(SEQUENCER_COMP, MedPrio, "return"); 608 g_system_ptr->getProfiler()->swPrefetchLatency(miss_latency, type, respondingMach); 609 return; // Ignore the software prefetch, don't callback the driver 610 } 611 612 // Profile the miss latency for all non-zero demand misses 613 if (miss_latency != 0) { 614 g_system_ptr->getProfiler()->missLatency(miss_latency, type, respondingMach); 615 616#if 0 617 uinteger_t tick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick")); 618 uinteger_t tick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick_cmpr")); 619 uinteger_t stick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick")); 620 uinteger_t stick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick_cmpr")); 621 cout << "END PROC " << m_version << hex << " tick = " << tick << " tick_cmpr = " << tick_cmpr << " stick = " << stick << " stick_cmpr = " << stick_cmpr << " cycle = "<< g_eventQueue_ptr->getTime() << dec << endl; 622#endif 623 624 } 625 626 bool write = 627 (type == CacheRequestType_ST) \|\|	537 (request.getType() == CacheRequestType_IFETCH) 538 ); 539 540 hitCallback(request, data, respondingMach, thread); 541} 542 543void Sequencer::hitCallback(const CacheMsg& request, DataBlock& data, GenericMachineType respondingMach, int thread) { 544 int size = request.getSize(); 545 Address request_address = request.getAddress(); 546 Address request_logical_address = request.getLogicalAddress(); 547 Address request_line_address = line_address(request_address); 548 CacheRequestType type = request.getType(); 549 int threadID = request.getThreadID(); 550 Time issued_time = request.getTime(); 551 int logical_proc_no = ((m_chip_ptr->getID() * RubyConfig::numberOfProcsPerChip()) + m_version) * RubyConfig::numberofSMTThreads() + threadID; 552 553 DEBUG_MSG(SEQUENCER_COMP, MedPrio, size); 554 555 // Set this cache entry to the most recently used 556 if (type == CacheRequestType_IFETCH) { 557 if (Protocol::m_TwoLevelCache) { 558 if (m_chip_ptr->m_L1Cache_L1IcacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 559 m_chip_ptr->m_L1Cache_L1IcacheMemory_vec[m_version]->setMRU(request_line_address); 560 } 561 } 562 else { 563 if (m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 564 m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->setMRU(request_line_address); 565 } 566 } 567 } else { 568 if (Protocol::m_TwoLevelCache) { 569 if (m_chip_ptr->m_L1Cache_L1DcacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 570 m_chip_ptr->m_L1Cache_L1DcacheMemory_vec[m_version]->setMRU(request_line_address); 571 } 572 } 573 else { 574 if (m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->isTagPresent(request_line_address)) { 575 m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->setMRU(request_line_address); 576 } 577 } 578 } 579 580 assert(g_eventQueue_ptr->getTime() >= issued_time); 581 Time miss_latency = g_eventQueue_ptr->getTime() - issued_time; 582 583 if (PROTOCOL_DEBUG_TRACE) { 584 g_system_ptr->getProfiler()->profileTransition("Seq", (m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version), -1, request.getAddress(), "", "Done", "", 585* int_to_string(miss_latency)+" cycles "+GenericMachineType_to_string(respondingMach)+" "+CacheRequestType_to_string(request.getType())+" "+PrefetchBit_to_string(request.getPrefetch())); 586 } 587 588 DEBUG_MSG(SEQUENCER_COMP, MedPrio, request_address); 589 DEBUG_MSG(SEQUENCER_COMP, MedPrio, request.getPrefetch()); 590 if (request.getPrefetch() == PrefetchBit_Yes) { 591 DEBUG_MSG(SEQUENCER_COMP, MedPrio, "return"); 592 g_system_ptr->getProfiler()->swPrefetchLatency(miss_latency, type, respondingMach); 593 return; // Ignore the software prefetch, don't callback the driver 594 } 595 596 // Profile the miss latency for all non-zero demand misses 597 if (miss_latency != 0) { 598 g_system_ptr->getProfiler()->missLatency(miss_latency, type, respondingMach); 599 600#if 0 601 uinteger_t tick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick")); 602 uinteger_t tick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick_cmpr")); 603 uinteger_t stick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick")); 604 uinteger_t stick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick_cmpr")); 605 cout << "END PROC " << m_version << hex << " tick = " << tick << " tick_cmpr = " << tick_cmpr << " stick = " << stick << " stick_cmpr = " << stick_cmpr << " cycle = "<< g_eventQueue_ptr->getTime() << dec << endl; 606#endif 607 608 } 609 610 bool write = 611 (type == CacheRequestType_ST) \|\|
628 (type == CacheRequestType_ST_XACT) \|\| 629 (type == CacheRequestType_LDX_XACT) \|\|
630 (type == CacheRequestType_ATOMIC); 631 632 if (TSO && write) { 633 m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->callBack(line_address(request.getAddress()), data); 634 } else { 635 636 // Copy the correct bytes out of the cache line into the subblock 637 SubBlock subblock(request_address, request_logical_address, size); 638 subblock.mergeFrom(data); // copy the correct bytes from DataBlock in the SubBlock 639 640 // Scan the store buffer to see if there are any outstanding stores we need to collect 641 if (TSO) { 642 m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->updateSubBlock(subblock); 643 } 644 645 // Call into the Driver (Tester or Simics) and let it read and/or modify the sub-block 646 g_system_ptr->getDriver()->hitCallback(m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version, subblock, type, threadID); 647* 648 // If the request was a Store or Atomic, apply the changes in the SubBlock to the DataBlock 649 // (This is only triggered for the non-TSO case) 650 if (write) { 651 assert(!TSO); 652 subblock.mergeTo(data); // copy the correct bytes from SubBlock into the DataBlock 653 } 654 } 655} 656	612 (type == CacheRequestType_ATOMIC); 613 614 if (TSO && write) { 615 m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->callBack(line_address(request.getAddress()), data); 616 } else { 617 618 // Copy the correct bytes out of the cache line into the subblock 619 SubBlock subblock(request_address, request_logical_address, size); 620 subblock.mergeFrom(data); // copy the correct bytes from DataBlock in the SubBlock 621 622 // Scan the store buffer to see if there are any outstanding stores we need to collect 623 if (TSO) { 624 m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->updateSubBlock(subblock); 625 } 626 627 // Call into the Driver (Tester or Simics) and let it read and/or modify the sub-block 628 g_system_ptr->getDriver()->hitCallback(m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version, subblock, type, threadID); 629* 630 // If the request was a Store or Atomic, apply the changes in the SubBlock to the DataBlock 631 // (This is only triggered for the non-TSO case) 632 if (write) { 633 assert(!TSO); 634 subblock.mergeTo(data); // copy the correct bytes from SubBlock into the DataBlock 635 } 636 } 637} 638
657void Sequencer::readConflictCallback(const Address& address) { 658 // process oldest thread first 659 int thread = -1; 660 Time oldest_time = 0; 661 int smt_threads = RubyConfig::numberofSMTThreads(); 662 for(int t=0; t < smt_threads; ++t){ 663 if(m_readRequestTable_ptr[t]->exist(address)){ 664 CacheMsg & request = m_readRequestTable_ptr[t]->lookup(address); 665 if(thread == -1 \|\| (request.getTime() < oldest_time) ){ 666 thread = t; 667 oldest_time = request.getTime(); 668 } 669 } 670 } 671 // make sure we found an oldest thread 672 ASSERT(thread != -1); 673 674 CacheMsg & request = m_readRequestTable_ptr[thread]->lookup(address); 675 676 readConflictCallback(address, GenericMachineType_NULL, thread); 677} 678 679void Sequencer::readConflictCallback(const Address& address, GenericMachineType respondingMach, int thread) { 680 assert(address == line_address(address)); 681 assert(m_readRequestTable_ptr[thread]->exist(line_address(address))); 682 683 CacheMsg request = m_readRequestTable_ptr[thread]->lookup(address); 684 assert( request.getThreadID() == thread ); 685 removeRequest(request); 686 687 assert((request.getType() == CacheRequestType_LD) \|\| 688 (request.getType() == CacheRequestType_LD_XACT) \|\| 689 (request.getType() == CacheRequestType_IFETCH) 690 ); 691 692 conflictCallback(request, respondingMach, thread); 693} 694 695void Sequencer::writeConflictCallback(const Address& address) { 696 // process oldest thread first 697 int thread = -1; 698 Time oldest_time = 0; 699 int smt_threads = RubyConfig::numberofSMTThreads(); 700 for(int t=0; t < smt_threads; ++t){ 701 if(m_writeRequestTable_ptr[t]->exist(address)){ 702 CacheMsg & request = m_writeRequestTable_ptr[t]->lookup(address); 703 if(thread == -1 \|\| (request.getTime() < oldest_time) ){ 704 thread = t; 705 oldest_time = request.getTime(); 706 } 707 } 708 } 709 // make sure we found an oldest thread 710 ASSERT(thread != -1); 711 712 CacheMsg & request = m_writeRequestTable_ptr[thread]->lookup(address); 713 714 writeConflictCallback(address, GenericMachineType_NULL, thread); 715} 716 717void Sequencer::writeConflictCallback(const Address& address, GenericMachineType respondingMach, int thread) { 718 assert(address == line_address(address)); 719 assert(m_writeRequestTable_ptr[thread]->exist(line_address(address))); 720 CacheMsg request = m_writeRequestTable_ptr[thread]->lookup(address); 721 assert( request.getThreadID() == thread); 722 removeRequest(request); 723 724 assert((request.getType() == CacheRequestType_ST) \|\| 725 (request.getType() == CacheRequestType_ST_XACT) \|\| 726 (request.getType() == CacheRequestType_LDX_XACT) \|\| 727 (request.getType() == CacheRequestType_ATOMIC)); 728 729 conflictCallback(request, respondingMach, thread); 730 731} 732 733void Sequencer::conflictCallback(const CacheMsg& request, GenericMachineType respondingMach, int thread) { 734 assert(XACT_MEMORY); 735 int size = request.getSize(); 736 Address request_address = request.getAddress(); 737 Address request_logical_address = request.getLogicalAddress(); 738 Address request_line_address = line_address(request_address); 739 CacheRequestType type = request.getType(); 740 int threadID = request.getThreadID(); 741 Time issued_time = request.getTime(); 742 int logical_proc_no = ((m_chip_ptr->getID() * RubyConfig::numberOfProcsPerChip()) + m_version) * RubyConfig::numberofSMTThreads() + threadID; 743 744 DEBUG_MSG(SEQUENCER_COMP, MedPrio, size); 745 746 assert(g_eventQueue_ptr->getTime() >= issued_time); 747 Time miss_latency = g_eventQueue_ptr->getTime() - issued_time; 748 749 if (PROTOCOL_DEBUG_TRACE) { 750 g_system_ptr->getProfiler()->profileTransition("Seq", (m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version), -1, request.getAddress(), "", "Conflict", "", 751* int_to_string(miss_latency)+" cycles "+GenericMachineType_to_string(respondingMach)+" "+CacheRequestType_to_string(request.getType())+" "+PrefetchBit_to_string(request.getPrefetch())); 752 } 753 754 DEBUG_MSG(SEQUENCER_COMP, MedPrio, request_address); 755 DEBUG_MSG(SEQUENCER_COMP, MedPrio, request.getPrefetch()); 756 if (request.getPrefetch() == PrefetchBit_Yes) { 757 DEBUG_MSG(SEQUENCER_COMP, MedPrio, "return"); 758 g_system_ptr->getProfiler()->swPrefetchLatency(miss_latency, type, respondingMach); 759 return; // Ignore the software prefetch, don't callback the driver 760 } 761 762 bool write = 763 (type == CacheRequestType_ST) \|\| 764 (type == CacheRequestType_ST_XACT) \|\| 765 (type == CacheRequestType_LDX_XACT) \|\| 766 (type == CacheRequestType_ATOMIC); 767 768 // Copy the correct bytes out of the cache line into the subblock 769 SubBlock subblock(request_address, request_logical_address, size); 770 771 // Call into the Driver (Tester or Simics) 772 g_system_ptr->getDriver()->conflictCallback(m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version, subblock, type, threadID); 773* 774 // If the request was a Store or Atomic, apply the changes in the SubBlock to the DataBlock 775 // (This is only triggered for the non-TSO case) 776 if (write) { 777 assert(!TSO); 778 } 779} 780
781void Sequencer::printDebug(){ 782 //notify driver of debug 783 g_system_ptr->getDriver()->printDebug(); 784} 785 786// Returns true if the sequencer already has a load or store outstanding 787bool 788Sequencer::isReady(const Packet* pkt) const 789{ 790 791 int cpu_number = pkt->req->contextId(); 792 la_t logical_addr = pkt->req->getVaddr(); 793 pa_t physical_addr = pkt->req->getPaddr(); 794 CacheRequestType type_of_request; 795 if ( pkt->req->isInstFetch() ) { 796 type_of_request = CacheRequestType_IFETCH; 797 } else if ( pkt->req->isLocked() \|\| pkt->req->isSwap() ) { 798 type_of_request = CacheRequestType_ATOMIC; 799 } else if ( pkt->isRead() ) { 800 type_of_request = CacheRequestType_LD; 801 } else if ( pkt->isWrite() ) { 802 type_of_request = CacheRequestType_ST; 803 } else { 804 assert(false); 805 } 806 int thread = pkt->req->threadId(); 807 808 CacheMsg request(Address( physical_addr ), 809 Address( physical_addr ), 810 type_of_request, 811 Address(0), 812 AccessModeType_UserMode, // User/supervisor mode 813 0, // Size in bytes of request 814 PrefetchBit_No, // Not a prefetch 815 0, // Version number 816 Address(logical_addr), // Virtual Address	639void Sequencer::printDebug(){ 640 //notify driver of debug 641 g_system_ptr->getDriver()->printDebug(); 642} 643 644// Returns true if the sequencer already has a load or store outstanding 645bool 646Sequencer::isReady(const Packet* pkt) const 647{ 648 649 int cpu_number = pkt->req->contextId(); 650 la_t logical_addr = pkt->req->getVaddr(); 651 pa_t physical_addr = pkt->req->getPaddr(); 652 CacheRequestType type_of_request; 653 if ( pkt->req->isInstFetch() ) { 654 type_of_request = CacheRequestType_IFETCH; 655 } else if ( pkt->req->isLocked() \|\| pkt->req->isSwap() ) { 656 type_of_request = CacheRequestType_ATOMIC; 657 } else if ( pkt->isRead() ) { 658 type_of_request = CacheRequestType_LD; 659 } else if ( pkt->isWrite() ) { 660 type_of_request = CacheRequestType_ST; 661 } else { 662 assert(false); 663 } 664 int thread = pkt->req->threadId(); 665 666 CacheMsg request(Address( physical_addr ), 667 Address( physical_addr ), 668 type_of_request, 669 Address(0), 670 AccessModeType_UserMode, // User/supervisor mode 671 0, // Size in bytes of request 672 PrefetchBit_No, // Not a prefetch 673 0, // Version number 674 Address(logical_addr), // Virtual Address
817 thread, // SMT thread 818 0, // TM specific - timestamp of memory request 819 false // TM specific - whether request is part of escape action	675 thread // SMT thread
820 ); 821 isReady(request); 822} 823 824bool 825Sequencer::isReady(const CacheMsg& request) const 826{ 827 if (m_outstanding_count >= g_SEQUENCER_OUTSTANDING_REQUESTS) { 828 //cout << "TOO MANY OUTSTANDING: " << m_outstanding_count << " " << g_SEQUENCER_OUTSTANDING_REQUESTS << " VER " << m_version << endl; 829 //printProgress(cout); 830 return false; 831 } 832 833 // This code allows reads to be performed even when we have a write 834 // request outstanding for the line 835 bool write = 836 (request.getType() == CacheRequestType_ST) \|\|	676 ); 677 isReady(request); 678} 679 680bool 681Sequencer::isReady(const CacheMsg& request) const 682{ 683 if (m_outstanding_count >= g_SEQUENCER_OUTSTANDING_REQUESTS) { 684 //cout << "TOO MANY OUTSTANDING: " << m_outstanding_count << " " << g_SEQUENCER_OUTSTANDING_REQUESTS << " VER " << m_version << endl; 685 //printProgress(cout); 686 return false; 687 } 688 689 // This code allows reads to be performed even when we have a write 690 // request outstanding for the line 691 bool write = 692 (request.getType() == CacheRequestType_ST) \|\|
837 (request.getType() == CacheRequestType_ST_XACT) \|\| 838 (request.getType() == CacheRequestType_LDX_XACT) \|\|
839 (request.getType() == CacheRequestType_ATOMIC); 840 841 // LUKE - disallow more than one request type per address 842 // INVARIANT: at most one request type per address, per processor 843 int smt_threads = RubyConfig::numberofSMTThreads(); 844 for(int p=0; p < smt_threads; ++p){ 845 if( m_writeRequestTable_ptr[p]->exist(line_address(request.getAddress())) \|\| 846 m_readRequestTable_ptr[p]->exist(line_address(request.getAddress())) ){ 847 //cout << "OUTSTANDING REQUEST EXISTS " << p << " VER " << m_version << endl; 848 //printProgress(cout); 849 return false; 850 } 851 } 852 853 if (TSO) { 854 return m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->isReady(); 855 } 856 return true; 857} 858 859// Called by Driver (Simics or Tester). 860void 861Sequencer::makeRequest(const Packet* pkt, void* data) 862{ 863 int cpu_number = pkt->req->contextId(); 864 la_t logical_addr = pkt->req->getVaddr(); 865 pa_t physical_addr = pkt->req->getPaddr(); 866 int request_size = pkt->getSize(); 867 CacheRequestType type_of_request; 868 if ( pkt->req->isInstFetch() ) { 869 type_of_request = CacheRequestType_IFETCH; 870 } else if ( pkt->req->isLocked() \|\| pkt->req->isSwap() ) { 871 type_of_request = CacheRequestType_ATOMIC; 872 } else if ( pkt->isRead() ) { 873 type_of_request = CacheRequestType_LD; 874 } else if ( pkt->isWrite() ) { 875 type_of_request = CacheRequestType_ST; 876 } else { 877 assert(false); 878 } 879 la_t virtual_pc = pkt->req->getPC(); 880 int isPriv = false; // TODO: get permission data 881 int thread = pkt->req->threadId(); 882 883 AccessModeType access_mode = AccessModeType_UserMode; // TODO: get actual permission 884 885 CacheMsg request(Address( physical_addr ), 886 Address( physical_addr ), 887 type_of_request, 888 Address(virtual_pc), 889 access_mode, // User/supervisor mode 890 request_size, // Size in bytes of request 891 PrefetchBit_No, // Not a prefetch 892 0, // Version number 893 Address(logical_addr), // Virtual Address	693 (request.getType() == CacheRequestType_ATOMIC); 694 695 // LUKE - disallow more than one request type per address 696 // INVARIANT: at most one request type per address, per processor 697 int smt_threads = RubyConfig::numberofSMTThreads(); 698 for(int p=0; p < smt_threads; ++p){ 699 if( m_writeRequestTable_ptr[p]->exist(line_address(request.getAddress())) \|\| 700 m_readRequestTable_ptr[p]->exist(line_address(request.getAddress())) ){ 701 //cout << "OUTSTANDING REQUEST EXISTS " << p << " VER " << m_version << endl; 702 //printProgress(cout); 703 return false; 704 } 705 } 706 707 if (TSO) { 708 return m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->isReady(); 709 } 710 return true; 711} 712 713// Called by Driver (Simics or Tester). 714void 715Sequencer::makeRequest(const Packet* pkt, void* data) 716{ 717 int cpu_number = pkt->req->contextId(); 718 la_t logical_addr = pkt->req->getVaddr(); 719 pa_t physical_addr = pkt->req->getPaddr(); 720 int request_size = pkt->getSize(); 721 CacheRequestType type_of_request; 722 if ( pkt->req->isInstFetch() ) { 723 type_of_request = CacheRequestType_IFETCH; 724 } else if ( pkt->req->isLocked() \|\| pkt->req->isSwap() ) { 725 type_of_request = CacheRequestType_ATOMIC; 726 } else if ( pkt->isRead() ) { 727 type_of_request = CacheRequestType_LD; 728 } else if ( pkt->isWrite() ) { 729 type_of_request = CacheRequestType_ST; 730 } else { 731 assert(false); 732 } 733 la_t virtual_pc = pkt->req->getPC(); 734 int isPriv = false; // TODO: get permission data 735 int thread = pkt->req->threadId(); 736 737 AccessModeType access_mode = AccessModeType_UserMode; // TODO: get actual permission 738 739 CacheMsg request(Address( physical_addr ), 740 Address( physical_addr ), 741 type_of_request, 742 Address(virtual_pc), 743 access_mode, // User/supervisor mode 744 request_size, // Size in bytes of request 745 PrefetchBit_No, // Not a prefetch 746 0, // Version number 747 Address(logical_addr), // Virtual Address
894 thread, // SMT thread 895 0, // TM specific - timestamp of memory request 896 false // TM specific - whether request is part of escape action	748 thread // SMT thread
897 ); 898 makeRequest(request); 899} 900 901void 902Sequencer::makeRequest(const CacheMsg& request) 903{ 904 bool write = (request.getType() == CacheRequestType_ST) \|\|	749 ); 750 makeRequest(request); 751} 752 753void 754Sequencer::makeRequest(const CacheMsg& request) 755{ 756 bool write = (request.getType() == CacheRequestType_ST) \|\|
905 (request.getType() == CacheRequestType_ST_XACT) \|\| 906 (request.getType() == CacheRequestType_LDX_XACT) \|\|
907 (request.getType() == CacheRequestType_ATOMIC); 908 909 if (TSO && (request.getPrefetch() == PrefetchBit_No) && write) { 910 assert(m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->isReady()); 911 m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->insertStore(request); 912 return; 913 } 914 915 bool hit = doRequest(request); 916 917} 918 919bool Sequencer::doRequest(const CacheMsg& request) { 920 bool hit = false; 921 // Check the fast path 922 DataBlock* data_ptr; 923 924 int thread = request.getThreadID(); 925 926 hit = tryCacheAccess(line_address(request.getAddress()), 927 request.getType(), 928 request.getProgramCounter(), 929 request.getAccessMode(), 930 request.getSize(), 931 data_ptr); 932 933 if (hit && (request.getType() == CacheRequestType_IFETCH \|\| !REMOVE_SINGLE_CYCLE_DCACHE_FAST_PATH) ) { 934 DEBUG_MSG(SEQUENCER_COMP, MedPrio, "Fast path hit"); 935 hitCallback(request, data_ptr, GenericMachineType_L1Cache, thread); 936* return true; 937 } 938 939#if 0 940 uinteger_t tick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick")); 941 uinteger_t tick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick_cmpr")); 942 uinteger_t stick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick")); 943 uinteger_t stick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick_cmpr")); 944 cout << "START PROC " << m_version << hex << " tick = " << tick << " tick_cmpr = " << tick_cmpr << " stick = " << stick << " stick_cmpr = " << stick_cmpr << " cycle = "<< g_eventQueue_ptr->getTime() << dec << endl;; 945#endif 946 947 if (TSO && (request.getType() == CacheRequestType_LD \|\| request.getType() == CacheRequestType_IFETCH)) { 948 949 // See if we can satisfy the load entirely from the store buffer 950 SubBlock subblock(line_address(request.getAddress()), request.getSize()); 951 if (m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->trySubBlock(subblock)) { 952 DataBlock dummy; 953 hitCallback(request, dummy, GenericMachineType_NULL, thread); // Call with an 'empty' datablock, since the data is in the store buffer 954 return true; 955 } 956 } 957 958 DEBUG_MSG(SEQUENCER_COMP, MedPrio, "Fast path miss"); 959 issueRequest(request); 960 return hit; 961} 962 963void Sequencer::issueRequest(const CacheMsg& request) { 964 bool found = insertRequest(request); 965 966 if (!found) { 967 CacheMsg msg = request; 968 msg.getAddress() = line_address(request.getAddress()); // Make line address 969 970 // Fast Path L1 misses are profiled here - all non-fast path misses are profiled within the generated protocol code 971 if (!REMOVE_SINGLE_CYCLE_DCACHE_FAST_PATH) { 972 g_system_ptr->getProfiler()->addPrimaryStatSample(msg, m_chip_ptr->getID()); 973 } 974 975 if (PROTOCOL_DEBUG_TRACE) { 976 g_system_ptr->getProfiler()->profileTransition("Seq", (m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip() + m_version), -1, msg.getAddress(),"", "Begin", "", CacheRequestType_to_string(request.getType())); 977* } 978 979#if 0 980 // Commented out by nate binkert because I removed the trace stuff 981 if (g_system_ptr->getTracer()->traceEnabled()) { 982 g_system_ptr->getTracer()->traceRequest((m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version), msg.getAddress(), msg.getProgramCounter(), 983* msg.getType(), g_eventQueue_ptr->getTime()); 984 } 985#endif 986 987 Time latency = 0; // initialzed to an null value 988 989 latency = SEQUENCER_TO_CONTROLLER_LATENCY; 990 991 // Send the message to the cache controller 992 assert(latency > 0); 993 m_chip_ptr->m_L1Cache_mandatoryQueue_vec[m_version]->enqueue(msg, latency); 994 995 } // !found 996} 997 998bool Sequencer::tryCacheAccess(const Address& addr, CacheRequestType type, 999 const Address& pc, AccessModeType access_mode, 1000 int size, DataBlock& data_ptr) { 1001* if (type == CacheRequestType_IFETCH) { 1002 if (Protocol::m_TwoLevelCache) { 1003 return m_chip_ptr->m_L1Cache_L1IcacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 1004 } 1005 else { 1006 return m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 1007 } 1008 } else { 1009 if (Protocol::m_TwoLevelCache) { 1010 return m_chip_ptr->m_L1Cache_L1DcacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 1011 } 1012 else { 1013 return m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 1014 } 1015 } 1016} 1017 1018void Sequencer::resetRequestTime(const Address& addr, int thread){ 1019 assert(thread >= 0); 1020 //reset both load and store requests, if they exist 1021 if(m_readRequestTable_ptr[thread]->exist(line_address(addr))){ 1022 CacheMsg& request = m_readRequestTable_ptr[thread]->lookup(addr); 1023 if( request.m_AccessMode != AccessModeType_UserMode){ 1024 cout << "resetRequestType ERROR read request addr = " << addr << " thread = "<< thread << " is SUPERVISOR MODE" << endl; 1025 printProgress(cout); 1026 } 1027 //ASSERT(request.m_AccessMode == AccessModeType_UserMode); 1028 request.setTime(g_eventQueue_ptr->getTime()); 1029 } 1030 if(m_writeRequestTable_ptr[thread]->exist(line_address(addr))){ 1031 CacheMsg& request = m_writeRequestTable_ptr[thread]->lookup(addr); 1032 if( request.m_AccessMode != AccessModeType_UserMode){ 1033 cout << "resetRequestType ERROR write request addr = " << addr << " thread = "<< thread << " is SUPERVISOR MODE" << endl; 1034 printProgress(cout); 1035 } 1036 //ASSERT(request.m_AccessMode == AccessModeType_UserMode); 1037 request.setTime(g_eventQueue_ptr->getTime()); 1038 } 1039} 1040 1041// removes load request from queue 1042void Sequencer::removeLoadRequest(const Address & addr, int thread){ 1043 removeRequest(getReadRequest(addr, thread)); 1044} 1045 1046void Sequencer::removeStoreRequest(const Address & addr, int thread){ 1047 removeRequest(getWriteRequest(addr, thread)); 1048} 1049 1050// returns the read CacheMsg 1051CacheMsg & Sequencer::getReadRequest( const Address & addr, int thread ){ 1052 Address temp = addr; 1053 assert(thread >= 0); 1054 assert(temp == line_address(temp)); 1055 assert(m_readRequestTable_ptr[thread]->exist(addr)); 1056 return m_readRequestTable_ptr[thread]->lookup(addr); 1057} 1058 1059CacheMsg & Sequencer::getWriteRequest( const Address & addr, int thread){ 1060 Address temp = addr; 1061 assert(thread >= 0); 1062 assert(temp == line_address(temp)); 1063 assert(m_writeRequestTable_ptr[thread]->exist(addr)); 1064 return m_writeRequestTable_ptr[thread]->lookup(addr); 1065} 1066 1067void Sequencer::print(ostream& out) const { 1068 out << "[Sequencer: " << m_chip_ptr->getID() 1069 << ", outstanding requests: " << m_outstanding_count; 1070 1071 int smt_threads = RubyConfig::numberofSMTThreads(); 1072 for(int p=0; p < smt_threads; ++p){ 1073 out << ", read request table[ " << p << " ]: " << m_readRequestTable_ptr[p] 1074* << ", write request table[ " << p << " ]: " << m_writeRequestTable_ptr[p]; 1075* } 1076 out << "]"; 1077} 1078 1079// this can be called from setState whenever coherence permissions are upgraded 1080// when invoked, coherence violations will be checked for the given block 1081void Sequencer::checkCoherence(const Address& addr) { 1082#ifdef CHECK_COHERENCE 1083 g_system_ptr->checkGlobalCoherenceInvariant(addr); 1084#endif 1085} 1086 1087bool Sequencer::getRubyMemoryValue(const Address& addr, char* value, 1088 unsigned int size_in_bytes ) { 1089 if(g_SIMICS){ 1090 for(unsigned int i=0; i < size_in_bytes; i++) { 1091 value[i] = SIMICS_read_physical_memory( m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version, 1092* addr.getAddress() + i, 1 ); 1093 } 1094 return false; // Do nothing? 1095 } else { 1096 bool found = false; 1097 const Address lineAddr = line_address(addr); 1098 DataBlock data; 1099 PhysAddress paddr(addr); 1100 DataBlock* dataPtr = &data; 1101 Chip* n = dynamic_cast<Chip>(m_chip_ptr); 1102* // LUKE - use variable names instead of macros 1103 assert(n->m_L1Cache_L1IcacheMemory_vec[m_version] != NULL); 1104 assert(n->m_L1Cache_L1DcacheMemory_vec[m_version] != NULL); 1105 1106 MachineID l2_mach = map_L2ChipId_to_L2Cache(addr, m_chip_ptr->getID() ); 1107 int l2_ver = l2_mach.num%RubyConfig::numberOfL2CachePerChip(); 1108 1109 if (Protocol::m_TwoLevelCache) { 1110 if(Protocol::m_CMP){ 1111 assert(n->m_L2Cache_L2cacheMemory_vec[l2_ver] != NULL); 1112 } 1113 else{ 1114 assert(n->m_L1Cache_cacheMemory_vec[m_version] != NULL); 1115 } 1116 } 1117 1118 if (n->m_L1Cache_L1IcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_IFETCH, dataPtr)){ 1119 n->m_L1Cache_L1IcacheMemory_vec[m_version]->getMemoryValue(addr, value, size_in_bytes); 1120 found = true; 1121 } else if (n->m_L1Cache_L1DcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 1122 n->m_L1Cache_L1DcacheMemory_vec[m_version]->getMemoryValue(addr, value, size_in_bytes); 1123 found = true; 1124 } else if (Protocol::m_CMP && n->m_L2Cache_L2cacheMemory_vec[l2_ver]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 1125 n->m_L2Cache_L2cacheMemory_vec[l2_ver]->getMemoryValue(addr, value, size_in_bytes); 1126 found = true; 1127 // } else if (n->TBE_TABLE_MEMBER_VARIABLE->isPresent(lineAddr)){ 1128 // ASSERT(n->TBE_TABLE_MEMBER_VARIABLE->isPresent(lineAddr)); 1129 // L1Cache_TBE tbeEntry = n->TBE_TABLE_MEMBER_VARIABLE->lookup(lineAddr); 1130 1131 // int offset = addr.getOffset(); 1132 // for(int i=0; i<size_in_bytes; ++i){ 1133 // value[i] = tbeEntry.getDataBlk().getByte(offset + i); 1134 // } 1135 1136 // found = true; 1137 } else { 1138 // Address not found 1139 //cout << " " << m_chip_ptr->getID() << " NOT IN CACHE, Value at Directory is: " << (int) value[0] << endl; 1140 n = dynamic_cast<Chip>(g_system_ptr->getChip(map_Address_to_DirectoryNode(addr)/RubyConfig::numberOfDirectoryPerChip())); 1141* int dir_version = map_Address_to_DirectoryNode(addr)%RubyConfig::numberOfDirectoryPerChip(); 1142 for(unsigned int i=0; i<size_in_bytes; ++i){ 1143 int offset = addr.getOffset(); 1144 value[i] = n->m_Directory_directory_vec[dir_version]->lookup(lineAddr).m_DataBlk.getByte(offset + i); 1145 } 1146 // Address not found 1147 //WARN_MSG("Couldn't find address"); 1148 //WARN_EXPR(addr); 1149 found = false; 1150 } 1151 return true; 1152 } 1153} 1154 1155bool Sequencer::setRubyMemoryValue(const Address& addr, char value, 1156* unsigned int size_in_bytes) { 1157 char test_buffer[64]; 1158 1159 if(g_SIMICS){ 1160 return false; // Do nothing? 1161 } else { 1162 // idea here is that coherent cache should find the 1163 // latest data, the update it 1164 bool found = false; 1165 const Address lineAddr = line_address(addr); 1166 PhysAddress paddr(addr); 1167 DataBlock data; 1168 DataBlock* dataPtr = &data; 1169 Chip* n = dynamic_cast<Chip>(m_chip_ptr); 1170* 1171 MachineID l2_mach = map_L2ChipId_to_L2Cache(addr, m_chip_ptr->getID() ); 1172 int l2_ver = l2_mach.num%RubyConfig::numberOfL2CachePerChip(); 1173 // LUKE - use variable names instead of macros 1174 //cout << "number of L2caches per chip = " << RubyConfig::numberOfL2CachePerChip(m_version) << endl; 1175 //cout << "L1I cache vec size = " << n->m_L1Cache_L1IcacheMemory_vec.size() << endl; 1176 //cout << "L1D cache vec size = " << n->m_L1Cache_L1DcacheMemory_vec.size() << endl; 1177 //cout << "L1cache_cachememory size = " << n->m_L1Cache_cacheMemory_vec.size() << endl; 1178 //cout << "L1cache_l2cachememory size = " << n->m_L1Cache_L2cacheMemory_vec.size() << endl; 1179 // if (Protocol::m_TwoLevelCache) { 1180 // if(Protocol::m_CMP){ 1181 // cout << "CMP L2 cache vec size = " << n->m_L2Cache_L2cacheMemory_vec.size() << endl; 1182 // } 1183 // else{ 1184 // cout << "L2 cache vec size = " << n->m_L1Cache_cacheMemory_vec.size() << endl; 1185 // } 1186 // } 1187 1188 assert(n->m_L1Cache_L1IcacheMemory_vec[m_version] != NULL); 1189 assert(n->m_L1Cache_L1DcacheMemory_vec[m_version] != NULL); 1190 if (Protocol::m_TwoLevelCache) { 1191 if(Protocol::m_CMP){ 1192 assert(n->m_L2Cache_L2cacheMemory_vec[l2_ver] != NULL); 1193 } 1194 else{ 1195 assert(n->m_L1Cache_cacheMemory_vec[m_version] != NULL); 1196 } 1197 } 1198 1199 if (n->m_L1Cache_L1IcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_IFETCH, dataPtr)){ 1200 n->m_L1Cache_L1IcacheMemory_vec[m_version]->setMemoryValue(addr, value, size_in_bytes); 1201 found = true; 1202 } else if (n->m_L1Cache_L1DcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 1203 n->m_L1Cache_L1DcacheMemory_vec[m_version]->setMemoryValue(addr, value, size_in_bytes); 1204 found = true; 1205 } else if (Protocol::m_CMP && n->m_L2Cache_L2cacheMemory_vec[l2_ver]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 1206 n->m_L2Cache_L2cacheMemory_vec[l2_ver]->setMemoryValue(addr, value, size_in_bytes); 1207 found = true; 1208 // } else if (n->TBE_TABLE_MEMBER_VARIABLE->isTagPresent(lineAddr)){ 1209 // L1Cache_TBE& tbeEntry = n->TBE_TABLE_MEMBER_VARIABLE->lookup(lineAddr); 1210 // DataBlock tmpData; 1211 // int offset = addr.getOffset(); 1212 // for(int i=0; i<size_in_bytes; ++i){ 1213 // tmpData.setByte(offset + i, value[i]); 1214 // } 1215 // tbeEntry.setDataBlk(tmpData); 1216 // tbeEntry.setDirty(true); 1217 } else { 1218 // Address not found 1219 n = dynamic_cast<Chip>(g_system_ptr->getChip(map_Address_to_DirectoryNode(addr)/RubyConfig::numberOfDirectoryPerChip())); 1220* int dir_version = map_Address_to_DirectoryNode(addr)%RubyConfig::numberOfDirectoryPerChip(); 1221 for(unsigned int i=0; i<size_in_bytes; ++i){ 1222 int offset = addr.getOffset(); 1223 n->m_Directory_directory_vec[dir_version]->lookup(lineAddr).m_DataBlk.setByte(offset + i, value[i]); 1224 } 1225 found = false; 1226 } 1227 1228 if (found){ 1229 found = getRubyMemoryValue(addr, test_buffer, size_in_bytes); 1230 assert(found); 1231 if(value[0] != test_buffer[0]){ 1232 WARN_EXPR((int) value[0]); 1233 WARN_EXPR((int) test_buffer[0]); 1234 ERROR_MSG("setRubyMemoryValue failed to set value."); 1235 } 1236 } 1237 1238 return true; 1239 } 1240}	757 (request.getType() == CacheRequestType_ATOMIC); 758 759 if (TSO && (request.getPrefetch() == PrefetchBit_No) && write) { 760 assert(m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->isReady()); 761 m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->insertStore(request); 762 return; 763 } 764 765 bool hit = doRequest(request); 766 767} 768 769bool Sequencer::doRequest(const CacheMsg& request) { 770 bool hit = false; 771 // Check the fast path 772 DataBlock* data_ptr; 773 774 int thread = request.getThreadID(); 775 776 hit = tryCacheAccess(line_address(request.getAddress()), 777 request.getType(), 778 request.getProgramCounter(), 779 request.getAccessMode(), 780 request.getSize(), 781 data_ptr); 782 783 if (hit && (request.getType() == CacheRequestType_IFETCH \|\| !REMOVE_SINGLE_CYCLE_DCACHE_FAST_PATH) ) { 784 DEBUG_MSG(SEQUENCER_COMP, MedPrio, "Fast path hit"); 785 hitCallback(request, data_ptr, GenericMachineType_L1Cache, thread); 786* return true; 787 } 788 789#if 0 790 uinteger_t tick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick")); 791 uinteger_t tick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "tick_cmpr")); 792 uinteger_t stick = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick")); 793 uinteger_t stick_cmpr = SIMICS_read_control_register(m_version, SIMICS_get_register_number(m_version, "stick_cmpr")); 794 cout << "START PROC " << m_version << hex << " tick = " << tick << " tick_cmpr = " << tick_cmpr << " stick = " << stick << " stick_cmpr = " << stick_cmpr << " cycle = "<< g_eventQueue_ptr->getTime() << dec << endl;; 795#endif 796 797 if (TSO && (request.getType() == CacheRequestType_LD \|\| request.getType() == CacheRequestType_IFETCH)) { 798 799 // See if we can satisfy the load entirely from the store buffer 800 SubBlock subblock(line_address(request.getAddress()), request.getSize()); 801 if (m_chip_ptr->m_L1Cache_storeBuffer_vec[m_version]->trySubBlock(subblock)) { 802 DataBlock dummy; 803 hitCallback(request, dummy, GenericMachineType_NULL, thread); // Call with an 'empty' datablock, since the data is in the store buffer 804 return true; 805 } 806 } 807 808 DEBUG_MSG(SEQUENCER_COMP, MedPrio, "Fast path miss"); 809 issueRequest(request); 810 return hit; 811} 812 813void Sequencer::issueRequest(const CacheMsg& request) { 814 bool found = insertRequest(request); 815 816 if (!found) { 817 CacheMsg msg = request; 818 msg.getAddress() = line_address(request.getAddress()); // Make line address 819 820 // Fast Path L1 misses are profiled here - all non-fast path misses are profiled within the generated protocol code 821 if (!REMOVE_SINGLE_CYCLE_DCACHE_FAST_PATH) { 822 g_system_ptr->getProfiler()->addPrimaryStatSample(msg, m_chip_ptr->getID()); 823 } 824 825 if (PROTOCOL_DEBUG_TRACE) { 826 g_system_ptr->getProfiler()->profileTransition("Seq", (m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip() + m_version), -1, msg.getAddress(),"", "Begin", "", CacheRequestType_to_string(request.getType())); 827* } 828 829#if 0 830 // Commented out by nate binkert because I removed the trace stuff 831 if (g_system_ptr->getTracer()->traceEnabled()) { 832 g_system_ptr->getTracer()->traceRequest((m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version), msg.getAddress(), msg.getProgramCounter(), 833* msg.getType(), g_eventQueue_ptr->getTime()); 834 } 835#endif 836 837 Time latency = 0; // initialzed to an null value 838 839 latency = SEQUENCER_TO_CONTROLLER_LATENCY; 840 841 // Send the message to the cache controller 842 assert(latency > 0); 843 m_chip_ptr->m_L1Cache_mandatoryQueue_vec[m_version]->enqueue(msg, latency); 844 845 } // !found 846} 847 848bool Sequencer::tryCacheAccess(const Address& addr, CacheRequestType type, 849 const Address& pc, AccessModeType access_mode, 850 int size, DataBlock& data_ptr) { 851* if (type == CacheRequestType_IFETCH) { 852 if (Protocol::m_TwoLevelCache) { 853 return m_chip_ptr->m_L1Cache_L1IcacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 854 } 855 else { 856 return m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 857 } 858 } else { 859 if (Protocol::m_TwoLevelCache) { 860 return m_chip_ptr->m_L1Cache_L1DcacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 861 } 862 else { 863 return m_chip_ptr->m_L1Cache_cacheMemory_vec[m_version]->tryCacheAccess(line_address(addr), type, data_ptr); 864 } 865 } 866} 867 868void Sequencer::resetRequestTime(const Address& addr, int thread){ 869 assert(thread >= 0); 870 //reset both load and store requests, if they exist 871 if(m_readRequestTable_ptr[thread]->exist(line_address(addr))){ 872 CacheMsg& request = m_readRequestTable_ptr[thread]->lookup(addr); 873 if( request.m_AccessMode != AccessModeType_UserMode){ 874 cout << "resetRequestType ERROR read request addr = " << addr << " thread = "<< thread << " is SUPERVISOR MODE" << endl; 875 printProgress(cout); 876 } 877 //ASSERT(request.m_AccessMode == AccessModeType_UserMode); 878 request.setTime(g_eventQueue_ptr->getTime()); 879 } 880 if(m_writeRequestTable_ptr[thread]->exist(line_address(addr))){ 881 CacheMsg& request = m_writeRequestTable_ptr[thread]->lookup(addr); 882 if( request.m_AccessMode != AccessModeType_UserMode){ 883 cout << "resetRequestType ERROR write request addr = " << addr << " thread = "<< thread << " is SUPERVISOR MODE" << endl; 884 printProgress(cout); 885 } 886 //ASSERT(request.m_AccessMode == AccessModeType_UserMode); 887 request.setTime(g_eventQueue_ptr->getTime()); 888 } 889} 890 891// removes load request from queue 892void Sequencer::removeLoadRequest(const Address & addr, int thread){ 893 removeRequest(getReadRequest(addr, thread)); 894} 895 896void Sequencer::removeStoreRequest(const Address & addr, int thread){ 897 removeRequest(getWriteRequest(addr, thread)); 898} 899 900// returns the read CacheMsg 901CacheMsg & Sequencer::getReadRequest( const Address & addr, int thread ){ 902 Address temp = addr; 903 assert(thread >= 0); 904 assert(temp == line_address(temp)); 905 assert(m_readRequestTable_ptr[thread]->exist(addr)); 906 return m_readRequestTable_ptr[thread]->lookup(addr); 907} 908 909CacheMsg & Sequencer::getWriteRequest( const Address & addr, int thread){ 910 Address temp = addr; 911 assert(thread >= 0); 912 assert(temp == line_address(temp)); 913 assert(m_writeRequestTable_ptr[thread]->exist(addr)); 914 return m_writeRequestTable_ptr[thread]->lookup(addr); 915} 916 917void Sequencer::print(ostream& out) const { 918 out << "[Sequencer: " << m_chip_ptr->getID() 919 << ", outstanding requests: " << m_outstanding_count; 920 921 int smt_threads = RubyConfig::numberofSMTThreads(); 922 for(int p=0; p < smt_threads; ++p){ 923 out << ", read request table[ " << p << " ]: " << m_readRequestTable_ptr[p] 924* << ", write request table[ " << p << " ]: " << m_writeRequestTable_ptr[p]; 925* } 926 out << "]"; 927} 928 929// this can be called from setState whenever coherence permissions are upgraded 930// when invoked, coherence violations will be checked for the given block 931void Sequencer::checkCoherence(const Address& addr) { 932#ifdef CHECK_COHERENCE 933 g_system_ptr->checkGlobalCoherenceInvariant(addr); 934#endif 935} 936 937bool Sequencer::getRubyMemoryValue(const Address& addr, char* value, 938 unsigned int size_in_bytes ) { 939 if(g_SIMICS){ 940 for(unsigned int i=0; i < size_in_bytes; i++) { 941 value[i] = SIMICS_read_physical_memory( m_chip_ptr->getID()RubyConfig::numberOfProcsPerChip()+m_version, 942* addr.getAddress() + i, 1 ); 943 } 944 return false; // Do nothing? 945 } else { 946 bool found = false; 947 const Address lineAddr = line_address(addr); 948 DataBlock data; 949 PhysAddress paddr(addr); 950 DataBlock* dataPtr = &data; 951 Chip* n = dynamic_cast<Chip>(m_chip_ptr); 952* // LUKE - use variable names instead of macros 953 assert(n->m_L1Cache_L1IcacheMemory_vec[m_version] != NULL); 954 assert(n->m_L1Cache_L1DcacheMemory_vec[m_version] != NULL); 955 956 MachineID l2_mach = map_L2ChipId_to_L2Cache(addr, m_chip_ptr->getID() ); 957 int l2_ver = l2_mach.num%RubyConfig::numberOfL2CachePerChip(); 958 959 if (Protocol::m_TwoLevelCache) { 960 if(Protocol::m_CMP){ 961 assert(n->m_L2Cache_L2cacheMemory_vec[l2_ver] != NULL); 962 } 963 else{ 964 assert(n->m_L1Cache_cacheMemory_vec[m_version] != NULL); 965 } 966 } 967 968 if (n->m_L1Cache_L1IcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_IFETCH, dataPtr)){ 969 n->m_L1Cache_L1IcacheMemory_vec[m_version]->getMemoryValue(addr, value, size_in_bytes); 970 found = true; 971 } else if (n->m_L1Cache_L1DcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 972 n->m_L1Cache_L1DcacheMemory_vec[m_version]->getMemoryValue(addr, value, size_in_bytes); 973 found = true; 974 } else if (Protocol::m_CMP && n->m_L2Cache_L2cacheMemory_vec[l2_ver]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 975 n->m_L2Cache_L2cacheMemory_vec[l2_ver]->getMemoryValue(addr, value, size_in_bytes); 976 found = true; 977 // } else if (n->TBE_TABLE_MEMBER_VARIABLE->isPresent(lineAddr)){ 978 // ASSERT(n->TBE_TABLE_MEMBER_VARIABLE->isPresent(lineAddr)); 979 // L1Cache_TBE tbeEntry = n->TBE_TABLE_MEMBER_VARIABLE->lookup(lineAddr); 980 981 // int offset = addr.getOffset(); 982 // for(int i=0; i<size_in_bytes; ++i){ 983 // value[i] = tbeEntry.getDataBlk().getByte(offset + i); 984 // } 985 986 // found = true; 987 } else { 988 // Address not found 989 //cout << " " << m_chip_ptr->getID() << " NOT IN CACHE, Value at Directory is: " << (int) value[0] << endl; 990 n = dynamic_cast<Chip>(g_system_ptr->getChip(map_Address_to_DirectoryNode(addr)/RubyConfig::numberOfDirectoryPerChip())); 991* int dir_version = map_Address_to_DirectoryNode(addr)%RubyConfig::numberOfDirectoryPerChip(); 992 for(unsigned int i=0; i<size_in_bytes; ++i){ 993 int offset = addr.getOffset(); 994 value[i] = n->m_Directory_directory_vec[dir_version]->lookup(lineAddr).m_DataBlk.getByte(offset + i); 995 } 996 // Address not found 997 //WARN_MSG("Couldn't find address"); 998 //WARN_EXPR(addr); 999 found = false; 1000 } 1001 return true; 1002 } 1003} 1004 1005bool Sequencer::setRubyMemoryValue(const Address& addr, char value, 1006* unsigned int size_in_bytes) { 1007 char test_buffer[64]; 1008 1009 if(g_SIMICS){ 1010 return false; // Do nothing? 1011 } else { 1012 // idea here is that coherent cache should find the 1013 // latest data, the update it 1014 bool found = false; 1015 const Address lineAddr = line_address(addr); 1016 PhysAddress paddr(addr); 1017 DataBlock data; 1018 DataBlock* dataPtr = &data; 1019 Chip* n = dynamic_cast<Chip>(m_chip_ptr); 1020* 1021 MachineID l2_mach = map_L2ChipId_to_L2Cache(addr, m_chip_ptr->getID() ); 1022 int l2_ver = l2_mach.num%RubyConfig::numberOfL2CachePerChip(); 1023 // LUKE - use variable names instead of macros 1024 //cout << "number of L2caches per chip = " << RubyConfig::numberOfL2CachePerChip(m_version) << endl; 1025 //cout << "L1I cache vec size = " << n->m_L1Cache_L1IcacheMemory_vec.size() << endl; 1026 //cout << "L1D cache vec size = " << n->m_L1Cache_L1DcacheMemory_vec.size() << endl; 1027 //cout << "L1cache_cachememory size = " << n->m_L1Cache_cacheMemory_vec.size() << endl; 1028 //cout << "L1cache_l2cachememory size = " << n->m_L1Cache_L2cacheMemory_vec.size() << endl; 1029 // if (Protocol::m_TwoLevelCache) { 1030 // if(Protocol::m_CMP){ 1031 // cout << "CMP L2 cache vec size = " << n->m_L2Cache_L2cacheMemory_vec.size() << endl; 1032 // } 1033 // else{ 1034 // cout << "L2 cache vec size = " << n->m_L1Cache_cacheMemory_vec.size() << endl; 1035 // } 1036 // } 1037 1038 assert(n->m_L1Cache_L1IcacheMemory_vec[m_version] != NULL); 1039 assert(n->m_L1Cache_L1DcacheMemory_vec[m_version] != NULL); 1040 if (Protocol::m_TwoLevelCache) { 1041 if(Protocol::m_CMP){ 1042 assert(n->m_L2Cache_L2cacheMemory_vec[l2_ver] != NULL); 1043 } 1044 else{ 1045 assert(n->m_L1Cache_cacheMemory_vec[m_version] != NULL); 1046 } 1047 } 1048 1049 if (n->m_L1Cache_L1IcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_IFETCH, dataPtr)){ 1050 n->m_L1Cache_L1IcacheMemory_vec[m_version]->setMemoryValue(addr, value, size_in_bytes); 1051 found = true; 1052 } else if (n->m_L1Cache_L1DcacheMemory_vec[m_version]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 1053 n->m_L1Cache_L1DcacheMemory_vec[m_version]->setMemoryValue(addr, value, size_in_bytes); 1054 found = true; 1055 } else if (Protocol::m_CMP && n->m_L2Cache_L2cacheMemory_vec[l2_ver]->tryCacheAccess(lineAddr, CacheRequestType_LD, dataPtr)){ 1056 n->m_L2Cache_L2cacheMemory_vec[l2_ver]->setMemoryValue(addr, value, size_in_bytes); 1057 found = true; 1058 // } else if (n->TBE_TABLE_MEMBER_VARIABLE->isTagPresent(lineAddr)){ 1059 // L1Cache_TBE& tbeEntry = n->TBE_TABLE_MEMBER_VARIABLE->lookup(lineAddr); 1060 // DataBlock tmpData; 1061 // int offset = addr.getOffset(); 1062 // for(int i=0; i<size_in_bytes; ++i){ 1063 // tmpData.setByte(offset + i, value[i]); 1064 // } 1065 // tbeEntry.setDataBlk(tmpData); 1066 // tbeEntry.setDirty(true); 1067 } else { 1068 // Address not found 1069 n = dynamic_cast<Chip>(g_system_ptr->getChip(map_Address_to_DirectoryNode(addr)/RubyConfig::numberOfDirectoryPerChip())); 1070* int dir_version = map_Address_to_DirectoryNode(addr)%RubyConfig::numberOfDirectoryPerChip(); 1071 for(unsigned int i=0; i<size_in_bytes; ++i){ 1072 int offset = addr.getOffset(); 1073 n->m_Directory_directory_vec[dir_version]->lookup(lineAddr).m_DataBlk.setByte(offset + i, value[i]); 1074 } 1075 found = false; 1076 } 1077 1078 if (found){ 1079 found = getRubyMemoryValue(addr, test_buffer, size_in_bytes); 1080 assert(found); 1081 if(value[0] != test_buffer[0]){ 1082 WARN_EXPR((int) value[0]); 1083 WARN_EXPR((int) test_buffer[0]); 1084 ERROR_MSG("setRubyMemoryValue failed to set value."); 1085 } 1086 } 1087 1088 return true; 1089 } 1090}