Sequencer.cc revision 6763:5a879a3513dc
1
2/*
3 * Copyright (c) 1999-2008 Mark D. Hill and David A. Wood
4 * All rights reserved.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions are
8 * met: redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer;
10 * redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution;
13 * neither the name of the copyright holders nor the names of its
14 * contributors may be used to endorse or promote products derived from
15 * this software without specific prior written permission.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
18 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
19 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
20 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
21 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
22 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
23 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
24 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
25 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
27 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28 */
29
30#include "mem/ruby/common/Global.hh"
31#include "mem/ruby/system/Sequencer.hh"
32#include "mem/ruby/system/System.hh"
33#include "mem/protocol/Protocol.hh"
34#include "mem/ruby/profiler/Profiler.hh"
35#include "mem/ruby/system/CacheMemory.hh"
36#include "mem/protocol/CacheMsg.hh"
37#include "mem/ruby/recorder/Tracer.hh"
38#include "mem/ruby/common/SubBlock.hh"
39#include "mem/protocol/Protocol.hh"
40#include "mem/gems_common/Map.hh"
41#include "mem/ruby/buffers/MessageBuffer.hh"
42#include "mem/ruby/slicc_interface/AbstractController.hh"
43
44//Sequencer::Sequencer(int core_id, MessageBuffer* mandatory_q)
45
46#define LLSC_FAIL -2
47ostream& operator<<(std::ostream& out, const SequencerRequest& obj) {
48  out << obj.ruby_request << flush;
49  return out;
50}
51
52Sequencer::Sequencer(const string & name)
53  :RubyPort(name)
54{
55}
56
57void Sequencer::init(const vector<string> & argv)
58{
59  m_deadlock_check_scheduled = false;
60  m_outstanding_count = 0;
61
62  m_max_outstanding_requests = 0;
63  m_deadlock_threshold = 0;
64  m_version = -1;
65  m_instCache_ptr = NULL;
66  m_dataCache_ptr = NULL;
67  m_controller = NULL;
68  m_servicing_atomic = -1;
69  m_atomics_counter = 0;
70  for (size_t i=0; i<argv.size(); i+=2) {
71    if ( argv[i] == "controller") {
72      m_controller = RubySystem::getController(argv[i+1]); // args[i] = "L1Cache"
73      m_mandatory_q_ptr = m_controller->getMandatoryQueue();
74    } else if ( argv[i] == "icache")
75      m_instCache_ptr = RubySystem::getCache(argv[i+1]);
76    else if ( argv[i] == "dcache")
77      m_dataCache_ptr = RubySystem::getCache(argv[i+1]);
78    else if ( argv[i] == "version")
79      m_version = atoi(argv[i+1].c_str());
80    else if ( argv[i] == "max_outstanding_requests")
81      m_max_outstanding_requests = atoi(argv[i+1].c_str());
82    else if ( argv[i] == "deadlock_threshold")
83      m_deadlock_threshold = atoi(argv[i+1].c_str());
84    else {
85      cerr << "WARNING: Sequencer: Unkown configuration parameter: " << argv[i] << endl;
86      assert(false);
87    }
88  }
89  assert(m_max_outstanding_requests > 0);
90  assert(m_deadlock_threshold > 0);
91  assert(m_version > -1);
92  assert(m_instCache_ptr != NULL);
93  assert(m_dataCache_ptr != NULL);
94  assert(m_controller != NULL);
95}
96
97Sequencer::~Sequencer() {
98
99}
100
101void Sequencer::wakeup() {
102  // Check for deadlock of any of the requests
103  Time current_time = g_eventQueue_ptr->getTime();
104
105  // Check across all outstanding requests
106  int total_outstanding = 0;
107
108  Vector<Address> keys = m_readRequestTable.keys();
109  for (int i=0; i<keys.size(); i++) {
110    SequencerRequest* request = m_readRequestTable.lookup(keys[i]);
111    if (current_time - request->issue_time >= m_deadlock_threshold) {
112      WARN_MSG("Possible Deadlock detected");
113      WARN_EXPR(request->ruby_request);
114      WARN_EXPR(m_version);
115      WARN_EXPR(keys.size());
116      WARN_EXPR(current_time);
117      WARN_EXPR(request->issue_time);
118      WARN_EXPR(current_time - request->issue_time);
119      ERROR_MSG("Aborting");
120    }
121  }
122
123  keys = m_writeRequestTable.keys();
124  for (int i=0; i<keys.size(); i++) {
125    SequencerRequest* request = m_writeRequestTable.lookup(keys[i]);
126    if (current_time - request->issue_time >= m_deadlock_threshold) {
127      WARN_MSG("Possible Deadlock detected");
128      WARN_EXPR(request->ruby_request);
129      WARN_EXPR(m_version);
130      WARN_EXPR(current_time);
131      WARN_EXPR(request->issue_time);
132      WARN_EXPR(current_time - request->issue_time);
133      WARN_EXPR(keys.size());
134      ERROR_MSG("Aborting");
135    }
136  }
137  total_outstanding += m_writeRequestTable.size() + m_readRequestTable.size();
138
139  assert(m_outstanding_count == total_outstanding);
140
141  if (m_outstanding_count > 0) { // If there are still outstanding requests, keep checking
142    g_eventQueue_ptr->scheduleEvent(this, m_deadlock_threshold);
143  } else {
144    m_deadlock_check_scheduled = false;
145  }
146}
147
148void Sequencer::printProgress(ostream& out) const{
149  /*
150  int total_demand = 0;
151  out << "Sequencer Stats Version " << m_version << endl;
152  out << "Current time = " << g_eventQueue_ptr->getTime() << endl;
153  out << "---------------" << endl;
154  out << "outstanding requests" << endl;
155
156  Vector<Address> rkeys = m_readRequestTable.keys();
157  int read_size = rkeys.size();
158  out << "proc " << m_version << " Read Requests = " << read_size << endl;
159  // print the request table
160  for(int i=0; i < read_size; ++i){
161    SequencerRequest * request = m_readRequestTable.lookup(rkeys[i]);
162    out << "\tRequest[ " << i << " ] = " << request->type << " Address " << rkeys[i]  << " Posted " << request->issue_time << " PF " << PrefetchBit_No << endl;
163    total_demand++;
164  }
165
166  Vector<Address> wkeys = m_writeRequestTable.keys();
167  int write_size = wkeys.size();
168  out << "proc " << m_version << " Write Requests = " << write_size << endl;
169  // print the request table
170  for(int i=0; i < write_size; ++i){
171      CacheMsg & request = m_writeRequestTable.lookup(wkeys[i]);
172      out << "\tRequest[ " << i << " ] = " << request.getType() << " Address " << wkeys[i]  << " Posted " << request.getTime() << " PF " << request.getPrefetch() << endl;
173      if( request.getPrefetch() == PrefetchBit_No ){
174        total_demand++;
175      }
176  }
177
178  out << endl;
179
180  out << "Total Number Outstanding: " << m_outstanding_count << endl;
181  out << "Total Number Demand     : " << total_demand << endl;
182  out << "Total Number Prefetches : " << m_outstanding_count - total_demand << endl;
183  out << endl;
184  out << endl;
185  */
186}
187
188void Sequencer::printConfig(ostream& out) const {
189  out << "Seqeuncer config: " << m_name << endl;
190  out << "  controller: " << m_controller->getName() << endl;
191  out << "  version: " << m_version << endl;
192  out << "  max_outstanding_requests: " << m_max_outstanding_requests << endl;
193  out << "  deadlock_threshold: " << m_deadlock_threshold << endl;
194}
195
196// Insert the request on the correct request table.  Return true if
197// the entry was already present.
198bool Sequencer::insertRequest(SequencerRequest* request) {
199  int total_outstanding = m_writeRequestTable.size() + m_readRequestTable.size();
200
201  assert(m_outstanding_count == total_outstanding);
202
203  // See if we should schedule a deadlock check
204  if (m_deadlock_check_scheduled == false) {
205    g_eventQueue_ptr->scheduleEvent(this, m_deadlock_threshold);
206    m_deadlock_check_scheduled = true;
207  }
208
209  Address line_addr(request->ruby_request.paddr);
210  line_addr.makeLineAddress();
211  if ((request->ruby_request.type == RubyRequestType_ST) ||
212      (request->ruby_request.type == RubyRequestType_RMW_Read) ||
213      (request->ruby_request.type == RubyRequestType_RMW_Write) ||
214      (request->ruby_request.type == RubyRequestType_Locked_Read) ||
215      (request->ruby_request.type == RubyRequestType_Locked_Write)) {
216    if (m_writeRequestTable.exist(line_addr)) {
217      m_writeRequestTable.lookup(line_addr) = request;
218      //      return true;
219      assert(0); // drh5: isn't this an error?  do you lose the initial request?
220    }
221    m_writeRequestTable.allocate(line_addr);
222    m_writeRequestTable.lookup(line_addr) = request;
223    m_outstanding_count++;
224  } else {
225    if (m_readRequestTable.exist(line_addr)) {
226      m_readRequestTable.lookup(line_addr) = request;
227      //      return true;
228      assert(0); // drh5: isn't this an error?  do you lose the initial request?
229    }
230    m_readRequestTable.allocate(line_addr);
231    m_readRequestTable.lookup(line_addr) = request;
232    m_outstanding_count++;
233  }
234
235  g_system_ptr->getProfiler()->sequencerRequests(m_outstanding_count);
236
237  total_outstanding = m_writeRequestTable.size() + m_readRequestTable.size();
238  assert(m_outstanding_count == total_outstanding);
239
240  return false;
241}
242
243void Sequencer::removeRequest(SequencerRequest* srequest) {
244
245  assert(m_outstanding_count == m_writeRequestTable.size() + m_readRequestTable.size());
246
247  const RubyRequest & ruby_request = srequest->ruby_request;
248  Address line_addr(ruby_request.paddr);
249  line_addr.makeLineAddress();
250  if ((ruby_request.type == RubyRequestType_ST) ||
251      (ruby_request.type == RubyRequestType_RMW_Read) ||
252      (ruby_request.type == RubyRequestType_RMW_Write) ||
253      (ruby_request.type == RubyRequestType_Locked_Read) ||
254      (ruby_request.type == RubyRequestType_Locked_Write)) {
255    m_writeRequestTable.deallocate(line_addr);
256  } else {
257    m_readRequestTable.deallocate(line_addr);
258  }
259  m_outstanding_count--;
260
261  assert(m_outstanding_count == m_writeRequestTable.size() + m_readRequestTable.size());
262}
263
264void Sequencer::writeCallback(const Address& address, DataBlock& data) {
265
266  assert(address == line_address(address));
267  assert(m_writeRequestTable.exist(line_address(address)));
268
269  SequencerRequest* request = m_writeRequestTable.lookup(address);
270  removeRequest(request);
271
272  assert((request->ruby_request.type == RubyRequestType_ST) ||
273         (request->ruby_request.type == RubyRequestType_RMW_Read) ||
274         (request->ruby_request.type == RubyRequestType_RMW_Write) ||
275         (request->ruby_request.type == RubyRequestType_Locked_Read) ||
276         (request->ruby_request.type == RubyRequestType_Locked_Write));
277  // POLINA: the assumption is that atomics are only on data cache and not instruction cache
278  if (request->ruby_request.type == RubyRequestType_Locked_Read) {
279    m_dataCache_ptr->setLocked(address, m_version);
280  }
281  else if (request->ruby_request.type == RubyRequestType_RMW_Read) {
282    m_controller->set_atomic(address);
283  }
284  else if (request->ruby_request.type == RubyRequestType_RMW_Write) {
285    m_controller->clear_atomic();
286  }
287
288  hitCallback(request, data);
289}
290
291void Sequencer::readCallback(const Address& address, DataBlock& data) {
292
293  assert(address == line_address(address));
294  assert(m_readRequestTable.exist(line_address(address)));
295
296  SequencerRequest* request = m_readRequestTable.lookup(address);
297  removeRequest(request);
298
299  assert((request->ruby_request.type == RubyRequestType_LD) ||
300	 (request->ruby_request.type == RubyRequestType_RMW_Read) ||
301         (request->ruby_request.type == RubyRequestType_IFETCH));
302
303  hitCallback(request, data);
304}
305
306void Sequencer::hitCallback(SequencerRequest* srequest, DataBlock& data) {
307  const RubyRequest & ruby_request = srequest->ruby_request;
308  Address request_address(ruby_request.paddr);
309  Address request_line_address(ruby_request.paddr);
310  request_line_address.makeLineAddress();
311  RubyRequestType type = ruby_request.type;
312  Time issued_time = srequest->issue_time;
313
314  // Set this cache entry to the most recently used
315  if (type == RubyRequestType_IFETCH) {
316    if (m_instCache_ptr->isTagPresent(request_line_address) )
317      m_instCache_ptr->setMRU(request_line_address);
318  } else {
319    if (m_dataCache_ptr->isTagPresent(request_line_address) )
320      m_dataCache_ptr->setMRU(request_line_address);
321  }
322
323  assert(g_eventQueue_ptr->getTime() >= issued_time);
324  Time miss_latency = g_eventQueue_ptr->getTime() - issued_time;
325
326  // Profile the miss latency for all non-zero demand misses
327  if (miss_latency != 0) {
328    g_system_ptr->getProfiler()->missLatency(miss_latency, type);
329
330    if (Debug::getProtocolTrace()) {
331      g_system_ptr->getProfiler()->profileTransition("Seq", m_version, Address(ruby_request.paddr),
332                                                     "", "Done", "", int_to_string(miss_latency)+" cycles");
333    }
334  }
335  /*
336  if (request.getPrefetch() == PrefetchBit_Yes) {
337    return; // Ignore the prefetch
338  }
339  */
340
341  // update the data
342  if (ruby_request.data != NULL) {
343    if ((type == RubyRequestType_LD) ||
344        (type == RubyRequestType_IFETCH) ||
345        (type == RubyRequestType_RMW_Read)) {
346      memcpy(ruby_request.data, data.getData(request_address.getOffset(), ruby_request.len), ruby_request.len);
347    } else {
348      data.setData(ruby_request.data, request_address.getOffset(), ruby_request.len);
349    }
350  }
351
352  m_hit_callback(srequest->id);
353  delete srequest;
354}
355
356// Returns true if the sequencer already has a load or store outstanding
357bool Sequencer::isReady(const RubyRequest& request) {
358  // POLINA: check if we are currently flushing the write buffer, if so Ruby is returned as not ready
359  // to simulate stalling of the front-end
360  // Do we stall all the sequencers? If it is atomic instruction - yes!
361  if (m_outstanding_count >= m_max_outstanding_requests) {
362    return false;
363  }
364
365  if( m_writeRequestTable.exist(line_address(Address(request.paddr))) ||
366      m_readRequestTable.exist(line_address(Address(request.paddr))) ){
367    //cout << "OUTSTANDING REQUEST EXISTS " << p << " VER " << m_version << endl;
368    //printProgress(cout);
369    return false;
370  }
371
372  if (m_servicing_atomic != -1 && m_servicing_atomic != (int)request.proc_id) {
373    assert(m_atomics_counter > 0);
374    return false;
375  }
376  else {
377    if (request.type == RubyRequestType_RMW_Read) {
378      if (m_servicing_atomic == -1) {
379        assert(m_atomics_counter == 0);
380        m_servicing_atomic = (int)request.proc_id;
381      }
382      else {
383        assert(m_servicing_atomic == (int)request.proc_id);
384      }
385      m_atomics_counter++;
386    }
387    else if (request.type == RubyRequestType_RMW_Write) {
388      assert(m_servicing_atomic == (int)request.proc_id);
389      assert(m_atomics_counter > 0);
390      m_atomics_counter--;
391      if (m_atomics_counter == 0) {
392        m_servicing_atomic = -1;
393      }
394    }
395  }
396
397  return true;
398}
399
400bool Sequencer::empty() const {
401  return (m_writeRequestTable.size() == 0) && (m_readRequestTable.size() == 0);
402}
403
404
405int64_t Sequencer::makeRequest(const RubyRequest & request)
406{
407  assert(Address(request.paddr).getOffset() + request.len <= RubySystem::getBlockSizeBytes());
408  if (isReady(request)) {
409    int64_t id = makeUniqueRequestID();
410    SequencerRequest *srequest = new SequencerRequest(request, id, g_eventQueue_ptr->getTime());
411    bool found = insertRequest(srequest);
412    if (!found)
413      if (request.type == RubyRequestType_Locked_Write) {
414        // NOTE: it is OK to check the locked flag here as the mandatory queue will be checked first
415        // ensuring that nothing comes between checking the flag and servicing the store
416        if (!m_dataCache_ptr->isLocked(line_address(Address(request.paddr)), m_version)) {
417          return LLSC_FAIL;
418        }
419        else {
420          m_dataCache_ptr->clearLocked(line_address(Address(request.paddr)));
421        }
422      }
423      if (request.type == RubyRequestType_RMW_Write) {
424        m_controller->started_writes();
425      }
426      issueRequest(request);
427
428    // TODO: issue hardware prefetches here
429    return id;
430  }
431  else {
432    return -1;
433  }
434}
435
436void Sequencer::issueRequest(const RubyRequest& request) {
437
438  // TODO: get rid of CacheMsg, CacheRequestType, and AccessModeTYpe, & have SLICC use RubyRequest and subtypes natively
439  CacheRequestType ctype;
440  switch(request.type) {
441  case RubyRequestType_IFETCH:
442    ctype = CacheRequestType_IFETCH;
443    break;
444  case RubyRequestType_LD:
445    ctype = CacheRequestType_LD;
446    break;
447  case RubyRequestType_ST:
448    ctype = CacheRequestType_ST;
449    break;
450  case RubyRequestType_Locked_Read:
451    ctype = CacheRequestType_ST;
452    break;
453  case RubyRequestType_Locked_Write:
454    ctype = CacheRequestType_ST;
455    break;
456  case RubyRequestType_RMW_Read:
457    ctype = CacheRequestType_ATOMIC;
458    break;
459  case RubyRequestType_RMW_Write:
460    ctype = CacheRequestType_ATOMIC;
461    break;
462  default:
463    assert(0);
464  }
465  AccessModeType amtype;
466  switch(request.access_mode){
467  case RubyAccessMode_User:
468    amtype = AccessModeType_UserMode;
469    break;
470  case RubyAccessMode_Supervisor:
471    amtype = AccessModeType_SupervisorMode;
472    break;
473  case RubyAccessMode_Device:
474    amtype = AccessModeType_UserMode;
475    break;
476  default:
477    assert(0);
478  }
479  Address line_addr(request.paddr);
480  line_addr.makeLineAddress();
481  CacheMsg msg(line_addr, Address(request.paddr), ctype, Address(request.pc), amtype, request.len, PrefetchBit_No, request.proc_id);
482
483  if (Debug::getProtocolTrace()) {
484    g_system_ptr->getProfiler()->profileTransition("Seq", m_version, Address(request.paddr),
485                                                   "", "Begin", "", RubyRequestType_to_string(request.type));
486  }
487
488  if (g_system_ptr->getTracer()->traceEnabled()) {
489    g_system_ptr->getTracer()->traceRequest(m_name, line_addr, Address(request.pc),
490                                            request.type, g_eventQueue_ptr->getTime());
491  }
492
493  Time latency = 0;  // initialzed to an null value
494
495  if (request.type == RubyRequestType_IFETCH)
496    latency = m_instCache_ptr->getLatency();
497  else
498    latency = m_dataCache_ptr->getLatency();
499
500  // Send the message to the cache controller
501  assert(latency > 0);
502
503
504  m_mandatory_q_ptr->enqueue(msg, latency);
505}
506/*
507bool Sequencer::tryCacheAccess(const Address& addr, CacheRequestType type,
508                               AccessModeType access_mode,
509                               int size, DataBlock*& data_ptr) {
510  if (type == CacheRequestType_IFETCH) {
511    return m_instCache_ptr->tryCacheAccess(line_address(addr), type, data_ptr);
512  } else {
513    return m_dataCache_ptr->tryCacheAccess(line_address(addr), type, data_ptr);
514  }
515}
516*/
517
518void Sequencer::print(ostream& out) const {
519  out << "[Sequencer: " << m_version
520      << ", outstanding requests: " << m_outstanding_count;
521
522  out << ", read request table: " << m_readRequestTable
523      << ", write request table: " << m_writeRequestTable;
524  out << "]";
525}
526
527// this can be called from setState whenever coherence permissions are upgraded
528// when invoked, coherence violations will be checked for the given block
529void Sequencer::checkCoherence(const Address& addr) {
530#ifdef CHECK_COHERENCE
531  g_system_ptr->checkGlobalCoherenceInvariant(addr);
532#endif
533}
534
535