Deleted Added
sdiff udiff text old ( 8532:8f27cf8971fe ) new ( 8615:e66a566f2cfa )
full compact
1/*
2 * Copyright (c) 2009 Advanced Micro Devices, Inc.
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are
7 * met: redistributions of source code must retain the above copyright
8 * notice, this list of conditions and the following disclaimer;
9 * redistributions in binary form must reproduce the above copyright
10 * notice, this list of conditions and the following disclaimer in the
11 * documentation and/or other materials provided with the distribution;
12 * neither the name of the copyright holders nor the names of its
13 * contributors may be used to endorse or promote products derived from
14 * this software without specific prior written permission.
15 *
16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
17 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
18 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
19 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
20 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
21 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
22 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
26 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27 */
28
29#include "cpu/testers/rubytest/RubyTester.hh"
30#include "debug/Ruby.hh"
31#include "mem/protocol/AccessPermission.hh"
32#include "mem/ruby/slicc_interface/AbstractController.hh"
33#include "mem/ruby/system/RubyPort.hh"
34#include "mem/physical.hh"
35
36RubyPort::RubyPort(const Params *p)
37 : MemObject(p)
38{
39 m_version = p->version;
40 assert(m_version != -1);
41
42 physmem = p->physmem;
43
44 m_controller = NULL;
45 m_mandatory_q_ptr = NULL;
46
47 m_request_cnt = 0;
48 pio_port = NULL;
49 physMemPort = NULL;
50
51 m_usingRubyTester = p->using_ruby_tester;
52 access_phys_mem = p->access_phys_mem;
53
54 ruby_system = p->ruby_system;
55 waitingOnSequencer = false;
56}
57
58void
59RubyPort::init()
60{
61 assert(m_controller != NULL);
62 m_mandatory_q_ptr = m_controller->getMandatoryQueue();
63}
64
65Port *
66RubyPort::getPort(const std::string &if_name, int idx)
67{
68 if (if_name == "port") {
69 return new M5Port(csprintf("%s-port%d", name(), idx), this,
70 ruby_system, access_phys_mem);
71 }
72
73 if (if_name == "pio_port") {
74 // ensure there is only one pio port
75 assert(pio_port == NULL);
76
77 pio_port = new PioPort(csprintf("%s-pio-port%d", name(), idx), this);
78
79 return pio_port;
80 }
81
82 if (if_name == "physMemPort") {
83 // RubyPort should only have one port to physical memory
84 assert (physMemPort == NULL);
85
86 physMemPort = new M5Port(csprintf("%s-physMemPort", name()), this,
87 ruby_system, access_phys_mem);
88
89 return physMemPort;
90 }
91
92 if (if_name == "functional") {
93 // Calls for the functional port only want to access
94 // functional memory. Therefore, directly pass these calls
95 // ports to physmem.
96 assert(physmem != NULL);
97 return physmem->getPort(if_name, idx);
98 }
99
100 return NULL;
101}
102
103RubyPort::PioPort::PioPort(const std::string &_name,
104 RubyPort *_port)
105 : SimpleTimingPort(_name, _port)
106{
107 DPRINTF(RubyPort, "creating port to ruby sequencer to cpu %s\n", _name);
108 ruby_port = _port;
109}
110
111RubyPort::M5Port::M5Port(const std::string &_name, RubyPort *_port,
112 RubySystem *_system, bool _access_phys_mem)
113 : SimpleTimingPort(_name, _port)
114{
115 DPRINTF(RubyPort, "creating port from ruby sequcner to cpu %s\n", _name);
116 ruby_port = _port;
117 ruby_system = _system;
118 _onRetryList = false;
119 access_phys_mem = _access_phys_mem;
120}
121
122Tick
123RubyPort::PioPort::recvAtomic(PacketPtr pkt)
124{
125 panic("RubyPort::PioPort::recvAtomic() not implemented!\n");
126 return 0;
127}
128
129Tick
130RubyPort::M5Port::recvAtomic(PacketPtr pkt)
131{
132 panic("RubyPort::M5Port::recvAtomic() not implemented!\n");
133 return 0;
134}
135
136
137bool
138RubyPort::PioPort::recvTiming(PacketPtr pkt)
139{
140 // In FS mode, ruby memory will receive pio responses from devices
141 // and it must forward these responses back to the particular CPU.
142 DPRINTF(RubyPort, "Pio response for address %#x\n", pkt->getAddr());
143
144 assert(pkt->isResponse());
145
146 // First we must retrieve the request port from the sender State
147 RubyPort::SenderState *senderState =
148 safe_cast<RubyPort::SenderState *>(pkt->senderState);
149 M5Port *port = senderState->port;
150 assert(port != NULL);
151
152 // pop the sender state from the packet
153 pkt->senderState = senderState->saved;
154 delete senderState;
155
156 port->sendTiming(pkt);
157
158 return true;
159}
160
161bool
162RubyPort::M5Port::recvTiming(PacketPtr pkt)
163{
164 DPRINTF(RubyPort,
165 "Timing access caught for address %#x\n", pkt->getAddr());
166
167 //dsm: based on SimpleTimingPort::recvTiming(pkt);
168
169 // The received packets should only be M5 requests, which should never
170 // get nacked. There used to be code to hanldle nacks here, but
171 // I'm pretty sure it didn't work correctly with the drain code,
172 // so that would need to be fixed if we ever added it back.
173 assert(pkt->isRequest());
174
175 if (pkt->memInhibitAsserted()) {
176 warn("memInhibitAsserted???");
177 // snooper will supply based on copy of packet
178 // still target's responsibility to delete packet
179 delete pkt;
180 return true;
181 }
182
183 // Save the port in the sender state object to be used later to
184 // route the response
185 pkt->senderState = new SenderState(this, pkt->senderState);
186
187 // Check for pio requests and directly send them to the dedicated
188 // pio port.
189 if (!isPhysMemAddress(pkt->getAddr())) {
190 assert(ruby_port->pio_port != NULL);
191 DPRINTF(RubyPort,
192 "Request for address 0x%#x is assumed to be a pio request\n",
193 pkt->getAddr());
194
195 return ruby_port->pio_port->sendTiming(pkt);
196 }
197
198 assert(Address(pkt->getAddr()).getOffset() + pkt->getSize() <=
199 RubySystem::getBlockSizeBytes());
200
201 // Submit the ruby request
202 RequestStatus requestStatus = ruby_port->makeRequest(pkt);
203
204 // If the request successfully issued then we should return true.
205 // Otherwise, we need to delete the senderStatus we just created and return
206 // false.
207 if (requestStatus == RequestStatus_Issued) {
208 DPRINTF(RubyPort, "Request %#x issued\n", pkt->getAddr());
209 return true;
210 }
211
212 //
213 // Unless one is using the ruby tester, record the stalled M5 port for
214 // later retry when the sequencer becomes free.
215 //
216 if (!ruby_port->m_usingRubyTester) {
217 ruby_port->addToRetryList(this);
218 }
219
220 DPRINTF(RubyPort,
221 "Request for address %#x did not issue because %s\n",
222 pkt->getAddr(), RequestStatus_to_string(requestStatus));
223
224 SenderState* senderState = safe_cast<SenderState*>(pkt->senderState);
225 pkt->senderState = senderState->saved;
226 delete senderState;
227 return false;
228}
229
230bool
231RubyPort::M5Port::doFunctionalRead(PacketPtr pkt)
232{
233 Address address(pkt->getAddr());
234 Address line_address(address);
235 line_address.makeLineAddress();
236
237 AccessPermission access_perm = AccessPermission_NotPresent;
238 int num_controllers = ruby_system->m_abs_cntrl_vec.size();
239
240 DPRINTF(RubyPort, "Functional Read request for %s\n",address);
241
242 unsigned int num_ro = 0;
243 unsigned int num_rw = 0;
244 unsigned int num_busy = 0;
245 unsigned int num_backing_store = 0;
246 unsigned int num_invalid = 0;
247
248 // In this loop we count the number of controllers that have the given
249 // address in read only, read write and busy states.
250 for (int i = 0; i < num_controllers; ++i) {
251 access_perm = ruby_system->m_abs_cntrl_vec[i]->
252 getAccessPermission(line_address);
253 if (access_perm == AccessPermission_Read_Only)
254 num_ro++;
255 else if (access_perm == AccessPermission_Read_Write)
256 num_rw++;
257 else if (access_perm == AccessPermission_Busy)
258 num_busy++;
259 else if (access_perm == AccessPermission_Backing_Store)
260 // See RubySlicc_Exports.sm for details, but Backing_Store is meant
261 // to represent blocks in memory *for Broadcast/Snooping protocols*,
262 // where memory has no idea whether it has an exclusive copy of data
263 // or not.
264 num_backing_store++;
265 else if (access_perm == AccessPermission_Invalid ||
266 access_perm == AccessPermission_NotPresent)
267 num_invalid++;
268 }
269 assert(num_rw <= 1);
270
271 uint8* data = pkt->getPtr<uint8_t>(true);
272 unsigned int size_in_bytes = pkt->getSize();
273 unsigned startByte = address.getAddress() - line_address.getAddress();
274
275 // This if case is meant to capture what happens in a Broadcast/Snoop
276 // protocol where the block does not exist in the cache hierarchy. You
277 // only want to read from the Backing_Store memory if there is no copy in
278 // the cache hierarchy, otherwise you want to try to read the RO or RW
279 // copies existing in the cache hierarchy (covered by the else statement).
280 // The reason is because the Backing_Store memory could easily be stale, if
281 // there are copies floating around the cache hierarchy, so you want to read
282 // it only if it's not in the cache hierarchy at all.
283 if (num_invalid == (num_controllers - 1) &&
284 num_backing_store == 1)
285 {
286 DPRINTF(RubyPort, "only copy in Backing_Store memory, read from it\n");
287 for (int i = 0; i < num_controllers; ++i) {
288 access_perm = ruby_system->m_abs_cntrl_vec[i]
289 ->getAccessPermission(line_address);
290 if (access_perm == AccessPermission_Backing_Store) {
291 DataBlock& block = ruby_system->m_abs_cntrl_vec[i]
292 ->getDataBlock(line_address);
293
294 DPRINTF(RubyPort, "reading from %s block %s\n",
295 ruby_system->m_abs_cntrl_vec[i]->name(), block);
296 for (unsigned i = 0; i < size_in_bytes; ++i) {
297 data[i] = block.getByte(i + startByte);
298 }
299 return true;
300 }
301 }
302 } else {
303 // In Broadcast/Snoop protocols, this covers if you know the block
304 // exists somewhere in the caching hierarchy, then you want to read any
305 // valid RO or RW block. In directory protocols, same thing, you want
306 // to read any valid readable copy of the block.
307 DPRINTF(RubyPort, "num_busy = %d, num_ro = %d, num_rw = %d\n",
308 num_busy, num_ro, num_rw);
309 // In this loop, we try to figure which controller has a read only or
310 // a read write copy of the given address. Any valid copy would suffice
311 // for a functional read.
312 for(int i = 0;i < num_controllers;++i) {
313 access_perm = ruby_system->m_abs_cntrl_vec[i]
314 ->getAccessPermission(line_address);
315 if(access_perm == AccessPermission_Read_Only ||
316 access_perm == AccessPermission_Read_Write)
317 {
318 DataBlock& block = ruby_system->m_abs_cntrl_vec[i]
319 ->getDataBlock(line_address);
320
321 DPRINTF(RubyPort, "reading from %s block %s\n",
322 ruby_system->m_abs_cntrl_vec[i]->name(), block);
323 for (unsigned i = 0; i < size_in_bytes; ++i) {
324 data[i] = block.getByte(i + startByte);
325 }
326 return true;
327 }
328 }
329 }
330 return false;
331}
332
333bool
334RubyPort::M5Port::doFunctionalWrite(PacketPtr pkt)
335{
336 Address addr(pkt->getAddr());
337 Address line_addr = line_address(addr);
338 AccessPermission access_perm = AccessPermission_NotPresent;
339 int num_controllers = ruby_system->m_abs_cntrl_vec.size();
340
341 DPRINTF(RubyPort, "Functional Write request for %s\n",addr);
342
343 unsigned int num_ro = 0;
344 unsigned int num_rw = 0;
345 unsigned int num_busy = 0;
346 unsigned int num_backing_store = 0;
347 unsigned int num_invalid = 0;
348
349 // In this loop we count the number of controllers that have the given
350 // address in read only, read write and busy states.
351 for(int i = 0;i < num_controllers;++i) {
352 access_perm = ruby_system->m_abs_cntrl_vec[i]->
353 getAccessPermission(line_addr);
354 if (access_perm == AccessPermission_Read_Only)
355 num_ro++;
356 else if (access_perm == AccessPermission_Read_Write)
357 num_rw++;
358 else if (access_perm == AccessPermission_Busy)
359 num_busy++;
360 else if (access_perm == AccessPermission_Backing_Store)
361 // See RubySlicc_Exports.sm for details, but Backing_Store is meant
362 // to represent blocks in memory *for Broadcast/Snooping protocols*,
363 // where memory has no idea whether it has an exclusive copy of data
364 // or not.
365 num_backing_store++;
366 else if (access_perm == AccessPermission_Invalid ||
367 access_perm == AccessPermission_NotPresent)
368 num_invalid++;
369 }
370
371 // If the number of read write copies is more than 1, then there is bug in
372 // coherence protocol. Otherwise, if all copies are in stable states, i.e.
373 // num_busy == 0, we update all the copies. If there is at least one copy
374 // in busy state, then we check if there is read write copy. If yes, then
375 // also we let the access go through. Or, if there is no copy in the cache
376 // hierarchy at all, we still want to do the write to the memory
377 // (Backing_Store) instead of failing.
378
379 DPRINTF(RubyPort, "num_busy = %d, num_ro = %d, num_rw = %d\n",
380 num_busy, num_ro, num_rw);
381 assert(num_rw <= 1);
382
383 uint8* data = pkt->getPtr<uint8_t>(true);
384 unsigned int size_in_bytes = pkt->getSize();
385 unsigned startByte = addr.getAddress() - line_addr.getAddress();
386
387 if ((num_busy == 0 && num_ro > 0) || num_rw == 1 ||
388 (num_invalid == (num_controllers - 1) && num_backing_store == 1))
389 {
390 for(int i = 0; i < num_controllers;++i) {
391 access_perm = ruby_system->m_abs_cntrl_vec[i]->
392 getAccessPermission(line_addr);
393 if(access_perm == AccessPermission_Read_Only ||
394 access_perm == AccessPermission_Read_Write||
395 access_perm == AccessPermission_Maybe_Stale ||
396 access_perm == AccessPermission_Backing_Store)
397 {
398 DataBlock& block = ruby_system->m_abs_cntrl_vec[i]
399 ->getDataBlock(line_addr);
400
401 DPRINTF(RubyPort, "%s\n",block);
402 for (unsigned i = 0; i < size_in_bytes; ++i) {
403 block.setByte(i + startByte, data[i]);
404 }
405 DPRINTF(RubyPort, "%s\n",block);
406 }
407 }
408 return true;
409 }
410 return false;
411}
412
413void
414RubyPort::M5Port::recvFunctional(PacketPtr pkt)
415{
416 DPRINTF(RubyPort, "Functional access caught for address %#x\n",
417 pkt->getAddr());
418
419 // Check for pio requests and directly send them to the dedicated
420 // pio port.
421 if (!isPhysMemAddress(pkt->getAddr())) {
422 assert(ruby_port->pio_port != NULL);
423 DPRINTF(RubyPort, "Request for address 0x%#x is a pio request\n",
424 pkt->getAddr());
425 panic("RubyPort::PioPort::recvFunctional() not implemented!\n");
426 }
427
428 assert(pkt->getAddr() + pkt->getSize() <=
429 line_address(Address(pkt->getAddr())).getAddress() +
430 RubySystem::getBlockSizeBytes());
431
432 bool accessSucceeded = false;
433 bool needsResponse = pkt->needsResponse();
434
435 // Do the functional access on ruby memory
436 if (pkt->isRead()) {
437 accessSucceeded = doFunctionalRead(pkt);
438 } else if (pkt->isWrite()) {
439 accessSucceeded = doFunctionalWrite(pkt);
440 } else {
441 panic("RubyPort: unsupported functional command %s\n",
442 pkt->cmdString());
443 }
444
445 // Unless the requester explicitly said otherwise, generate an error if
446 // the functional request failed
447 if (!accessSucceeded && !pkt->suppressFuncError()) {
448 fatal("Ruby functional %s failed for address %#x\n",
449 pkt->isWrite() ? "write" : "read", pkt->getAddr());
450 }
451
452 if (access_phys_mem) {
453 // The attached physmem contains the official version of data.
454 // The following command performs the real functional access.
455 // This line should be removed once Ruby supplies the official version
456 // of data.
457 ruby_port->physMemPort->sendFunctional(pkt);
458 }
459
460 // turn packet around to go back to requester if response expected
461 if (needsResponse) {
462 pkt->setFunctionalResponseStatus(accessSucceeded);
463 DPRINTF(RubyPort, "Sending packet back over port\n");
464 sendFunctional(pkt);
465 }
466 DPRINTF(RubyPort, "Functional access %s!\n",
467 accessSucceeded ? "successful":"failed");
468}
469
470void
471RubyPort::ruby_hit_callback(PacketPtr pkt)
472{
473 // Retrieve the request port from the sender State
474 RubyPort::SenderState *senderState =
475 safe_cast<RubyPort::SenderState *>(pkt->senderState);
476 M5Port *port = senderState->port;
477 assert(port != NULL);
478
479 // pop the sender state from the packet
480 pkt->senderState = senderState->saved;
481 delete senderState;
482
483 port->hitCallback(pkt);
484
485 //
486 // If we had to stall the M5Ports, wake them up because the sequencer
487 // likely has free resources now.
488 //
489 if (waitingOnSequencer) {
490 //
491 // Record the current list of ports to retry on a temporary list before
492 // calling sendRetry on those ports. sendRetry will cause an
493 // immediate retry, which may result in the ports being put back on the
494 // list. Therefore we want to clear the retryList before calling
495 // sendRetry.
496 //
497 std::list<M5Port*> curRetryList(retryList);
498
499 retryList.clear();
500 waitingOnSequencer = false;
501
502 for (std::list<M5Port*>::iterator i = curRetryList.begin();
503 i != curRetryList.end(); ++i) {
504 DPRINTF(RubyPort,
505 "Sequencer may now be free. SendRetry to port %s\n",
506 (*i)->name());
507 (*i)->onRetryList(false);
508 (*i)->sendRetry();
509 }
510 }
511}
512
513void
514RubyPort::M5Port::hitCallback(PacketPtr pkt)
515{
516 bool needsResponse = pkt->needsResponse();
517
518 //
519 // Unless specified at configuraiton, all responses except failed SC
520 // and Flush operations access M5 physical memory.
521 //
522 bool accessPhysMem = access_phys_mem;
523
524 if (pkt->isLLSC()) {
525 if (pkt->isWrite()) {
526 if (pkt->req->getExtraData() != 0) {
527 //
528 // Successful SC packets convert to normal writes
529 //
530 pkt->convertScToWrite();
531 } else {
532 //
533 // Failed SC packets don't access physical memory and thus
534 // the RubyPort itself must convert it to a response.
535 //
536 accessPhysMem = false;
537 }
538 } else {
539 //
540 // All LL packets convert to normal loads so that M5 PhysMem does
541 // not lock the blocks.
542 //
543 pkt->convertLlToRead();
544 }
545 }
546
547 //
548 // Flush requests don't access physical memory
549 //
550 if (pkt->isFlush()) {
551 accessPhysMem = false;
552 }
553
554 DPRINTF(RubyPort, "Hit callback needs response %d\n", needsResponse);
555
556 if (accessPhysMem) {
557 ruby_port->physMemPort->sendAtomic(pkt);
558 } else if (needsResponse) {
559 pkt->makeResponse();
560 }
561
562 // turn packet around to go back to requester if response expected
563 if (needsResponse) {
564 DPRINTF(RubyPort, "Sending packet back over port\n");
565 sendTiming(pkt);
566 } else {
567 delete pkt;
568 }
569 DPRINTF(RubyPort, "Hit callback done!\n");
570}
571
572bool
573RubyPort::M5Port::sendTiming(PacketPtr pkt)
574{
575 //minimum latency, must be > 0
576 schedSendTiming(pkt, curTick() + (1 * g_eventQueue_ptr->getClock()));
577 return true;
578}
579
580bool
581RubyPort::PioPort::sendTiming(PacketPtr pkt)
582{
583 //minimum latency, must be > 0
584 schedSendTiming(pkt, curTick() + (1 * g_eventQueue_ptr->getClock()));
585 return true;
586}
587
588bool
589RubyPort::M5Port::isPhysMemAddress(Addr addr)
590{
591 AddrRangeList physMemAddrList;
592 bool snoop = false;
593 ruby_port->physMemPort->getPeerAddressRanges(physMemAddrList, snoop);
594 for (AddrRangeIter iter = physMemAddrList.begin();
595 iter != physMemAddrList.end();
596 iter++) {
597 if (addr >= iter->start && addr <= iter->end) {
598 DPRINTF(RubyPort, "Request found in %#llx - %#llx range\n",
599 iter->start, iter->end);
600 return true;
601 }
602 }
603 return false;
604}
605
606unsigned
607RubyPort::M5Port::deviceBlockSize() const
608{
609 return (unsigned) RubySystem::getBlockSizeBytes();
610}