Deleted Added
sdiff udiff text old ( 3177:3a2bc3fbae6e ) new ( 3184:8edaf4539e05 )
full compact
1/*
2 * Copyright (c) 2002-2005 The Regents of The University of Michigan
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are
7 * met: redistributions of source code must retain the above copyright
8 * notice, this list of conditions and the following disclaimer;
9 * redistributions in binary form must reproduce the above copyright
10 * notice, this list of conditions and the following disclaimer in the
11 * documentation and/or other materials provided with the distribution;
12 * neither the name of the copyright holders nor the names of its
13 * contributors may be used to endorse or promote products derived from
14 * this software without specific prior written permission.
15 *
16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
17 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
18 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
19 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
20 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
21 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
22 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
26 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27 *
28 * Authors: Steve Reinhardt
29 */
30
31#include "arch/locked_mem.hh"
32#include "arch/utility.hh"
33#include "cpu/exetrace.hh"
34#include "cpu/simple/atomic.hh"
35#include "mem/packet_impl.hh"
36#include "sim/builder.hh"
37#include "sim/system.hh"
38
39using namespace std;
40using namespace TheISA;
41
42AtomicSimpleCPU::TickEvent::TickEvent(AtomicSimpleCPU *c)
43 : Event(&mainEventQueue, CPU_Tick_Pri), cpu(c)
44{
45}
46
47
48void
49AtomicSimpleCPU::TickEvent::process()
50{
51 cpu->tick();
52}
53
54const char *
55AtomicSimpleCPU::TickEvent::description()
56{
57 return "AtomicSimpleCPU tick event";
58}
59
60Port *
61AtomicSimpleCPU::getPort(const std::string &if_name, int idx)
62{
63 if (if_name == "dcache_port")
64 return &dcachePort;
65 else if (if_name == "icache_port")
66 return &icachePort;
67 else
68 panic("No Such Port\n");
69}
70
71void
72AtomicSimpleCPU::init()
73{
74 //Create Memory Ports (conect them up)
75// Port *mem_dport = mem->getPort("");
76// dcachePort.setPeer(mem_dport);
77// mem_dport->setPeer(&dcachePort);
78
79// Port *mem_iport = mem->getPort("");
80// icachePort.setPeer(mem_iport);
81// mem_iport->setPeer(&icachePort);
82
83 BaseCPU::init();
84#if FULL_SYSTEM
85 for (int i = 0; i < threadContexts.size(); ++i) {
86 ThreadContext *tc = threadContexts[i];
87
88 // initialize CPU, including PC
89 TheISA::initCPU(tc, tc->readCpuId());
90 }
91#endif
92}
93
94bool
95AtomicSimpleCPU::CpuPort::recvTiming(Packet *pkt)
96{
97 panic("AtomicSimpleCPU doesn't expect recvAtomic callback!");
98 return true;
99}
100
101Tick
102AtomicSimpleCPU::CpuPort::recvAtomic(Packet *pkt)
103{
104 panic("AtomicSimpleCPU doesn't expect recvAtomic callback!");
105 return curTick;
106}
107
108void
109AtomicSimpleCPU::CpuPort::recvFunctional(Packet *pkt)
110{
111 panic("AtomicSimpleCPU doesn't expect recvFunctional callback!");
112}
113
114void
115AtomicSimpleCPU::CpuPort::recvStatusChange(Status status)
116{
117 if (status == RangeChange)
118 return;
119
120 panic("AtomicSimpleCPU doesn't expect recvStatusChange callback!");
121}
122
123void
124AtomicSimpleCPU::CpuPort::recvRetry()
125{
126 panic("AtomicSimpleCPU doesn't expect recvRetry callback!");
127}
128
129
130AtomicSimpleCPU::AtomicSimpleCPU(Params *p)
131 : BaseSimpleCPU(p), tickEvent(this),
132 width(p->width), simulate_stalls(p->simulate_stalls),
133 icachePort(name() + "-iport", this), dcachePort(name() + "-iport", this)
134{
135 _status = Idle;
136
137 ifetch_req = new Request();
138 ifetch_req->setThreadContext(p->cpu_id, 0); // Add thread ID if we add MT
139 ifetch_pkt = new Packet(ifetch_req, Packet::ReadReq, Packet::Broadcast);
140 ifetch_pkt->dataStatic(&inst);
141
142 data_read_req = new Request();
143 data_read_req->setThreadContext(p->cpu_id, 0); // Add thread ID here too
144 data_read_pkt = new Packet(data_read_req, Packet::ReadReq,
145 Packet::Broadcast);
146 data_read_pkt->dataStatic(&dataReg);
147
148 data_write_req = new Request();
149 data_write_req->setThreadContext(p->cpu_id, 0); // Add thread ID here too
150 data_write_pkt = new Packet(data_write_req, Packet::WriteReq,
151 Packet::Broadcast);
152}
153
154
155AtomicSimpleCPU::~AtomicSimpleCPU()
156{
157}
158
159void
160AtomicSimpleCPU::serialize(ostream &os)
161{
162 SimObject::State so_state = SimObject::getState();
163 SERIALIZE_ENUM(so_state);
164 Status _status = status();
165 SERIALIZE_ENUM(_status);
166 BaseSimpleCPU::serialize(os);
167 nameOut(os, csprintf("%s.tickEvent", name()));
168 tickEvent.serialize(os);
169}
170
171void
172AtomicSimpleCPU::unserialize(Checkpoint *cp, const string &section)
173{
174 SimObject::State so_state;
175 UNSERIALIZE_ENUM(so_state);
176 UNSERIALIZE_ENUM(_status);
177 BaseSimpleCPU::unserialize(cp, section);
178 tickEvent.unserialize(cp, csprintf("%s.tickEvent", section));
179}
180
181void
182AtomicSimpleCPU::resume()
183{
184 assert(system->getMemoryMode() == System::Atomic);
185 changeState(SimObject::Running);
186 if (thread->status() == ThreadContext::Active) {
187 if (!tickEvent.scheduled())
188 tickEvent.schedule(curTick);
189 }
190}
191
192void
193AtomicSimpleCPU::switchOut()
194{
195 assert(status() == Running || status() == Idle);
196 _status = SwitchedOut;
197
198 tickEvent.squash();
199}
200
201
202void
203AtomicSimpleCPU::takeOverFrom(BaseCPU *oldCPU)
204{
205 BaseCPU::takeOverFrom(oldCPU);
206
207 assert(!tickEvent.scheduled());
208
209 // if any of this CPU's ThreadContexts are active, mark the CPU as
210 // running and schedule its tick event.
211 for (int i = 0; i < threadContexts.size(); ++i) {
212 ThreadContext *tc = threadContexts[i];
213 if (tc->status() == ThreadContext::Active && _status != Running) {
214 _status = Running;
215 tickEvent.schedule(curTick);
216 break;
217 }
218 }
219}
220
221
222void
223AtomicSimpleCPU::activateContext(int thread_num, int delay)
224{
225 assert(thread_num == 0);
226 assert(thread);
227
228 assert(_status == Idle);
229 assert(!tickEvent.scheduled());
230
231 notIdleFraction++;
232 tickEvent.schedule(curTick + cycles(delay));
233 _status = Running;
234}
235
236
237void
238AtomicSimpleCPU::suspendContext(int thread_num)
239{
240 assert(thread_num == 0);
241 assert(thread);
242
243 assert(_status == Running);
244
245 // tick event may not be scheduled if this gets called from inside
246 // an instruction's execution, e.g. "quiesce"
247 if (tickEvent.scheduled())
248 tickEvent.deschedule();
249
250 notIdleFraction--;
251 _status = Idle;
252}
253
254
255template <class T>
256Fault
257AtomicSimpleCPU::read(Addr addr, T &data, unsigned flags)
258{
259 // use the CPU's statically allocated read request and packet objects
260 Request *req = data_read_req;
261 Packet *pkt = data_read_pkt;
262
263 req->setVirt(0, addr, sizeof(T), flags, thread->readPC());
264
265 if (traceData) {
266 traceData->setAddr(addr);
267 }
268
269 // translate to physical address
270 Fault fault = thread->translateDataReadReq(req);
271
272 // Now do the access.
273 if (fault == NoFault) {
274 pkt->reinitFromRequest();
275
276 dcache_latency = dcachePort.sendAtomic(pkt);
277 dcache_access = true;
278
279 assert(pkt->result == Packet::Success);
280 data = pkt->get<T>();
281
282 if (req->isLocked()) {
283 TheISA::handleLockedRead(thread, req);
284 }
285 }
286
287 // This will need a new way to tell if it has a dcache attached.
288 if (req->isUncacheable())
289 recordEvent("Uncached Read");
290
291 return fault;
292}
293
294#ifndef DOXYGEN_SHOULD_SKIP_THIS
295
296template
297Fault
298AtomicSimpleCPU::read(Addr addr, uint64_t &data, unsigned flags);
299
300template
301Fault
302AtomicSimpleCPU::read(Addr addr, uint32_t &data, unsigned flags);
303
304template
305Fault
306AtomicSimpleCPU::read(Addr addr, uint16_t &data, unsigned flags);
307
308template
309Fault
310AtomicSimpleCPU::read(Addr addr, uint8_t &data, unsigned flags);
311
312#endif //DOXYGEN_SHOULD_SKIP_THIS
313
314template<>
315Fault
316AtomicSimpleCPU::read(Addr addr, double &data, unsigned flags)
317{
318 return read(addr, *(uint64_t*)&data, flags);
319}
320
321template<>
322Fault
323AtomicSimpleCPU::read(Addr addr, float &data, unsigned flags)
324{
325 return read(addr, *(uint32_t*)&data, flags);
326}
327
328
329template<>
330Fault
331AtomicSimpleCPU::read(Addr addr, int32_t &data, unsigned flags)
332{
333 return read(addr, (uint32_t&)data, flags);
334}
335
336
337template <class T>
338Fault
339AtomicSimpleCPU::write(T data, Addr addr, unsigned flags, uint64_t *res)
340{
341 // use the CPU's statically allocated write request and packet objects
342 Request *req = data_write_req;
343 Packet *pkt = data_write_pkt;
344
345 req->setVirt(0, addr, sizeof(T), flags, thread->readPC());
346
347 if (traceData) {
348 traceData->setAddr(addr);
349 }
350
351 // translate to physical address
352 Fault fault = thread->translateDataWriteReq(req);
353
354 // Now do the access.
355 if (fault == NoFault) {
356 bool do_access = true; // flag to suppress cache access
357
358 if (req->isLocked()) {
359 do_access = TheISA::handleLockedWrite(thread, req);
360 }
361
362 if (do_access) {
363 data = htog(data);
364 pkt->reinitFromRequest();
365 pkt->dataStatic(&data);
366
367 dcache_latency = dcachePort.sendAtomic(pkt);
368 dcache_access = true;
369
370 assert(pkt->result == Packet::Success);
371 }
372
373 if (req->isLocked()) {
374 uint64_t scResult = req->getScResult();
375 if (scResult != 0) {
376 // clear failure counter
377 thread->setStCondFailures(0);
378 }
379 if (res) {
380 *res = req->getScResult();
381 }
382 }
383 }
384
385 // This will need a new way to tell if it's hooked up to a cache or not.
386 if (req->isUncacheable())
387 recordEvent("Uncached Write");
388
389 // If the write needs to have a fault on the access, consider calling
390 // changeStatus() and changing it to "bad addr write" or something.
391 return fault;
392}
393
394
395#ifndef DOXYGEN_SHOULD_SKIP_THIS
396template
397Fault
398AtomicSimpleCPU::write(uint64_t data, Addr addr,
399 unsigned flags, uint64_t *res);
400
401template
402Fault
403AtomicSimpleCPU::write(uint32_t data, Addr addr,
404 unsigned flags, uint64_t *res);
405
406template
407Fault
408AtomicSimpleCPU::write(uint16_t data, Addr addr,
409 unsigned flags, uint64_t *res);
410
411template
412Fault
413AtomicSimpleCPU::write(uint8_t data, Addr addr,
414 unsigned flags, uint64_t *res);
415
416#endif //DOXYGEN_SHOULD_SKIP_THIS
417
418template<>
419Fault
420AtomicSimpleCPU::write(double data, Addr addr, unsigned flags, uint64_t *res)
421{
422 return write(*(uint64_t*)&data, addr, flags, res);
423}
424
425template<>
426Fault
427AtomicSimpleCPU::write(float data, Addr addr, unsigned flags, uint64_t *res)
428{
429 return write(*(uint32_t*)&data, addr, flags, res);
430}
431
432
433template<>
434Fault
435AtomicSimpleCPU::write(int32_t data, Addr addr, unsigned flags, uint64_t *res)
436{
437 return write((uint32_t)data, addr, flags, res);
438}
439
440
441void
442AtomicSimpleCPU::tick()
443{
444 Tick latency = cycles(1); // instruction takes one cycle by default
445
446 for (int i = 0; i < width; ++i) {
447 numCycles++;
448
449 checkForInterrupts();
450
451 Fault fault = setupFetchRequest(ifetch_req);
452
453 if (fault == NoFault) {
454 ifetch_pkt->reinitFromRequest();
455
456 Tick icache_latency = icachePort.sendAtomic(ifetch_pkt);
457 // ifetch_req is initialized to read the instruction directly
458 // into the CPU object's inst field.
459
460 dcache_access = false; // assume no dcache access
461 preExecute();
462 fault = curStaticInst->execute(this, traceData);
463 postExecute();
464
465 if (simulate_stalls) {
466 Tick icache_stall = icache_latency - cycles(1);
467 Tick dcache_stall =
468 dcache_access ? dcache_latency - cycles(1) : 0;
469 Tick stall_cycles = (icache_stall + dcache_stall) / cycles(1);
470 if (cycles(stall_cycles) < (icache_stall + dcache_stall))
471 latency += cycles(stall_cycles+1);
472 else
473 latency += cycles(stall_cycles);
474 }
475
476 }
477
478 advancePC(fault);
479 }
480
481 if (_status != Idle)
482 tickEvent.schedule(curTick + latency);
483}
484
485
486////////////////////////////////////////////////////////////////////////
487//
488// AtomicSimpleCPU Simulation Object
489//
490BEGIN_DECLARE_SIM_OBJECT_PARAMS(AtomicSimpleCPU)
491
492 Param<Counter> max_insts_any_thread;
493 Param<Counter> max_insts_all_threads;
494 Param<Counter> max_loads_any_thread;
495 Param<Counter> max_loads_all_threads;
496 Param<Tick> progress_interval;
497 SimObjectParam<MemObject *> mem;
498 SimObjectParam<System *> system;
499 Param<int> cpu_id;
500
501#if FULL_SYSTEM
502 SimObjectParam<AlphaITB *> itb;
503 SimObjectParam<AlphaDTB *> dtb;
504 Param<Tick> profile;
505#else
506 SimObjectParam<Process *> workload;
507#endif // FULL_SYSTEM
508
509 Param<int> clock;
510
511 Param<bool> defer_registration;
512 Param<int> width;
513 Param<bool> function_trace;
514 Param<Tick> function_trace_start;
515 Param<bool> simulate_stalls;
516
517END_DECLARE_SIM_OBJECT_PARAMS(AtomicSimpleCPU)
518
519BEGIN_INIT_SIM_OBJECT_PARAMS(AtomicSimpleCPU)
520
521 INIT_PARAM(max_insts_any_thread,
522 "terminate when any thread reaches this inst count"),
523 INIT_PARAM(max_insts_all_threads,
524 "terminate when all threads have reached this inst count"),
525 INIT_PARAM(max_loads_any_thread,
526 "terminate when any thread reaches this load count"),
527 INIT_PARAM(max_loads_all_threads,
528 "terminate when all threads have reached this load count"),
529 INIT_PARAM(progress_interval, "Progress interval"),
530 INIT_PARAM(mem, "memory"),
531 INIT_PARAM(system, "system object"),
532 INIT_PARAM(cpu_id, "processor ID"),
533
534#if FULL_SYSTEM
535 INIT_PARAM(itb, "Instruction TLB"),
536 INIT_PARAM(dtb, "Data TLB"),
537 INIT_PARAM(profile, ""),
538#else
539 INIT_PARAM(workload, "processes to run"),
540#endif // FULL_SYSTEM
541
542 INIT_PARAM(clock, "clock speed"),
543 INIT_PARAM(defer_registration, "defer system registration (for sampling)"),
544 INIT_PARAM(width, "cpu width"),
545 INIT_PARAM(function_trace, "Enable function trace"),
546 INIT_PARAM(function_trace_start, "Cycle to start function trace"),
547 INIT_PARAM(simulate_stalls, "Simulate cache stall cycles")
548
549END_INIT_SIM_OBJECT_PARAMS(AtomicSimpleCPU)
550
551
552CREATE_SIM_OBJECT(AtomicSimpleCPU)
553{
554 AtomicSimpleCPU::Params *params = new AtomicSimpleCPU::Params();
555 params->name = getInstanceName();
556 params->numberOfThreads = 1;
557 params->max_insts_any_thread = max_insts_any_thread;
558 params->max_insts_all_threads = max_insts_all_threads;
559 params->max_loads_any_thread = max_loads_any_thread;
560 params->max_loads_all_threads = max_loads_all_threads;
561 params->progress_interval = progress_interval;
562 params->deferRegistration = defer_registration;
563 params->clock = clock;
564 params->functionTrace = function_trace;
565 params->functionTraceStart = function_trace_start;
566 params->width = width;
567 params->simulate_stalls = simulate_stalls;
568 params->mem = mem;
569 params->system = system;
570 params->cpu_id = cpu_id;
571
572#if FULL_SYSTEM
573 params->itb = itb;
574 params->dtb = dtb;
575 params->profile = profile;
576#else
577 params->process = workload;
578#endif
579
580 AtomicSimpleCPU *cpu = new AtomicSimpleCPU(params);
581 return cpu;
582}
583
584REGISTER_SIM_OBJECT("AtomicSimpleCPU", AtomicSimpleCPU)
585