1/*
2 * Copyright (c) 2010-2012 ARM Limited
3 * Copyright (c) 2013 Advanced Micro Devices, Inc.
4 * All rights reserved
5 *
6 * The license below extends only to copyright in the software and shall
7 * not be construed as granting a license to any other intellectual
8 * property including but not limited to intellectual property relating
9 * to a hardware implementation of the functionality of the software
10 * licensed hereunder. You may use the software subject to the license
11 * terms below provided that you ensure that this notice is replicated
12 * unmodified and in its entirety in all distributions of the software,
13 * modified or unmodified, in source code or in binary form.
14 *
15 * Copyright (c) 2002-2005 The Regents of The University of Michigan
16 * All rights reserved.
17 *
18 * Redistribution and use in source and binary forms, with or without
19 * modification, are permitted provided that the following conditions are
20 * met: redistributions of source code must retain the above copyright
21 * notice, this list of conditions and the following disclaimer;
22 * redistributions in binary form must reproduce the above copyright
23 * notice, this list of conditions and the following disclaimer in the
24 * documentation and/or other materials provided with the distribution;
25 * neither the name of the copyright holders nor the names of its
26 * contributors may be used to endorse or promote products derived from
27 * this software without specific prior written permission.
28 *
29 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
30 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
31 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
32 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
33 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
34 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
35 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
36 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
37 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
38 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
39 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
40 *
41 * Authors: Steve Reinhardt
42 */
43
44#include "arch/kernel_stats.hh"
45#include "arch/stacktrace.hh"
46#include "arch/tlb.hh"
47#include "arch/utility.hh"
48#include "arch/vtophys.hh"
49#include "base/loader/symtab.hh"
50#include "base/cp_annotate.hh"
51#include "base/cprintf.hh"
52#include "base/inifile.hh"
53#include "base/misc.hh"
54#include "base/pollevent.hh"
55#include "base/trace.hh"
56#include "base/types.hh"
57#include "config/the_isa.hh"
58#include "cpu/simple/base.hh"
59#include "cpu/base.hh"
60#include "cpu/checker/cpu.hh"
61#include "cpu/checker/thread_context.hh"
62#include "cpu/exetrace.hh"
63#include "cpu/pred/bpred_unit.hh"
64#include "cpu/profile.hh"
65#include "cpu/simple_thread.hh"
66#include "cpu/smt.hh"
67#include "cpu/static_inst.hh"
68#include "cpu/thread_context.hh"
69#include "debug/Decode.hh"
70#include "debug/Fetch.hh"
71#include "debug/Quiesce.hh"
72#include "mem/mem_object.hh"
73#include "mem/packet.hh"
74#include "mem/request.hh"
75#include "params/BaseSimpleCPU.hh"
76#include "sim/byteswap.hh"
77#include "sim/debug.hh"
78#include "sim/faults.hh"
79#include "sim/full_system.hh"
80#include "sim/sim_events.hh"
81#include "sim/sim_object.hh"
82#include "sim/stats.hh"
83#include "sim/system.hh"
84
85using namespace std;
86using namespace TheISA;
87
88BaseSimpleCPU::BaseSimpleCPU(BaseSimpleCPUParams *p)
89 : BaseCPU(p),
90 branchPred(p->branchPred),
91 traceData(NULL), thread(NULL)
91 traceData(NULL), thread(NULL), _status(Idle), interval_stats(false),
92 inst()
93{
94 if (FullSystem)
95 thread = new SimpleThread(this, 0, p->system, p->itb, p->dtb,
96 p->isa[0]);
97 else
98 thread = new SimpleThread(this, /* thread_num */ 0, p->system,
99 p->workload[0], p->itb, p->dtb, p->isa[0]);
100
101 thread->setStatus(ThreadContext::Halted);
102
103 tc = thread->getTC();
104
105 if (p->checker) {
106 BaseCPU *temp_checker = p->checker;
107 checker = dynamic_cast<CheckerCPU *>(temp_checker);
108 checker->setSystem(p->system);
109 // Manipulate thread context
110 ThreadContext *cpu_tc = tc;
111 tc = new CheckerThreadContext<ThreadContext>(cpu_tc, this->checker);
112 } else {
113 checker = NULL;
114 }
115
116 numInst = 0;
117 startNumInst = 0;
118 numOp = 0;
119 startNumOp = 0;
120 numLoad = 0;
121 startNumLoad = 0;
122 lastIcacheStall = 0;
123 lastDcacheStall = 0;
124
125 threadContexts.push_back(tc);
126
127
128 fetchOffset = 0;
129 stayAtPC = false;
130}
131
132BaseSimpleCPU::~BaseSimpleCPU()
133{
134}
135
136void
137BaseSimpleCPU::haltContext(ThreadID thread_num)
138{
139 // for now, these are equivalent
140 suspendContext(thread_num);
141}
142
143
144void
145BaseSimpleCPU::regStats()
146{
147 using namespace Stats;
148
149 BaseCPU::regStats();
150
151 numInsts
152 .name(name() + ".committedInsts")
153 .desc("Number of instructions committed")
154 ;
155
156 numOps
157 .name(name() + ".committedOps")
158 .desc("Number of ops (including micro ops) committed")
159 ;
160
161 numIntAluAccesses
162 .name(name() + ".num_int_alu_accesses")
163 .desc("Number of integer alu accesses")
164 ;
165
166 numFpAluAccesses
167 .name(name() + ".num_fp_alu_accesses")
168 .desc("Number of float alu accesses")
169 ;
170
171 numCallsReturns
172 .name(name() + ".num_func_calls")
173 .desc("number of times a function call or return occured")
174 ;
175
176 numCondCtrlInsts
177 .name(name() + ".num_conditional_control_insts")
178 .desc("number of instructions that are conditional controls")
179 ;
180
181 numIntInsts
182 .name(name() + ".num_int_insts")
183 .desc("number of integer instructions")
184 ;
185
186 numFpInsts
187 .name(name() + ".num_fp_insts")
188 .desc("number of float instructions")
189 ;
190
191 numIntRegReads
192 .name(name() + ".num_int_register_reads")
193 .desc("number of times the integer registers were read")
194 ;
195
196 numIntRegWrites
197 .name(name() + ".num_int_register_writes")
198 .desc("number of times the integer registers were written")
199 ;
200
201 numFpRegReads
202 .name(name() + ".num_fp_register_reads")
203 .desc("number of times the floating registers were read")
204 ;
205
206 numFpRegWrites
207 .name(name() + ".num_fp_register_writes")
208 .desc("number of times the floating registers were written")
209 ;
210
211 numCCRegReads
212 .name(name() + ".num_cc_register_reads")
213 .desc("number of times the CC registers were read")
214 .flags(nozero)
215 ;
216
217 numCCRegWrites
218 .name(name() + ".num_cc_register_writes")
219 .desc("number of times the CC registers were written")
220 .flags(nozero)
221 ;
222
223 numMemRefs
224 .name(name()+".num_mem_refs")
225 .desc("number of memory refs")
226 ;
227
228 numStoreInsts
229 .name(name() + ".num_store_insts")
230 .desc("Number of store instructions")
231 ;
232
233 numLoadInsts
234 .name(name() + ".num_load_insts")
235 .desc("Number of load instructions")
236 ;
237
238 notIdleFraction
239 .name(name() + ".not_idle_fraction")
240 .desc("Percentage of non-idle cycles")
241 ;
242
243 idleFraction
244 .name(name() + ".idle_fraction")
245 .desc("Percentage of idle cycles")
246 ;
247
248 numBusyCycles
249 .name(name() + ".num_busy_cycles")
250 .desc("Number of busy cycles")
251 ;
252
253 numIdleCycles
254 .name(name()+".num_idle_cycles")
255 .desc("Number of idle cycles")
256 ;
257
258 icacheStallCycles
259 .name(name() + ".icache_stall_cycles")
260 .desc("ICache total stall cycles")
261 .prereq(icacheStallCycles)
262 ;
263
264 dcacheStallCycles
265 .name(name() + ".dcache_stall_cycles")
266 .desc("DCache total stall cycles")
267 .prereq(dcacheStallCycles)
268 ;
269
269 icacheRetryCycles
270 .name(name() + ".icache_retry_cycles")
271 .desc("ICache total retry cycles")
272 .prereq(icacheRetryCycles)
273 ;
274
275 dcacheRetryCycles
276 .name(name() + ".dcache_retry_cycles")
277 .desc("DCache total retry cycles")
278 .prereq(dcacheRetryCycles)
279 ;
280
270 statExecutedInstType
271 .init(Enums::Num_OpClass)
272 .name(name() + ".op_class")
273 .desc("Class of executed instruction")
274 .flags(total | pdf | dist)
275 ;
276 for (unsigned i = 0; i < Num_OpClasses; ++i) {
277 statExecutedInstType.subname(i, Enums::OpClassStrings[i]);
278 }
279
280 idleFraction = constant(1.0) - notIdleFraction;
281 numIdleCycles = idleFraction * numCycles;
282 numBusyCycles = (notIdleFraction)*numCycles;
283
284 numBranches
285 .name(name() + ".Branches")
286 .desc("Number of branches fetched")
287 .prereq(numBranches);
288
289 numPredictedBranches
290 .name(name() + ".predictedBranches")
291 .desc("Number of branches predicted as taken")
292 .prereq(numPredictedBranches);
293
294 numBranchMispred
295 .name(name() + ".BranchMispred")
296 .desc("Number of branch mispredictions")
297 .prereq(numBranchMispred);
298}
299
300void
301BaseSimpleCPU::resetStats()
302{
303// startNumInst = numInst;
304 notIdleFraction = (_status != Idle);
305}
306
307void
308BaseSimpleCPU::serializeThread(ostream &os, ThreadID tid)
309{
310 assert(_status == Idle || _status == Running);
311 assert(tid == 0);
312
313 thread->serialize(os);
314}
315
316void
317BaseSimpleCPU::unserializeThread(Checkpoint *cp, const string &section,
318 ThreadID tid)
319{
320 if (tid != 0)
321 fatal("Trying to load more than one thread into a SimpleCPU\n");
322 thread->unserialize(cp, section);
323}
324
325void
326change_thread_state(ThreadID tid, int activate, int priority)
327{
328}
329
330Addr
331BaseSimpleCPU::dbg_vtophys(Addr addr)
332{
333 return vtophys(tc, addr);
334}
335
336void
337BaseSimpleCPU::wakeup()
338{
339 getAddrMonitor()->gotWakeup = true;
340
341 if (thread->status() != ThreadContext::Suspended)
342 return;
343
344 DPRINTF(Quiesce,"Suspended Processor awoke\n");
345 thread->activate();
346}
347
348void
349BaseSimpleCPU::checkForInterrupts()
350{
351 if (checkInterrupts(tc)) {
352 Fault interrupt = interrupts->getInterrupt(tc);
353
354 if (interrupt != NoFault) {
355 fetchOffset = 0;
356 interrupts->updateIntrInfo(tc);
357 interrupt->invoke(tc);
358 thread->decoder.reset();
359 }
360 }
361}
362
363
364void
365BaseSimpleCPU::setupFetchRequest(Request *req)
366{
367 Addr instAddr = thread->instAddr();
368
369 // set up memory request for instruction fetch
370 DPRINTF(Fetch, "Fetch: PC:%08p\n", instAddr);
371
372 Addr fetchPC = (instAddr & PCMask) + fetchOffset;
373 req->setVirt(0, fetchPC, sizeof(MachInst), Request::INST_FETCH, instMasterId(),
374 instAddr);
375}
376
377
378void
379BaseSimpleCPU::preExecute()
380{
381 // maintain $r0 semantics
382 thread->setIntReg(ZeroReg, 0);
383#if THE_ISA == ALPHA_ISA
384 thread->setFloatReg(ZeroReg, 0.0);
385#endif // ALPHA_ISA
386
387 // check for instruction-count-based events
388 comInstEventQueue[0]->serviceEvents(numInst);
389 system->instEventQueue.serviceEvents(system->totalNumInsts);
390
391 // decode the instruction
392 inst = gtoh(inst);
393
394 TheISA::PCState pcState = thread->pcState();
395
396 if (isRomMicroPC(pcState.microPC())) {
397 stayAtPC = false;
398 curStaticInst = microcodeRom.fetchMicroop(pcState.microPC(),
399 curMacroStaticInst);
400 } else if (!curMacroStaticInst) {
401 //We're not in the middle of a macro instruction
402 StaticInstPtr instPtr = NULL;
403
404 TheISA::Decoder *decoder = &(thread->decoder);
405
406 //Predecode, ie bundle up an ExtMachInst
407 //If more fetch data is needed, pass it in.
408 Addr fetchPC = (pcState.instAddr() & PCMask) + fetchOffset;
409 //if(decoder->needMoreBytes())
410 decoder->moreBytes(pcState, fetchPC, inst);
411 //else
412 // decoder->process();
413
414 //Decode an instruction if one is ready. Otherwise, we'll have to
415 //fetch beyond the MachInst at the current pc.
416 instPtr = decoder->decode(pcState);
417 if (instPtr) {
418 stayAtPC = false;
419 thread->pcState(pcState);
420 } else {
421 stayAtPC = true;
422 fetchOffset += sizeof(MachInst);
423 }
424
425 //If we decoded an instruction and it's microcoded, start pulling
426 //out micro ops
427 if (instPtr && instPtr->isMacroop()) {
428 curMacroStaticInst = instPtr;
429 curStaticInst = curMacroStaticInst->fetchMicroop(pcState.microPC());
430 } else {
431 curStaticInst = instPtr;
432 }
433 } else {
434 //Read the next micro op from the macro op
435 curStaticInst = curMacroStaticInst->fetchMicroop(pcState.microPC());
436 }
437
438 //If we decoded an instruction this "tick", record information about it.
439 if (curStaticInst) {
440#if TRACING_ON
441 traceData = tracer->getInstRecord(curTick(), tc,
442 curStaticInst, thread->pcState(), curMacroStaticInst);
443
444 DPRINTF(Decode,"Decode: Decoded %s instruction: %#x\n",
445 curStaticInst->getName(), curStaticInst->machInst);
446#endif // TRACING_ON
447 }
448
449 if (branchPred && curStaticInst && curStaticInst->isControl()) {
450 // Use a fake sequence number since we only have one
451 // instruction in flight at the same time.
452 const InstSeqNum cur_sn(0);
453 const ThreadID tid(0);
454 pred_pc = thread->pcState();
455 const bool predict_taken(
456 branchPred->predict(curStaticInst, cur_sn, pred_pc, tid));
457
458 if (predict_taken)
459 ++numPredictedBranches;
460 }
461}
462
463void
464BaseSimpleCPU::postExecute()
465{
466 assert(curStaticInst);
467
468 TheISA::PCState pc = tc->pcState();
469 Addr instAddr = pc.instAddr();
470 if (FullSystem && thread->profile) {
471 bool usermode = TheISA::inUserMode(tc);
472 thread->profilePC = usermode ? 1 : instAddr;
473 ProfileNode *node = thread->profile->consume(tc, curStaticInst);
474 if (node)
475 thread->profileNode = node;
476 }
477
478 if (curStaticInst->isMemRef()) {
479 numMemRefs++;
480 }
481
482 if (curStaticInst->isLoad()) {
483 ++numLoad;
484 comLoadEventQueue[0]->serviceEvents(numLoad);
485 }
486
487 if (CPA::available()) {
488 CPA::cpa()->swAutoBegin(tc, pc.nextInstAddr());
489 }
490
491 if (curStaticInst->isControl()) {
492 ++numBranches;
493 }
494
495 /* Power model statistics */
496 //integer alu accesses
497 if (curStaticInst->isInteger()){
498 numIntAluAccesses++;
499 numIntInsts++;
500 }
501
502 //float alu accesses
503 if (curStaticInst->isFloating()){
504 numFpAluAccesses++;
505 numFpInsts++;
506 }
507
508 //number of function calls/returns to get window accesses
509 if (curStaticInst->isCall() || curStaticInst->isReturn()){
510 numCallsReturns++;
511 }
512
513 //the number of branch predictions that will be made
514 if (curStaticInst->isCondCtrl()){
515 numCondCtrlInsts++;
516 }
517
518 //result bus acceses
519 if (curStaticInst->isLoad()){
520 numLoadInsts++;
521 }
522
523 if (curStaticInst->isStore()){
524 numStoreInsts++;
525 }
526 /* End power model statistics */
527
528 statExecutedInstType[curStaticInst->opClass()]++;
529
530 if (FullSystem)
531 traceFunctions(instAddr);
532
533 if (traceData) {
534 traceData->dump();
535 delete traceData;
536 traceData = NULL;
537 }
538
539 // Call CPU instruction commit probes
540 probeInstCommit(curStaticInst);
541}
542
543void
544BaseSimpleCPU::advancePC(const Fault &fault)
545{
546 const bool branching(thread->pcState().branching());
547
548 //Since we're moving to a new pc, zero out the offset
549 fetchOffset = 0;
550 if (fault != NoFault) {
551 curMacroStaticInst = StaticInst::nullStaticInstPtr;
552 fault->invoke(tc, curStaticInst);
553 thread->decoder.reset();
554 } else {
555 if (curStaticInst) {
556 if (curStaticInst->isLastMicroop())
557 curMacroStaticInst = StaticInst::nullStaticInstPtr;
558 TheISA::PCState pcState = thread->pcState();
559 TheISA::advancePC(pcState, curStaticInst);
560 thread->pcState(pcState);
561 }
562 }
563
564 if (branchPred && curStaticInst && curStaticInst->isControl()) {
565 // Use a fake sequence number since we only have one
566 // instruction in flight at the same time.
567 const InstSeqNum cur_sn(0);
568 const ThreadID tid(0);
569
570 if (pred_pc == thread->pcState()) {
571 // Correctly predicted branch
572 branchPred->update(cur_sn, tid);
573 } else {
574 // Mis-predicted branch
575 branchPred->squash(cur_sn, pcState(),
576 branching, tid);
577 ++numBranchMispred;
578 }
579 }
580}
581
582void
583BaseSimpleCPU::startup()
584{
585 BaseCPU::startup();
586 thread->startup();
587}