/* * Copyright (c) 2004-2005 The Regents of The University of Michigan * All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions are * met: redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer; * redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution; * neither the name of the copyright holders nor the names of its * contributors may be used to endorse or promote products derived from * this software without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. * * Authors: Kevin Lim */ #include #include #include #include #include "base/cprintf.hh" #include "base/trace.hh" #include "arch/faults.hh" #include "cpu/exetrace.hh" #include "mem/request.hh" #include "cpu/base_dyn_inst.hh" #include "cpu/o3/alpha_impl.hh" #include "cpu/o3/alpha_cpu.hh" //#include "cpu/ozone/simple_impl.hh" //#include "cpu/ozone/ozone_impl.hh" using namespace std; using namespace TheISA; #define NOHASH #ifndef NOHASH #include "base/hashmap.hh" unsigned int MyHashFunc(const BaseDynInst *addr) { unsigned a = (unsigned)addr; unsigned hash = (((a >> 14) ^ ((a >> 2) & 0xffff))) & 0x7FFFFFFF; return hash; } typedef m5::hash_map my_hash_t; my_hash_t thishash; #endif template BaseDynInst::BaseDynInst(ExtMachInst machInst, Addr inst_PC, Addr pred_PC, InstSeqNum seq_num, FullCPU *cpu) : staticInst(machInst), traceData(NULL), cpu(cpu)/*, xc(cpu->xcBase())*/ { seqNum = seq_num; PC = inst_PC; nextPC = PC + sizeof(MachInst); predPC = pred_PC; initVars(); } template BaseDynInst::BaseDynInst(StaticInstPtr &_staticInst) : staticInst(_staticInst), traceData(NULL) { seqNum = 0; initVars(); } template void BaseDynInst::initVars() { req = NULL; memData = NULL; effAddr = 0; physEffAddr = 0; storeSize = 0; readyRegs = 0; // May want to turn this into a bit vector or something. completed = false; resultReady = false; canIssue = false; issued = false; executed = false; canCommit = false; committed = false; squashed = false; squashedInIQ = false; squashedInLSQ = false; squashedInROB = false; eaCalcDone = false; memOpDone = false; lqIdx = -1; sqIdx = -1; reachedCommit = false; blockingInst = false; recoverInst = false; iqEntry = false; robEntry = false; serializeBefore = false; serializeAfter = false; serializeHandled = false; // Eventually make this a parameter. threadNumber = 0; // Also make this a parameter, or perhaps get it from xc or cpu. asid = 0; // Initialize the fault to be unimplemented opcode. // fault = new UnimplementedOpcodeFault; fault = NoFault; ++instcount; if (instcount > 1500) { cpu->dumpInsts(); #ifdef DEBUG dumpSNList(); #endif assert(instcount <= 1500); } DPRINTF(DynInst, "DynInst: [sn:%lli] Instruction created. Instcount=%i\n", seqNum, instcount); #ifdef DEBUG cpu->snList.insert(seqNum); #endif } template BaseDynInst::~BaseDynInst() { if (req) { delete req; } if (memData) { delete [] memData; } if (traceData) { delete traceData; } fault = NoFault; --instcount; DPRINTF(DynInst, "DynInst: [sn:%lli] Instruction destroyed. Instcount=%i\n", seqNum, instcount); #ifdef DEBUG cpu->snList.erase(seqNum); #endif } #ifdef DEBUG template void BaseDynInst::dumpSNList() { std::set::iterator sn_it = cpu->snList.begin(); int count = 0; while (sn_it != cpu->snList.end()) { cprintf("%i: [sn:%lli] not destroyed\n", count, (*sn_it)); count++; sn_it++; } } #endif template void BaseDynInst::prefetch(Addr addr, unsigned flags) { // This is the "functional" implementation of prefetch. Not much // happens here since prefetches don't affect the architectural // state. /* // Generate a MemReq so we can translate the effective address. MemReqPtr req = new MemReq(addr, thread->getXCProxy(), 1, flags); req->asid = asid; // Prefetches never cause faults. fault = NoFault; // note this is a local, not BaseDynInst::fault Fault trans_fault = cpu->translateDataReadReq(req); if (trans_fault == NoFault && !(req->flags & UNCACHEABLE)) { // It's a valid address to cacheable space. Record key MemReq // parameters so we can generate another one just like it for // the timing access without calling translate() again (which // might mess up the TLB). effAddr = req->vaddr; physEffAddr = req->paddr; memReqFlags = req->flags; } else { // Bogus address (invalid or uncacheable space). Mark it by // setting the eff_addr to InvalidAddr. effAddr = physEffAddr = MemReq::inval_addr; } if (traceData) { traceData->setAddr(addr); } */ } template void BaseDynInst::writeHint(Addr addr, int size, unsigned flags) { // Need to create a MemReq here so we can do a translation. This // will casue a TLB miss trap if necessary... not sure whether // that's the best thing to do or not. We don't really need the // MemReq otherwise, since wh64 has no functional effect. /* MemReqPtr req = new MemReq(addr, thread->getXCProxy(), size, flags); req->asid = asid; fault = cpu->translateDataWriteReq(req); if (fault == NoFault && !(req->flags & UNCACHEABLE)) { // Record key MemReq parameters so we can generate another one // just like it for the timing access without calling translate() // again (which might mess up the TLB). effAddr = req->vaddr; physEffAddr = req->paddr; memReqFlags = req->flags; } else { // ignore faults & accesses to uncacheable space... treat as no-op effAddr = physEffAddr = MemReq::inval_addr; } storeSize = size; storeData = 0; */ } /** * @todo Need to find a way to get the cache block size here. */ template Fault BaseDynInst::copySrcTranslate(Addr src) { /* MemReqPtr req = new MemReq(src, thread->getXCProxy(), 64); req->asid = asid; // translate to physical address Fault fault = cpu->translateDataReadReq(req); if (fault == NoFault) { thread->copySrcAddr = src; thread->copySrcPhysAddr = req->paddr; } else { thread->copySrcAddr = 0; thread->copySrcPhysAddr = 0; } return fault; */ return NoFault; } /** * @todo Need to find a way to get the cache block size here. */ template Fault BaseDynInst::copy(Addr dest) { /* uint8_t data[64]; FunctionalMemory *mem = thread->mem; assert(thread->copySrcPhysAddr); MemReqPtr req = new MemReq(dest, thread->getXCProxy(), 64); req->asid = asid; // translate to physical address Fault fault = cpu->translateDataWriteReq(req); if (fault == NoFault) { Addr dest_addr = req->paddr; // Need to read straight from memory since we have more than 8 bytes. req->paddr = thread->copySrcPhysAddr; mem->read(req, data); req->paddr = dest_addr; mem->write(req, data); } return fault; */ return NoFault; } template void BaseDynInst::dump() { cprintf("T%d : %#08d `", threadNumber, PC); cout << staticInst->disassemble(PC); cprintf("'\n"); } template void BaseDynInst::dump(std::string &outstring) { std::ostringstream s; s << "T" << threadNumber << " : 0x" << PC << " " << staticInst->disassemble(PC); outstring = s.str(); } #if 0 template Fault BaseDynInst::mem_access(mem_cmd cmd, Addr addr, void *p, int nbytes) { Fault fault; // check alignments, even speculative this test should always pass if ((nbytes & nbytes - 1) != 0 || (addr & nbytes - 1) != 0) { for (int i = 0; i < nbytes; i++) ((char *) p)[i] = 0; // I added the following because according to the comment above, // we should never get here. The comment lies #if 0 panic("unaligned access. Cycle = %n", curTick); #endif return NoFault; } MemReqPtr req = new MemReq(addr, thread, nbytes); switch(cmd) { case Read: fault = spec_mem->read(req, (uint8_t *)p); break; case Write: fault = spec_mem->write(req, (uint8_t *)p); if (fault != NoFault) break; specMemWrite = true; storeSize = nbytes; switch(nbytes) { case sizeof(uint8_t): *(uint8_t)&storeData = (uint8_t *)p; break; case sizeof(uint16_t): *(uint16_t)&storeData = (uint16_t *)p; break; case sizeof(uint32_t): *(uint32_t)&storeData = (uint32_t *)p; break; case sizeof(uint64_t): *(uint64_t)&storeData = (uint64_t *)p; break; } break; default: fault = genMachineCheckFault(); break; } trace_mem(fault, cmd, addr, p, nbytes); return fault; } #endif template void BaseDynInst::markSrcRegReady() { if (++readyRegs == numSrcRegs()) { canIssue = true; } } template void BaseDynInst::markSrcRegReady(RegIndex src_idx) { ++readyRegs; _readySrcRegIdx[src_idx] = true; if (readyRegs == numSrcRegs()) { canIssue = true; } } template bool BaseDynInst::eaSrcsReady() { // For now I am assuming that src registers 1..n-1 are the ones that the // EA calc depends on. (i.e. src reg 0 is the source of the data to be // stored) for (int i = 1; i < numSrcRegs(); ++i) { if (!_readySrcRegIdx[i]) return false; } return true; } // Forward declaration template class BaseDynInst; template <> int BaseDynInst::instcount = 0; /* // Forward declaration template class BaseDynInst; template <> int BaseDynInst::instcount = 0; // Forward declaration template class BaseDynInst; template <> int BaseDynInst::instcount = 0; */