cpu/simple/atomic.cc

2SN/A/*
2190SN/A * Copyright 2014 Google, Inc.
2SN/A * Copyright (c) 2012-2013,2015 ARM Limited
2SN/A * All rights reserved.
2SN/A *
2SN/A * The license below extends only to copyright in the software and shall
2SN/A * not be construed as granting a license to any other intellectual
2SN/A * property including but not limited to intellectual property relating
2SN/A * to a hardware implementation of the functionality of the software
2SN/A * licensed hereunder.  You may use the software subject to the license
2SN/A * terms below provided that you ensure that this notice is replicated
2SN/A * unmodified and in its entirety in all distributions of the software,
2SN/A * modified or unmodified, in source code or in binary form.
2SN/A *
2SN/A * Copyright (c) 2002-2005 The Regents of The University of Michigan
2SN/A * All rights reserved.
2SN/A *
2SN/A * Redistribution and use in source and binary forms, with or without
2SN/A * modification, are permitted provided that the following conditions are
2SN/A * met: redistributions of source code must retain the above copyright
2SN/A * notice, this list of conditions and the following disclaimer;
2SN/A * redistributions in binary form must reproduce the above copyright
2SN/A * notice, this list of conditions and the following disclaimer in the
2SN/A * documentation and/or other materials provided with the distribution;
2SN/A * neither the name of the copyright holders nor the names of its
2SN/A * contributors may be used to endorse or promote products derived from
2665SN/A * this software without specific prior written permission.
2665SN/A *
2SN/A * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
2SN/A * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
2680Sktlim@umich.edu * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
2680Sktlim@umich.edu * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
2SN/A * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
2972Sgblack@eecs.umich.edu * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
2972Sgblack@eecs.umich.edu * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
2972Sgblack@eecs.umich.edu * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
1858SN/A * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
2423SN/A * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
2190SN/A * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
56SN/A *
217SN/A * Authors: Steve Reinhardt
2036SN/A */
2SN/A
2190SN/A#include "cpu/simple/atomic.hh"
2190SN/A
2190SN/A#include "arch/locked_mem.hh"
2190SN/A#include "arch/mmapped_ipr.hh"
2190SN/A#include "arch/utility.hh"
2313SN/A#include "base/bigint.hh"
2235SN/A#include "base/output.hh"
2423SN/A#include "config/the_isa.hh"
2521SN/A#include "cpu/exetrace.hh"
2521SN/A#include "debug/Drain.hh"
2190SN/A#include "debug/ExecFaulting.hh"
2190SN/A#include "debug/SimpleCPU.hh"
2330SN/A#include "mem/packet.hh"
2330SN/A#include "mem/packet_access.hh"
2330SN/A#include "mem/physical.hh"
2SN/A#include "params/AtomicSimpleCPU.hh"
2680Sktlim@umich.edu#include "sim/faults.hh"
2680Sktlim@umich.edu#include "sim/full_system.hh"
2680Sktlim@umich.edu#include "sim/system.hh"
2680Sktlim@umich.edu
2680Sktlim@umich.eduusing namespace std;
2680Sktlim@umich.eduusing namespace TheISA;
2680Sktlim@umich.edu
2680Sktlim@umich.eduAtomicSimpleCPU::TickEvent::TickEvent(AtomicSimpleCPU *c)
2680Sktlim@umich.edu    : Event(CPU_Tick_Pri), cpu(c)
2680Sktlim@umich.edu{
2680Sktlim@umich.edu}
2682Sktlim@umich.edu
2680Sktlim@umich.edu
2680Sktlim@umich.eduvoid
2680Sktlim@umich.eduAtomicSimpleCPU::TickEvent::process()
2680Sktlim@umich.edu{
2680Sktlim@umich.edu    cpu->tick();
2SN/A}
2107SN/A
2107SN/Aconst char *
2107SN/AAtomicSimpleCPU::TickEvent::description() const
2190SN/A{
2455SN/A    return "AtomicSimpleCPU tick";
2455SN/A}
2107SN/A
2159SN/Avoid
2SN/AAtomicSimpleCPU::init()
246SN/A{
246SN/A    BaseSimpleCPU::init();
246SN/A
246SN/A    int cid = threadContexts[0]->contextId();
246SN/A    ifetch_req.setContext(cid);
246SN/A    data_read_req.setContext(cid);
246SN/A    data_write_req.setContext(cid);
246SN/A}
246SN/A
246SN/AAtomicSimpleCPU::AtomicSimpleCPU(AtomicSimpleCPUParams *p)
246SN/A    : BaseSimpleCPU(p), tickEvent(this), width(p->width), locked(false),
246SN/A      simulate_data_stalls(p->simulate_data_stalls),
246SN/A      simulate_inst_stalls(p->simulate_inst_stalls),
2190SN/A      icachePort(name() + ".icache_port", this),
246SN/A      dcachePort(name() + ".dcache_port", this),
246SN/A      fastmem(p->fastmem), dcache_access(false), dcache_latency(0),
246SN/A      ppCommit(nullptr)
246SN/A{
246SN/A    _status = Idle;
246SN/A}
246SN/A
2SN/A
2680Sktlim@umich.eduAtomicSimpleCPU::~AtomicSimpleCPU()
2423SN/A{
2190SN/A    if (tickEvent.scheduled()) {
180SN/A        deschedule(tickEvent);
2190SN/A    }
2190SN/A}
2190SN/A
2190SN/ADrainState
2190SN/AAtomicSimpleCPU::drain()
2190SN/A{
2190SN/A    if (switchedOut())
2190SN/A        return DrainState::Drained;
2190SN/A
2190SN/A    if (!isDrained()) {
2521SN/A        DPRINTF(Drain, "Requesting drain.\n");
2330SN/A        return DrainState::Draining;
2654SN/A    } else {
2521SN/A        if (tickEvent.scheduled())
2521SN/A            deschedule(tickEvent);
2680Sktlim@umich.edu
2521SN/A        activeThreads.clear();
2521SN/A        DPRINTF(Drain, "Not executing microcode, no need to drain.\n");
2190SN/A        return DrainState::Drained;
2518SN/A    }
2518SN/A}
2190SN/A
2190SN/Avoid
2190SN/AAtomicSimpleCPU::threadSnoop(PacketPtr pkt, ThreadID sender)
2190SN/A{
2159SN/A    DPRINTF(SimpleCPU, "received snoop pkt for addr:%#x %s\n", pkt->getAddr(),
2235SN/A            pkt->cmdString());
2103SN/A
393SN/A    for (ThreadID tid = 0; tid < numThreads; tid++) {
393SN/A        if (tid != sender) {
2190SN/A            if (getCpuAddrMonitor(tid)->doMonitor(pkt)) {
393SN/A                wakeup(tid);
393SN/A            }
2190SN/A
393SN/A            TheISA::handleLockedSnoop(threadInfo[tid]->thread,
393SN/A                                      pkt, dcachePort.cacheBlockMask);
2875Sksewell@umich.edu        }
393SN/A    }
393SN/A}
2190SN/A
2159SN/Avoid
2159SN/AAtomicSimpleCPU::drainResume()
2190SN/A{
2159SN/A    assert(!tickEvent.scheduled());
2159SN/A    if (switchedOut())
2680Sktlim@umich.edu        return;
2159SN/A
2190SN/A    DPRINTF(SimpleCPU, "Resume\n");
2159SN/A    verifyMemoryMode();
2190SN/A
2190SN/A    assert(!threadContexts.empty());
2159SN/A
2235SN/A    _status = BaseSimpleCPU::Idle;
2313SN/A
2235SN/A    for (ThreadID tid = 0; tid < numThreads; tid++) {
2235SN/A        if (threadInfo[tid]->thread->status() == ThreadContext::Active) {
2235SN/A            threadInfo[tid]->notIdleFraction = 1;
2235SN/A            activeThreads.push_back(tid);
2235SN/A            _status = BaseSimpleCPU::Running;
2254SN/A
2254SN/A            // Tick if any threads active
2254SN/A            if (!tickEvent.scheduled()) {
2235SN/A                schedule(tickEvent, nextCycle());
2235SN/A            }
2190SN/A        } else {
2159SN/A            threadInfo[tid]->notIdleFraction = 0;
2235SN/A        }
2254SN/A    }
2190SN/A}
2159SN/A
2680Sktlim@umich.edubool
2159SN/AAtomicSimpleCPU::tryCompleteDrain()
2190SN/A{
2159SN/A    if (drainState() != DrainState::Draining)
2159SN/A        return false;
2159SN/A
2159SN/A    DPRINTF(Drain, "tryCompleteDrain.\n");
2190SN/A    if (!isDrained())
2159SN/A        return false;
2455SN/A
2159SN/A    DPRINTF(Drain, "CPU done draining, processing drain event\n");
2455SN/A    signalDrainDone();
2159SN/A
2455SN/A    return true;
2455SN/A}
2455SN/A
2159SN/A
2190SN/Avoid
2159SN/AAtomicSimpleCPU::switchOut()
2455SN/A{
2159SN/A    BaseSimpleCPU::switchOut();
2455SN/A
2159SN/A    assert(!tickEvent.scheduled());
2455SN/A    assert(_status == BaseSimpleCPU::Running || _status == Idle);
2455SN/A    assert(isDrained());
2455SN/A}
2159SN/A
2190SN/A
2159SN/Avoid
2190SN/AAtomicSimpleCPU::takeOverFrom(BaseCPU *oldCPU)
2159SN/A{
2190SN/A    BaseSimpleCPU::takeOverFrom(oldCPU);
2159SN/A
2190SN/A    // The tick event should have been descheduled by drain()
2159SN/A    assert(!tickEvent.scheduled());
2447SN/A}
2447SN/A
2447SN/Avoid
2447SN/AAtomicSimpleCPU::verifyMemoryMode() const
2190SN/A{
2159SN/A    if (!system->isAtomicMode()) {
2190SN/A        fatal("The atomic CPU requires the memory system to be in "
2190SN/A              "'atomic' mode.\n");
2190SN/A    }
2190SN/A}
2190SN/A
2190SN/Avoid
2235SN/AAtomicSimpleCPU::activateContext(ThreadID thread_num)
2235SN/A{
2190SN/A    DPRINTF(SimpleCPU, "ActivateContext %d\n", thread_num);
2190SN/A
2190SN/A    assert(thread_num < numThreads);
2159SN/A
2159SN/A    threadInfo[thread_num]->notIdleFraction = 1;
2190SN/A    Cycles delta = ticksToCycles(threadInfo[thread_num]->thread->lastActivate -
2159SN/A                                 threadInfo[thread_num]->thread->lastSuspend);
2159SN/A    numCycles += delta;
2235SN/A    ppCycles->notify(delta);
2190SN/A
2190SN/A    if (!tickEvent.scheduled()) {
2159SN/A        //Make sure ticks are still on multiples of cycles
2190SN/A        schedule(tickEvent, clockEdge(Cycles(0)));
2159SN/A    }
2159SN/A    _status = BaseSimpleCPU::Running;
2190SN/A    if (std::find(activeThreads.begin(), activeThreads.end(), thread_num)
2159SN/A        == activeThreads.end()) {
2190SN/A        activeThreads.push_back(thread_num);
2159SN/A    }
2235SN/A
2190SN/A    BaseCPU::activateContext(thread_num);
2834Sksewell@umich.edu}
2834Sksewell@umich.edu
2834Sksewell@umich.edu
2834Sksewell@umich.eduvoid
2834Sksewell@umich.eduAtomicSimpleCPU::suspendContext(ThreadID thread_num)
2159SN/A{
2525SN/A    DPRINTF(SimpleCPU, "SuspendContext %d\n", thread_num);
2972Sgblack@eecs.umich.edu
2972Sgblack@eecs.umich.edu    assert(thread_num < numThreads);
2159SN/A    activeThreads.remove(thread_num);
2159SN/A
2682Sktlim@umich.edu    if (_status == Idle)
2682Sktlim@umich.edu        return;
2682Sktlim@umich.edu
2682Sktlim@umich.edu    assert(_status == BaseSimpleCPU::Running);
2682Sktlim@umich.edu
2682Sktlim@umich.edu    threadInfo[thread_num]->notIdleFraction = 0;
2682Sktlim@umich.edu
2682Sktlim@umich.edu    if (activeThreads.empty()) {
2682Sktlim@umich.edu        _status = Idle;
2682Sktlim@umich.edu
2680Sktlim@umich.edu        if (tickEvent.scheduled()) {
2680Sktlim@umich.edu            deschedule(tickEvent);
2190SN/A        }
2190SN/A    }
2680Sktlim@umich.edu
2680Sktlim@umich.edu    BaseCPU::suspendContext(thread_num);
2159SN/A}
2190SN/A
2680Sktlim@umich.edu
2SN/ATick
2SN/AAtomicSimpleCPU::AtomicCPUDPort::recvAtomicSnoop(PacketPtr pkt)
2SN/A{
2680Sktlim@umich.edu    DPRINTF(SimpleCPU, "received snoop pkt for addr:%#x %s\n", pkt->getAddr(),
2SN/A            pkt->cmdString());
2680Sktlim@umich.edu
716SN/A    // X86 ISA: Snooping an invalidation for monitor/mwait
2680Sktlim@umich.edu    AtomicSimpleCPU *cpu = (AtomicSimpleCPU *)(&owner);
2SN/A
1858SN/A    for (ThreadID tid = 0; tid < cpu->numThreads; tid++) {
2680Sktlim@umich.edu        if (cpu->getCpuAddrMonitor(tid)->doMonitor(pkt)) {
2SN/A            cpu->wakeup(tid);
2680Sktlim@umich.edu        }
1917SN/A    }
2680Sktlim@umich.edu
2521SN/A    // if snoop invalidates, release any associated locks
2680Sktlim@umich.edu    // When run without caches, Invalidation packets will not be received
2654SN/A    // hence we must check if the incoming packets are writes and wakeup
2680Sktlim@umich.edu    // the processor accordingly
2521SN/A    if (pkt->isInvalidate() || pkt->isWrite()) {
2680Sktlim@umich.edu        DPRINTF(SimpleCPU, "received invalidation for addr:%#x\n",
2521SN/A                pkt->getAddr());
2680Sktlim@umich.edu        for (auto &t_info : cpu->threadInfo) {
2SN/A            TheISA::handleLockedSnoop(t_info->thread, pkt, cacheBlockMask);
2680Sktlim@umich.edu        }
2518SN/A    }
2680Sktlim@umich.edu
2SN/A    return 0;
2SN/A}
2680Sktlim@umich.edu
595SN/Avoid
2680Sktlim@umich.eduAtomicSimpleCPU::AtomicCPUDPort::recvFunctionalSnoop(PacketPtr pkt)
2SN/A{
2190SN/A    DPRINTF(SimpleCPU, "received snoop pkt for addr:%#x %s\n", pkt->getAddr(),
2190SN/A            pkt->cmdString());
2680Sktlim@umich.edu
2SN/A    // X86 ISA: Snooping an invalidation for monitor/mwait
2190SN/A    AtomicSimpleCPU *cpu = (AtomicSimpleCPU *)(&owner);
2680Sktlim@umich.edu    for (ThreadID tid = 0; tid < cpu->numThreads; tid++) {
2SN/A        if (cpu->getCpuAddrMonitor(tid)->doMonitor(pkt)) {
2190SN/A            cpu->wakeup(tid);
2875Sksewell@umich.edu        }
2SN/A    }
2190SN/A
2680Sktlim@umich.edu    // if snoop invalidates, release any associated locks
217SN/A    if (pkt->isInvalidate()) {
1858SN/A        DPRINTF(SimpleCPU, "received invalidation for addr:%#x\n",
2680Sktlim@umich.edu                pkt->getAddr());
2190SN/A        for (auto &t_info : cpu->threadInfo) {
2190SN/A            TheISA::handleLockedSnoop(t_info->thread, pkt, cacheBlockMask);
2680Sktlim@umich.edu        }
2680Sktlim@umich.edu    }
2190SN/A}
2680Sktlim@umich.edu
2190SN/AFault
2680Sktlim@umich.eduAtomicSimpleCPU::readMem(Addr addr, uint8_t * data, unsigned size,
2190SN/A                         Request::Flags flags)
2680Sktlim@umich.edu{
2190SN/A    SimpleExecContext& t_info = *threadInfo[curThread];
2235SN/A    SimpleThread* thread = t_info.thread;
2680Sktlim@umich.edu
2235SN/A    // use the CPU's statically allocated read request and packet objects
2680Sktlim@umich.edu    Request *req = &data_read_req;
2680Sktlim@umich.edu
2254SN/A    if (traceData)
2680Sktlim@umich.edu        traceData->setMem(addr, size, flags);
2680Sktlim@umich.edu
2235SN/A    //The size of the data we're trying to read.
2235SN/A    int fullSize = size;
2680Sktlim@umich.edu
2190SN/A    //The address of the second part of this access if it needs to be split
2190SN/A    //across a cache line boundary.
2680Sktlim@umich.edu    Addr secondAddr = roundDown(addr + size - 1, cacheLineSize());
2SN/A
2190SN/A    if (secondAddr > addr)
2680Sktlim@umich.edu        size = secondAddr - addr;
2SN/A
2680Sktlim@umich.edu    dcache_latency = 0;
716SN/A
2SN/A    req->taskId(taskId());
2SN/A    while (1) {
2SN/A        req->setVirt(0, addr, size, flags, dataMasterId(), thread->pcState().instAddr());
2SN/A
2680Sktlim@umich.edu        // translate to physical address
2SN/A        Fault fault = thread->dtb->translateAtomic(req, thread->getTC(),
2455SN/A                                                          BaseTLB::Read);
2680Sktlim@umich.edu
2SN/A        // Now do the access.
2455SN/A        if (fault == NoFault && !req->getFlags().isSet(Request::NO_ACCESS)) {
2680Sktlim@umich.edu            Packet pkt(req, Packet::makeReadCmd(req));
2SN/A            pkt.dataStatic(data);
2455SN/A
2680Sktlim@umich.edu            if (req->isMmappedIpr())
2455SN/A                dcache_latency += TheISA::handleIprRead(thread->getTC(), &pkt);
2455SN/A            else {
2680Sktlim@umich.edu                if (fastmem && system->isMemAddr(pkt.getAddr()))
2SN/A                    system->getPhysMem().access(&pkt);
2SN/A                else
2680Sktlim@umich.edu                    dcache_latency += dcachePort.sendAtomic(&pkt);
2SN/A            }
2455SN/A            dcache_access = true;
2680Sktlim@umich.edu
2SN/A            assert(!pkt.isError());
2455SN/A
2680Sktlim@umich.edu            if (req->isLLSC()) {
2SN/A                TheISA::handleLockedRead(thread, req);
2455SN/A            }
2680Sktlim@umich.edu        }
2455SN/A
2455SN/A        //If there's a fault, return it
2680Sktlim@umich.edu        if (fault != NoFault) {
2SN/A            if (req->isPrefetch()) {
2680Sktlim@umich.edu                return NoFault;
2SN/A            } else {
2680Sktlim@umich.edu                return fault;
2206SN/A            }
2680Sktlim@umich.edu        }
2252SN/A
2680Sktlim@umich.edu        //If we don't need to access a second cache line, stop now.
2SN/A        if (secondAddr <= addr)
2680Sktlim@umich.edu        {
2447SN/A            if (req->isLockedRMW() && fault == NoFault) {
2680Sktlim@umich.edu                assert(!locked);
2447SN/A                locked = true;
2159SN/A            }
2680Sktlim@umich.edu
2SN/A            return fault;
2159SN/A        }
2680Sktlim@umich.edu
2SN/A        /*
2159SN/A         * Set up for accessing the second cache line.
2680Sktlim@umich.edu         */
2SN/A
2159SN/A        //Move the pointer we're reading into to the correct location.
2680Sktlim@umich.edu        data += size;
2190SN/A        //Adjust the size to get the remaining bytes.
2190SN/A        size = addr + fullSize - secondAddr;
2680Sktlim@umich.edu        //And access the right address.
2190SN/A        addr = secondAddr;
2190SN/A    }
2680Sktlim@umich.edu}
1858SN/A
2680Sktlim@umich.eduFault
2SN/AAtomicSimpleCPU::initiateMemRead(Addr addr, unsigned size,
2SN/A                                 Request::Flags flags)
2190SN/A{
2680Sktlim@umich.edu    panic("initiateMemRead() is for timing accesses, and should "
2190SN/A          "never be called on AtomicSimpleCPU.\n");
1858SN/A}
2680Sktlim@umich.edu
360SN/AFault
360SN/AAtomicSimpleCPU::writeMem(uint8_t *data, unsigned size, Addr addr,
2190SN/A                          Request::Flags flags, uint64_t *res)
2680Sktlim@umich.edu{
360SN/A    SimpleExecContext& t_info = *threadInfo[curThread];
1450SN/A    SimpleThread* thread = t_info.thread;
2680Sktlim@umich.edu    static uint8_t zero_array[64] = {};
360SN/A
2680Sktlim@umich.edu    if (data == NULL) {
2SN/A        assert(size <= 64);
2525SN/A        assert(flags & Request::CACHE_BLOCK_ZERO);
2972Sgblack@eecs.umich.edu        // This must be a cache block cleaning request
2972Sgblack@eecs.umich.edu        data = zero_array;
2525SN/A    }
2680Sktlim@umich.edu
2525SN/A    // use the CPU's statically allocated write request and packet objects
2SN/A    Request *req = &data_write_req;
2SN/A
2190SN/A    if (traceData)
        traceData->setMem(addr, size, flags);

    //The size of the data we're trying to read.
    int fullSize = size;

    //The address of the second part of this access if it needs to be split
    //across a cache line boundary.
    Addr secondAddr = roundDown(addr + size - 1, cacheLineSize());

    if (secondAddr > addr)
        size = secondAddr - addr;

    dcache_latency = 0;

    req->taskId(taskId());
    while (1) {
        req->setVirt(0, addr, size, flags, dataMasterId(), thread->pcState().instAddr());

        // translate to physical address
        Fault fault = thread->dtb->translateAtomic(req, thread->getTC(), BaseTLB::Write);

        // Now do the access.
        if (fault == NoFault) {
            MemCmd cmd = MemCmd::WriteReq; // default
            bool do_access = true;  // flag to suppress cache access

            if (req->isLLSC()) {
                cmd = MemCmd::StoreCondReq;
                do_access = TheISA::handleLockedWrite(thread, req, dcachePort.cacheBlockMask);
            } else if (req->isSwap()) {
                cmd = MemCmd::SwapReq;
                if (req->isCondSwap()) {
                    assert(res);
                    req->setExtraData(*res);
                }
            }

            if (do_access && !req->getFlags().isSet(Request::NO_ACCESS)) {
                Packet pkt = Packet(req, cmd);
                pkt.dataStatic(data);

                if (req->isMmappedIpr()) {
                    dcache_latency +=
                        TheISA::handleIprWrite(thread->getTC(), &pkt);
                } else {
                    if (fastmem && system->isMemAddr(pkt.getAddr()))
                        system->getPhysMem().access(&pkt);
                    else
                        dcache_latency += dcachePort.sendAtomic(&pkt);

                    // Notify other threads on this CPU of write
                    threadSnoop(&pkt, curThread);
                }
                dcache_access = true;
                assert(!pkt.isError());

                if (req->isSwap()) {
                    assert(res);
                    memcpy(res, pkt.getConstPtr<uint8_t>(), fullSize);
                }
            }

            if (res && !req->isSwap()) {
                *res = req->getExtraData();
            }
        }

        //If there's a fault or we don't need to access a second cache line,
        //stop now.
        if (fault != NoFault || secondAddr <= addr)
        {
            if (req->isLockedRMW() && fault == NoFault) {
                assert(locked);
                locked = false;
            }


            if (fault != NoFault && req->isPrefetch()) {
                return NoFault;
            } else {
                return fault;
            }
        }

        /*
         * Set up for accessing the second cache line.
         */

        //Move the pointer we're reading into to the correct location.
        data += size;
        //Adjust the size to get the remaining bytes.
        size = addr + fullSize - secondAddr;
        //And access the right address.
        addr = secondAddr;
    }
}


void
AtomicSimpleCPU::tick()
{
    DPRINTF(SimpleCPU, "Tick\n");

    // Change thread if multi-threaded
    swapActiveThread();

    // Set memroy request ids to current thread
    if (numThreads > 1) {
        ContextID cid = threadContexts[curThread]->contextId();

        ifetch_req.setContext(cid);
        data_read_req.setContext(cid);
        data_write_req.setContext(cid);
    }

    SimpleExecContext& t_info = *threadInfo[curThread];
    SimpleThread* thread = t_info.thread;

    Tick latency = 0;

    for (int i = 0; i < width || locked; ++i) {
        numCycles++;
        ppCycles->notify(1);

        if (!curStaticInst || !curStaticInst->isDelayedCommit()) {
            checkForInterrupts();
            checkPcEventQueue();
        }

        // We must have just got suspended by a PC event
        if (_status == Idle) {
            tryCompleteDrain();
            return;
        }

        Fault fault = NoFault;

        TheISA::PCState pcState = thread->pcState();

        bool needToFetch = !isRomMicroPC(pcState.microPC()) &&
                           !curMacroStaticInst;
        if (needToFetch) {
            ifetch_req.taskId(taskId());
            setupFetchRequest(&ifetch_req);
            fault = thread->itb->translateAtomic(&ifetch_req, thread->getTC(),
                                                 BaseTLB::Execute);
        }

        if (fault == NoFault) {
            Tick icache_latency = 0;
            bool icache_access = false;
            dcache_access = false; // assume no dcache access

            if (needToFetch) {
                // This is commented out because the decoder would act like
                // a tiny cache otherwise. It wouldn't be flushed when needed
                // like the I cache. It should be flushed, and when that works
                // this code should be uncommented.
                //Fetch more instruction memory if necessary
                //if (decoder.needMoreBytes())
                //{
                    icache_access = true;
                    Packet ifetch_pkt = Packet(&ifetch_req, MemCmd::ReadReq);
                    ifetch_pkt.dataStatic(&inst);

                    if (fastmem && system->isMemAddr(ifetch_pkt.getAddr()))
                        system->getPhysMem().access(&ifetch_pkt);
                    else
                        icache_latency = icachePort.sendAtomic(&ifetch_pkt);

                    assert(!ifetch_pkt.isError());

                    // ifetch_req is initialized to read the instruction directly
                    // into the CPU object's inst field.
                //}
            }

            preExecute();

            if (curStaticInst) {
                fault = curStaticInst->execute(&t_info, traceData);

                // keep an instruction count
                if (fault == NoFault) {
                    countInst();
                    ppCommit->notify(std::make_pair(thread, curStaticInst));
                }
                else if (traceData && !DTRACE(ExecFaulting)) {
                    delete traceData;
                    traceData = NULL;
                }

                postExecute();
            }

            // @todo remove me after debugging with legion done
            if (curStaticInst && (!curStaticInst->isMicroop() ||
                        curStaticInst->isFirstMicroop()))
                instCnt++;

            Tick stall_ticks = 0;
            if (simulate_inst_stalls && icache_access)
                stall_ticks += icache_latency;

            if (simulate_data_stalls && dcache_access)
                stall_ticks += dcache_latency;

            if (stall_ticks) {
                // the atomic cpu does its accounting in ticks, so
                // keep counting in ticks but round to the clock
                // period
                latency += divCeil(stall_ticks, clockPeriod()) *
                    clockPeriod();
            }

        }
        if (fault != NoFault || !t_info.stayAtPC)
            advancePC(fault);
    }

    if (tryCompleteDrain())
        return;

    // instruction takes at least one cycle
    if (latency < clockPeriod())
        latency = clockPeriod();

    if (_status != Idle)
        reschedule(tickEvent, curTick() + latency, true);
}

void
AtomicSimpleCPU::regProbePoints()
{
    BaseCPU::regProbePoints();

    ppCommit = new ProbePointArg<pair<SimpleThread*, const StaticInstPtr>>
                                (getProbeManager(), "Commit");
}

void
AtomicSimpleCPU::printAddr(Addr a)
{
    dcachePort.printAddr(a);
}

////////////////////////////////////////////////////////////////////////
//
//  AtomicSimpleCPU Simulation Object
//
AtomicSimpleCPU *
AtomicSimpleCPUParams::create()
{
    return new AtomicSimpleCPU(this);
}