base.cc revision 6122
12810SN/A/*
22810SN/A * Copyright (c) 2003-2005 The Regents of The University of Michigan
32810SN/A * All rights reserved.
42810SN/A *
52810SN/A * Redistribution and use in source and binary forms, with or without
62810SN/A * modification, are permitted provided that the following conditions are
72810SN/A * met: redistributions of source code must retain the above copyright
82810SN/A * notice, this list of conditions and the following disclaimer;
92810SN/A * redistributions in binary form must reproduce the above copyright
102810SN/A * notice, this list of conditions and the following disclaimer in the
112810SN/A * documentation and/or other materials provided with the distribution;
122810SN/A * neither the name of the copyright holders nor the names of its
132810SN/A * contributors may be used to endorse or promote products derived from
142810SN/A * this software without specific prior written permission.
152810SN/A *
162810SN/A * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
172810SN/A * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
182810SN/A * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
192810SN/A * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
202810SN/A * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
212810SN/A * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
222810SN/A * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
232810SN/A * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
242810SN/A * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
252810SN/A * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
262810SN/A * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
272810SN/A *
282810SN/A * Authors: Erik Hallnor
292810SN/A */
302810SN/A
312810SN/A/**
322810SN/A * @file
332810SN/A * Definition of BaseCache functions.
342810SN/A */
352810SN/A
363348SN/A#include "cpu/base.hh"
373348SN/A#include "cpu/smt.hh"
385338Sstever@gmail.com#include "mem/cache/base.hh"
395338Sstever@gmail.com#include "mem/cache/mshr.hh"
402810SN/A
412810SN/Ausing namespace std;
422810SN/A
434965SN/ABaseCache::CachePort::CachePort(const std::string &_name, BaseCache *_cache,
446122SSteve.Reinhardt@amd.com                                const std::string &_label)
455314SN/A    : SimpleTimingPort(_name, _cache), cache(_cache),
465314SN/A      label(_label), otherPort(NULL),
476122SSteve.Reinhardt@amd.com      blocked(false), mustSendRetry(false)
482810SN/A{
494475SN/A}
504475SN/A
514475SN/A
525034SN/ABaseCache::BaseCache(const Params *p)
535034SN/A    : MemObject(p),
545314SN/A      mshrQueue("MSHRs", p->mshrs, 4, MSHRQueue_MSHRs),
555314SN/A      writeBuffer("write buffer", p->write_buffers, p->mshrs+1000,
564628SN/A                  MSHRQueue_WriteBuffer),
575034SN/A      blkSize(p->block_size),
585034SN/A      hitLatency(p->latency),
595034SN/A      numTarget(p->tgts_per_mshr),
606122SSteve.Reinhardt@amd.com      forwardSnoops(p->forward_snoops),
614626SN/A      blocked(0),
624626SN/A      noTargetMSHR(NULL),
635034SN/A      missCount(p->max_miss_count),
646122SSteve.Reinhardt@amd.com      drainEvent(NULL),
656122SSteve.Reinhardt@amd.com      addrRange(p->addr_range)
664458SN/A{
672810SN/A}
682810SN/A
692811SN/Avoid
702810SN/ABaseCache::CachePort::recvStatusChange(Port::Status status)
712810SN/A{
724458SN/A    if (status == Port::RangeChange) {
734458SN/A        otherPort->sendStatusChange(Port::RangeChange);
744458SN/A    }
752810SN/A}
762810SN/A
775314SN/A
785314SN/Abool
795314SN/ABaseCache::CachePort::checkFunctional(PacketPtr pkt)
805314SN/A{
815314SN/A    pkt->pushLabel(label);
825314SN/A    bool done = SimpleTimingPort::checkFunctional(pkt);
835314SN/A    pkt->popLabel();
845314SN/A    return done;
855314SN/A}
865314SN/A
875314SN/A
882810SN/Aint
892810SN/ABaseCache::CachePort::deviceBlockSize()
902810SN/A{
912810SN/A    return cache->getBlockSize();
922810SN/A}
932810SN/A
943606SN/A
954458SN/Abool
964458SN/ABaseCache::CachePort::recvRetryCommon()
973013SN/A{
983236SN/A    assert(waitingOnRetry);
994458SN/A    waitingOnRetry = false;
1004458SN/A    return false;
1014458SN/A}
1023246SN/A
1033309SN/A
1043013SN/Avoid
1052810SN/ABaseCache::CachePort::setBlocked()
1062810SN/A{
1073013SN/A    assert(!blocked);
1083013SN/A    DPRINTF(Cache, "Cache Blocking\n");
1092810SN/A    blocked = true;
1103013SN/A    //Clear the retry flag
1113013SN/A    mustSendRetry = false;
1122810SN/A}
1132810SN/A
1142810SN/Avoid
1152810SN/ABaseCache::CachePort::clearBlocked()
1162810SN/A{
1173013SN/A    assert(blocked);
1183013SN/A    DPRINTF(Cache, "Cache Unblocking\n");
1193013SN/A    blocked = false;
1202897SN/A    if (mustSendRetry)
1212897SN/A    {
1223013SN/A        DPRINTF(Cache, "Cache Sending Retry\n");
1232897SN/A        mustSendRetry = false;
1244666SN/A        SendRetryEvent *ev = new SendRetryEvent(this, true);
1254666SN/A        // @TODO: need to find a better time (next bus cycle?)
1265606Snate@binkert.org        schedule(ev, curTick + 1);
1272897SN/A    }
1282810SN/A}
1292810SN/A
1302844SN/A
1312810SN/Avoid
1322858SN/ABaseCache::init()
1332858SN/A{
1342858SN/A    if (!cpuSidePort || !memSidePort)
1352858SN/A        panic("Cache not hooked up on both sides\n");
1362858SN/A    cpuSidePort->sendStatusChange(Port::RangeChange);
1372858SN/A}
1382858SN/A
1394628SN/A
1402858SN/Avoid
1412810SN/ABaseCache::regStats()
1422810SN/A{
1432810SN/A    using namespace Stats;
1442810SN/A
1452810SN/A    // Hit statistics
1464022SN/A    for (int access_idx = 0; access_idx < MemCmd::NUM_MEM_CMDS; ++access_idx) {
1474022SN/A        MemCmd cmd(access_idx);
1484022SN/A        const string &cstr = cmd.toString();
1492810SN/A
1502810SN/A        hits[access_idx]
1512810SN/A            .init(maxThreadsPerCPU)
1522810SN/A            .name(name() + "." + cstr + "_hits")
1532810SN/A            .desc("number of " + cstr + " hits")
1542810SN/A            .flags(total | nozero | nonan)
1552810SN/A            ;
1562810SN/A    }
1572810SN/A
1584871SN/A// These macros make it easier to sum the right subset of commands and
1594871SN/A// to change the subset of commands that are considered "demand" vs
1604871SN/A// "non-demand"
1614871SN/A#define SUM_DEMAND(s) \
1624871SN/A    (s[MemCmd::ReadReq] + s[MemCmd::WriteReq] + s[MemCmd::ReadExReq])
1634871SN/A
1644871SN/A// should writebacks be included here?  prior code was inconsistent...
1654871SN/A#define SUM_NON_DEMAND(s) \
1664871SN/A    (s[MemCmd::SoftPFReq] + s[MemCmd::HardPFReq])
1674871SN/A
1682810SN/A    demandHits
1692810SN/A        .name(name() + ".demand_hits")
1702810SN/A        .desc("number of demand (read+write) hits")
1712810SN/A        .flags(total)
1722810SN/A        ;
1734871SN/A    demandHits = SUM_DEMAND(hits);
1742810SN/A
1752810SN/A    overallHits
1762810SN/A        .name(name() + ".overall_hits")
1772810SN/A        .desc("number of overall hits")
1782810SN/A        .flags(total)
1792810SN/A        ;
1804871SN/A    overallHits = demandHits + SUM_NON_DEMAND(hits);
1812810SN/A
1822810SN/A    // Miss statistics
1834022SN/A    for (int access_idx = 0; access_idx < MemCmd::NUM_MEM_CMDS; ++access_idx) {
1844022SN/A        MemCmd cmd(access_idx);
1854022SN/A        const string &cstr = cmd.toString();
1862810SN/A
1872810SN/A        misses[access_idx]
1882810SN/A            .init(maxThreadsPerCPU)
1892810SN/A            .name(name() + "." + cstr + "_misses")
1902810SN/A            .desc("number of " + cstr + " misses")
1912810SN/A            .flags(total | nozero | nonan)
1922810SN/A            ;
1932810SN/A    }
1942810SN/A
1952810SN/A    demandMisses
1962810SN/A        .name(name() + ".demand_misses")
1972810SN/A        .desc("number of demand (read+write) misses")
1982810SN/A        .flags(total)
1992810SN/A        ;
2004871SN/A    demandMisses = SUM_DEMAND(misses);
2012810SN/A
2022810SN/A    overallMisses
2032810SN/A        .name(name() + ".overall_misses")
2042810SN/A        .desc("number of overall misses")
2052810SN/A        .flags(total)
2062810SN/A        ;
2074871SN/A    overallMisses = demandMisses + SUM_NON_DEMAND(misses);
2082810SN/A
2092810SN/A    // Miss latency statistics
2104022SN/A    for (int access_idx = 0; access_idx < MemCmd::NUM_MEM_CMDS; ++access_idx) {
2114022SN/A        MemCmd cmd(access_idx);
2124022SN/A        const string &cstr = cmd.toString();
2132810SN/A
2142810SN/A        missLatency[access_idx]
2152810SN/A            .init(maxThreadsPerCPU)
2162810SN/A            .name(name() + "." + cstr + "_miss_latency")
2172810SN/A            .desc("number of " + cstr + " miss cycles")
2182810SN/A            .flags(total | nozero | nonan)
2192810SN/A            ;
2202810SN/A    }
2212810SN/A
2222810SN/A    demandMissLatency
2232810SN/A        .name(name() + ".demand_miss_latency")
2242810SN/A        .desc("number of demand (read+write) miss cycles")
2252810SN/A        .flags(total)
2262810SN/A        ;
2274871SN/A    demandMissLatency = SUM_DEMAND(missLatency);
2282810SN/A
2292810SN/A    overallMissLatency
2302810SN/A        .name(name() + ".overall_miss_latency")
2312810SN/A        .desc("number of overall miss cycles")
2322810SN/A        .flags(total)
2332810SN/A        ;
2344871SN/A    overallMissLatency = demandMissLatency + SUM_NON_DEMAND(missLatency);
2352810SN/A
2362810SN/A    // access formulas
2374022SN/A    for (int access_idx = 0; access_idx < MemCmd::NUM_MEM_CMDS; ++access_idx) {
2384022SN/A        MemCmd cmd(access_idx);
2394022SN/A        const string &cstr = cmd.toString();
2402810SN/A
2412810SN/A        accesses[access_idx]
2422810SN/A            .name(name() + "." + cstr + "_accesses")
2432810SN/A            .desc("number of " + cstr + " accesses(hits+misses)")
2442810SN/A            .flags(total | nozero | nonan)
2452810SN/A            ;
2462810SN/A
2472810SN/A        accesses[access_idx] = hits[access_idx] + misses[access_idx];
2482810SN/A    }
2492810SN/A
2502810SN/A    demandAccesses
2512810SN/A        .name(name() + ".demand_accesses")
2522810SN/A        .desc("number of demand (read+write) accesses")
2532810SN/A        .flags(total)
2542810SN/A        ;
2552810SN/A    demandAccesses = demandHits + demandMisses;
2562810SN/A
2572810SN/A    overallAccesses
2582810SN/A        .name(name() + ".overall_accesses")
2592810SN/A        .desc("number of overall (read+write) accesses")
2602810SN/A        .flags(total)
2612810SN/A        ;
2622810SN/A    overallAccesses = overallHits + overallMisses;
2632810SN/A
2642810SN/A    // miss rate formulas
2654022SN/A    for (int access_idx = 0; access_idx < MemCmd::NUM_MEM_CMDS; ++access_idx) {
2664022SN/A        MemCmd cmd(access_idx);
2674022SN/A        const string &cstr = cmd.toString();
2682810SN/A
2692810SN/A        missRate[access_idx]
2702810SN/A            .name(name() + "." + cstr + "_miss_rate")
2712810SN/A            .desc("miss rate for " + cstr + " accesses")
2722810SN/A            .flags(total | nozero | nonan)
2732810SN/A            ;
2742810SN/A
2752810SN/A        missRate[access_idx] = misses[access_idx] / accesses[access_idx];
2762810SN/A    }
2772810SN/A
2782810SN/A    demandMissRate
2792810SN/A        .name(name() + ".demand_miss_rate")
2802810SN/A        .desc("miss rate for demand accesses")
2812810SN/A        .flags(total)
2822810SN/A        ;
2832810SN/A    demandMissRate = demandMisses / demandAccesses;
2842810SN/A
2852810SN/A    overallMissRate
2862810SN/A        .name(name() + ".overall_miss_rate")
2872810SN/A        .desc("miss rate for overall accesses")
2882810SN/A        .flags(total)
2892810SN/A        ;
2902810SN/A    overallMissRate = overallMisses / overallAccesses;
2912810SN/A
2922810SN/A    // miss latency formulas
2934022SN/A    for (int access_idx = 0; access_idx < MemCmd::NUM_MEM_CMDS; ++access_idx) {
2944022SN/A        MemCmd cmd(access_idx);
2954022SN/A        const string &cstr = cmd.toString();
2962810SN/A
2972810SN/A        avgMissLatency[access_idx]
2982810SN/A            .name(name() + "." + cstr + "_avg_miss_latency")
2992810SN/A            .desc("average " + cstr + " miss latency")
3002810SN/A            .flags(total | nozero | nonan)
3012810SN/A            ;
3022810SN/A
3032810SN/A        avgMissLatency[access_idx] =
3042810SN/A            missLatency[access_idx] / misses[access_idx];
3052810SN/A    }
3062810SN/A
3072810SN/A    demandAvgMissLatency
3082810SN/A        .name(name() + ".demand_avg_miss_latency")
3092810SN/A        .desc("average overall miss latency")
3102810SN/A        .flags(total)
3112810SN/A        ;
3122810SN/A    demandAvgMissLatency = demandMissLatency / demandMisses;
3132810SN/A
3142810SN/A    overallAvgMissLatency
3152810SN/A        .name(name() + ".overall_avg_miss_latency")
3162810SN/A        .desc("average overall miss latency")
3172810SN/A        .flags(total)
3182810SN/A        ;
3192810SN/A    overallAvgMissLatency = overallMissLatency / overallMisses;
3202810SN/A
3212810SN/A    blocked_cycles.init(NUM_BLOCKED_CAUSES);
3222810SN/A    blocked_cycles
3232810SN/A        .name(name() + ".blocked_cycles")
3242810SN/A        .desc("number of cycles access was blocked")
3252810SN/A        .subname(Blocked_NoMSHRs, "no_mshrs")
3262810SN/A        .subname(Blocked_NoTargets, "no_targets")
3272810SN/A        ;
3282810SN/A
3292810SN/A
3302810SN/A    blocked_causes.init(NUM_BLOCKED_CAUSES);
3312810SN/A    blocked_causes
3322810SN/A        .name(name() + ".blocked")
3332810SN/A        .desc("number of cycles access was blocked")
3342810SN/A        .subname(Blocked_NoMSHRs, "no_mshrs")
3352810SN/A        .subname(Blocked_NoTargets, "no_targets")
3362810SN/A        ;
3372810SN/A
3382810SN/A    avg_blocked
3392810SN/A        .name(name() + ".avg_blocked_cycles")
3402810SN/A        .desc("average number of cycles each access was blocked")
3412810SN/A        .subname(Blocked_NoMSHRs, "no_mshrs")
3422810SN/A        .subname(Blocked_NoTargets, "no_targets")
3432810SN/A        ;
3442810SN/A
3452810SN/A    avg_blocked = blocked_cycles / blocked_causes;
3462810SN/A
3472810SN/A    fastWrites
3482810SN/A        .name(name() + ".fast_writes")
3492810SN/A        .desc("number of fast writes performed")
3502810SN/A        ;
3512810SN/A
3522810SN/A    cacheCopies
3532810SN/A        .name(name() + ".cache_copies")
3542810SN/A        .desc("number of cache copies performed")
3552810SN/A        ;
3562826SN/A
3574626SN/A    writebacks
3584626SN/A        .init(maxThreadsPerCPU)
3594626SN/A        .name(name() + ".writebacks")
3604626SN/A        .desc("number of writebacks")
3614626SN/A        .flags(total)
3624626SN/A        ;
3634626SN/A
3644626SN/A    // MSHR statistics
3654626SN/A    // MSHR hit statistics
3664626SN/A    for (int access_idx = 0; access_idx < MemCmd::NUM_MEM_CMDS; ++access_idx) {
3674626SN/A        MemCmd cmd(access_idx);
3684626SN/A        const string &cstr = cmd.toString();
3694626SN/A
3704626SN/A        mshr_hits[access_idx]
3714626SN/A            .init(maxThreadsPerCPU)
3724626SN/A            .name(name() + "." + cstr + "_mshr_hits")
3734626SN/A            .desc("number of " + cstr + " MSHR hits")
3744626SN/A            .flags(total | nozero | nonan)
3754626SN/A            ;
3764626SN/A    }
3774626SN/A
3784626SN/A    demandMshrHits
3794626SN/A        .name(name() + ".demand_mshr_hits")
3804626SN/A        .desc("number of demand (read+write) MSHR hits")
3814626SN/A        .flags(total)
3824626SN/A        ;
3834871SN/A    demandMshrHits = SUM_DEMAND(mshr_hits);
3844626SN/A
3854626SN/A    overallMshrHits
3864626SN/A        .name(name() + ".overall_mshr_hits")
3874626SN/A        .desc("number of overall MSHR hits")
3884626SN/A        .flags(total)
3894626SN/A        ;
3904871SN/A    overallMshrHits = demandMshrHits + SUM_NON_DEMAND(mshr_hits);
3914626SN/A
3924626SN/A    // MSHR miss statistics
3934626SN/A    for (int access_idx = 0; access_idx < MemCmd::NUM_MEM_CMDS; ++access_idx) {
3944626SN/A        MemCmd cmd(access_idx);
3954626SN/A        const string &cstr = cmd.toString();
3964626SN/A
3974626SN/A        mshr_misses[access_idx]
3984626SN/A            .init(maxThreadsPerCPU)
3994626SN/A            .name(name() + "." + cstr + "_mshr_misses")
4004626SN/A            .desc("number of " + cstr + " MSHR misses")
4014626SN/A            .flags(total | nozero | nonan)
4024626SN/A            ;
4034626SN/A    }
4044626SN/A
4054626SN/A    demandMshrMisses
4064626SN/A        .name(name() + ".demand_mshr_misses")
4074626SN/A        .desc("number of demand (read+write) MSHR misses")
4084626SN/A        .flags(total)
4094626SN/A        ;
4104871SN/A    demandMshrMisses = SUM_DEMAND(mshr_misses);
4114626SN/A
4124626SN/A    overallMshrMisses
4134626SN/A        .name(name() + ".overall_mshr_misses")
4144626SN/A        .desc("number of overall MSHR misses")
4154626SN/A        .flags(total)
4164626SN/A        ;
4174871SN/A    overallMshrMisses = demandMshrMisses + SUM_NON_DEMAND(mshr_misses);
4184626SN/A
4194626SN/A    // MSHR miss latency statistics
4204626SN/A    for (int access_idx = 0; access_idx < MemCmd::NUM_MEM_CMDS; ++access_idx) {
4214626SN/A        MemCmd cmd(access_idx);
4224626SN/A        const string &cstr = cmd.toString();
4234626SN/A
4244626SN/A        mshr_miss_latency[access_idx]
4254626SN/A            .init(maxThreadsPerCPU)
4264626SN/A            .name(name() + "." + cstr + "_mshr_miss_latency")
4274626SN/A            .desc("number of " + cstr + " MSHR miss cycles")
4284626SN/A            .flags(total | nozero | nonan)
4294626SN/A            ;
4304626SN/A    }
4314626SN/A
4324626SN/A    demandMshrMissLatency
4334626SN/A        .name(name() + ".demand_mshr_miss_latency")
4344626SN/A        .desc("number of demand (read+write) MSHR miss cycles")
4354626SN/A        .flags(total)
4364626SN/A        ;
4374871SN/A    demandMshrMissLatency = SUM_DEMAND(mshr_miss_latency);
4384626SN/A
4394626SN/A    overallMshrMissLatency
4404626SN/A        .name(name() + ".overall_mshr_miss_latency")
4414626SN/A        .desc("number of overall MSHR miss cycles")
4424626SN/A        .flags(total)
4434626SN/A        ;
4444871SN/A    overallMshrMissLatency =
4454871SN/A        demandMshrMissLatency + SUM_NON_DEMAND(mshr_miss_latency);
4464626SN/A
4474626SN/A    // MSHR uncacheable statistics
4484626SN/A    for (int access_idx = 0; access_idx < MemCmd::NUM_MEM_CMDS; ++access_idx) {
4494626SN/A        MemCmd cmd(access_idx);
4504626SN/A        const string &cstr = cmd.toString();
4514626SN/A
4524626SN/A        mshr_uncacheable[access_idx]
4534626SN/A            .init(maxThreadsPerCPU)
4544626SN/A            .name(name() + "." + cstr + "_mshr_uncacheable")
4554626SN/A            .desc("number of " + cstr + " MSHR uncacheable")
4564626SN/A            .flags(total | nozero | nonan)
4574626SN/A            ;
4584626SN/A    }
4594626SN/A
4604626SN/A    overallMshrUncacheable
4614626SN/A        .name(name() + ".overall_mshr_uncacheable_misses")
4624626SN/A        .desc("number of overall MSHR uncacheable misses")
4634626SN/A        .flags(total)
4644626SN/A        ;
4654871SN/A    overallMshrUncacheable =
4664871SN/A        SUM_DEMAND(mshr_uncacheable) + SUM_NON_DEMAND(mshr_uncacheable);
4674626SN/A
4684626SN/A    // MSHR miss latency statistics
4694626SN/A    for (int access_idx = 0; access_idx < MemCmd::NUM_MEM_CMDS; ++access_idx) {
4704626SN/A        MemCmd cmd(access_idx);
4714626SN/A        const string &cstr = cmd.toString();
4724626SN/A
4734626SN/A        mshr_uncacheable_lat[access_idx]
4744626SN/A            .init(maxThreadsPerCPU)
4754626SN/A            .name(name() + "." + cstr + "_mshr_uncacheable_latency")
4764626SN/A            .desc("number of " + cstr + " MSHR uncacheable cycles")
4774626SN/A            .flags(total | nozero | nonan)
4784626SN/A            ;
4794626SN/A    }
4804626SN/A
4814626SN/A    overallMshrUncacheableLatency
4824626SN/A        .name(name() + ".overall_mshr_uncacheable_latency")
4834626SN/A        .desc("number of overall MSHR uncacheable cycles")
4844626SN/A        .flags(total)
4854626SN/A        ;
4864871SN/A    overallMshrUncacheableLatency =
4874871SN/A        SUM_DEMAND(mshr_uncacheable_lat) +
4884871SN/A        SUM_NON_DEMAND(mshr_uncacheable_lat);
4894626SN/A
4904626SN/A#if 0
4914626SN/A    // MSHR access formulas
4924626SN/A    for (int access_idx = 0; access_idx < MemCmd::NUM_MEM_CMDS; ++access_idx) {
4934626SN/A        MemCmd cmd(access_idx);
4944626SN/A        const string &cstr = cmd.toString();
4954626SN/A
4964626SN/A        mshrAccesses[access_idx]
4974626SN/A            .name(name() + "." + cstr + "_mshr_accesses")
4984626SN/A            .desc("number of " + cstr + " mshr accesses(hits+misses)")
4994626SN/A            .flags(total | nozero | nonan)
5004626SN/A            ;
5014626SN/A        mshrAccesses[access_idx] =
5024626SN/A            mshr_hits[access_idx] + mshr_misses[access_idx]
5034626SN/A            + mshr_uncacheable[access_idx];
5044626SN/A    }
5054626SN/A
5064626SN/A    demandMshrAccesses
5074626SN/A        .name(name() + ".demand_mshr_accesses")
5084626SN/A        .desc("number of demand (read+write) mshr accesses")
5094626SN/A        .flags(total | nozero | nonan)
5104626SN/A        ;
5114626SN/A    demandMshrAccesses = demandMshrHits + demandMshrMisses;
5124626SN/A
5134626SN/A    overallMshrAccesses
5144626SN/A        .name(name() + ".overall_mshr_accesses")
5154626SN/A        .desc("number of overall (read+write) mshr accesses")
5164626SN/A        .flags(total | nozero | nonan)
5174626SN/A        ;
5184626SN/A    overallMshrAccesses = overallMshrHits + overallMshrMisses
5194626SN/A        + overallMshrUncacheable;
5204626SN/A#endif
5214626SN/A
5224626SN/A    // MSHR miss rate formulas
5234626SN/A    for (int access_idx = 0; access_idx < MemCmd::NUM_MEM_CMDS; ++access_idx) {
5244626SN/A        MemCmd cmd(access_idx);
5254626SN/A        const string &cstr = cmd.toString();
5264626SN/A
5274626SN/A        mshrMissRate[access_idx]
5284626SN/A            .name(name() + "." + cstr + "_mshr_miss_rate")
5294626SN/A            .desc("mshr miss rate for " + cstr + " accesses")
5304626SN/A            .flags(total | nozero | nonan)
5314626SN/A            ;
5324626SN/A
5334626SN/A        mshrMissRate[access_idx] =
5344626SN/A            mshr_misses[access_idx] / accesses[access_idx];
5354626SN/A    }
5364626SN/A
5374626SN/A    demandMshrMissRate
5384626SN/A        .name(name() + ".demand_mshr_miss_rate")
5394626SN/A        .desc("mshr miss rate for demand accesses")
5404626SN/A        .flags(total)
5414626SN/A        ;
5424626SN/A    demandMshrMissRate = demandMshrMisses / demandAccesses;
5434626SN/A
5444626SN/A    overallMshrMissRate
5454626SN/A        .name(name() + ".overall_mshr_miss_rate")
5464626SN/A        .desc("mshr miss rate for overall accesses")
5474626SN/A        .flags(total)
5484626SN/A        ;
5494626SN/A    overallMshrMissRate = overallMshrMisses / overallAccesses;
5504626SN/A
5514626SN/A    // mshrMiss latency formulas
5524626SN/A    for (int access_idx = 0; access_idx < MemCmd::NUM_MEM_CMDS; ++access_idx) {
5534626SN/A        MemCmd cmd(access_idx);
5544626SN/A        const string &cstr = cmd.toString();
5554626SN/A
5564626SN/A        avgMshrMissLatency[access_idx]
5574626SN/A            .name(name() + "." + cstr + "_avg_mshr_miss_latency")
5584626SN/A            .desc("average " + cstr + " mshr miss latency")
5594626SN/A            .flags(total | nozero | nonan)
5604626SN/A            ;
5614626SN/A
5624626SN/A        avgMshrMissLatency[access_idx] =
5634626SN/A            mshr_miss_latency[access_idx] / mshr_misses[access_idx];
5644626SN/A    }
5654626SN/A
5664626SN/A    demandAvgMshrMissLatency
5674626SN/A        .name(name() + ".demand_avg_mshr_miss_latency")
5684626SN/A        .desc("average overall mshr miss latency")
5694626SN/A        .flags(total)
5704626SN/A        ;
5714626SN/A    demandAvgMshrMissLatency = demandMshrMissLatency / demandMshrMisses;
5724626SN/A
5734626SN/A    overallAvgMshrMissLatency
5744626SN/A        .name(name() + ".overall_avg_mshr_miss_latency")
5754626SN/A        .desc("average overall mshr miss latency")
5764626SN/A        .flags(total)
5774626SN/A        ;
5784626SN/A    overallAvgMshrMissLatency = overallMshrMissLatency / overallMshrMisses;
5794626SN/A
5804626SN/A    // mshrUncacheable latency formulas
5814626SN/A    for (int access_idx = 0; access_idx < MemCmd::NUM_MEM_CMDS; ++access_idx) {
5824626SN/A        MemCmd cmd(access_idx);
5834626SN/A        const string &cstr = cmd.toString();
5844626SN/A
5854626SN/A        avgMshrUncacheableLatency[access_idx]
5864626SN/A            .name(name() + "." + cstr + "_avg_mshr_uncacheable_latency")
5874626SN/A            .desc("average " + cstr + " mshr uncacheable latency")
5884626SN/A            .flags(total | nozero | nonan)
5894626SN/A            ;
5904626SN/A
5914626SN/A        avgMshrUncacheableLatency[access_idx] =
5924626SN/A            mshr_uncacheable_lat[access_idx] / mshr_uncacheable[access_idx];
5934626SN/A    }
5944626SN/A
5954626SN/A    overallAvgMshrUncacheableLatency
5964626SN/A        .name(name() + ".overall_avg_mshr_uncacheable_latency")
5974626SN/A        .desc("average overall mshr uncacheable latency")
5984626SN/A        .flags(total)
5994626SN/A        ;
6004626SN/A    overallAvgMshrUncacheableLatency = overallMshrUncacheableLatency / overallMshrUncacheable;
6014626SN/A
6024626SN/A    mshr_cap_events
6034626SN/A        .init(maxThreadsPerCPU)
6044626SN/A        .name(name() + ".mshr_cap_events")
6054626SN/A        .desc("number of times MSHR cap was activated")
6064626SN/A        .flags(total)
6074626SN/A        ;
6084626SN/A
6094626SN/A    //software prefetching stats
6104626SN/A    soft_prefetch_mshr_full
6114626SN/A        .init(maxThreadsPerCPU)
6124626SN/A        .name(name() + ".soft_prefetch_mshr_full")
6134626SN/A        .desc("number of mshr full events for SW prefetching instrutions")
6144626SN/A        .flags(total)
6154626SN/A        ;
6164626SN/A
6174626SN/A    mshr_no_allocate_misses
6184626SN/A        .name(name() +".no_allocate_misses")
6194626SN/A        .desc("Number of misses that were no-allocate")
6204626SN/A        ;
6214626SN/A
6222810SN/A}
6233503SN/A
6243503SN/Aunsigned int
6253503SN/ABaseCache::drain(Event *de)
6263503SN/A{
6274626SN/A    int count = memSidePort->drain(de) + cpuSidePort->drain(de);
6284626SN/A
6293503SN/A    // Set status
6304626SN/A    if (count != 0) {
6313503SN/A        drainEvent = de;
6323503SN/A
6333503SN/A        changeState(SimObject::Draining);
6344626SN/A        return count;
6353503SN/A    }
6363503SN/A
6373503SN/A    changeState(SimObject::Drained);
6383503SN/A    return 0;
6393503SN/A}
640