Profiler.hh revision 9747:fbe79534d024
1/* 2 * Copyright (c) 1999-2008 Mark D. Hill and David A. Wood 3 * All rights reserved. 4 * 5 * Redistribution and use in source and binary forms, with or without 6 * modification, are permitted provided that the following conditions are 7 * met: redistributions of source code must retain the above copyright 8 * notice, this list of conditions and the following disclaimer; 9 * redistributions in binary form must reproduce the above copyright 10 * notice, this list of conditions and the following disclaimer in the 11 * documentation and/or other materials provided with the distribution; 12 * neither the name of the copyright holders nor the names of its 13 * contributors may be used to endorse or promote products derived from 14 * this software without specific prior written permission. 15 * 16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 17 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 18 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 19 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 20 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 21 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 22 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 23 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 24 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 25 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 26 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 27 */ 28 29/* 30 This file has been modified by Kevin Moore and Dan Nussbaum of the 31 Scalable Systems Research Group at Sun Microsystems Laboratories 32 (http://research.sun.com/scalable/) to support the Adaptive 33 Transactional Memory Test Platform (ATMTP). 34 35 Please send email to atmtp-interest@sun.com with feedback, questions, or 36 to request future announcements about ATMTP. 37 38 ---------------------------------------------------------------------- 39 40 File modification date: 2008-02-23 41 42 ---------------------------------------------------------------------- 43*/ 44 45#ifndef __MEM_RUBY_PROFILER_PROFILER_HH__ 46#define __MEM_RUBY_PROFILER_PROFILER_HH__ 47 48#include <iostream> 49#include <map> 50#include <string> 51#include <vector> 52 53#include "base/hashmap.hh" 54#include "mem/protocol/AccessType.hh" 55#include "mem/protocol/GenericMachineType.hh" 56#include "mem/protocol/PrefetchBit.hh" 57#include "mem/protocol/RubyAccessMode.hh" 58#include "mem/protocol/RubyRequestType.hh" 59#include "mem/ruby/common/Address.hh" 60#include "mem/ruby/common/Global.hh" 61#include "mem/ruby/common/Histogram.hh" 62#include "mem/ruby/common/Set.hh" 63#include "mem/ruby/system/MachineID.hh" 64#include "mem/ruby/system/MemoryControl.hh" 65#include "params/RubyProfiler.hh" 66#include "sim/sim_object.hh" 67 68class RubyRequest; 69class AddressProfiler; 70 71class Profiler : public SimObject 72{ 73 public: 74 typedef RubyProfilerParams Params; 75 Profiler(const Params *); 76 ~Profiler(); 77 78 void wakeup(); 79 80 void setPeriodicStatsFile(const std::string& filename); 81 void setPeriodicStatsInterval(int64_t period); 82 83 void printStats(std::ostream& out, bool short_stats=false); 84 void printShortStats(std::ostream& out) { printStats(out, true); } 85 void printTraceStats(std::ostream& out) const; 86 void clearStats(); 87 void printResourceUsage(std::ostream& out) const; 88 89 AddressProfiler* getAddressProfiler() { return m_address_profiler_ptr; } 90 AddressProfiler* getInstructionProfiler() { return m_inst_profiler_ptr; } 91 92 void addAddressTraceSample(const RubyRequest& msg, NodeID id); 93 94 void profileRequest(const std::string& requestStr); 95 void profileSharing(const Address& addr, AccessType type, 96 NodeID requestor, const Set& sharers, 97 const Set& owner); 98 99 void profileMulticastRetry(const Address& addr, int count); 100 101 void profileFilterAction(int action); 102 103 void profileConflictingRequests(const Address& addr); 104 105 void 106 profileAverageLatencyEstimate(int latency) 107 { 108 m_average_latency_estimate.add(latency); 109 } 110 111 void controllerBusy(MachineID machID); 112 void bankBusy(); 113 114 void missLatency(Cycles t, RubyRequestType type, 115 const GenericMachineType respondingMach); 116 117 void missLatencyWcc(Cycles issuedTime, Cycles initialRequestTime, 118 Cycles forwardRequestTime, Cycles firstResponseTime, 119 Cycles completionTime); 120 121 void missLatencyDir(Cycles issuedTime, Cycles initialRequestTime, 122 Cycles forwardRequestTime, Cycles firstResponseTime, 123 Cycles completionTime); 124 125 void swPrefetchLatency(Cycles t, RubyRequestType type, 126 const GenericMachineType respondingMach); 127 128 void print(std::ostream& out) const; 129 130 void rubyWatch(int proc); 131 bool watchAddress(Address addr); 132 133 // return Ruby's start time 134 Cycles getRubyStartTime() { return m_ruby_start; } 135 136 // added by SS 137 bool getHotLines() { return m_hot_lines; } 138 bool getAllInstructions() { return m_all_instructions; } 139 140 private: 141 void printRequestProfile(std::ostream &out) const; 142 void printDelayProfile(std::ostream &out) const; 143 void printOutstandingReqProfile(std::ostream &out) const; 144 145 private: 146 // Private copy constructor and assignment operator 147 Profiler(const Profiler& obj); 148 Profiler& operator=(const Profiler& obj); 149 150 AddressProfiler* m_address_profiler_ptr; 151 AddressProfiler* m_inst_profiler_ptr; 152 153 Cycles m_ruby_start; 154 time_t m_real_time_start_time; 155 156 int64_t m_busyBankCount; 157 158 Histogram m_read_sharing_histogram; 159 Histogram m_write_sharing_histogram; 160 Histogram m_all_sharing_histogram; 161 int64 m_cache_to_cache; 162 int64 m_memory_to_cache; 163 164 std::vector<Histogram> m_missLatencyHistograms; 165 std::vector<Histogram> m_machLatencyHistograms; 166 std::vector< std::vector<Histogram> > m_missMachLatencyHistograms; 167 Histogram m_wCCIssueToInitialRequestHistogram; 168 Histogram m_wCCInitialRequestToForwardRequestHistogram; 169 Histogram m_wCCForwardRequestToFirstResponseHistogram; 170 Histogram m_wCCFirstResponseToCompleteHistogram; 171 int64 m_wCCIncompleteTimes; 172 Histogram m_dirIssueToInitialRequestHistogram; 173 Histogram m_dirInitialRequestToForwardRequestHistogram; 174 Histogram m_dirForwardRequestToFirstResponseHistogram; 175 Histogram m_dirFirstResponseToCompleteHistogram; 176 int64 m_dirIncompleteTimes; 177 178 Histogram m_allMissLatencyHistogram; 179 180 Histogram m_allSWPrefetchLatencyHistogram; 181 Histogram m_SWPrefetchL2MissLatencyHistogram; 182 std::vector<Histogram> m_SWPrefetchLatencyHistograms; 183 std::vector<Histogram> m_SWPrefetchMachLatencyHistograms; 184 185 Histogram m_average_latency_estimate; 186 m5::hash_set<Address> m_watch_address_set; 187 188 //added by SS 189 bool m_hot_lines; 190 bool m_all_instructions; 191 192 int m_num_of_sequencers; 193}; 194 195inline std::ostream& 196operator<<(std::ostream& out, const Profiler& obj) 197{ 198 obj.print(out); 199 out << std::flush; 200 return out; 201} 202 203#endif // __MEM_RUBY_PROFILER_PROFILER_HH__ 204