AddressProfiler.cc (6896:649e40aad897) AddressProfiler.cc (7048:2ab58c54de63)
1
2/*
3 * Copyright (c) 1999-2008 Mark D. Hill and David A. Wood
4 * All rights reserved.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions are
8 * met: redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer;

--- 12 unchanged lines hidden (view full) ---

22 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
23 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
24 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
25 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
27 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28 */
29
1/*
2 * Copyright (c) 1999-2008 Mark D. Hill and David A. Wood
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are
7 * met: redistributions of source code must retain the above copyright
8 * notice, this list of conditions and the following disclaimer;

--- 12 unchanged lines hidden (view full) ---

21 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
22 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
26 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27 */
28
30/*
31 * AddressProfiler.cc
32 *
33 * Description: See AddressProfiler.hh
34 *
35 * $Id$
36 *
37 */
38
39#include "mem/ruby/profiler/AddressProfiler.hh"
29#include "mem/gems_common/Map.hh"
30#include "mem/gems_common/PrioHeap.hh"
40#include "mem/protocol/CacheMsg.hh"
41#include "mem/ruby/profiler/AccessTraceForAddress.hh"
31#include "mem/protocol/CacheMsg.hh"
32#include "mem/ruby/profiler/AccessTraceForAddress.hh"
42#include "mem/gems_common/PrioHeap.hh"
43#include "mem/gems_common/Map.hh"
44#include "mem/ruby/system/System.hh"
33#include "mem/ruby/profiler/AddressProfiler.hh"
45#include "mem/ruby/profiler/Profiler.hh"
34#include "mem/ruby/profiler/Profiler.hh"
35#include "mem/ruby/system/System.hh"
46
36
47// Helper functions
48static AccessTraceForAddress& lookupTraceForAddress(const Address& addr,
49 Map<Address,
50 AccessTraceForAddress>* record_map);
37typedef AddressProfiler::AddressMap AddressMap;
51
38
52static void printSorted(ostream& out,
53 int num_of_sequencers,
54 const Map<Address, AccessTraceForAddress>* record_map,
55 string description);
56
57AddressProfiler::AddressProfiler(int num_of_sequencers)
39// Helper functions
40AccessTraceForAddress&
41lookupTraceForAddress(const Address& addr, AddressMap* record_map)
58{
42{
59 m_dataAccessTrace = new Map<Address, AccessTraceForAddress>;
60 m_macroBlockAccessTrace = new Map<Address, AccessTraceForAddress>;
61 m_programCounterAccessTrace = new Map<Address, AccessTraceForAddress>;
62 m_retryProfileMap = new Map<Address, AccessTraceForAddress>;
63 m_num_of_sequencers = num_of_sequencers;
64 clearStats();
43 if (!record_map->exist(addr)) {
44 record_map->add(addr, AccessTraceForAddress(addr));
45 }
46 return record_map->lookup(addr);
65}
66
47}
48
67AddressProfiler::~AddressProfiler()
49void
50printSorted(ostream& out, int num_of_sequencers, const AddressMap* record_map,
51 string description)
68{
52{
69 delete m_dataAccessTrace;
70 delete m_macroBlockAccessTrace;
71 delete m_programCounterAccessTrace;
72 delete m_retryProfileMap;
73}
53 const int records_printed = 100;
74
54
75void AddressProfiler::setHotLines(bool hot_lines){
76 m_hot_lines = hot_lines;
77}
78void AddressProfiler::setAllInstructions(bool all_instructions){
79 m_all_instructions = all_instructions;
80}
55 uint64 misses = 0;
56 PrioHeap<AccessTraceForAddress*> heap;
57 Vector<Address> keys = record_map->keys();
58 for (int i = 0; i < keys.size(); i++) {
59 AccessTraceForAddress* record = &(record_map->lookup(keys[i]));
60 misses += record->getTotal();
61 heap.insert(record);
62 }
81
63
82void AddressProfiler::printStats(ostream& out) const
83{
84 if (m_hot_lines) {
85 out << endl;
86 out << "AddressProfiler Stats" << endl;
87 out << "---------------------" << endl;
64 out << "Total_entries_" << description << ": " << keys.size() << endl;
65 if (g_system_ptr->getProfiler()->getAllInstructions())
66 out << "Total_Instructions_" << description << ": " << misses << endl;
67 else
68 out << "Total_data_misses_" << description << ": " << misses << endl;
88
69
89 out << endl;
90 out << "sharing_misses: " << m_sharing_miss_counter << endl;
91 out << "getx_sharing_histogram: " << m_getx_sharing_histogram << endl;
92 out << "gets_sharing_histogram: " << m_gets_sharing_histogram << endl;
70 out << "total | load store atomic | user supervisor | sharing | touched-by"
71 << endl;
93
72
94 out << endl;
95 out << "Hot Data Blocks" << endl;
96 out << "---------------" << endl;
97 out << endl;
98 printSorted(out, m_num_of_sequencers, m_dataAccessTrace, "block_address");
73 Histogram remaining_records(1, 100);
74 Histogram all_records(1, 100);
75 Histogram remaining_records_log(-1);
76 Histogram all_records_log(-1);
99
77
100 out << endl;
101 out << "Hot MacroData Blocks" << endl;
102 out << "--------------------" << endl;
103 out << endl;
104 printSorted(out, m_num_of_sequencers, m_macroBlockAccessTrace, "macroblock_address");
78 // Allows us to track how many lines where touched by n processors
79 Vector<int64> m_touched_vec;
80 Vector<int64> m_touched_weighted_vec;
81 m_touched_vec.setSize(num_of_sequencers+1);
82 m_touched_weighted_vec.setSize(num_of_sequencers+1);
83 for (int i = 0; i < m_touched_vec.size(); i++) {
84 m_touched_vec[i] = 0;
85 m_touched_weighted_vec[i] = 0;
86 }
105
87
106 out << "Hot Instructions" << endl;
107 out << "----------------" << endl;
108 out << endl;
109 printSorted(out, m_num_of_sequencers, m_programCounterAccessTrace, "pc_address");
110 }
88 int counter = 0;
89 while (heap.size() > 0 && counter < records_printed) {
90 AccessTraceForAddress* record = heap.extractMin();
91 double percent = 100.0 * (record->getTotal() / double(misses));
92 out << description << " | " << percent << " % " << *record << endl;
93 all_records.add(record->getTotal());
94 all_records_log.add(record->getTotal());
95 counter++;
96 m_touched_vec[record->getTouchedBy()]++;
97 m_touched_weighted_vec[record->getTouchedBy()] += record->getTotal();
98 }
111
99
112 if (m_all_instructions){
100 while (heap.size() > 0) {
101 AccessTraceForAddress* record = heap.extractMin();
102 all_records.add(record->getTotal());
103 remaining_records.add(record->getTotal());
104 all_records_log.add(record->getTotal());
105 remaining_records_log.add(record->getTotal());
106 m_touched_vec[record->getTouchedBy()]++;
107 m_touched_weighted_vec[record->getTouchedBy()] += record->getTotal();
108 }
113 out << endl;
109 out << endl;
114 out << "All Instructions Profile:" << endl;
115 out << "-------------------------" << endl;
116 out << endl;
117 printSorted(out, m_num_of_sequencers, m_programCounterAccessTrace, "pc_address");
118 out << endl;
119 }
110 out << "all_records_" << description << ": "
111 << all_records << endl
112 << "all_records_log_" << description << ": "
113 << all_records_log << endl
114 << "remaining_records_" << description << ": "
115 << remaining_records << endl
116 << "remaining_records_log_" << description << ": "
117 << remaining_records_log << endl
118 << "touched_by_" << description << ": "
119 << m_touched_vec << endl
120 << "touched_by_weighted_" << description << ": "
121 << m_touched_weighted_vec << endl
122 << endl;
123}
120
124
121 if (m_retryProfileHisto.size() > 0) {
122 out << "Retry Profile" << endl;
123 out << "-------------" << endl;
124 out << endl;
125 out << "retry_histogram_absolute: " << m_retryProfileHisto << endl;
126 out << "retry_histogram_write: " << m_retryProfileHistoWrite << endl;
127 out << "retry_histogram_read: " << m_retryProfileHistoRead << endl;
128
129 out << "retry_histogram_percent: ";
130 m_retryProfileHisto.printPercent(out);
131 out << endl;
132
133 printSorted(out, m_num_of_sequencers, m_retryProfileMap, "block_address");
134 out << endl;
135 }
136
125AddressProfiler::AddressProfiler(int num_of_sequencers)
126{
127 m_dataAccessTrace = new AddressMap;
128 m_macroBlockAccessTrace = new AddressMap;
129 m_programCounterAccessTrace = new AddressMap;
130 m_retryProfileMap = new AddressMap;
131 m_num_of_sequencers = num_of_sequencers;
132 clearStats();
137}
138
133}
134
139void AddressProfiler::clearStats()
135AddressProfiler::~AddressProfiler()
140{
136{
141 // Clear the maps
142 m_sharing_miss_counter = 0;
143 m_dataAccessTrace->clear();
144 m_macroBlockAccessTrace->clear();
145 m_programCounterAccessTrace->clear();
146 m_retryProfileMap->clear();
147 m_retryProfileHisto.clear();
148 m_retryProfileHistoRead.clear();
149 m_retryProfileHistoWrite.clear();
150 m_getx_sharing_histogram.clear();
151 m_gets_sharing_histogram.clear();
137 delete m_dataAccessTrace;
138 delete m_macroBlockAccessTrace;
139 delete m_programCounterAccessTrace;
140 delete m_retryProfileMap;
152}
153
141}
142
154void AddressProfiler::profileGetX(const Address& datablock, const Address& PC, const Set& owner, const Set& sharers, NodeID requestor)
143void
144AddressProfiler::setHotLines(bool hot_lines)
155{
145{
156 Set indirection_set;
157 indirection_set.addSet(sharers);
158 indirection_set.addSet(owner);
159 indirection_set.remove(requestor);
160 int num_indirections = indirection_set.count();
146 m_hot_lines = hot_lines;
147}
161
148
162 m_getx_sharing_histogram.add(num_indirections);
163 bool indirection_miss = (num_indirections > 0);
164
165 addTraceSample(datablock, PC, CacheRequestType_ST, AccessModeType(0), requestor, indirection_miss);
149void
150AddressProfiler::setAllInstructions(bool all_instructions)
151{
152 m_all_instructions = all_instructions;
166}
167
153}
154
168void AddressProfiler::profileGetS(const Address& datablock, const Address& PC, const Set& owner, const Set& sharers, NodeID requestor)
155void
156AddressProfiler::printStats(ostream& out) const
169{
157{
170 Set indirection_set;
171 indirection_set.addSet(owner);
172 indirection_set.remove(requestor);
173 int num_indirections = indirection_set.count();
158 if (m_hot_lines) {
159 out << endl;
160 out << "AddressProfiler Stats" << endl;
161 out << "---------------------" << endl;
174
162
175 m_gets_sharing_histogram.add(num_indirections);
176 bool indirection_miss = (num_indirections > 0);
163 out << endl;
164 out << "sharing_misses: " << m_sharing_miss_counter << endl;
165 out << "getx_sharing_histogram: " << m_getx_sharing_histogram << endl;
166 out << "gets_sharing_histogram: " << m_gets_sharing_histogram << endl;
177
167
178 addTraceSample(datablock, PC, CacheRequestType_LD, AccessModeType(0), requestor, indirection_miss);
179}
168 out << endl;
169 out << "Hot Data Blocks" << endl;
170 out << "---------------" << endl;
171 out << endl;
172 printSorted(out, m_num_of_sequencers, m_dataAccessTrace,
173 "block_address");
180
174
181void AddressProfiler::addTraceSample(Address data_addr, Address pc_addr, CacheRequestType type, AccessModeType access_mode, NodeID id, bool sharing_miss)
182{
183 if (m_all_instructions) {
184 if (sharing_miss) {
185 m_sharing_miss_counter++;
175 out << endl;
176 out << "Hot MacroData Blocks" << endl;
177 out << "--------------------" << endl;
178 out << endl;
179 printSorted(out, m_num_of_sequencers, m_macroBlockAccessTrace,
180 "macroblock_address");
181
182 out << "Hot Instructions" << endl;
183 out << "----------------" << endl;
184 out << endl;
185 printSorted(out, m_num_of_sequencers, m_programCounterAccessTrace,
186 "pc_address");
186 }
187
187 }
188
188 // record data address trace info
189 data_addr.makeLineAddress();
190 lookupTraceForAddress(data_addr, m_dataAccessTrace).update(type, access_mode, id, sharing_miss);
189 if (m_all_instructions) {
190 out << endl;
191 out << "All Instructions Profile:" << endl;
192 out << "-------------------------" << endl;
193 out << endl;
194 printSorted(out, m_num_of_sequencers, m_programCounterAccessTrace,
195 "pc_address");
196 out << endl;
197 }
191
198
192 // record macro data address trace info
193 Address macro_addr(data_addr.maskLowOrderBits(10)); // 6 for datablock, 4 to make it 16x more coarse
194 lookupTraceForAddress(macro_addr, m_macroBlockAccessTrace).update(type, access_mode, id, sharing_miss);
199 if (m_retryProfileHisto.size() > 0) {
200 out << "Retry Profile" << endl;
201 out << "-------------" << endl;
202 out << endl;
203 out << "retry_histogram_absolute: " << m_retryProfileHisto << endl;
204 out << "retry_histogram_write: " << m_retryProfileHistoWrite << endl;
205 out << "retry_histogram_read: " << m_retryProfileHistoRead << endl;
195
206
196 // record program counter address trace info
197 lookupTraceForAddress(pc_addr, m_programCounterAccessTrace).update(type, access_mode, id, sharing_miss);
198 }
207 out << "retry_histogram_percent: ";
208 m_retryProfileHisto.printPercent(out);
209 out << endl;
199
210
200 if (m_all_instructions) {
201 // This code is used if the address profiler is an all-instructions profiler
202 // record program counter address trace info
203 lookupTraceForAddress(pc_addr, m_programCounterAccessTrace).update(type, access_mode, id, sharing_miss);
204 }
211 printSorted(out, m_num_of_sequencers, m_retryProfileMap,
212 "block_address");
213 out << endl;
214 }
205}
206
215}
216
207void AddressProfiler::profileRetry(const Address& data_addr, AccessType type, int count)
217void
218AddressProfiler::clearStats()
208{
219{
209 m_retryProfileHisto.add(count);
210 if (type == AccessType_Read) {
211 m_retryProfileHistoRead.add(count);
212 } else {
213 m_retryProfileHistoWrite.add(count);
214 }
215 if (count > 1) {
216 lookupTraceForAddress(data_addr, m_retryProfileMap).addSample(count);
217 }
220 // Clear the maps
221 m_sharing_miss_counter = 0;
222 m_dataAccessTrace->clear();
223 m_macroBlockAccessTrace->clear();
224 m_programCounterAccessTrace->clear();
225 m_retryProfileMap->clear();
226 m_retryProfileHisto.clear();
227 m_retryProfileHistoRead.clear();
228 m_retryProfileHistoWrite.clear();
229 m_getx_sharing_histogram.clear();
230 m_gets_sharing_histogram.clear();
218}
219
231}
232
220// ***** Normal Functions ******
233void
234AddressProfiler::profileGetX(const Address& datablock, const Address& PC,
235 const Set& owner, const Set& sharers,
236 NodeID requestor)
237{
238 Set indirection_set;
239 indirection_set.addSet(sharers);
240 indirection_set.addSet(owner);
241 indirection_set.remove(requestor);
242 int num_indirections = indirection_set.count();
221
243
222static void printSorted(ostream& out,
223 int num_of_sequencers,
224 const Map<Address, AccessTraceForAddress>* record_map,
225 string description)
244 m_getx_sharing_histogram.add(num_indirections);
245 bool indirection_miss = (num_indirections > 0);
246
247 addTraceSample(datablock, PC, CacheRequestType_ST, AccessModeType(0),
248 requestor, indirection_miss);
249}
250
251void
252AddressProfiler::profileGetS(const Address& datablock, const Address& PC,
253 const Set& owner, const Set& sharers,
254 NodeID requestor)
226{
255{
227 const int records_printed = 100;
256 Set indirection_set;
257 indirection_set.addSet(owner);
258 indirection_set.remove(requestor);
259 int num_indirections = indirection_set.count();
228
260
229 uint64 misses = 0;
230 PrioHeap<AccessTraceForAddress*> heap;
231 Vector<Address> keys = record_map->keys();
232 for(int i=0; i<keys.size(); i++){
233 AccessTraceForAddress* record = &(record_map->lookup(keys[i]));
234 misses += record->getTotal();
235 heap.insert(record);
236 }
261 m_gets_sharing_histogram.add(num_indirections);
262 bool indirection_miss = (num_indirections > 0);
237
263
238 out << "Total_entries_" << description << ": " << keys.size() << endl;
239 if (g_system_ptr->getProfiler()->getAllInstructions())
240 out << "Total_Instructions_" << description << ": " << misses << endl;
241 else
242 out << "Total_data_misses_" << description << ": " << misses << endl;
264 addTraceSample(datablock, PC, CacheRequestType_LD, AccessModeType(0),
265 requestor, indirection_miss);
266}
243
267
244 out << "total | load store atomic | user supervisor | sharing | touched-by" << endl;
268void
269AddressProfiler::addTraceSample(Address data_addr, Address pc_addr,
270 CacheRequestType type,
271 AccessModeType access_mode, NodeID id,
272 bool sharing_miss)
273{
274 if (m_all_instructions) {
275 if (sharing_miss) {
276 m_sharing_miss_counter++;
277 }
245
278
246 Histogram remaining_records(1, 100);
247 Histogram all_records(1, 100);
248 Histogram remaining_records_log(-1);
249 Histogram all_records_log(-1);
279 // record data address trace info
280 data_addr.makeLineAddress();
281 lookupTraceForAddress(data_addr, m_dataAccessTrace).
282 update(type, access_mode, id, sharing_miss);
250
283
251 // Allows us to track how many lines where touched by n processors
252 Vector<int64> m_touched_vec;
253 Vector<int64> m_touched_weighted_vec;
254 m_touched_vec.setSize(num_of_sequencers+1);
255 m_touched_weighted_vec.setSize(num_of_sequencers+1);
256 for (int i=0; i<m_touched_vec.size(); i++) {
257 m_touched_vec[i] = 0;
258 m_touched_weighted_vec[i] = 0;
259 }
284 // record macro data address trace info
260
285
261 int counter = 0;
262 while((heap.size() > 0) && (counter < records_printed)) {
263 AccessTraceForAddress* record = heap.extractMin();
264 double percent = 100.0*(record->getTotal()/double(misses));
265 out << description << " | " << percent << " % " << *record << endl;
266 all_records.add(record->getTotal());
267 all_records_log.add(record->getTotal());
268 counter++;
269 m_touched_vec[record->getTouchedBy()]++;
270 m_touched_weighted_vec[record->getTouchedBy()] += record->getTotal();
271 }
286 // 6 for datablock, 4 to make it 16x more coarse
287 Address macro_addr(data_addr.maskLowOrderBits(10));
288 lookupTraceForAddress(macro_addr, m_macroBlockAccessTrace).
289 update(type, access_mode, id, sharing_miss);
272
290
273 while(heap.size() > 0) {
274 AccessTraceForAddress* record = heap.extractMin();
275 all_records.add(record->getTotal());
276 remaining_records.add(record->getTotal());
277 all_records_log.add(record->getTotal());
278 remaining_records_log.add(record->getTotal());
279 m_touched_vec[record->getTouchedBy()]++;
280 m_touched_weighted_vec[record->getTouchedBy()] += record->getTotal();
281 }
282 out << endl;
283 out << "all_records_" << description << ": " << all_records << endl;
284 out << "all_records_log_" << description << ": " << all_records_log << endl;
285 out << "remaining_records_" << description << ": " << remaining_records << endl;
286 out << "remaining_records_log_" << description << ": " << remaining_records_log << endl;
287 out << "touched_by_" << description << ": " << m_touched_vec << endl;
288 out << "touched_by_weighted_" << description << ": " << m_touched_weighted_vec << endl;
289 out << endl;
291 // record program counter address trace info
292 lookupTraceForAddress(pc_addr, m_programCounterAccessTrace).
293 update(type, access_mode, id, sharing_miss);
294 }
295
296 if (m_all_instructions) {
297 // This code is used if the address profiler is an
298 // all-instructions profiler record program counter address
299 // trace info
300 lookupTraceForAddress(pc_addr, m_programCounterAccessTrace).
301 update(type, access_mode, id, sharing_miss);
302 }
290}
291
303}
304
292static AccessTraceForAddress& lookupTraceForAddress(const Address& addr, Map<Address, AccessTraceForAddress>* record_map)
305void
306AddressProfiler::profileRetry(const Address& data_addr, AccessType type,
307 int count)
293{
308{
294 if(record_map->exist(addr) == false){
295 record_map->add(addr, AccessTraceForAddress(addr));
296 }
297 return record_map->lookup(addr);
309 m_retryProfileHisto.add(count);
310 if (type == AccessType_Read) {
311 m_retryProfileHistoRead.add(count);
312 } else {
313 m_retryProfileHistoWrite.add(count);
314 }
315 if (count > 1) {
316 lookupTraceForAddress(data_addr, m_retryProfileMap).addSample(count);
317 }
298}
318}