AddressProfiler.cc revision 6145
12567SN/A 210037SARM gem5 Developers/* 37650SAli.Saidi@ARM.com * Copyright (c) 1999-2008 Mark D. Hill and David A. Wood 47650SAli.Saidi@ARM.com * All rights reserved. 57650SAli.Saidi@ARM.com * 67650SAli.Saidi@ARM.com * Redistribution and use in source and binary forms, with or without 77650SAli.Saidi@ARM.com * modification, are permitted provided that the following conditions are 87650SAli.Saidi@ARM.com * met: redistributions of source code must retain the above copyright 97650SAli.Saidi@ARM.com * notice, this list of conditions and the following disclaimer; 107650SAli.Saidi@ARM.com * redistributions in binary form must reproduce the above copyright 117650SAli.Saidi@ARM.com * notice, this list of conditions and the following disclaimer in the 127650SAli.Saidi@ARM.com * documentation and/or other materials provided with the distribution; 137650SAli.Saidi@ARM.com * neither the name of the copyright holders nor the names of its 142567SN/A * contributors may be used to endorse or promote products derived from 152567SN/A * this software without specific prior written permission. 162567SN/A * 172567SN/A * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 182567SN/A * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 192567SN/A * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 202567SN/A * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 212567SN/A * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 222567SN/A * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 232567SN/A * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 242567SN/A * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 252567SN/A * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 262567SN/A * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 272567SN/A * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 282567SN/A */ 292567SN/A 302567SN/A/* 312567SN/A * AddressProfiler.C 322567SN/A * 332567SN/A * Description: See AddressProfiler.h 342567SN/A * 352567SN/A * $Id$ 362567SN/A * 372567SN/A */ 382567SN/A 392665SN/A#include "AddressProfiler.hh" 402665SN/A#include "CacheMsg.hh" 412567SN/A#include "AccessTraceForAddress.hh" 422567SN/A#include "PrioHeap.hh" 436757SAli.Saidi@ARM.com#include "Map.hh" 446757SAli.Saidi@ARM.com#include "System.hh" 452567SN/A#include "Profiler.hh" 462567SN/A 472567SN/A// Helper functions 482567SN/Astatic AccessTraceForAddress& lookupTraceForAddress(const Address& addr, Map<Address, AccessTraceForAddress>* record_map); 498229Snate@binkert.orgstatic void printSorted(ostream& out, const Map<Address, AccessTraceForAddress>* record_map, string description); 506757SAli.Saidi@ARM.com 5110810Sbr@bsdpad.comAddressProfiler::AddressProfiler() 522567SN/A{ 532567SN/A m_dataAccessTrace = new Map<Address, AccessTraceForAddress>; 542567SN/A m_macroBlockAccessTrace = new Map<Address, AccessTraceForAddress>; 5510844Sandreas.sandberg@arm.com m_programCounterAccessTrace = new Map<Address, AccessTraceForAddress>; 5610037SARM gem5 Developers m_retryProfileMap = new Map<Address, AccessTraceForAddress>; 5710037SARM gem5 Developers m_persistentPredictionProfileMap = new Map<Address, AccessTraceForAddress>; 586757SAli.Saidi@ARM.com clearStats(); 592567SN/A} 608285SPrakash.Ramrakhyani@arm.com 617650SAli.Saidi@ARM.comAddressProfiler::~AddressProfiler() 627650SAli.Saidi@ARM.com{ 637650SAli.Saidi@ARM.com delete m_dataAccessTrace; 647650SAli.Saidi@ARM.com delete m_macroBlockAccessTrace; 657650SAli.Saidi@ARM.com delete m_programCounterAccessTrace; 667650SAli.Saidi@ARM.com delete m_retryProfileMap; 678286SAli.Saidi@ARM.com delete m_persistentPredictionProfileMap; 688286SAli.Saidi@ARM.com} 698286SAli.Saidi@ARM.com 708286SAli.Saidi@ARM.comvoid AddressProfiler::printStats(ostream& out) const 718286SAli.Saidi@ARM.com{ 7210037SARM gem5 Developers if (PROFILE_HOT_LINES) { 7310037SARM gem5 Developers out << endl; 7410037SARM gem5 Developers out << "AddressProfiler Stats" << endl; 7510037SARM gem5 Developers out << "---------------------" << endl; 7610037SARM gem5 Developers 7710037SARM gem5 Developers out << endl; 7810037SARM gem5 Developers out << "sharing_misses: " << m_sharing_miss_counter << endl; 7910037SARM gem5 Developers out << "getx_sharing_histogram: " << m_getx_sharing_histogram << endl; 8010037SARM gem5 Developers out << "gets_sharing_histogram: " << m_gets_sharing_histogram << endl; 8110037SARM gem5 Developers 8210037SARM gem5 Developers out << endl; 8310037SARM gem5 Developers out << "Hot Data Blocks" << endl; 8410037SARM gem5 Developers out << "---------------" << endl; 8510037SARM gem5 Developers out << endl; 8610037SARM gem5 Developers printSorted(out, m_dataAccessTrace, "block_address"); 8710037SARM gem5 Developers 8810037SARM gem5 Developers out << endl; 8910037SARM gem5 Developers out << "Hot MacroData Blocks" << endl; 9010037SARM gem5 Developers out << "--------------------" << endl; 9110037SARM gem5 Developers out << endl; 9210037SARM gem5 Developers printSorted(out, m_macroBlockAccessTrace, "macroblock_address"); 9310037SARM gem5 Developers 9410037SARM gem5 Developers out << "Hot Instructions" << endl; 9510037SARM gem5 Developers out << "----------------" << endl; 9610037SARM gem5 Developers out << endl; 9710037SARM gem5 Developers printSorted(out, m_programCounterAccessTrace, "pc_address"); 9810037SARM gem5 Developers } 9910037SARM gem5 Developers 10010037SARM gem5 Developers if (PROFILE_ALL_INSTRUCTIONS){ 10110037SARM gem5 Developers out << endl; 10210037SARM gem5 Developers out << "All Instructions Profile:" << endl; 10310037SARM gem5 Developers out << "-------------------------" << endl; 10410037SARM gem5 Developers out << endl; 10510037SARM gem5 Developers printSorted(out, m_programCounterAccessTrace, "pc_address"); 10610037SARM gem5 Developers out << endl; 10710037SARM gem5 Developers } 10810037SARM gem5 Developers 10910037SARM gem5 Developers if (m_retryProfileHisto.size() > 0) { 11010037SARM gem5 Developers out << "Retry Profile" << endl; 11110037SARM gem5 Developers out << "-------------" << endl; 11210037SARM gem5 Developers out << endl; 11310037SARM gem5 Developers out << "retry_histogram_absolute: " << m_retryProfileHisto << endl; 11410037SARM gem5 Developers out << "retry_histogram_write: " << m_retryProfileHistoWrite << endl; 1152567SN/A out << "retry_histogram_read: " << m_retryProfileHistoRead << endl; 1166757SAli.Saidi@ARM.com 1178286SAli.Saidi@ARM.com out << "retry_histogram_percent: "; 1188286SAli.Saidi@ARM.com m_retryProfileHisto.printPercent(out); 1198286SAli.Saidi@ARM.com out << endl; 1208286SAli.Saidi@ARM.com 1218286SAli.Saidi@ARM.com out << "retry_histogram_per_instruction: "; 1228286SAli.Saidi@ARM.com m_retryProfileHisto.printWithMultiplier(out, 1.0 / double(g_system_ptr->getProfiler()->getTotalInstructionsExecuted())); 1236757SAli.Saidi@ARM.com out << endl; 1246757SAli.Saidi@ARM.com 1258286SAli.Saidi@ARM.com printSorted(out, m_retryProfileMap, "block_address"); 1268706Sandreas.hansson@arm.com out << endl; 1278706Sandreas.hansson@arm.com } 1288706Sandreas.hansson@arm.com 1298706Sandreas.hansson@arm.com if (m_persistentPredictionProfileHisto.size() > 0) { 1308286SAli.Saidi@ARM.com out << "Persistent Prediction Profile" << endl; 1313553SN/A out << "-------------" << endl; 1323553SN/A out << endl; 1337693SAli.Saidi@ARM.com out << "persistent prediction_histogram: " << m_persistentPredictionProfileHisto << endl; 1347693SAli.Saidi@ARM.com 1357693SAli.Saidi@ARM.com out << "persistent prediction_histogram_percent: "; 1367720Sgblack@eecs.umich.edu m_persistentPredictionProfileHisto.printPercent(out); 1373553SN/A out << endl; 1383553SN/A 1399050Schander.sudanthi@arm.com out << "persistentPrediction_histogram_per_instruction: "; 1409050Schander.sudanthi@arm.com m_persistentPredictionProfileHisto.printWithMultiplier(out, 1.0 / double(g_system_ptr->getProfiler()->getTotalInstructionsExecuted())); 1419050Schander.sudanthi@arm.com out << endl; 14210037SARM gem5 Developers 14310037SARM gem5 Developers printSorted(out, m_persistentPredictionProfileMap, "block_address"); 14410037SARM gem5 Developers out << endl; 14510037SARM gem5 Developers } 14610037SARM gem5 Developers} 14710037SARM gem5 Developers 14810037SARM gem5 Developersvoid AddressProfiler::clearStats() 14910037SARM gem5 Developers{ 15010037SARM gem5 Developers // Clear the maps 15110037SARM gem5 Developers m_sharing_miss_counter = 0; 15210037SARM gem5 Developers m_dataAccessTrace->clear(); 15310037SARM gem5 Developers m_macroBlockAccessTrace->clear(); 15410037SARM gem5 Developers m_programCounterAccessTrace->clear(); 15510037SARM gem5 Developers m_retryProfileMap->clear(); 15610037SARM gem5 Developers m_retryProfileHisto.clear(); 15710037SARM gem5 Developers m_retryProfileHistoRead.clear(); 15810037SARM gem5 Developers m_retryProfileHistoWrite.clear(); 15910037SARM gem5 Developers m_getx_sharing_histogram.clear(); 16010037SARM gem5 Developers m_gets_sharing_histogram.clear(); 16110844Sandreas.sandberg@arm.com} 16210844Sandreas.sandberg@arm.com 16310037SARM gem5 Developersvoid AddressProfiler::profileGetX(const Address& datablock, const Address& PC, const Set& owner, const Set& sharers, NodeID requestor) 16410037SARM gem5 Developers{ 16510037SARM gem5 Developers Set indirection_set; 16610037SARM gem5 Developers indirection_set.addSet(sharers); 16710037SARM gem5 Developers indirection_set.addSet(owner); 16810037SARM gem5 Developers indirection_set.remove(requestor); 16910037SARM gem5 Developers int num_indirections = indirection_set.count(); 17010037SARM gem5 Developers 17110037SARM gem5 Developers m_getx_sharing_histogram.add(num_indirections); 17210037SARM gem5 Developers bool indirection_miss = (num_indirections > 0); 17310037SARM gem5 Developers 17410037SARM gem5 Developers addTraceSample(datablock, PC, CacheRequestType_ST, AccessModeType(0), requestor, indirection_miss); 17510037SARM gem5 Developers} 17610037SARM gem5 Developers 17710037SARM gem5 Developersvoid AddressProfiler::profileGetS(const Address& datablock, const Address& PC, const Set& owner, const Set& sharers, NodeID requestor) 17810037SARM gem5 Developers{ 17910037SARM gem5 Developers Set indirection_set; 18010037SARM gem5 Developers indirection_set.addSet(owner); 18110037SARM gem5 Developers indirection_set.remove(requestor); 18210037SARM gem5 Developers int num_indirections = indirection_set.count(); 18310037SARM gem5 Developers 18410037SARM gem5 Developers m_gets_sharing_histogram.add(num_indirections); 18510037SARM gem5 Developers bool indirection_miss = (num_indirections > 0); 18610037SARM gem5 Developers 18710037SARM gem5 Developers addTraceSample(datablock, PC, CacheRequestType_LD, AccessModeType(0), requestor, indirection_miss); 18810037SARM gem5 Developers} 18910037SARM gem5 Developers 19010037SARM gem5 Developersvoid AddressProfiler::addTraceSample(Address data_addr, Address pc_addr, CacheRequestType type, AccessModeType access_mode, NodeID id, bool sharing_miss) 19110037SARM gem5 Developers{ 19210037SARM gem5 Developers if (PROFILE_HOT_LINES) { 19310037SARM gem5 Developers if (sharing_miss) { 19410037SARM gem5 Developers m_sharing_miss_counter++; 19510037SARM gem5 Developers } 19610037SARM gem5 Developers 19710037SARM gem5 Developers // record data address trace info 19810037SARM gem5 Developers data_addr.makeLineAddress(); 19910037SARM gem5 Developers lookupTraceForAddress(data_addr, m_dataAccessTrace).update(type, access_mode, id, sharing_miss); 20010037SARM gem5 Developers 20110037SARM gem5 Developers // record macro data address trace info 20210037SARM gem5 Developers Address macro_addr(data_addr.maskLowOrderBits(10)); // 6 for datablock, 4 to make it 16x more coarse 20310037SARM gem5 Developers lookupTraceForAddress(macro_addr, m_macroBlockAccessTrace).update(type, access_mode, id, sharing_miss); 20410037SARM gem5 Developers 20510037SARM gem5 Developers // record program counter address trace info 20610037SARM gem5 Developers lookupTraceForAddress(pc_addr, m_programCounterAccessTrace).update(type, access_mode, id, sharing_miss); 20710037SARM gem5 Developers } 20810037SARM gem5 Developers 20910037SARM gem5 Developers if (PROFILE_ALL_INSTRUCTIONS) { 21010037SARM gem5 Developers // This code is used if the address profiler is an all-instructions profiler 21110037SARM gem5 Developers // record program counter address trace info 21210037SARM gem5 Developers lookupTraceForAddress(pc_addr, m_programCounterAccessTrace).update(type, access_mode, id, sharing_miss); 21310037SARM gem5 Developers } 21410037SARM gem5 Developers} 21510037SARM gem5 Developers 21610037SARM gem5 Developersvoid AddressProfiler::profileRetry(const Address& data_addr, AccessType type, int count) 21710037SARM gem5 Developers{ 21810037SARM gem5 Developers m_retryProfileHisto.add(count); 21910037SARM gem5 Developers if (type == AccessType_Read) { 22010037SARM gem5 Developers m_retryProfileHistoRead.add(count); 22110037SARM gem5 Developers } else { 22210037SARM gem5 Developers m_retryProfileHistoWrite.add(count); 22310037SARM gem5 Developers } 22410037SARM gem5 Developers if (count > 1) { 22510037SARM gem5 Developers lookupTraceForAddress(data_addr, m_retryProfileMap).addSample(count); 22610037SARM gem5 Developers } 22710037SARM gem5 Developers} 22810037SARM gem5 Developers 22910037SARM gem5 Developersvoid AddressProfiler::profilePersistentPrediction(const Address& data_addr, AccessType type) 23010037SARM gem5 Developers{ 23110037SARM gem5 Developers m_persistentPredictionProfileHisto.add(1); 23210037SARM gem5 Developers lookupTraceForAddress(data_addr, m_persistentPredictionProfileMap).addSample(1); 23310037SARM gem5 Developers} 23410037SARM gem5 Developers 23510037SARM gem5 Developers// ***** Normal Functions ****** 23610037SARM gem5 Developers 23710037SARM gem5 Developersstatic void printSorted(ostream& out, const Map<Address, AccessTraceForAddress>* record_map, string description) 23810037SARM gem5 Developers{ 23910037SARM gem5 Developers const int records_printed = 100; 24010037SARM gem5 Developers 24110037SARM gem5 Developers uint64 misses = 0; 24210037SARM gem5 Developers PrioHeap<AccessTraceForAddress*> heap; 24310037SARM gem5 Developers Vector<Address> keys = record_map->keys(); 24410037SARM gem5 Developers for(int i=0; i<keys.size(); i++){ 24510037SARM gem5 Developers AccessTraceForAddress* record = &(record_map->lookup(keys[i])); 24610037SARM gem5 Developers misses += record->getTotal(); 24710037SARM gem5 Developers heap.insert(record); 24810037SARM gem5 Developers } 24910810Sbr@bsdpad.com 25010037SARM gem5 Developers out << "Total_entries_" << description << ": " << keys.size() << endl; 25110810Sbr@bsdpad.com if (PROFILE_ALL_INSTRUCTIONS) 25210810Sbr@bsdpad.com out << "Total_Instructions_" << description << ": " << misses << endl; 25310810Sbr@bsdpad.com else 25410810Sbr@bsdpad.com out << "Total_data_misses_" << description << ": " << misses << endl; 25510810Sbr@bsdpad.com 25610810Sbr@bsdpad.com out << "total | load store atomic | user supervisor | sharing | touched-by" << endl; 25710810Sbr@bsdpad.com 25810810Sbr@bsdpad.com Histogram remaining_records(1, 100); 25910810Sbr@bsdpad.com Histogram all_records(1, 100); 26010810Sbr@bsdpad.com Histogram remaining_records_log(-1); 26110810Sbr@bsdpad.com Histogram all_records_log(-1); 26210810Sbr@bsdpad.com 26310810Sbr@bsdpad.com // Allows us to track how many lines where touched by n processors 26410810Sbr@bsdpad.com Vector<int64> m_touched_vec; 26510810Sbr@bsdpad.com Vector<int64> m_touched_weighted_vec; 26610810Sbr@bsdpad.com m_touched_vec.setSize(RubyConfig::numberOfProcessors()+1); 26710810Sbr@bsdpad.com m_touched_weighted_vec.setSize(RubyConfig::numberOfProcessors()+1); 2682567SN/A for (int i=0; i<m_touched_vec.size(); i++) { 2692567SN/A m_touched_vec[i] = 0; 2702567SN/A m_touched_weighted_vec[i] = 0; 271 } 272 273 int counter = 0; 274 while((heap.size() > 0) && (counter < records_printed)) { 275 AccessTraceForAddress* record = heap.extractMin(); 276 double percent = 100.0*(record->getTotal()/double(misses)); 277 out << description << " | " << percent << " % " << *record << endl; 278 all_records.add(record->getTotal()); 279 all_records_log.add(record->getTotal()); 280 counter++; 281 m_touched_vec[record->getTouchedBy()]++; 282 m_touched_weighted_vec[record->getTouchedBy()] += record->getTotal(); 283 } 284 285 while(heap.size() > 0) { 286 AccessTraceForAddress* record = heap.extractMin(); 287 all_records.add(record->getTotal()); 288 remaining_records.add(record->getTotal()); 289 all_records_log.add(record->getTotal()); 290 remaining_records_log.add(record->getTotal()); 291 m_touched_vec[record->getTouchedBy()]++; 292 m_touched_weighted_vec[record->getTouchedBy()] += record->getTotal(); 293 } 294 out << endl; 295 out << "all_records_" << description << ": " << all_records << endl; 296 out << "all_records_log_" << description << ": " << all_records_log << endl; 297 out << "remaining_records_" << description << ": " << remaining_records << endl; 298 out << "remaining_records_log_" << description << ": " << remaining_records_log << endl; 299 out << "touched_by_" << description << ": " << m_touched_vec << endl; 300 out << "touched_by_weighted_" << description << ": " << m_touched_weighted_vec << endl; 301 out << endl; 302} 303 304static AccessTraceForAddress& lookupTraceForAddress(const Address& addr, Map<Address, AccessTraceForAddress>* record_map) 305{ 306 if(record_map->exist(addr) == false){ 307 record_map->add(addr, AccessTraceForAddress(addr)); 308 } 309 return record_map->lookup(addr); 310} 311