memtest.py revision 9928:9d3b979cd3ed
1# Copyright (c) 2006-2007 The Regents of The University of Michigan 2# All rights reserved. 3# 4# Redistribution and use in source and binary forms, with or without 5# modification, are permitted provided that the following conditions are 6# met: redistributions of source code must retain the above copyright 7# notice, this list of conditions and the following disclaimer; 8# redistributions in binary form must reproduce the above copyright 9# notice, this list of conditions and the following disclaimer in the 10# documentation and/or other materials provided with the distribution; 11# neither the name of the copyright holders nor the names of its 12# contributors may be used to endorse or promote products derived from 13# this software without specific prior written permission. 14# 15# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 16# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 17# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 18# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 19# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 20# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 21# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 22# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 23# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 24# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 25# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 26# 27# Authors: Ron Dreslinski 28 29import optparse 30import sys 31 32import m5 33from m5.objects import * 34 35parser = optparse.OptionParser() 36 37parser.add_option("-a", "--atomic", action="store_true", 38 help="Use atomic (non-timing) mode") 39parser.add_option("-b", "--blocking", action="store_true", 40 help="Use blocking caches") 41parser.add_option("-l", "--maxloads", metavar="N", default=0, 42 help="Stop after N loads") 43parser.add_option("-m", "--maxtick", type="int", default=m5.MaxTick, 44 metavar="T", 45 help="Stop after T ticks") 46 47# 48# The "tree" specification is a colon-separated list of one or more 49# integers. The first integer is the number of caches/testers 50# connected directly to main memory. The last integer in the list is 51# the number of testers associated with the uppermost level of memory 52# (L1 cache, if there are caches, or main memory if no caches). Thus 53# if there is only one integer, there are no caches, and the integer 54# specifies the number of testers connected directly to main memory. 55# The other integers (if any) specify the number of caches at each 56# level of the hierarchy between. 57# 58# Examples: 59# 60# "2:1" Two caches connected to memory with a single tester behind each 61# (single-level hierarchy, two testers total) 62# 63# "2:2:1" Two-level hierarchy, 2 L1s behind each of 2 L2s, 4 testers total 64# 65parser.add_option("-t", "--treespec", type="string", default="8:1", 66 help="Colon-separated multilevel tree specification, " 67 "see script comments for details " 68 "[default: %default]") 69 70parser.add_option("--force-bus", action="store_true", 71 help="Use bus between levels even with single cache") 72 73parser.add_option("-f", "--functional", type="int", default=0, 74 metavar="PCT", 75 help="Target percentage of functional accesses " 76 "[default: %default]") 77parser.add_option("-u", "--uncacheable", type="int", default=0, 78 metavar="PCT", 79 help="Target percentage of uncacheable accesses " 80 "[default: %default]") 81 82parser.add_option("--progress", type="int", default=1000, 83 metavar="NLOADS", 84 help="Progress message interval " 85 "[default: %default]") 86parser.add_option("--sys-clock", action="store", type="string", 87 default='1GHz', 88 help = """Top-level clock for blocks running at system 89 speed""") 90 91(options, args) = parser.parse_args() 92 93if args: 94 print "Error: script doesn't take any positional arguments" 95 sys.exit(1) 96 97block_size = 64 98 99try: 100 treespec = [int(x) for x in options.treespec.split(':')] 101 numtesters = reduce(lambda x,y: x*y, treespec) 102except: 103 print "Error parsing treespec option" 104 sys.exit(1) 105 106if numtesters > block_size: 107 print "Error: Number of testers limited to %s because of false sharing" \ 108 % (block_size) 109 sys.exit(1) 110 111if len(treespec) < 1: 112 print "Error parsing treespec" 113 sys.exit(1) 114 115# define prototype L1 cache 116proto_l1 = BaseCache(size = '32kB', assoc = 4, 117 hit_latency = 1, response_latency = 1, 118 tgts_per_mshr = 8) 119 120if options.blocking: 121 proto_l1.mshrs = 1 122else: 123 proto_l1.mshrs = 4 124 125# build a list of prototypes, one for each level of treespec, starting 126# at the end (last entry is tester objects) 127prototypes = [ MemTest(atomic=options.atomic, max_loads=options.maxloads, 128 percent_functional=options.functional, 129 percent_uncacheable=options.uncacheable, 130 progress_interval=options.progress) ] 131 132# next comes L1 cache, if any 133if len(treespec) > 1: 134 prototypes.insert(0, proto_l1) 135 136# now add additional cache levels (if any) by scaling L1 params 137for scale in treespec[:-2]: 138 # clone previous level and update params 139 prev = prototypes[0] 140 next = prev() 141 next.size = prev.size * scale 142 next.latency = prev.latency * 10 143 next.assoc = prev.assoc * scale 144 next.mshrs = prev.mshrs * scale 145 prototypes.insert(0, next) 146 147# system simulated 148system = System(funcmem = SimpleMemory(in_addr_map = False), 149 funcbus = NoncoherentBus(), 150 physmem = SimpleMemory(latency = "100ns"), 151 cache_line_size = block_size) 152 153 154system.voltage_domain = VoltageDomain(voltage = '1V') 155 156system.clk_domain = SrcClockDomain(clock = options.sys_clock, 157 voltage_domain = system.voltage_domain) 158 159def make_level(spec, prototypes, attach_obj, attach_port): 160 fanout = spec[0] 161 parent = attach_obj # use attach obj as config parent too 162 if len(spec) > 1 and (fanout > 1 or options.force_bus): 163 port = getattr(attach_obj, attach_port) 164 new_bus = CoherentBus(width=16) 165 if (port.role == 'MASTER'): 166 new_bus.slave = port 167 attach_port = "master" 168 else: 169 new_bus.master = port 170 attach_port = "slave" 171 parent.cpu_side_bus = new_bus 172 attach_obj = new_bus 173 objs = [prototypes[0]() for i in xrange(fanout)] 174 if len(spec) > 1: 175 # we just built caches, more levels to go 176 parent.cache = objs 177 for cache in objs: 178 cache.mem_side = getattr(attach_obj, attach_port) 179 make_level(spec[1:], prototypes[1:], cache, "cpu_side") 180 else: 181 # we just built the MemTest objects 182 parent.cpu = objs 183 for t in objs: 184 t.test = getattr(attach_obj, attach_port) 185 t.functional = system.funcbus.slave 186 187make_level(treespec, prototypes, system.physmem, "port") 188 189# connect reference memory to funcbus 190system.funcbus.master = system.funcmem.port 191 192# ----------------------- 193# run simulation 194# ----------------------- 195 196root = Root( full_system = False, system = system ) 197if options.atomic: 198 root.system.mem_mode = 'atomic' 199else: 200 root.system.mem_mode = 'timing' 201 202# The system port is never used in the tester so merely connect it 203# to avoid problems 204root.system.system_port = root.system.funcbus.slave 205 206# Not much point in this being higher than the L1 latency 207m5.ticks.setGlobalFrequency('1ns') 208 209# instantiate configuration 210m5.instantiate() 211 212# simulate until program terminates 213exit_event = m5.simulate(options.maxtick) 214 215print 'Exiting @ tick', m5.curTick(), 'because', exit_event.getCause() 216