sweep.py revision 11682
110743Sandreas.hansson@arm.com# Copyright (c) 2014-2015 ARM Limited
210139Sandreas.hansson@arm.com# All rights reserved.
310139Sandreas.hansson@arm.com#
410139Sandreas.hansson@arm.com# The license below extends only to copyright in the software and shall
510139Sandreas.hansson@arm.com# not be construed as granting a license to any other intellectual
610139Sandreas.hansson@arm.com# property including but not limited to intellectual property relating
710139Sandreas.hansson@arm.com# to a hardware implementation of the functionality of the software
810139Sandreas.hansson@arm.com# licensed hereunder.  You may use the software subject to the license
910139Sandreas.hansson@arm.com# terms below provided that you ensure that this notice is replicated
1010139Sandreas.hansson@arm.com# unmodified and in its entirety in all distributions of the software,
1110139Sandreas.hansson@arm.com# modified or unmodified, in source code or in binary form.
1210139Sandreas.hansson@arm.com#
1310139Sandreas.hansson@arm.com# Redistribution and use in source and binary forms, with or without
1410139Sandreas.hansson@arm.com# modification, are permitted provided that the following conditions are
1510139Sandreas.hansson@arm.com# met: redistributions of source code must retain the above copyright
1610139Sandreas.hansson@arm.com# notice, this list of conditions and the following disclaimer;
1710139Sandreas.hansson@arm.com# redistributions in binary form must reproduce the above copyright
1810139Sandreas.hansson@arm.com# notice, this list of conditions and the following disclaimer in the
1910139Sandreas.hansson@arm.com# documentation and/or other materials provided with the distribution;
2010139Sandreas.hansson@arm.com# neither the name of the copyright holders nor the names of its
2110139Sandreas.hansson@arm.com# contributors may be used to endorse or promote products derived from
2210139Sandreas.hansson@arm.com# this software without specific prior written permission.
2310139Sandreas.hansson@arm.com#
2410139Sandreas.hansson@arm.com# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
2510139Sandreas.hansson@arm.com# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
2610139Sandreas.hansson@arm.com# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
2710139Sandreas.hansson@arm.com# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
2810139Sandreas.hansson@arm.com# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
2910139Sandreas.hansson@arm.com# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
3010139Sandreas.hansson@arm.com# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
3110139Sandreas.hansson@arm.com# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
3210139Sandreas.hansson@arm.com# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
3310139Sandreas.hansson@arm.com# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
3410139Sandreas.hansson@arm.com# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
3510139Sandreas.hansson@arm.com#
3610139Sandreas.hansson@arm.com# Authors: Andreas Hansson
3710139Sandreas.hansson@arm.com
3810139Sandreas.hansson@arm.comimport optparse
3910139Sandreas.hansson@arm.com
4010139Sandreas.hansson@arm.comimport m5
4110139Sandreas.hansson@arm.comfrom m5.objects import *
4210139Sandreas.hansson@arm.comfrom m5.util import addToPath
4310139Sandreas.hansson@arm.comfrom m5.internal.stats import periodicStatDump
4410139Sandreas.hansson@arm.com
4511682Sandreas.hansson@arm.comaddToPath('../')
4610139Sandreas.hansson@arm.com
4711682Sandreas.hansson@arm.comfrom common import MemConfig
4810139Sandreas.hansson@arm.com
4910139Sandreas.hansson@arm.com# this script is helpful to sweep the efficiency of a specific memory
5010139Sandreas.hansson@arm.com# controller configuration, by varying the number of banks accessed,
5110139Sandreas.hansson@arm.com# and the sequential stride size (how many bytes per activate), and
5210139Sandreas.hansson@arm.com# observe what bus utilisation (bandwidth) is achieved
5310139Sandreas.hansson@arm.com
5410139Sandreas.hansson@arm.comparser = optparse.OptionParser()
5510139Sandreas.hansson@arm.com
5610139Sandreas.hansson@arm.com# Use a single-channel DDR3-1600 x64 by default
5710789Sandreas.hansson@arm.comparser.add_option("--mem-type", type="choice", default="DDR3_1600_x64",
5810139Sandreas.hansson@arm.com                  choices=MemConfig.mem_names(),
5910139Sandreas.hansson@arm.com                  help = "type of memory to use")
6010139Sandreas.hansson@arm.com
6110743Sandreas.hansson@arm.comparser.add_option("--mem-ranks", "-r", type="int", default=1,
6210392Swendy.elsasser@arm.com                  help = "Number of ranks to iterate across")
6310392Swendy.elsasser@arm.com
6410392Swendy.elsasser@arm.comparser.add_option("--rd_perc", type="int", default=100,
6510392Swendy.elsasser@arm.com                  help = "Percentage of read commands")
6610392Swendy.elsasser@arm.com
6710392Swendy.elsasser@arm.comparser.add_option("--mode", type="choice", default="DRAM",
6810392Swendy.elsasser@arm.com                  choices=["DRAM", "DRAM_ROTATE"],
6910392Swendy.elsasser@arm.com                  help = "DRAM: Random traffic; \
7010392Swendy.elsasser@arm.com                          DRAM_ROTATE: Traffic rotating across banks and ranks")
7110392Swendy.elsasser@arm.com
7210392Swendy.elsasser@arm.comparser.add_option("--addr_map", type="int", default=1,
7310392Swendy.elsasser@arm.com                  help = "0: RoCoRaBaCh; 1: RoRaBaCoCh/RoRaBaChCo")
7410392Swendy.elsasser@arm.com
7510139Sandreas.hansson@arm.com(options, args) = parser.parse_args()
7610139Sandreas.hansson@arm.com
7710139Sandreas.hansson@arm.comif args:
7810139Sandreas.hansson@arm.com    print "Error: script doesn't take any positional arguments"
7910139Sandreas.hansson@arm.com    sys.exit(1)
8010139Sandreas.hansson@arm.com
8110139Sandreas.hansson@arm.com# at the moment we stay with the default open-adaptive page policy,
8210139Sandreas.hansson@arm.com# and address mapping
8310139Sandreas.hansson@arm.com
8411125Sandreas.hansson@arm.com# start with the system itself, using a multi-layer 2.0 GHz
8511125Sandreas.hansson@arm.com# crossbar, delivering 64 bytes / 3 cycles (one header cycle)
8611125Sandreas.hansson@arm.com# which amounts to 42.7 GByte/s per layer and thus per port
8711125Sandreas.hansson@arm.comsystem = System(membus = IOXBar(width = 32))
8811125Sandreas.hansson@arm.comsystem.clk_domain = SrcClockDomain(clock = '2.0GHz',
8910139Sandreas.hansson@arm.com                                   voltage_domain =
9010139Sandreas.hansson@arm.com                                   VoltageDomain(voltage = '1V'))
9110139Sandreas.hansson@arm.com
9210139Sandreas.hansson@arm.com# we are fine with 256 MB memory for now
9310139Sandreas.hansson@arm.commem_range = AddrRange('256MB')
9410139Sandreas.hansson@arm.comsystem.mem_ranges = [mem_range]
9510139Sandreas.hansson@arm.com
9610833Sandreas.hansson@arm.com# do not worry about reserving space for the backing store
9711223Sandreas.hansson@arm.comsystem.mmap_using_noreserve = True
9810833Sandreas.hansson@arm.com
9910139Sandreas.hansson@arm.com# force a single channel to match the assumptions in the DRAM traffic
10010139Sandreas.hansson@arm.com# generator
10110139Sandreas.hansson@arm.comoptions.mem_channels = 1
10210832Swendy.elsasser@arm.comoptions.external_memory_system = 0
10311125Sandreas.hansson@arm.comoptions.tlm_memory = 0
10411251Sradhika.jagtap@ARM.comoptions.elastic_trace_en = 0
10510139Sandreas.hansson@arm.comMemConfig.config_mem(options, system)
10610139Sandreas.hansson@arm.com
10710139Sandreas.hansson@arm.com# the following assumes that we are using the native DRAM
10810139Sandreas.hansson@arm.com# controller, check to be sure
10910146Sandreas.hansson@arm.comif not isinstance(system.mem_ctrls[0], m5.objects.DRAMCtrl):
11010146Sandreas.hansson@arm.com    fatal("This script assumes the memory is a DRAMCtrl subclass")
11110139Sandreas.hansson@arm.com
11210833Sandreas.hansson@arm.com# there is no point slowing things down by saving any data
11310833Sandreas.hansson@arm.comsystem.mem_ctrls[0].null = True
11410833Sandreas.hansson@arm.com
11510392Swendy.elsasser@arm.com# Set the address mapping based on input argument
11610392Swendy.elsasser@arm.com# Default to RoRaBaCoCh
11710392Swendy.elsasser@arm.comif options.addr_map == 0:
11810392Swendy.elsasser@arm.com   system.mem_ctrls[0].addr_mapping = "RoCoRaBaCh"
11910392Swendy.elsasser@arm.comelif options.addr_map == 1:
12010392Swendy.elsasser@arm.com   system.mem_ctrls[0].addr_mapping = "RoRaBaCoCh"
12110392Swendy.elsasser@arm.comelse:
12210392Swendy.elsasser@arm.com    fatal("Did not specify a valid address map argument")
12310139Sandreas.hansson@arm.com
12410139Sandreas.hansson@arm.com# stay in each state for 0.25 ms, long enough to warm things up, and
12510139Sandreas.hansson@arm.com# short enough to avoid hitting a refresh
12610139Sandreas.hansson@arm.comperiod = 250000000
12710139Sandreas.hansson@arm.com
12810139Sandreas.hansson@arm.com# this is where we go off piste, and print the traffic generator
12910139Sandreas.hansson@arm.com# configuration that we will later use, crazy but it works
13010139Sandreas.hansson@arm.comcfg_file_name = "configs/dram/sweep.cfg"
13110139Sandreas.hansson@arm.comcfg_file = open(cfg_file_name, 'w')
13210139Sandreas.hansson@arm.com
13310139Sandreas.hansson@arm.com# stay in each state as long as the dump/reset period, use the entire
13410139Sandreas.hansson@arm.com# range, issue transactions of the right DRAM burst size, and match
13510139Sandreas.hansson@arm.com# the DRAM maximum bandwidth to ensure that it is saturated
13610139Sandreas.hansson@arm.com
13710139Sandreas.hansson@arm.com# get the number of banks
13810139Sandreas.hansson@arm.comnbr_banks = system.mem_ctrls[0].banks_per_rank.value
13910139Sandreas.hansson@arm.com
14010139Sandreas.hansson@arm.com# determine the burst length in bytes
14110139Sandreas.hansson@arm.comburst_size = int((system.mem_ctrls[0].devices_per_rank.value *
14210139Sandreas.hansson@arm.com                  system.mem_ctrls[0].device_bus_width.value *
14310139Sandreas.hansson@arm.com                  system.mem_ctrls[0].burst_length.value) / 8)
14410139Sandreas.hansson@arm.com
14510139Sandreas.hansson@arm.com# next, get the page size in bytes
14610139Sandreas.hansson@arm.compage_size = system.mem_ctrls[0].devices_per_rank.value * \
14710139Sandreas.hansson@arm.com    system.mem_ctrls[0].device_rowbuffer_size.value
14810139Sandreas.hansson@arm.com
14911223Sandreas.hansson@arm.com# match the maximum bandwidth of the memory, the parameter is in seconds
15011223Sandreas.hansson@arm.com# and we need it in ticks (ps)
15110139Sandreas.hansson@arm.comitt = system.mem_ctrls[0].tBURST.value * 1000000000000
15210139Sandreas.hansson@arm.com
15310139Sandreas.hansson@arm.com# assume we start at 0
15410139Sandreas.hansson@arm.commax_addr = mem_range.end
15510139Sandreas.hansson@arm.com
15610323Sandreas.hansson@arm.com# use min of the page size and 512 bytes as that should be more than
15710323Sandreas.hansson@arm.com# enough
15810323Sandreas.hansson@arm.commax_stride = min(512, page_size)
15910323Sandreas.hansson@arm.com
16010139Sandreas.hansson@arm.com# now we create the state by iterating over the stride size from burst
16110323Sandreas.hansson@arm.com# size to the max stride, and from using only a single bank up to the
16210323Sandreas.hansson@arm.com# number of banks available
16310139Sandreas.hansson@arm.comnxt_state = 0
16410139Sandreas.hansson@arm.comfor bank in range(1, nbr_banks + 1):
16510323Sandreas.hansson@arm.com    for stride_size in range(burst_size, max_stride + 1, burst_size):
16610392Swendy.elsasser@arm.com        cfg_file.write("STATE %d %d %s %d 0 %d %d "
16710392Swendy.elsasser@arm.com                       "%d %d %d %d %d %d %d %d %d\n" %
16810392Swendy.elsasser@arm.com                       (nxt_state, period, options.mode, options.rd_perc,
16910392Swendy.elsasser@arm.com                        max_addr, burst_size, itt, itt, 0, stride_size,
17010392Swendy.elsasser@arm.com                        page_size, nbr_banks, bank, options.addr_map,
17110743Sandreas.hansson@arm.com                        options.mem_ranks))
17210139Sandreas.hansson@arm.com        nxt_state = nxt_state + 1
17310139Sandreas.hansson@arm.com
17410139Sandreas.hansson@arm.comcfg_file.write("INIT 0\n")
17510139Sandreas.hansson@arm.com
17610139Sandreas.hansson@arm.com# go through the states one by one
17710139Sandreas.hansson@arm.comfor state in range(1, nxt_state):
17810139Sandreas.hansson@arm.com    cfg_file.write("TRANSITION %d %d 1\n" % (state - 1, state))
17910139Sandreas.hansson@arm.com
18010139Sandreas.hansson@arm.comcfg_file.write("TRANSITION %d %d 1\n" % (nxt_state - 1, nxt_state - 1))
18110139Sandreas.hansson@arm.com
18210139Sandreas.hansson@arm.comcfg_file.close()
18310139Sandreas.hansson@arm.com
18410139Sandreas.hansson@arm.com# create a traffic generator, and point it to the file we just created
18510139Sandreas.hansson@arm.comsystem.tgen = TrafficGen(config_file = cfg_file_name)
18610139Sandreas.hansson@arm.com
18710139Sandreas.hansson@arm.com# add a communication monitor
18810139Sandreas.hansson@arm.comsystem.monitor = CommMonitor()
18910139Sandreas.hansson@arm.com
19010139Sandreas.hansson@arm.com# connect the traffic generator to the bus via a communication monitor
19110139Sandreas.hansson@arm.comsystem.tgen.port = system.monitor.slave
19210139Sandreas.hansson@arm.comsystem.monitor.master = system.membus.slave
19310139Sandreas.hansson@arm.com
19410139Sandreas.hansson@arm.com# connect the system port even if it is not used in this example
19510139Sandreas.hansson@arm.comsystem.system_port = system.membus.slave
19610139Sandreas.hansson@arm.com
19710139Sandreas.hansson@arm.com# every period, dump and reset all stats
19810139Sandreas.hansson@arm.comperiodicStatDump(period)
19910139Sandreas.hansson@arm.com
20010139Sandreas.hansson@arm.com# run Forrest, run!
20110139Sandreas.hansson@arm.comroot = Root(full_system = False, system = system)
20210139Sandreas.hansson@arm.comroot.system.mem_mode = 'timing'
20310139Sandreas.hansson@arm.com
20410139Sandreas.hansson@arm.comm5.instantiate()
20510139Sandreas.hansson@arm.comm5.simulate(nxt_state * period)
20610323Sandreas.hansson@arm.com
20710323Sandreas.hansson@arm.comprint "DRAM sweep with burst: %d, banks: %d, max stride: %d" % \
20810323Sandreas.hansson@arm.com    (burst_size, nbr_banks, max_stride)
209