ruby_gpu_random_test.py revision 11682
111308Santhony.gutierrez@amd.com# 211308Santhony.gutierrez@amd.com# Copyright (c) 2010-2015 Advanced Micro Devices, Inc. 311308Santhony.gutierrez@amd.com# All rights reserved. 411308Santhony.gutierrez@amd.com# 511308Santhony.gutierrez@amd.com# For use for simulation and test purposes only 611308Santhony.gutierrez@amd.com# 711308Santhony.gutierrez@amd.com# Redistribution and use in source and binary forms, with or without 811308Santhony.gutierrez@amd.com# modification, are permitted provided that the following conditions are met: 911308Santhony.gutierrez@amd.com# 1011308Santhony.gutierrez@amd.com# 1. Redistributions of source code must retain the above copyright notice, 1111308Santhony.gutierrez@amd.com# this list of conditions and the following disclaimer. 1211308Santhony.gutierrez@amd.com# 1311308Santhony.gutierrez@amd.com# 2. Redistributions in binary form must reproduce the above copyright notice, 1411308Santhony.gutierrez@amd.com# this list of conditions and the following disclaimer in the documentation 1511308Santhony.gutierrez@amd.com# and/or other materials provided with the distribution. 1611308Santhony.gutierrez@amd.com# 1711308Santhony.gutierrez@amd.com# 3. Neither the name of the copyright holder nor the names of its contributors 1811308Santhony.gutierrez@amd.com# may be used to endorse or promote products derived from this software 1911308Santhony.gutierrez@amd.com# without specific prior written permission. 2011308Santhony.gutierrez@amd.com# 2111308Santhony.gutierrez@amd.com# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" 2211308Santhony.gutierrez@amd.com# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 2311308Santhony.gutierrez@amd.com# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 2411308Santhony.gutierrez@amd.com# ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE 2511308Santhony.gutierrez@amd.com# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 2611308Santhony.gutierrez@amd.com# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 2711308Santhony.gutierrez@amd.com# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 2811308Santhony.gutierrez@amd.com# INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 2911308Santhony.gutierrez@amd.com# CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 3011308Santhony.gutierrez@amd.com# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 3111308Santhony.gutierrez@amd.com# POSSIBILITY OF SUCH DAMAGE. 3211308Santhony.gutierrez@amd.com# 3311308Santhony.gutierrez@amd.com# Author: Brad Beckmann 3411308Santhony.gutierrez@amd.com# 3511308Santhony.gutierrez@amd.com 3611308Santhony.gutierrez@amd.comimport m5 3711308Santhony.gutierrez@amd.comfrom m5.objects import * 3811308Santhony.gutierrez@amd.comfrom m5.defines import buildEnv 3911308Santhony.gutierrez@amd.comfrom m5.util import addToPath 4011308Santhony.gutierrez@amd.comimport os, optparse, sys 4111682Sandreas.hansson@arm.com 4211670Sandreas.hansson@arm.comaddToPath('../') 4311308Santhony.gutierrez@amd.com 4411682Sandreas.hansson@arm.comfrom common import Options 4511670Sandreas.hansson@arm.comfrom ruby import Ruby 4611308Santhony.gutierrez@amd.com 4711308Santhony.gutierrez@amd.com# Get paths we might need. 4811308Santhony.gutierrez@amd.comconfig_path = os.path.dirname(os.path.abspath(__file__)) 4911308Santhony.gutierrez@amd.comconfig_root = os.path.dirname(config_path) 5011308Santhony.gutierrez@amd.comm5_root = os.path.dirname(config_root) 5111308Santhony.gutierrez@amd.com 5211308Santhony.gutierrez@amd.comparser = optparse.OptionParser() 5311308Santhony.gutierrez@amd.comOptions.addCommonOptions(parser) 5411308Santhony.gutierrez@amd.com 5511308Santhony.gutierrez@amd.comparser.add_option("--maxloads", metavar="N", default=100, 5611308Santhony.gutierrez@amd.com help="Stop after N loads") 5711308Santhony.gutierrez@amd.comparser.add_option("-f", "--wakeup_freq", metavar="N", default=10, 5811308Santhony.gutierrez@amd.com help="Wakeup every N cycles") 5911308Santhony.gutierrez@amd.comparser.add_option("-u", "--num-compute-units", type="int", default=1, 6011308Santhony.gutierrez@amd.com help="number of compute units in the GPU") 6111310SBrad.Beckmann@amd.comparser.add_option("--num-cp", type="int", default=0, 6211308Santhony.gutierrez@amd.com help="Number of GPU Command Processors (CP)") 6311308Santhony.gutierrez@amd.com# not super important now, but to avoid putting the number 4 everywhere, make 6411308Santhony.gutierrez@amd.com# it an option/knob 6511308Santhony.gutierrez@amd.comparser.add_option("--cu-per-sqc", type="int", default=4, help="number of CUs \ 6611308Santhony.gutierrez@amd.com sharing an SQC (icache, and thus icache TLB)") 6711308Santhony.gutierrez@amd.comparser.add_option("--simds-per-cu", type="int", default=4, help="SIMD units" \ 6811308Santhony.gutierrez@amd.com "per CU") 6911308Santhony.gutierrez@amd.comparser.add_option("--wf-size", type="int", default=64, 7011308Santhony.gutierrez@amd.com help="Wavefront size(in workitems)") 7111308Santhony.gutierrez@amd.comparser.add_option("--wfs-per-simd", type="int", default=10, help="Number of " \ 7211308Santhony.gutierrez@amd.com "WF slots per SIMD") 7311308Santhony.gutierrez@amd.com 7411308Santhony.gutierrez@amd.com# 7511308Santhony.gutierrez@amd.com# Add the ruby specific and protocol specific options 7611308Santhony.gutierrez@amd.com# 7711308Santhony.gutierrez@amd.comRuby.define_options(parser) 7811308Santhony.gutierrez@amd.com 7911308Santhony.gutierrez@amd.comexecfile(os.path.join(config_root, "common", "Options.py")) 8011308Santhony.gutierrez@amd.com 8111308Santhony.gutierrez@amd.com(options, args) = parser.parse_args() 8211308Santhony.gutierrez@amd.com 8311308Santhony.gutierrez@amd.com# 8411308Santhony.gutierrez@amd.com# Set the default cache size and associativity to be very small to encourage 8511308Santhony.gutierrez@amd.com# races between requests and writebacks. 8611308Santhony.gutierrez@amd.com# 8711308Santhony.gutierrez@amd.comoptions.l1d_size="256B" 8811308Santhony.gutierrez@amd.comoptions.l1i_size="256B" 8911308Santhony.gutierrez@amd.comoptions.l2_size="512B" 9011308Santhony.gutierrez@amd.comoptions.l3_size="1kB" 9111308Santhony.gutierrez@amd.comoptions.l1d_assoc=2 9211308Santhony.gutierrez@amd.comoptions.l1i_assoc=2 9311308Santhony.gutierrez@amd.comoptions.l2_assoc=2 9411308Santhony.gutierrez@amd.comoptions.l3_assoc=2 9511308Santhony.gutierrez@amd.com 9611308Santhony.gutierrez@amd.com# This file can support multiple compute units 9711308Santhony.gutierrez@amd.comassert(options.num_compute_units >= 1) 9811308Santhony.gutierrez@amd.comn_cu = options.num_compute_units 9911308Santhony.gutierrez@amd.com 10011308Santhony.gutierrez@amd.comoptions.num_sqc = int((n_cu + options.cu_per_sqc - 1) / options.cu_per_sqc) 10111308Santhony.gutierrez@amd.com 10211308Santhony.gutierrez@amd.comif args: 10311308Santhony.gutierrez@amd.com print "Error: script doesn't take any positional arguments" 10411308Santhony.gutierrez@amd.com sys.exit(1) 10511308Santhony.gutierrez@amd.com 10611308Santhony.gutierrez@amd.com# 10711308Santhony.gutierrez@amd.com# Create the ruby random tester 10811308Santhony.gutierrez@amd.com# 10911308Santhony.gutierrez@amd.com 11011308Santhony.gutierrez@amd.com# Check to for the GPU_RfO protocol. Other GPU protocols are non-SC and will 11111308Santhony.gutierrez@amd.com# not work with the Ruby random tester. 11211308Santhony.gutierrez@amd.comassert(buildEnv['PROTOCOL'] == 'GPU_RfO') 11311308Santhony.gutierrez@amd.com 11411308Santhony.gutierrez@amd.com# The GPU_RfO protocol does not support cache flushes 11511308Santhony.gutierrez@amd.comcheck_flush = False 11611308Santhony.gutierrez@amd.com 11711308Santhony.gutierrez@amd.comtester = RubyTester(check_flush=check_flush, 11811308Santhony.gutierrez@amd.com checks_to_complete=options.maxloads, 11911308Santhony.gutierrez@amd.com wakeup_frequency=options.wakeup_freq, 12011308Santhony.gutierrez@amd.com deadlock_threshold=1000000) 12111308Santhony.gutierrez@amd.com 12211308Santhony.gutierrez@amd.com# 12311308Santhony.gutierrez@amd.com# Create the M5 system. Note that the Memory Object isn't 12411308Santhony.gutierrez@amd.com# actually used by the rubytester, but is included to support the 12511308Santhony.gutierrez@amd.com# M5 memory size == Ruby memory size checks 12611308Santhony.gutierrez@amd.com# 12711308Santhony.gutierrez@amd.comsystem = System(cpu=tester, mem_ranges=[AddrRange(options.mem_size)]) 12811308Santhony.gutierrez@amd.com 12911308Santhony.gutierrez@amd.com# Create a top-level voltage domain and clock domain 13011308Santhony.gutierrez@amd.comsystem.voltage_domain = VoltageDomain(voltage=options.sys_voltage) 13111308Santhony.gutierrez@amd.com 13211308Santhony.gutierrez@amd.comsystem.clk_domain = SrcClockDomain(clock=options.sys_clock, 13311308Santhony.gutierrez@amd.com voltage_domain=system.voltage_domain) 13411308Santhony.gutierrez@amd.com 13511308Santhony.gutierrez@amd.comRuby.create_system(options, False, system) 13611308Santhony.gutierrez@amd.com 13711308Santhony.gutierrez@amd.com# Create a seperate clock domain for Ruby 13811308Santhony.gutierrez@amd.comsystem.ruby.clk_domain = SrcClockDomain(clock=options.ruby_clock, 13911308Santhony.gutierrez@amd.com voltage_domain=system.voltage_domain) 14011308Santhony.gutierrez@amd.com 14111308Santhony.gutierrez@amd.comtester.num_cpus = len(system.ruby._cpu_ports) 14211308Santhony.gutierrez@amd.com 14311308Santhony.gutierrez@amd.com# 14411308Santhony.gutierrez@amd.com# The tester is most effective when randomization is turned on and 14511308Santhony.gutierrez@amd.com# artifical delay is randomly inserted on messages 14611308Santhony.gutierrez@amd.com# 14711308Santhony.gutierrez@amd.comsystem.ruby.randomization = True 14811308Santhony.gutierrez@amd.com 14911308Santhony.gutierrez@amd.comfor ruby_port in system.ruby._cpu_ports: 15011308Santhony.gutierrez@amd.com 15111308Santhony.gutierrez@amd.com # 15211308Santhony.gutierrez@amd.com # Tie the ruby tester ports to the ruby cpu read and write ports 15311308Santhony.gutierrez@amd.com # 15411308Santhony.gutierrez@amd.com if ruby_port.support_data_reqs and ruby_port.support_inst_reqs: 15511308Santhony.gutierrez@amd.com tester.cpuInstDataPort = ruby_port.slave 15611308Santhony.gutierrez@amd.com elif ruby_port.support_data_reqs: 15711308Santhony.gutierrez@amd.com tester.cpuDataPort = ruby_port.slave 15811308Santhony.gutierrez@amd.com elif ruby_port.support_inst_reqs: 15911308Santhony.gutierrez@amd.com tester.cpuInstPort = ruby_port.slave 16011308Santhony.gutierrez@amd.com 16111308Santhony.gutierrez@amd.com # Do not automatically retry stalled Ruby requests 16211308Santhony.gutierrez@amd.com ruby_port.no_retry_on_stall = True 16311308Santhony.gutierrez@amd.com 16411308Santhony.gutierrez@amd.com # 16511308Santhony.gutierrez@amd.com # Tell each sequencer this is the ruby tester so that it 16611308Santhony.gutierrez@amd.com # copies the subblock back to the checker 16711308Santhony.gutierrez@amd.com # 16811308Santhony.gutierrez@amd.com ruby_port.using_ruby_tester = True 16911308Santhony.gutierrez@amd.com 17011308Santhony.gutierrez@amd.com# ----------------------- 17111308Santhony.gutierrez@amd.com# run simulation 17211308Santhony.gutierrez@amd.com# ----------------------- 17311308Santhony.gutierrez@amd.com 17411308Santhony.gutierrez@amd.comroot = Root( full_system = False, system = system ) 17511308Santhony.gutierrez@amd.comroot.system.mem_mode = 'timing' 17611308Santhony.gutierrez@amd.com 17711308Santhony.gutierrez@amd.com# Not much point in this being higher than the L1 latency 17811308Santhony.gutierrez@amd.comm5.ticks.setGlobalFrequency('1ns') 17911308Santhony.gutierrez@amd.com 18011308Santhony.gutierrez@amd.com# instantiate configuration 18111308Santhony.gutierrez@amd.comm5.instantiate() 18211308Santhony.gutierrez@amd.com 18311308Santhony.gutierrez@amd.com# simulate until program terminates 18411308Santhony.gutierrez@amd.comexit_event = m5.simulate(options.abs_max_tick) 18511308Santhony.gutierrez@amd.com 18611308Santhony.gutierrez@amd.comprint 'Exiting @ tick', m5.curTick(), 'because', exit_event.getCause() 187