1# Copyright (c) 2012 ARM Limited
2# All rights reserved
3#
4# The license below extends only to copyright in the software and shall
5# not be construed as granting a license to any other intellectual
6# property including but not limited to intellectual property relating
7# to a hardware implementation of the functionality of the software
8# licensed hereunder. You may use the software subject to the license
9# terms below provided that you ensure that this notice is replicated
10# unmodified and in its entirety in all distributions of the software,
11# modified or unmodified, in source code or in binary form.
12#
13# Copyright (c) 2006-2008 The Regents of The University of Michigan
14# Copyright (c) 2010 Advanced Micro Devices, Inc.
15# All rights reserved.
16#
17# Redistribution and use in source and binary forms, with or without
18# modification, are permitted provided that the following conditions are
19# met: redistributions of source code must retain the above copyright
20# notice, this list of conditions and the following disclaimer;
21# redistributions in binary form must reproduce the above copyright
22# notice, this list of conditions and the following disclaimer in the
23# documentation and/or other materials provided with the distribution;
24# neither the name of the copyright holders nor the names of its
25# contributors may be used to endorse or promote products derived from
26# this software without specific prior written permission.
27#
28# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
29# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
30# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
31# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
32# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
33# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
34# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
35# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
36# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
37# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
38# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
39#
40# Authors: Lisa Hsu
41
42import sys
43from os import getcwd
44from os.path import join as joinpath
45
46import m5
47from m5.defines import buildEnv
48from m5.objects import *
49from m5.util import *
50from O3_ARM_v7a import *
51
52addToPath('../common')
53
54def getCPUClass(cpu_type):
55 """Returns the required cpu class and the mode of operation.
56 """
57
58 if cpu_type == "timing":
59 return TimingSimpleCPU, 'timing'
60 elif cpu_type == "detailed":
61 return DerivO3CPU, 'timing'
62 elif cpu_type == "arm_detailed":
63 return O3_ARM_v7a_3, 'timing'
64 elif cpu_type == "inorder":
65 return InOrderCPU, 'timing'
66 else:
67 return AtomicSimpleCPU, 'atomic'
68
69def setCPUClass(options):
70 """Returns two cpu classes and the initial mode of operation.
71
72 Restoring from a checkpoint or fast forwarding through a benchmark
73 can be done using one type of cpu, and then the actual
74 simulation can be carried out using another type. This function
75 returns these two types of cpus and the initial mode of operation
76 depending on the options provided.
77 """
78
67 if options.cpu_type == "detailed" or \
68 options.cpu_type == "arm_detailed" or \
69 options.cpu_type == "inorder" :
70 if not options.caches and not options.ruby:
71 fatal("O3/Inorder CPU must be used with caches")
72
79 TmpClass, test_mem_mode = getCPUClass(options.cpu_type)
80 CPUClass = None
81 if TmpClass.require_caches() and \
82 not options.caches and not options.ruby:
83 fatal("%s must be used with caches" % options.cpu_type)
84
85 if options.checkpoint_restore != None:
86 if options.restore_with_cpu != options.cpu_type:
87 CPUClass = TmpClass
88 TmpClass, test_mem_mode = getCPUClass(options.restore_with_cpu)
89 elif options.fast_forward:
90 CPUClass = TmpClass
91 TmpClass = AtomicSimpleCPU
92 test_mem_mode = 'atomic'
93
94 return (TmpClass, test_mem_mode, CPUClass)
95
96def setWorkCountOptions(system, options):
97 if options.work_item_id != None:
98 system.work_item_id = options.work_item_id
99 if options.work_begin_cpu_id_exit != None:
100 system.work_begin_cpu_id_exit = options.work_begin_cpu_id_exit
101 if options.work_end_exit_count != None:
102 system.work_end_exit_count = options.work_end_exit_count
103 if options.work_end_checkpoint_count != None:
104 system.work_end_ckpt_count = options.work_end_checkpoint_count
105 if options.work_begin_exit_count != None:
106 system.work_begin_exit_count = options.work_begin_exit_count
107 if options.work_begin_checkpoint_count != None:
108 system.work_begin_ckpt_count = options.work_begin_checkpoint_count
109 if options.work_cpus_checkpoint_count != None:
110 system.work_cpus_ckpt_count = options.work_cpus_checkpoint_count
111
112def findCptDir(options, maxtick, cptdir, testsys):
113 """Figures out the directory from which the checkpointed state is read.
114
115 There are two different ways in which the directories holding checkpoints
116 can be named --
117 1. cpt.<benchmark name>.<instruction count when the checkpoint was taken>
118 2. cpt.<some number, usually the tick value when the checkpoint was taken>
119
120 This function parses through the options to figure out which one of the
121 above should be used for selecting the checkpoint, and then figures out
122 the appropriate directory.
123
124 It also sets the value of the maximum tick value till which the simulation
125 will run.
126 """
127
128 from os.path import isdir, exists
129 from os import listdir
130 import re
131
132 if not isdir(cptdir):
133 fatal("checkpoint dir %s does not exist!", cptdir)
134
135 if options.at_instruction or options.simpoint:
136 inst = options.checkpoint_restore
137 if options.simpoint:
138 # assume workload 0 has the simpoint
139 if testsys.cpu[0].workload[0].simpoint == 0:
140 fatal('Unable to find simpoint')
141 inst += int(testsys.cpu[0].workload[0].simpoint)
142
143 checkpoint_dir = joinpath(cptdir, "cpt.%s.%s" % (options.bench, inst))
144 if not exists(checkpoint_dir):
145 fatal("Unable to find checkpoint directory %s", checkpoint_dir)
146 else:
147 dirs = listdir(cptdir)
148 expr = re.compile('cpt\.([0-9]*)')
149 cpts = []
150 for dir in dirs:
151 match = expr.match(dir)
152 if match:
153 cpts.append(match.group(1))
154
155 cpts.sort(lambda a,b: cmp(long(a), long(b)))
156
157 cpt_num = options.checkpoint_restore
158 if cpt_num > len(cpts):
159 fatal('Checkpoint %d not found', cpt_num)
160
161 maxtick = maxtick - int(cpts[cpt_num - 1])
162 checkpoint_dir = joinpath(cptdir, "cpt.%s" % cpts[cpt_num - 1])
163
164 return maxtick, checkpoint_dir
165
166def scriptCheckpoints(options, maxtick, cptdir):
167 if options.at_instruction or options.simpoint:
168 checkpoint_inst = int(options.take_checkpoints)
169
170 # maintain correct offset if we restored from some instruction
171 if options.checkpoint_restore != None:
172 checkpoint_inst += options.checkpoint_restore
173
174 print "Creating checkpoint at inst:%d" % (checkpoint_inst)
175 exit_event = m5.simulate()
176 exit_cause = exit_event.getCause()
177 print "exit cause = %s" % exit_cause
178
179 # skip checkpoint instructions should they exist
180 while exit_cause == "checkpoint":
181 exit_event = m5.simulate()
182 exit_cause = exit_event.getCause()
183
184 if exit_cause == "a thread reached the max instruction count":
185 m5.checkpoint(joinpath(cptdir, "cpt.%s.%d" % \
186 (options.bench, checkpoint_inst)))
187 print "Checkpoint written."
188
189 else:
190 when, period = options.take_checkpoints.split(",", 1)
191 when = int(when)
192 period = int(period)
193 num_checkpoints = 0
194
195 exit_event = m5.simulate(when)
196 exit_cause = exit_event.getCause()
197 while exit_cause == "checkpoint":
198 exit_event = m5.simulate(when - m5.curTick())
199 exit_cause = exit_event.getCause()
200
201 if exit_cause == "simulate() limit reached":
202 m5.checkpoint(joinpath(cptdir, "cpt.%d"))
203 num_checkpoints += 1
204
205 sim_ticks = when
206 max_checkpoints = options.max_checkpoints
207
208 while num_checkpoints < max_checkpoints and \
209 exit_cause == "simulate() limit reached":
210 if (sim_ticks + period) > maxtick:
211 exit_event = m5.simulate(maxtick - sim_ticks)
212 exit_cause = exit_event.getCause()
213 break
214 else:
215 exit_event = m5.simulate(period)
216 exit_cause = exit_event.getCause()
217 sim_ticks += period
218 while exit_event.getCause() == "checkpoint":
219 exit_event = m5.simulate(sim_ticks - m5.curTick())
220 if exit_event.getCause() == "simulate() limit reached":
221 m5.checkpoint(joinpath(cptdir, "cpt.%d"))
222 num_checkpoints += 1
223
224 return exit_cause
225
226def benchCheckpoints(options, maxtick, cptdir):
227 exit_event = m5.simulate(maxtick)
228 exit_cause = exit_event.getCause()
229
230 num_checkpoints = 0
231 max_checkpoints = options.max_checkpoints
232
233 while exit_cause == "checkpoint":
234 m5.checkpoint(joinpath(cptdir, "cpt.%d"))
235 num_checkpoints += 1
236 if num_checkpoints == max_checkpoints:
237 exit_cause = "maximum %d checkpoints dropped" % max_checkpoints
238 break
239
240 exit_event = m5.simulate(maxtick - m5.curTick())
241 exit_cause = exit_event.getCause()
242
243 return exit_event
244
245def repeatSwitch(testsys, repeat_switch_cpu_list, maxtick, switch_freq):
246 print "starting switch loop"
247 while True:
248 exit_event = m5.simulate(switch_freq)
249 exit_cause = exit_event.getCause()
250
251 if exit_cause != "simulate() limit reached":
252 return exit_event
253
254 print "draining the system"
255 m5.drain(testsys)
256 m5.switchCpus(repeat_switch_cpu_list)
257 m5.resume(testsys)
258
259 tmp_cpu_list = []
260 for old_cpu, new_cpu in repeat_switch_cpu_list:
261 tmp_cpu_list.append((new_cpu, old_cpu))
262 repeat_switch_cpu_list = tmp_cpu_list
263
264 if (maxtick - m5.curTick()) <= switch_freq:
265 exit_event = m5.simulate(maxtick - m5.curTick())
266 return exit_event
267
268def run(options, root, testsys, cpu_class):
269 if options.maxtick:
270 maxtick = options.maxtick
271 elif options.maxtime:
272 simtime = m5.ticks.seconds(simtime)
273 print "simulating for: ", simtime
274 maxtick = simtime
275 else:
276 maxtick = m5.MaxTick
277
278 if options.checkpoint_dir:
279 cptdir = options.checkpoint_dir
280 elif m5.options.outdir:
281 cptdir = m5.options.outdir
282 else:
283 cptdir = getcwd()
284
285 if options.fast_forward and options.checkpoint_restore != None:
286 fatal("Can't specify both --fast-forward and --checkpoint-restore")
287
288 if options.standard_switch and not options.caches:
289 fatal("Must specify --caches when using --standard-switch")
290
291 if options.standard_switch and options.repeat_switch:
292 fatal("Can't specify both --standard-switch and --repeat-switch")
293
294 if options.repeat_switch and options.take_checkpoints:
295 fatal("Can't specify both --repeat-switch and --take-checkpoints")
296
297 np = options.num_cpus
298 switch_cpus = None
299
300 if options.prog_interval:
301 for i in xrange(np):
302 testsys.cpu[i].progress_interval = options.prog_interval
303
304 if options.maxinsts:
305 for i in xrange(np):
306 testsys.cpu[i].max_insts_any_thread = options.maxinsts
307
308 if cpu_class:
309 switch_cpus = [cpu_class(switched_out=True, cpu_id=(i))
310 for i in xrange(np)]
311
312 for i in xrange(np):
313 if options.fast_forward:
314 testsys.cpu[i].max_insts_any_thread = int(options.fast_forward)
315 switch_cpus[i].system = testsys
316 switch_cpus[i].workload = testsys.cpu[i].workload
317 switch_cpus[i].clock = testsys.cpu[i].clock
318 # simulation period
319 if options.maxinsts:
320 switch_cpus[i].max_insts_any_thread = options.maxinsts
321 # Add checker cpu if selected
322 if options.checker:
323 switch_cpus[i].addCheckerCpu()
324
325 testsys.switch_cpus = switch_cpus
326 switch_cpu_list = [(testsys.cpu[i], switch_cpus[i]) for i in xrange(np)]
327
328 if options.repeat_switch:
320 if options.cpu_type == "arm_detailed":
321 if not options.caches:
322 print "O3 CPU must be used with caches"
323 sys.exit(1)
324
325 repeat_switch_cpus = [O3_ARM_v7a_3(switched_out=True, \
326 cpu_id=(i)) for i in xrange(np)]
327 elif options.cpu_type == "detailed":
328 if not options.caches:
329 print "O3 CPU must be used with caches"
330 sys.exit(1)
331
332 repeat_switch_cpus = [DerivO3CPU(switched_out=True, \
333 cpu_id=(i)) for i in xrange(np)]
334 elif options.cpu_type == "inorder":
335 print "inorder CPU switching not supported"
329 switch_class = getCPUClass(options.cpu_type)[0]
330 if switch_class.require_caches() and \
331 not options.caches:
332 print "%s: Must be used with caches" % str(switch_class)
333 sys.exit(1)
337 elif options.cpu_type == "timing":
338 repeat_switch_cpus = [TimingSimpleCPU(switched_out=True, \
339 cpu_id=(i)) for i in xrange(np)]
340 else:
341 repeat_switch_cpus = [AtomicSimpleCPU(switched_out=True, \
342 cpu_id=(i)) for i in xrange(np)]
334 if not switch_class.support_take_over():
335 print "%s: CPU switching not supported" % str(switch_class)
336 sys.exit(1)
337
338 repeat_switch_cpus = [switch_class(switched_out=True, \
339 cpu_id=(i)) for i in xrange(np)]
340
341 for i in xrange(np):
342 repeat_switch_cpus[i].system = testsys
343 repeat_switch_cpus[i].workload = testsys.cpu[i].workload
344 repeat_switch_cpus[i].clock = testsys.cpu[i].clock
345
346 if options.maxinsts:
347 repeat_switch_cpus[i].max_insts_any_thread = options.maxinsts
348
349 if options.checker:
350 repeat_switch_cpus[i].addCheckerCpu()
351
352 testsys.repeat_switch_cpus = repeat_switch_cpus
353
354 if cpu_class:
355 repeat_switch_cpu_list = [(switch_cpus[i], repeat_switch_cpus[i])
356 for i in xrange(np)]
357 else:
358 repeat_switch_cpu_list = [(testsys.cpu[i], repeat_switch_cpus[i])
359 for i in xrange(np)]
360
361 if options.standard_switch:
362 switch_cpus = [TimingSimpleCPU(switched_out=True, cpu_id=(i))
363 for i in xrange(np)]
364 switch_cpus_1 = [DerivO3CPU(switched_out=True, cpu_id=(i))
365 for i in xrange(np)]
366
367 for i in xrange(np):
368 switch_cpus[i].system = testsys
369 switch_cpus_1[i].system = testsys
370 switch_cpus[i].workload = testsys.cpu[i].workload
371 switch_cpus_1[i].workload = testsys.cpu[i].workload
372 switch_cpus[i].clock = testsys.cpu[i].clock
373 switch_cpus_1[i].clock = testsys.cpu[i].clock
374
375 # if restoring, make atomic cpu simulate only a few instructions
376 if options.checkpoint_restore != None:
377 testsys.cpu[i].max_insts_any_thread = 1
378 # Fast forward to specified location if we are not restoring
379 elif options.fast_forward:
380 testsys.cpu[i].max_insts_any_thread = int(options.fast_forward)
381 # Fast forward to a simpoint (warning: time consuming)
382 elif options.simpoint:
383 if testsys.cpu[i].workload[0].simpoint == 0:
384 fatal('simpoint not found')
385 testsys.cpu[i].max_insts_any_thread = \
386 testsys.cpu[i].workload[0].simpoint
387 # No distance specified, just switch
388 else:
389 testsys.cpu[i].max_insts_any_thread = 1
390
391 # warmup period
392 if options.warmup_insts:
393 switch_cpus[i].max_insts_any_thread = options.warmup_insts
394
395 # simulation period
396 if options.maxinsts:
397 switch_cpus_1[i].max_insts_any_thread = options.maxinsts
398
399 # attach the checker cpu if selected
400 if options.checker:
401 switch_cpus[i].addCheckerCpu()
402 switch_cpus_1[i].addCheckerCpu()
403
404 testsys.switch_cpus = switch_cpus
405 testsys.switch_cpus_1 = switch_cpus_1
406 switch_cpu_list = [(testsys.cpu[i], switch_cpus[i]) for i in xrange(np)]
407 switch_cpu_list1 = [(switch_cpus[i], switch_cpus_1[i]) for i in xrange(np)]
408
409 # set the checkpoint in the cpu before m5.instantiate is called
410 if options.take_checkpoints != None and \
411 (options.simpoint or options.at_instruction):
412 offset = int(options.take_checkpoints)
413 # Set an instruction break point
414 if options.simpoint:
415 for i in xrange(np):
416 if testsys.cpu[i].workload[0].simpoint == 0:
417 fatal('no simpoint for testsys.cpu[%d].workload[0]', i)
418 checkpoint_inst = int(testsys.cpu[i].workload[0].simpoint) + offset
419 testsys.cpu[i].max_insts_any_thread = checkpoint_inst
420 # used for output below
421 options.take_checkpoints = checkpoint_inst
422 else:
423 options.take_checkpoints = offset
424 # Set all test cpus with the right number of instructions
425 # for the upcoming simulation
426 for i in xrange(np):
427 testsys.cpu[i].max_insts_any_thread = offset
428
429 checkpoint_dir = None
430 if options.checkpoint_restore != None:
431 maxtick, checkpoint_dir = findCptDir(options, maxtick, cptdir, testsys)
432 m5.instantiate(checkpoint_dir)
433
434 if options.standard_switch or cpu_class:
435 if options.standard_switch:
436 print "Switch at instruction count:%s" % \
437 str(testsys.cpu[0].max_insts_any_thread)
438 exit_event = m5.simulate()
439 elif cpu_class and options.fast_forward:
440 print "Switch at instruction count:%s" % \
441 str(testsys.cpu[0].max_insts_any_thread)
442 exit_event = m5.simulate()
443 else:
444 print "Switch at curTick count:%s" % str(10000)
445 exit_event = m5.simulate(10000)
446 print "Switched CPUS @ tick %s" % (m5.curTick())
447
448 # when you change to Timing (or Atomic), you halt the system
449 # given as argument. When you are finished with the system
450 # changes (including switchCpus), you must resume the system
451 # manually. You DON'T need to resume after just switching
452 # CPUs if you haven't changed anything on the system level.
453
454 m5.changeToTiming(testsys)
455 m5.switchCpus(switch_cpu_list)
456 m5.resume(testsys)
457
458 if options.standard_switch:
459 print "Switch at instruction count:%d" % \
460 (testsys.switch_cpus[0].max_insts_any_thread)
461
462 #warmup instruction count may have already been set
463 if options.warmup_insts:
464 exit_event = m5.simulate()
465 else:
466 exit_event = m5.simulate(options.standard_switch)
467 print "Switching CPUS @ tick %s" % (m5.curTick())
468 print "Simulation ends instruction count:%d" % \
469 (testsys.switch_cpus_1[0].max_insts_any_thread)
470 m5.drain(testsys)
471 m5.switchCpus(switch_cpu_list1)
472 m5.resume(testsys)
473
474 # If we're taking and restoring checkpoints, use checkpoint_dir
475 # option only for finding the checkpoints to restore from. This
476 # lets us test checkpointing by restoring from one set of
477 # checkpoints, generating a second set, and then comparing them.
478 if options.take_checkpoints and options.checkpoint_restore:
479 if m5.options.outdir:
480 cptdir = m5.options.outdir
481 else:
482 cptdir = getcwd()
483
484 if options.take_checkpoints != None :
485 # Checkpoints being taken via the command line at <when> and at
486 # subsequent periods of <period>. Checkpoint instructions
487 # received from the benchmark running are ignored and skipped in
488 # favor of command line checkpoint instructions.
489 exit_cause = scriptCheckpoints(options, maxtick, cptdir)
490 else:
491 if options.fast_forward:
492 m5.stats.reset()
493 print "**** REAL SIMULATION ****"
494
495 # If checkpoints are being taken, then the checkpoint instruction
496 # will occur in the benchmark code it self.
497 if options.repeat_switch and maxtick > options.repeat_switch:
498 exit_event = repeatSwitch(testsys, repeat_switch_cpu_list,
499 maxtick, options.repeat_switch)
500 else:
501 exit_event = benchCheckpoints(options, maxtick, cptdir)
502
503 print 'Exiting @ tick %i because %s' % (m5.curTick(), exit_event.getCause())
504 if options.checkpoint_at_end:
505 m5.checkpoint(joinpath(cptdir, "cpt.%d"))
506
507 if not m5.options.interactive:
508 sys.exit(exit_event.getCode())