2 # Copyright (c) 2010-2015 Advanced Micro Devices, Inc.
5 # For use for simulation and test purposes only
7 # Redistribution and use in source and binary forms, with or without
8 # modification, are permitted provided that the following conditions are met:
10 # 1. Redistributions of source code must retain the above copyright notice,
11 # this list of conditions and the following disclaimer.
13 # 2. Redistributions in binary form must reproduce the above copyright notice,
14 # this list of conditions and the following disclaimer in the documentation
15 # and/or other materials provided with the distribution.
17 # 3. Neither the name of the copyright holder nor the names of its contributors
18 # may be used to endorse or promote products derived from this software
19 # without specific prior written permission.
21 # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
22 # AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23 # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24 # ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
25 # LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26 # CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27 # SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
28 # INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
29 # CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
30 # ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
31 # POSSIBILITY OF SUCH DAMAGE.
33 # Author: Brad Beckmann
37 from m5
.objects
import *
38 from m5
.defines
import buildEnv
39 from m5
.util
import addToPath
40 import os
, optparse
, sys
41 addToPath('../common')
43 addToPath('../topologies')
48 # Get paths we might need.
49 config_path
= os
.path
.dirname(os
.path
.abspath(__file__
))
50 config_root
= os
.path
.dirname(config_path
)
51 m5_root
= os
.path
.dirname(config_root
)
53 parser
= optparse
.OptionParser()
54 Options
.addCommonOptions(parser
)
56 parser
.add_option("--maxloads", metavar
="N", default
=100,
57 help="Stop after N loads")
58 parser
.add_option("-f", "--wakeup_freq", metavar
="N", default
=10,
59 help="Wakeup every N cycles")
60 parser
.add_option("-u", "--num-compute-units", type="int", default
=1,
61 help="number of compute units in the GPU")
62 parser
.add_option("--num-cp", type="int", default
=0,
63 help="Number of GPU Command Processors (CP)")
64 # not super important now, but to avoid putting the number 4 everywhere, make
66 parser
.add_option("--cu-per-sqc", type="int", default
=4, help="number of CUs \
67 sharing an SQC (icache, and thus icache TLB)")
68 parser
.add_option("--simds-per-cu", type="int", default
=4, help="SIMD units" \
70 parser
.add_option("--wf-size", type="int", default
=64,
71 help="Wavefront size(in workitems)")
72 parser
.add_option("--wfs-per-simd", type="int", default
=10, help="Number of " \
76 # Add the ruby specific and protocol specific options
78 Ruby
.define_options(parser
)
80 execfile(os
.path
.join(config_root
, "common", "Options.py"))
82 (options
, args
) = parser
.parse_args()
85 # Set the default cache size and associativity to be very small to encourage
86 # races between requests and writebacks.
88 options
.l1d_size
="256B"
89 options
.l1i_size
="256B"
90 options
.l2_size
="512B"
97 # This file can support multiple compute units
98 assert(options
.num_compute_units
>= 1)
99 n_cu
= options
.num_compute_units
101 options
.num_sqc
= int((n_cu
+ options
.cu_per_sqc
- 1) / options
.cu_per_sqc
)
104 print "Error: script doesn't take any positional arguments"
108 # Create the ruby random tester
111 # Check to for the GPU_RfO protocol. Other GPU protocols are non-SC and will
112 # not work with the Ruby random tester.
113 assert(buildEnv
['PROTOCOL'] == 'GPU_RfO')
115 # The GPU_RfO protocol does not support cache flushes
118 tester
= RubyTester(check_flush
=check_flush
,
119 checks_to_complete
=options
.maxloads
,
120 wakeup_frequency
=options
.wakeup_freq
,
121 deadlock_threshold
=1000000)
124 # Create the M5 system. Note that the Memory Object isn't
125 # actually used by the rubytester, but is included to support the
126 # M5 memory size == Ruby memory size checks
128 system
= System(cpu
=tester
, mem_ranges
=[AddrRange(options
.mem_size
)])
130 # Create a top-level voltage domain and clock domain
131 system
.voltage_domain
= VoltageDomain(voltage
=options
.sys_voltage
)
133 system
.clk_domain
= SrcClockDomain(clock
=options
.sys_clock
,
134 voltage_domain
=system
.voltage_domain
)
136 Ruby
.create_system(options
, False, system
)
138 # Create a seperate clock domain for Ruby
139 system
.ruby
.clk_domain
= SrcClockDomain(clock
=options
.ruby_clock
,
140 voltage_domain
=system
.voltage_domain
)
142 tester
.num_cpus
= len(system
.ruby
._cpu
_ports
)
145 # The tester is most effective when randomization is turned on and
146 # artifical delay is randomly inserted on messages
148 system
.ruby
.randomization
= True
150 for ruby_port
in system
.ruby
._cpu
_ports
:
153 # Tie the ruby tester ports to the ruby cpu read and write ports
155 if ruby_port
.support_data_reqs
and ruby_port
.support_inst_reqs
:
156 tester
.cpuInstDataPort
= ruby_port
.slave
157 elif ruby_port
.support_data_reqs
:
158 tester
.cpuDataPort
= ruby_port
.slave
159 elif ruby_port
.support_inst_reqs
:
160 tester
.cpuInstPort
= ruby_port
.slave
162 # Do not automatically retry stalled Ruby requests
163 ruby_port
.no_retry_on_stall
= True
166 # Tell each sequencer this is the ruby tester so that it
167 # copies the subblock back to the checker
169 ruby_port
.using_ruby_tester
= True
171 # -----------------------
173 # -----------------------
175 root
= Root( full_system
= False, system
= system
)
176 root
.system
.mem_mode
= 'timing'
178 # Not much point in this being higher than the L1 latency
179 m5
.ticks
.setGlobalFrequency('1ns')
181 # instantiate configuration
184 # simulate until program terminates
185 exit_event
= m5
.simulate(options
.abs_max_tick
)
187 print 'Exiting @ tick', m5
.curTick(), 'because', exit_event
.getCause()