2 # Copyright (c) 2010-2015 Advanced Micro Devices, Inc.
5 # For use for simulation and test purposes only
7 # Redistribution and use in source and binary forms, with or without
8 # modification, are permitted provided that the following conditions are met:
10 # 1. Redistributions of source code must retain the above copyright notice,
11 # this list of conditions and the following disclaimer.
13 # 2. Redistributions in binary form must reproduce the above copyright notice,
14 # this list of conditions and the following disclaimer in the documentation
15 # and/or other materials provided with the distribution.
17 # 3. Neither the name of the copyright holder nor the names of its contributors
18 # may be used to endorse or promote products derived from this software
19 # without specific prior written permission.
21 # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
22 # AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23 # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24 # ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
25 # LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26 # CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27 # SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
28 # INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
29 # CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
30 # ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
31 # POSSIBILITY OF SUCH DAMAGE.
33 # Author: Brad Beckmann
37 from m5
.objects
import *
38 from m5
.defines
import buildEnv
39 from m5
.util
import addToPath
40 import os
, optparse
, sys
44 from common
import Options
47 # Get paths we might need.
48 config_path
= os
.path
.dirname(os
.path
.abspath(__file__
))
49 config_root
= os
.path
.dirname(config_path
)
50 m5_root
= os
.path
.dirname(config_root
)
52 parser
= optparse
.OptionParser()
53 Options
.addNoISAOptions(parser
)
55 parser
.add_option("--maxloads", metavar
="N", default
=100,
56 help="Stop after N loads")
57 parser
.add_option("-f", "--wakeup_freq", metavar
="N", default
=10,
58 help="Wakeup every N cycles")
59 parser
.add_option("-u", "--num-compute-units", type="int", default
=1,
60 help="number of compute units in the GPU")
61 parser
.add_option("--num-cp", type="int", default
=0,
62 help="Number of GPU Command Processors (CP)")
63 # not super important now, but to avoid putting the number 4 everywhere, make
65 parser
.add_option("--cu-per-sqc", type="int", default
=4, help="number of CUs \
66 sharing an SQC (icache, and thus icache TLB)")
67 parser
.add_option("--simds-per-cu", type="int", default
=4, help="SIMD units" \
69 parser
.add_option("--wf-size", type="int", default
=64,
70 help="Wavefront size(in workitems)")
71 parser
.add_option("--wfs-per-simd", type="int", default
=10, help="Number of " \
75 # Add the ruby specific and protocol specific options
77 Ruby
.define_options(parser
)
79 execfile(os
.path
.join(config_root
, "common", "Options.py"))
81 (options
, args
) = parser
.parse_args()
84 # Set the default cache size and associativity to be very small to encourage
85 # races between requests and writebacks.
87 options
.l1d_size
="256B"
88 options
.l1i_size
="256B"
89 options
.l2_size
="512B"
96 # This file can support multiple compute units
97 assert(options
.num_compute_units
>= 1)
98 n_cu
= options
.num_compute_units
100 options
.num_sqc
= int((n_cu
+ options
.cu_per_sqc
- 1) / options
.cu_per_sqc
)
103 print "Error: script doesn't take any positional arguments"
107 # Create the ruby random tester
110 # Check to for the GPU_RfO protocol. Other GPU protocols are non-SC and will
111 # not work with the Ruby random tester.
112 assert(buildEnv
['PROTOCOL'] == 'GPU_RfO')
114 # The GPU_RfO protocol does not support cache flushes
117 tester
= RubyTester(check_flush
=check_flush
,
118 checks_to_complete
=options
.maxloads
,
119 wakeup_frequency
=options
.wakeup_freq
,
120 deadlock_threshold
=1000000)
123 # Create the M5 system. Note that the Memory Object isn't
124 # actually used by the rubytester, but is included to support the
125 # M5 memory size == Ruby memory size checks
127 system
= System(cpu
=tester
, mem_ranges
=[AddrRange(options
.mem_size
)])
129 # Create a top-level voltage domain and clock domain
130 system
.voltage_domain
= VoltageDomain(voltage
=options
.sys_voltage
)
132 system
.clk_domain
= SrcClockDomain(clock
=options
.sys_clock
,
133 voltage_domain
=system
.voltage_domain
)
135 Ruby
.create_system(options
, False, system
)
137 # Create a seperate clock domain for Ruby
138 system
.ruby
.clk_domain
= SrcClockDomain(clock
=options
.ruby_clock
,
139 voltage_domain
=system
.voltage_domain
)
141 tester
.num_cpus
= len(system
.ruby
._cpu
_ports
)
144 # The tester is most effective when randomization is turned on and
145 # artifical delay is randomly inserted on messages
147 system
.ruby
.randomization
= True
149 for ruby_port
in system
.ruby
._cpu
_ports
:
152 # Tie the ruby tester ports to the ruby cpu read and write ports
154 if ruby_port
.support_data_reqs
and ruby_port
.support_inst_reqs
:
155 tester
.cpuInstDataPort
= ruby_port
.slave
156 elif ruby_port
.support_data_reqs
:
157 tester
.cpuDataPort
= ruby_port
.slave
158 elif ruby_port
.support_inst_reqs
:
159 tester
.cpuInstPort
= ruby_port
.slave
161 # Do not automatically retry stalled Ruby requests
162 ruby_port
.no_retry_on_stall
= True
165 # Tell each sequencer this is the ruby tester so that it
166 # copies the subblock back to the checker
168 ruby_port
.using_ruby_tester
= True
170 # -----------------------
172 # -----------------------
174 root
= Root( full_system
= False, system
= system
)
175 root
.system
.mem_mode
= 'timing'
177 # Not much point in this being higher than the L1 latency
178 m5
.ticks
.setGlobalFrequency('1ns')
180 # instantiate configuration
183 # simulate until program terminates
184 exit_event
= m5
.simulate(options
.abs_max_tick
)
186 print 'Exiting @ tick', m5
.curTick(), 'because', exit_event
.getCause()