3 * Copyright © 2020 Intel Corporation
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9 * and/or sell copies of the Software, and to permit persons to whom the
10 * Software is furnished to do so, subject to the following conditions:
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
25 #ifndef BRW_IR_PERFORMANCE_H
26 #define BRW_IR_PERFORMANCE_H
34 * Various estimates of the performance of a shader based on static
38 performance(const fs_visitor
*v
);
39 performance(const vec4_visitor
*v
);
42 analysis_dependency_class
43 dependency_class() const
45 return (DEPENDENCY_INSTRUCTIONS
|
50 validate(const backend_shader
*) const
56 * Array containing estimates of the runtime of each basic block of the
57 * program in cycle units.
59 unsigned *block_latency
;
62 * Estimate of the runtime of the whole program in cycle units assuming
63 * uncontended execution.
68 * Estimate of the throughput of the whole program in
69 * invocations-per-cycle units.
71 * Note that this might be lower than the ratio between the dispatch
72 * width of the program and its latency estimate in cases where
73 * performance doesn't scale without limits as a function of its thread
74 * parallelism, e.g. due to the existence of a bottleneck in a shared
80 performance(const performance
&perf
);
82 operator=(performance u
);