intel/nir: Stop using nir_lower_vars_to_scratch
[mesa.git] / src / intel / compiler / brw_ir_performance.h
1 /* -*- c++ -*- */
2 /*
3 * Copyright © 2020 Intel Corporation
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9 * and/or sell copies of the Software, and to permit persons to whom the
10 * Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
22 * IN THE SOFTWARE.
23 */
24
25 #ifndef BRW_IR_PERFORMANCE_H
26 #define BRW_IR_PERFORMANCE_H
27
28 class fs_visitor;
29
30 namespace brw {
31 class vec4_visitor;
32
33 /**
34 * Various estimates of the performance of a shader based on static
35 * analysis.
36 */
37 struct performance {
38 performance(const fs_visitor *v);
39 performance(const vec4_visitor *v);
40 ~performance();
41
42 analysis_dependency_class
43 dependency_class() const
44 {
45 return (DEPENDENCY_INSTRUCTIONS |
46 DEPENDENCY_BLOCKS);
47 }
48
49 bool
50 validate(const backend_shader *) const
51 {
52 return true;
53 }
54
55 /**
56 * Array containing estimates of the runtime of each basic block of the
57 * program in cycle units.
58 */
59 unsigned *block_latency;
60
61 /**
62 * Estimate of the runtime of the whole program in cycle units assuming
63 * uncontended execution.
64 */
65 unsigned latency;
66
67 /**
68 * Estimate of the throughput of the whole program in
69 * invocations-per-cycle units.
70 *
71 * Note that this might be lower than the ratio between the dispatch
72 * width of the program and its latency estimate in cases where
73 * performance doesn't scale without limits as a function of its thread
74 * parallelism, e.g. due to the existence of a bottleneck in a shared
75 * function.
76 */
77 float throughput;
78
79 private:
80 performance(const performance &perf);
81 performance &
82 operator=(performance u);
83 };
84 }
85
86 #endif