ac: fix num_good_cu_per_sh for harvested chips
[mesa.git] / src / amd / common / ac_rtld.h
1 /*
2 * Copyright 2014-2019 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 * SOFTWARE.
22 */
23
24 #ifndef AC_RTLD_H
25 #define AC_RTLD_H
26
27 #include <stdbool.h>
28 #include <stdint.h>
29 #include <stddef.h>
30
31 #include "util/u_dynarray.h"
32 #include "compiler/shader_enums.h"
33
34 struct ac_rtld_part;
35 struct ac_shader_config;
36 struct radeon_info;
37
38 struct ac_rtld_symbol {
39 const char *name;
40 uint32_t size;
41 uint32_t align;
42 uint64_t offset; /* filled in by ac_rtld_open */
43 unsigned part_idx; /* shader part in which this symbol appears */
44 };
45
46 struct ac_rtld_options {
47 /* Loader will insert an s_sethalt 1 instruction as the
48 * first instruction. */
49 bool halt_at_entry:1;
50 };
51
52 /* Lightweight wrapper around underlying ELF objects. */
53 struct ac_rtld_binary {
54 struct ac_rtld_options options;
55 unsigned wave_size;
56
57 /* Required buffer sizes, currently read/executable only. */
58 uint64_t rx_size;
59
60 /* Size of executable code, for reporting purposes. */
61 uint64_t exec_size;
62
63 uint64_t rx_end_markers;
64
65 unsigned num_parts;
66 struct ac_rtld_part *parts;
67
68 struct util_dynarray lds_symbols;
69 uint32_t lds_size;
70 };
71
72 /**
73 * Callback function type used during upload to resolve external symbols that
74 * are not defined in any of the ELF binaries available to the linker.
75 *
76 * \param cb_data caller-defined data
77 * \param symbol NUL-terminated symbol name
78 * \param value to be filled in by the callback
79 * \return whether the symbol was found successfully
80 */
81 typedef bool (*ac_rtld_get_external_symbol_cb)(
82 void *cb_data, const char *symbol, uint64_t *value);
83
84 /**
85 * Lifetimes of \ref info, in-memory ELF objects, and the names of
86 * \ref shared_lds_symbols must extend until \ref ac_rtld_close is called on
87 * the opened binary.
88 */
89 struct ac_rtld_open_info {
90 const struct radeon_info *info;
91 struct ac_rtld_options options;
92 gl_shader_stage shader_type;
93 unsigned wave_size;
94
95 unsigned num_parts;
96 const char * const *elf_ptrs; /* in-memory ELF objects of each part */
97 const size_t *elf_sizes; /* sizes of corresponding in-memory ELF objects in bytes */
98
99 /* Shared LDS symbols are layouted such that they are accessible from
100 * all shader parts. Non-shared (private) LDS symbols of one part may
101 * overlap private LDS symbols of another shader part.
102 */
103 unsigned num_shared_lds_symbols;
104 const struct ac_rtld_symbol *shared_lds_symbols;
105 };
106
107 bool ac_rtld_open(struct ac_rtld_binary *binary,
108 struct ac_rtld_open_info i);
109
110 void ac_rtld_close(struct ac_rtld_binary *binary);
111
112 bool ac_rtld_get_section_by_name(struct ac_rtld_binary *binary, const char *name,
113 const char **data, size_t *nbytes);
114
115 bool ac_rtld_read_config(struct ac_rtld_binary *binary,
116 struct ac_shader_config *config);
117
118 struct ac_rtld_upload_info {
119 struct ac_rtld_binary *binary;
120
121 /** GPU mapping of the read/executable buffer. */
122 uint64_t rx_va;
123
124 /** CPU mapping of the read/executable buffer */
125 char *rx_ptr;
126
127 /** Optional callback function that will be queried for symbols not
128 * defined in any of the binary's parts. */
129 ac_rtld_get_external_symbol_cb get_external_symbol;
130
131 /** Caller-defined data that will be passed to callback functions. */
132 void *cb_data;
133 };
134
135 bool ac_rtld_upload(struct ac_rtld_upload_info *u);
136
137 #endif /* AC_RTLD_H */