2 * Copyright 2014 Advanced Micro Devices, Inc.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
23 * Authors: Tom Stellard <thomas.stellard@amd.com>
27 #include "radeon_elf_util.h"
28 #include "r600_pipe_common.h"
30 #include "util/u_memory.h"
36 static void parse_symbol_table(Elf_Data
*symbol_table_data
,
37 const GElf_Shdr
*symbol_table_header
,
38 struct radeon_shader_binary
*binary
)
42 unsigned symbol_count
=
43 symbol_table_header
->sh_size
/ symbol_table_header
->sh_entsize
;
45 /* We are over allocating this list, because symbol_count gives the
46 * total number of symbols, and we will only be filling the list
47 * with offsets of global symbols. The memory savings from
48 * allocating the correct size of this list will be small, and
49 * I don't think it is worth the cost of pre-computing the number
52 binary
->global_symbol_offsets
= CALLOC(symbol_count
, sizeof(uint64_t));
54 while (gelf_getsym(symbol_table_data
, i
++, &symbol
)) {
56 if (GELF_ST_BIND(symbol
.st_info
) != STB_GLOBAL
||
57 symbol
.st_shndx
== 0 /* Undefined symbol */) {
61 binary
->global_symbol_offsets
[binary
->global_symbol_count
] =
64 /* Sort the list using bubble sort. This list will usually
66 for (i
= binary
->global_symbol_count
; i
> 0; --i
) {
67 uint64_t lhs
= binary
->global_symbol_offsets
[i
- 1];
68 uint64_t rhs
= binary
->global_symbol_offsets
[i
];
72 binary
->global_symbol_offsets
[i
] = lhs
;
73 binary
->global_symbol_offsets
[i
- 1] = rhs
;
75 ++binary
->global_symbol_count
;
79 static void parse_relocs(Elf
*elf
, Elf_Data
*relocs
, Elf_Data
*symbols
,
80 unsigned symbol_sh_link
,
81 struct radeon_shader_binary
*binary
)
85 if (!relocs
|| !symbols
|| !binary
->reloc_count
) {
88 binary
->relocs
= CALLOC(binary
->reloc_count
,
89 sizeof(struct radeon_shader_reloc
));
90 for (i
= 0; i
< binary
->reloc_count
; i
++) {
94 struct radeon_shader_reloc
*reloc
= &binary
->relocs
[i
];
96 gelf_getrel(relocs
, i
, &rel
);
97 gelf_getsym(symbols
, GELF_R_SYM(rel
.r_info
), &symbol
);
98 symbol_name
= elf_strptr(elf
, symbol_sh_link
, symbol
.st_name
);
100 reloc
->offset
= rel
.r_offset
;
101 reloc
->name
= strdup(symbol_name
);
105 void radeon_elf_read(const char *elf_data
, unsigned elf_size
,
106 struct radeon_shader_binary
*binary
)
110 Elf_Scn
*section
= NULL
;
111 Elf_Data
*symbols
= NULL
, *relocs
= NULL
;
112 size_t section_str_index
;
113 unsigned symbol_sh_link
= 0;
115 /* One of the libelf implementations
116 * (http://www.mr511.de/software/english.htm) requires calling
117 * elf_version() before elf_memory().
119 elf_version(EV_CURRENT
);
120 elf_buffer
= MALLOC(elf_size
);
121 memcpy(elf_buffer
, elf_data
, elf_size
);
123 elf
= elf_memory(elf_buffer
, elf_size
);
125 elf_getshdrstrndx(elf
, §ion_str_index
);
127 while ((section
= elf_nextscn(elf
, section
))) {
129 Elf_Data
*section_data
= NULL
;
130 GElf_Shdr section_header
;
131 if (gelf_getshdr(section
, §ion_header
) != §ion_header
) {
132 fprintf(stderr
, "Failed to read ELF section header\n");
135 name
= elf_strptr(elf
, section_str_index
, section_header
.sh_name
);
136 if (!strcmp(name
, ".text")) {
137 section_data
= elf_getdata(section
, section_data
);
138 binary
->code_size
= section_data
->d_size
;
139 binary
->code
= MALLOC(binary
->code_size
* sizeof(unsigned char));
140 memcpy(binary
->code
, section_data
->d_buf
, binary
->code_size
);
141 } else if (!strcmp(name
, ".AMDGPU.config")) {
142 section_data
= elf_getdata(section
, section_data
);
143 binary
->config_size
= section_data
->d_size
;
144 binary
->config
= MALLOC(binary
->config_size
* sizeof(unsigned char));
145 memcpy(binary
->config
, section_data
->d_buf
, binary
->config_size
);
146 } else if (!strcmp(name
, ".AMDGPU.disasm")) {
147 /* Always read disassembly if it's available. */
148 section_data
= elf_getdata(section
, section_data
);
149 binary
->disasm_string
= strndup(section_data
->d_buf
,
150 section_data
->d_size
);
151 } else if (!strncmp(name
, ".rodata", 7)) {
152 section_data
= elf_getdata(section
, section_data
);
153 binary
->rodata_size
= section_data
->d_size
;
154 binary
->rodata
= MALLOC(binary
->rodata_size
* sizeof(unsigned char));
155 memcpy(binary
->rodata
, section_data
->d_buf
, binary
->rodata_size
);
156 } else if (!strncmp(name
, ".symtab", 7)) {
157 symbols
= elf_getdata(section
, section_data
);
158 symbol_sh_link
= section_header
.sh_link
;
159 parse_symbol_table(symbols
, §ion_header
, binary
);
160 } else if (!strcmp(name
, ".rel.text")) {
161 relocs
= elf_getdata(section
, section_data
);
162 binary
->reloc_count
= section_header
.sh_size
/
163 section_header
.sh_entsize
;
167 parse_relocs(elf
, relocs
, symbols
, symbol_sh_link
, binary
);
174 /* Cache the config size per symbol */
175 if (binary
->global_symbol_count
) {
176 binary
->config_size_per_symbol
=
177 binary
->config_size
/ binary
->global_symbol_count
;
179 binary
->global_symbol_count
= 1;
180 binary
->config_size_per_symbol
= binary
->config_size
;
184 const unsigned char *radeon_shader_binary_config_start(
185 const struct radeon_shader_binary
*binary
,
186 uint64_t symbol_offset
)
189 for (i
= 0; i
< binary
->global_symbol_count
; ++i
) {
190 if (binary
->global_symbol_offsets
[i
] == symbol_offset
) {
191 unsigned offset
= i
* binary
->config_size_per_symbol
;
192 return binary
->config
+ offset
;
195 return binary
->config
;
198 void radeon_shader_binary_free_relocs(struct radeon_shader_reloc
*relocs
,
199 unsigned reloc_count
)
202 for (i
= 0; i
< reloc_count
; i
++) {
203 FREE(relocs
[i
].name
);
208 void radeon_shader_binary_free_members(struct radeon_shader_binary
*binary
,
209 unsigned free_relocs
)
212 FREE(binary
->config
);
213 FREE(binary
->rodata
);
216 radeon_shader_binary_free_relocs(binary
->relocs
,
217 binary
->reloc_count
);