Introduce partial_symtab::read_symtab method
[binutils-gdb.git] / gdb / dwarf-index-write.c
1 /* DWARF index writing support for GDB.
2
3 Copyright (C) 1994-2020 Free Software Foundation, Inc.
4
5 This file is part of GDB.
6
7 This program is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3 of the License, or
10 (at your option) any later version.
11
12 This program is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
16
17 You should have received a copy of the GNU General Public License
18 along with this program. If not, see <http://www.gnu.org/licenses/>. */
19
20 #include "defs.h"
21
22 #include "dwarf-index-write.h"
23
24 #include "addrmap.h"
25 #include "cli/cli-decode.h"
26 #include "gdbsupport/byte-vector.h"
27 #include "gdbsupport/filestuff.h"
28 #include "gdbsupport/gdb_unlinker.h"
29 #include "gdbsupport/pathstuff.h"
30 #include "gdbsupport/scoped_fd.h"
31 #include "complaints.h"
32 #include "dwarf-index-common.h"
33 #include "dwarf2.h"
34 #include "dwarf2read.h"
35 #include "gdb/gdb-index.h"
36 #include "gdbcmd.h"
37 #include "objfiles.h"
38 #include "psympriv.h"
39 #include "ada-lang.h"
40
41 #include <algorithm>
42 #include <cmath>
43 #include <set>
44 #include <unordered_map>
45 #include <unordered_set>
46
47 /* Ensure only legit values are used. */
48 #define DW2_GDB_INDEX_SYMBOL_STATIC_SET_VALUE(cu_index, value) \
49 do { \
50 gdb_assert ((unsigned int) (value) <= 1); \
51 GDB_INDEX_SYMBOL_STATIC_SET_VALUE((cu_index), (value)); \
52 } while (0)
53
54 /* Ensure only legit values are used. */
55 #define DW2_GDB_INDEX_SYMBOL_KIND_SET_VALUE(cu_index, value) \
56 do { \
57 gdb_assert ((value) >= GDB_INDEX_SYMBOL_KIND_TYPE \
58 && (value) <= GDB_INDEX_SYMBOL_KIND_OTHER); \
59 GDB_INDEX_SYMBOL_KIND_SET_VALUE((cu_index), (value)); \
60 } while (0)
61
62 /* Ensure we don't use more than the allotted number of bits for the CU. */
63 #define DW2_GDB_INDEX_CU_SET_VALUE(cu_index, value) \
64 do { \
65 gdb_assert (((value) & ~GDB_INDEX_CU_MASK) == 0); \
66 GDB_INDEX_CU_SET_VALUE((cu_index), (value)); \
67 } while (0)
68
69 /* The "save gdb-index" command. */
70
71 /* Write SIZE bytes from the buffer pointed to by DATA to FILE, with
72 error checking. */
73
74 static void
75 file_write (FILE *file, const void *data, size_t size)
76 {
77 if (fwrite (data, 1, size, file) != size)
78 error (_("couldn't data write to file"));
79 }
80
81 /* Write the contents of VEC to FILE, with error checking. */
82
83 template<typename Elem, typename Alloc>
84 static void
85 file_write (FILE *file, const std::vector<Elem, Alloc> &vec)
86 {
87 if (!vec.empty ())
88 file_write (file, vec.data (), vec.size () * sizeof (vec[0]));
89 }
90
91 /* In-memory buffer to prepare data to be written later to a file. */
92 class data_buf
93 {
94 public:
95 /* Copy DATA to the end of the buffer. */
96 template<typename T>
97 void append_data (const T &data)
98 {
99 std::copy (reinterpret_cast<const gdb_byte *> (&data),
100 reinterpret_cast<const gdb_byte *> (&data + 1),
101 grow (sizeof (data)));
102 }
103
104 /* Copy CSTR (a zero-terminated string) to the end of buffer. The
105 terminating zero is appended too. */
106 void append_cstr0 (const char *cstr)
107 {
108 const size_t size = strlen (cstr) + 1;
109 std::copy (cstr, cstr + size, grow (size));
110 }
111
112 /* Store INPUT as ULEB128 to the end of buffer. */
113 void append_unsigned_leb128 (ULONGEST input)
114 {
115 for (;;)
116 {
117 gdb_byte output = input & 0x7f;
118 input >>= 7;
119 if (input)
120 output |= 0x80;
121 append_data (output);
122 if (input == 0)
123 break;
124 }
125 }
126
127 /* Accept a host-format integer in VAL and append it to the buffer
128 as a target-format integer which is LEN bytes long. */
129 void append_uint (size_t len, bfd_endian byte_order, ULONGEST val)
130 {
131 ::store_unsigned_integer (grow (len), len, byte_order, val);
132 }
133
134 /* Return the size of the buffer. */
135 size_t size () const
136 {
137 return m_vec.size ();
138 }
139
140 /* Return true iff the buffer is empty. */
141 bool empty () const
142 {
143 return m_vec.empty ();
144 }
145
146 /* Write the buffer to FILE. */
147 void file_write (FILE *file) const
148 {
149 ::file_write (file, m_vec);
150 }
151
152 private:
153 /* Grow SIZE bytes at the end of the buffer. Returns a pointer to
154 the start of the new block. */
155 gdb_byte *grow (size_t size)
156 {
157 m_vec.resize (m_vec.size () + size);
158 return &*(m_vec.end () - size);
159 }
160
161 gdb::byte_vector m_vec;
162 };
163
164 /* An entry in the symbol table. */
165 struct symtab_index_entry
166 {
167 /* The name of the symbol. */
168 const char *name;
169 /* The offset of the name in the constant pool. */
170 offset_type index_offset;
171 /* A sorted vector of the indices of all the CUs that hold an object
172 of this name. */
173 std::vector<offset_type> cu_indices;
174 };
175
176 /* The symbol table. This is a power-of-2-sized hash table. */
177 struct mapped_symtab
178 {
179 mapped_symtab ()
180 {
181 data.resize (1024);
182 }
183
184 offset_type n_elements = 0;
185 std::vector<symtab_index_entry> data;
186 };
187
188 /* Find a slot in SYMTAB for the symbol NAME. Returns a reference to
189 the slot.
190
191 Function is used only during write_hash_table so no index format backward
192 compatibility is needed. */
193
194 static symtab_index_entry &
195 find_slot (struct mapped_symtab *symtab, const char *name)
196 {
197 offset_type index, step, hash = mapped_index_string_hash (INT_MAX, name);
198
199 index = hash & (symtab->data.size () - 1);
200 step = ((hash * 17) & (symtab->data.size () - 1)) | 1;
201
202 for (;;)
203 {
204 if (symtab->data[index].name == NULL
205 || strcmp (name, symtab->data[index].name) == 0)
206 return symtab->data[index];
207 index = (index + step) & (symtab->data.size () - 1);
208 }
209 }
210
211 /* Expand SYMTAB's hash table. */
212
213 static void
214 hash_expand (struct mapped_symtab *symtab)
215 {
216 auto old_entries = std::move (symtab->data);
217
218 symtab->data.clear ();
219 symtab->data.resize (old_entries.size () * 2);
220
221 for (auto &it : old_entries)
222 if (it.name != NULL)
223 {
224 auto &ref = find_slot (symtab, it.name);
225 ref = std::move (it);
226 }
227 }
228
229 /* Add an entry to SYMTAB. NAME is the name of the symbol.
230 CU_INDEX is the index of the CU in which the symbol appears.
231 IS_STATIC is one if the symbol is static, otherwise zero (global). */
232
233 static void
234 add_index_entry (struct mapped_symtab *symtab, const char *name,
235 int is_static, gdb_index_symbol_kind kind,
236 offset_type cu_index)
237 {
238 offset_type cu_index_and_attrs;
239
240 ++symtab->n_elements;
241 if (4 * symtab->n_elements / 3 >= symtab->data.size ())
242 hash_expand (symtab);
243
244 symtab_index_entry &slot = find_slot (symtab, name);
245 if (slot.name == NULL)
246 {
247 slot.name = name;
248 /* index_offset is set later. */
249 }
250
251 cu_index_and_attrs = 0;
252 DW2_GDB_INDEX_CU_SET_VALUE (cu_index_and_attrs, cu_index);
253 DW2_GDB_INDEX_SYMBOL_STATIC_SET_VALUE (cu_index_and_attrs, is_static);
254 DW2_GDB_INDEX_SYMBOL_KIND_SET_VALUE (cu_index_and_attrs, kind);
255
256 /* We don't want to record an index value twice as we want to avoid the
257 duplication.
258 We process all global symbols and then all static symbols
259 (which would allow us to avoid the duplication by only having to check
260 the last entry pushed), but a symbol could have multiple kinds in one CU.
261 To keep things simple we don't worry about the duplication here and
262 sort and uniquify the list after we've processed all symbols. */
263 slot.cu_indices.push_back (cu_index_and_attrs);
264 }
265
266 /* Sort and remove duplicates of all symbols' cu_indices lists. */
267
268 static void
269 uniquify_cu_indices (struct mapped_symtab *symtab)
270 {
271 for (auto &entry : symtab->data)
272 {
273 if (entry.name != NULL && !entry.cu_indices.empty ())
274 {
275 auto &cu_indices = entry.cu_indices;
276 std::sort (cu_indices.begin (), cu_indices.end ());
277 auto from = std::unique (cu_indices.begin (), cu_indices.end ());
278 cu_indices.erase (from, cu_indices.end ());
279 }
280 }
281 }
282
283 /* A form of 'const char *' suitable for container keys. Only the
284 pointer is stored. The strings themselves are compared, not the
285 pointers. */
286 class c_str_view
287 {
288 public:
289 c_str_view (const char *cstr)
290 : m_cstr (cstr)
291 {}
292
293 bool operator== (const c_str_view &other) const
294 {
295 return strcmp (m_cstr, other.m_cstr) == 0;
296 }
297
298 /* Return the underlying C string. Note, the returned string is
299 only a reference with lifetime of this object. */
300 const char *c_str () const
301 {
302 return m_cstr;
303 }
304
305 private:
306 friend class c_str_view_hasher;
307 const char *const m_cstr;
308 };
309
310 /* A std::unordered_map::hasher for c_str_view that uses the right
311 hash function for strings in a mapped index. */
312 class c_str_view_hasher
313 {
314 public:
315 size_t operator () (const c_str_view &x) const
316 {
317 return mapped_index_string_hash (INT_MAX, x.m_cstr);
318 }
319 };
320
321 /* A std::unordered_map::hasher for std::vector<>. */
322 template<typename T>
323 class vector_hasher
324 {
325 public:
326 size_t operator () (const std::vector<T> &key) const
327 {
328 return iterative_hash (key.data (),
329 sizeof (key.front ()) * key.size (), 0);
330 }
331 };
332
333 /* Write the mapped hash table SYMTAB to the data buffer OUTPUT, with
334 constant pool entries going into the data buffer CPOOL. */
335
336 static void
337 write_hash_table (mapped_symtab *symtab, data_buf &output, data_buf &cpool)
338 {
339 {
340 /* Elements are sorted vectors of the indices of all the CUs that
341 hold an object of this name. */
342 std::unordered_map<std::vector<offset_type>, offset_type,
343 vector_hasher<offset_type>>
344 symbol_hash_table;
345
346 /* We add all the index vectors to the constant pool first, to
347 ensure alignment is ok. */
348 for (symtab_index_entry &entry : symtab->data)
349 {
350 if (entry.name == NULL)
351 continue;
352 gdb_assert (entry.index_offset == 0);
353
354 /* Finding before inserting is faster than always trying to
355 insert, because inserting always allocates a node, does the
356 lookup, and then destroys the new node if another node
357 already had the same key. C++17 try_emplace will avoid
358 this. */
359 const auto found
360 = symbol_hash_table.find (entry.cu_indices);
361 if (found != symbol_hash_table.end ())
362 {
363 entry.index_offset = found->second;
364 continue;
365 }
366
367 symbol_hash_table.emplace (entry.cu_indices, cpool.size ());
368 entry.index_offset = cpool.size ();
369 cpool.append_data (MAYBE_SWAP (entry.cu_indices.size ()));
370 for (const auto index : entry.cu_indices)
371 cpool.append_data (MAYBE_SWAP (index));
372 }
373 }
374
375 /* Now write out the hash table. */
376 std::unordered_map<c_str_view, offset_type, c_str_view_hasher> str_table;
377 for (const auto &entry : symtab->data)
378 {
379 offset_type str_off, vec_off;
380
381 if (entry.name != NULL)
382 {
383 const auto insertpair = str_table.emplace (entry.name, cpool.size ());
384 if (insertpair.second)
385 cpool.append_cstr0 (entry.name);
386 str_off = insertpair.first->second;
387 vec_off = entry.index_offset;
388 }
389 else
390 {
391 /* While 0 is a valid constant pool index, it is not valid
392 to have 0 for both offsets. */
393 str_off = 0;
394 vec_off = 0;
395 }
396
397 output.append_data (MAYBE_SWAP (str_off));
398 output.append_data (MAYBE_SWAP (vec_off));
399 }
400 }
401
402 typedef std::unordered_map<dwarf2_psymtab *, unsigned int> psym_index_map;
403
404 /* Helper struct for building the address table. */
405 struct addrmap_index_data
406 {
407 addrmap_index_data (data_buf &addr_vec_, psym_index_map &cu_index_htab_)
408 : addr_vec (addr_vec_), cu_index_htab (cu_index_htab_)
409 {}
410
411 struct objfile *objfile;
412 data_buf &addr_vec;
413 psym_index_map &cu_index_htab;
414
415 /* Non-zero if the previous_* fields are valid.
416 We can't write an entry until we see the next entry (since it is only then
417 that we know the end of the entry). */
418 int previous_valid;
419 /* Index of the CU in the table of all CUs in the index file. */
420 unsigned int previous_cu_index;
421 /* Start address of the CU. */
422 CORE_ADDR previous_cu_start;
423 };
424
425 /* Write an address entry to ADDR_VEC. */
426
427 static void
428 add_address_entry (struct objfile *objfile, data_buf &addr_vec,
429 CORE_ADDR start, CORE_ADDR end, unsigned int cu_index)
430 {
431 addr_vec.append_uint (8, BFD_ENDIAN_LITTLE, start);
432 addr_vec.append_uint (8, BFD_ENDIAN_LITTLE, end);
433 addr_vec.append_data (MAYBE_SWAP (cu_index));
434 }
435
436 /* Worker function for traversing an addrmap to build the address table. */
437
438 static int
439 add_address_entry_worker (void *datap, CORE_ADDR start_addr, void *obj)
440 {
441 struct addrmap_index_data *data = (struct addrmap_index_data *) datap;
442 dwarf2_psymtab *pst = (dwarf2_psymtab *) obj;
443
444 if (data->previous_valid)
445 add_address_entry (data->objfile, data->addr_vec,
446 data->previous_cu_start, start_addr,
447 data->previous_cu_index);
448
449 data->previous_cu_start = start_addr;
450 if (pst != NULL)
451 {
452 const auto it = data->cu_index_htab.find (pst);
453 gdb_assert (it != data->cu_index_htab.cend ());
454 data->previous_cu_index = it->second;
455 data->previous_valid = 1;
456 }
457 else
458 data->previous_valid = 0;
459
460 return 0;
461 }
462
463 /* Write OBJFILE's address map to ADDR_VEC.
464 CU_INDEX_HTAB is used to map addrmap entries to their CU indices
465 in the index file. */
466
467 static void
468 write_address_map (struct objfile *objfile, data_buf &addr_vec,
469 psym_index_map &cu_index_htab)
470 {
471 struct addrmap_index_data addrmap_index_data (addr_vec, cu_index_htab);
472
473 /* When writing the address table, we have to cope with the fact that
474 the addrmap iterator only provides the start of a region; we have to
475 wait until the next invocation to get the start of the next region. */
476
477 addrmap_index_data.objfile = objfile;
478 addrmap_index_data.previous_valid = 0;
479
480 addrmap_foreach (objfile->partial_symtabs->psymtabs_addrmap,
481 add_address_entry_worker, &addrmap_index_data);
482
483 /* It's highly unlikely the last entry (end address = 0xff...ff)
484 is valid, but we should still handle it.
485 The end address is recorded as the start of the next region, but that
486 doesn't work here. To cope we pass 0xff...ff, this is a rare situation
487 anyway. */
488 if (addrmap_index_data.previous_valid)
489 add_address_entry (objfile, addr_vec,
490 addrmap_index_data.previous_cu_start, (CORE_ADDR) -1,
491 addrmap_index_data.previous_cu_index);
492 }
493
494 /* Return the symbol kind of PSYM. */
495
496 static gdb_index_symbol_kind
497 symbol_kind (struct partial_symbol *psym)
498 {
499 domain_enum domain = psym->domain;
500 enum address_class aclass = psym->aclass;
501
502 switch (domain)
503 {
504 case VAR_DOMAIN:
505 switch (aclass)
506 {
507 case LOC_BLOCK:
508 return GDB_INDEX_SYMBOL_KIND_FUNCTION;
509 case LOC_TYPEDEF:
510 return GDB_INDEX_SYMBOL_KIND_TYPE;
511 case LOC_COMPUTED:
512 case LOC_CONST_BYTES:
513 case LOC_OPTIMIZED_OUT:
514 case LOC_STATIC:
515 return GDB_INDEX_SYMBOL_KIND_VARIABLE;
516 case LOC_CONST:
517 /* Note: It's currently impossible to recognize psyms as enum values
518 short of reading the type info. For now punt. */
519 return GDB_INDEX_SYMBOL_KIND_VARIABLE;
520 default:
521 /* There are other LOC_FOO values that one might want to classify
522 as variables, but dwarf2read.c doesn't currently use them. */
523 return GDB_INDEX_SYMBOL_KIND_OTHER;
524 }
525 case STRUCT_DOMAIN:
526 return GDB_INDEX_SYMBOL_KIND_TYPE;
527 default:
528 return GDB_INDEX_SYMBOL_KIND_OTHER;
529 }
530 }
531
532 /* Add a list of partial symbols to SYMTAB. */
533
534 static void
535 write_psymbols (struct mapped_symtab *symtab,
536 std::unordered_set<partial_symbol *> &psyms_seen,
537 struct partial_symbol **psymp,
538 int count,
539 offset_type cu_index,
540 int is_static)
541 {
542 for (; count-- > 0; ++psymp)
543 {
544 struct partial_symbol *psym = *psymp;
545
546 if (psym->ginfo.language () == language_ada)
547 error (_("Ada is not currently supported by the index; "
548 "use the DWARF 5 index instead"));
549
550 /* Only add a given psymbol once. */
551 if (psyms_seen.insert (psym).second)
552 {
553 gdb_index_symbol_kind kind = symbol_kind (psym);
554
555 add_index_entry (symtab, psym->ginfo.search_name (),
556 is_static, kind, cu_index);
557 }
558 }
559 }
560
561 /* A helper struct used when iterating over debug_types. */
562 struct signatured_type_index_data
563 {
564 signatured_type_index_data (data_buf &types_list_,
565 std::unordered_set<partial_symbol *> &psyms_seen_)
566 : types_list (types_list_), psyms_seen (psyms_seen_)
567 {}
568
569 struct objfile *objfile;
570 struct mapped_symtab *symtab;
571 data_buf &types_list;
572 std::unordered_set<partial_symbol *> &psyms_seen;
573 int cu_index;
574 };
575
576 /* A helper function that writes a single signatured_type to an
577 obstack. */
578
579 static int
580 write_one_signatured_type (void **slot, void *d)
581 {
582 struct signatured_type_index_data *info
583 = (struct signatured_type_index_data *) d;
584 struct signatured_type *entry = (struct signatured_type *) *slot;
585 dwarf2_psymtab *psymtab = entry->per_cu.v.psymtab;
586
587 write_psymbols (info->symtab,
588 info->psyms_seen,
589 (info->objfile->partial_symtabs->global_psymbols.data ()
590 + psymtab->globals_offset),
591 psymtab->n_global_syms, info->cu_index,
592 0);
593 write_psymbols (info->symtab,
594 info->psyms_seen,
595 (info->objfile->partial_symtabs->static_psymbols.data ()
596 + psymtab->statics_offset),
597 psymtab->n_static_syms, info->cu_index,
598 1);
599
600 info->types_list.append_uint (8, BFD_ENDIAN_LITTLE,
601 to_underlying (entry->per_cu.sect_off));
602 info->types_list.append_uint (8, BFD_ENDIAN_LITTLE,
603 to_underlying (entry->type_offset_in_tu));
604 info->types_list.append_uint (8, BFD_ENDIAN_LITTLE, entry->signature);
605
606 ++info->cu_index;
607
608 return 1;
609 }
610
611 /* Recurse into all "included" dependencies and count their symbols as
612 if they appeared in this psymtab. */
613
614 static void
615 recursively_count_psymbols (dwarf2_psymtab *psymtab,
616 size_t &psyms_seen)
617 {
618 for (int i = 0; i < psymtab->number_of_dependencies; ++i)
619 if (psymtab->dependencies[i]->user != NULL)
620 recursively_count_psymbols ((dwarf2_psymtab *) psymtab->dependencies[i],
621 psyms_seen);
622
623 psyms_seen += psymtab->n_global_syms;
624 psyms_seen += psymtab->n_static_syms;
625 }
626
627 /* Recurse into all "included" dependencies and write their symbols as
628 if they appeared in this psymtab. */
629
630 static void
631 recursively_write_psymbols (struct objfile *objfile,
632 dwarf2_psymtab *psymtab,
633 struct mapped_symtab *symtab,
634 std::unordered_set<partial_symbol *> &psyms_seen,
635 offset_type cu_index)
636 {
637 int i;
638
639 for (i = 0; i < psymtab->number_of_dependencies; ++i)
640 if (psymtab->dependencies[i]->user != NULL)
641 recursively_write_psymbols (objfile,
642 (dwarf2_psymtab *) psymtab->dependencies[i],
643 symtab, psyms_seen, cu_index);
644
645 write_psymbols (symtab,
646 psyms_seen,
647 (objfile->partial_symtabs->global_psymbols.data ()
648 + psymtab->globals_offset),
649 psymtab->n_global_syms, cu_index,
650 0);
651 write_psymbols (symtab,
652 psyms_seen,
653 (objfile->partial_symtabs->static_psymbols.data ()
654 + psymtab->statics_offset),
655 psymtab->n_static_syms, cu_index,
656 1);
657 }
658
659 /* DWARF-5 .debug_names builder. */
660 class debug_names
661 {
662 public:
663 debug_names (struct dwarf2_per_objfile *dwarf2_per_objfile, bool is_dwarf64,
664 bfd_endian dwarf5_byte_order)
665 : m_dwarf5_byte_order (dwarf5_byte_order),
666 m_dwarf32 (dwarf5_byte_order),
667 m_dwarf64 (dwarf5_byte_order),
668 m_dwarf (is_dwarf64
669 ? static_cast<dwarf &> (m_dwarf64)
670 : static_cast<dwarf &> (m_dwarf32)),
671 m_name_table_string_offs (m_dwarf.name_table_string_offs),
672 m_name_table_entry_offs (m_dwarf.name_table_entry_offs),
673 m_debugstrlookup (dwarf2_per_objfile)
674 {}
675
676 int dwarf5_offset_size () const
677 {
678 const bool dwarf5_is_dwarf64 = &m_dwarf == &m_dwarf64;
679 return dwarf5_is_dwarf64 ? 8 : 4;
680 }
681
682 /* Is this symbol from DW_TAG_compile_unit or DW_TAG_type_unit? */
683 enum class unit_kind { cu, tu };
684
685 /* Insert one symbol. */
686 void insert (const partial_symbol *psym, int cu_index, bool is_static,
687 unit_kind kind)
688 {
689 const int dwarf_tag = psymbol_tag (psym);
690 if (dwarf_tag == 0)
691 return;
692 const char *name = psym->ginfo.search_name ();
693
694 if (psym->ginfo.language () == language_ada)
695 {
696 /* We want to ensure that the Ada main function's name appears
697 verbatim in the index. However, this name will be of the
698 form "_ada_mumble", and will be rewritten by ada_decode.
699 So, recognize it specially here and add it to the index by
700 hand. */
701 if (strcmp (main_name (), name) == 0)
702 {
703 const auto insertpair
704 = m_name_to_value_set.emplace (c_str_view (name),
705 std::set<symbol_value> ());
706 std::set<symbol_value> &value_set = insertpair.first->second;
707 value_set.emplace (symbol_value (dwarf_tag, cu_index, is_static,
708 kind));
709 }
710
711 /* In order for the index to work when read back into gdb, it
712 has to supply a funny form of the name: it should be the
713 encoded name, with any suffixes stripped. Using the
714 ordinary encoded name will not work properly with the
715 searching logic in find_name_components_bounds; nor will
716 using the decoded name. Furthermore, an Ada "verbatim"
717 name (of the form "<MumBle>") must be entered without the
718 angle brackets. Note that the current index is unusual,
719 see PR symtab/24820 for details. */
720 std::string decoded = ada_decode (name);
721 if (decoded[0] == '<')
722 name = (char *) obstack_copy0 (&m_string_obstack,
723 decoded.c_str () + 1,
724 decoded.length () - 2);
725 else
726 name = obstack_strdup (&m_string_obstack,
727 ada_encode (decoded.c_str ()));
728 }
729
730 const auto insertpair
731 = m_name_to_value_set.emplace (c_str_view (name),
732 std::set<symbol_value> ());
733 std::set<symbol_value> &value_set = insertpair.first->second;
734 value_set.emplace (symbol_value (dwarf_tag, cu_index, is_static, kind));
735 }
736
737 /* Build all the tables. All symbols must be already inserted.
738 This function does not call file_write, caller has to do it
739 afterwards. */
740 void build ()
741 {
742 /* Verify the build method has not be called twice. */
743 gdb_assert (m_abbrev_table.empty ());
744 const size_t name_count = m_name_to_value_set.size ();
745 m_bucket_table.resize
746 (std::pow (2, std::ceil (std::log2 (name_count * 4 / 3))));
747 m_hash_table.reserve (name_count);
748 m_name_table_string_offs.reserve (name_count);
749 m_name_table_entry_offs.reserve (name_count);
750
751 /* Map each hash of symbol to its name and value. */
752 struct hash_it_pair
753 {
754 uint32_t hash;
755 decltype (m_name_to_value_set)::const_iterator it;
756 };
757 std::vector<std::forward_list<hash_it_pair>> bucket_hash;
758 bucket_hash.resize (m_bucket_table.size ());
759 for (decltype (m_name_to_value_set)::const_iterator it
760 = m_name_to_value_set.cbegin ();
761 it != m_name_to_value_set.cend ();
762 ++it)
763 {
764 const char *const name = it->first.c_str ();
765 const uint32_t hash = dwarf5_djb_hash (name);
766 hash_it_pair hashitpair;
767 hashitpair.hash = hash;
768 hashitpair.it = it;
769 auto &slot = bucket_hash[hash % bucket_hash.size()];
770 slot.push_front (std::move (hashitpair));
771 }
772 for (size_t bucket_ix = 0; bucket_ix < bucket_hash.size (); ++bucket_ix)
773 {
774 const std::forward_list<hash_it_pair> &hashitlist
775 = bucket_hash[bucket_ix];
776 if (hashitlist.empty ())
777 continue;
778 uint32_t &bucket_slot = m_bucket_table[bucket_ix];
779 /* The hashes array is indexed starting at 1. */
780 store_unsigned_integer (reinterpret_cast<gdb_byte *> (&bucket_slot),
781 sizeof (bucket_slot), m_dwarf5_byte_order,
782 m_hash_table.size () + 1);
783 for (const hash_it_pair &hashitpair : hashitlist)
784 {
785 m_hash_table.push_back (0);
786 store_unsigned_integer (reinterpret_cast<gdb_byte *>
787 (&m_hash_table.back ()),
788 sizeof (m_hash_table.back ()),
789 m_dwarf5_byte_order, hashitpair.hash);
790 const c_str_view &name = hashitpair.it->first;
791 const std::set<symbol_value> &value_set = hashitpair.it->second;
792 m_name_table_string_offs.push_back_reorder
793 (m_debugstrlookup.lookup (name.c_str ()));
794 m_name_table_entry_offs.push_back_reorder (m_entry_pool.size ());
795 gdb_assert (!value_set.empty ());
796 for (const symbol_value &value : value_set)
797 {
798 int &idx = m_indexkey_to_idx[index_key (value.dwarf_tag,
799 value.is_static,
800 value.kind)];
801 if (idx == 0)
802 {
803 idx = m_idx_next++;
804 m_abbrev_table.append_unsigned_leb128 (idx);
805 m_abbrev_table.append_unsigned_leb128 (value.dwarf_tag);
806 m_abbrev_table.append_unsigned_leb128
807 (value.kind == unit_kind::cu ? DW_IDX_compile_unit
808 : DW_IDX_type_unit);
809 m_abbrev_table.append_unsigned_leb128 (DW_FORM_udata);
810 m_abbrev_table.append_unsigned_leb128 (value.is_static
811 ? DW_IDX_GNU_internal
812 : DW_IDX_GNU_external);
813 m_abbrev_table.append_unsigned_leb128 (DW_FORM_flag_present);
814
815 /* Terminate attributes list. */
816 m_abbrev_table.append_unsigned_leb128 (0);
817 m_abbrev_table.append_unsigned_leb128 (0);
818 }
819
820 m_entry_pool.append_unsigned_leb128 (idx);
821 m_entry_pool.append_unsigned_leb128 (value.cu_index);
822 }
823
824 /* Terminate the list of CUs. */
825 m_entry_pool.append_unsigned_leb128 (0);
826 }
827 }
828 gdb_assert (m_hash_table.size () == name_count);
829
830 /* Terminate tags list. */
831 m_abbrev_table.append_unsigned_leb128 (0);
832 }
833
834 /* Return .debug_names bucket count. This must be called only after
835 calling the build method. */
836 uint32_t bucket_count () const
837 {
838 /* Verify the build method has been already called. */
839 gdb_assert (!m_abbrev_table.empty ());
840 const uint32_t retval = m_bucket_table.size ();
841
842 /* Check for overflow. */
843 gdb_assert (retval == m_bucket_table.size ());
844 return retval;
845 }
846
847 /* Return .debug_names names count. This must be called only after
848 calling the build method. */
849 uint32_t name_count () const
850 {
851 /* Verify the build method has been already called. */
852 gdb_assert (!m_abbrev_table.empty ());
853 const uint32_t retval = m_hash_table.size ();
854
855 /* Check for overflow. */
856 gdb_assert (retval == m_hash_table.size ());
857 return retval;
858 }
859
860 /* Return number of bytes of .debug_names abbreviation table. This
861 must be called only after calling the build method. */
862 uint32_t abbrev_table_bytes () const
863 {
864 gdb_assert (!m_abbrev_table.empty ());
865 return m_abbrev_table.size ();
866 }
867
868 /* Recurse into all "included" dependencies and store their symbols
869 as if they appeared in this psymtab. */
870 void recursively_write_psymbols
871 (struct objfile *objfile,
872 dwarf2_psymtab *psymtab,
873 std::unordered_set<partial_symbol *> &psyms_seen,
874 int cu_index)
875 {
876 for (int i = 0; i < psymtab->number_of_dependencies; ++i)
877 if (psymtab->dependencies[i]->user != NULL)
878 recursively_write_psymbols
879 (objfile, (dwarf2_psymtab *) psymtab->dependencies[i], psyms_seen, cu_index);
880
881 write_psymbols (psyms_seen,
882 (objfile->partial_symtabs->global_psymbols.data ()
883 + psymtab->globals_offset),
884 psymtab->n_global_syms, cu_index, false, unit_kind::cu);
885 write_psymbols (psyms_seen,
886 (objfile->partial_symtabs->static_psymbols.data ()
887 + psymtab->statics_offset),
888 psymtab->n_static_syms, cu_index, true, unit_kind::cu);
889 }
890
891 /* Return number of bytes the .debug_names section will have. This
892 must be called only after calling the build method. */
893 size_t bytes () const
894 {
895 /* Verify the build method has been already called. */
896 gdb_assert (!m_abbrev_table.empty ());
897 size_t expected_bytes = 0;
898 expected_bytes += m_bucket_table.size () * sizeof (m_bucket_table[0]);
899 expected_bytes += m_hash_table.size () * sizeof (m_hash_table[0]);
900 expected_bytes += m_name_table_string_offs.bytes ();
901 expected_bytes += m_name_table_entry_offs.bytes ();
902 expected_bytes += m_abbrev_table.size ();
903 expected_bytes += m_entry_pool.size ();
904 return expected_bytes;
905 }
906
907 /* Write .debug_names to FILE_NAMES and .debug_str addition to
908 FILE_STR. This must be called only after calling the build
909 method. */
910 void file_write (FILE *file_names, FILE *file_str) const
911 {
912 /* Verify the build method has been already called. */
913 gdb_assert (!m_abbrev_table.empty ());
914 ::file_write (file_names, m_bucket_table);
915 ::file_write (file_names, m_hash_table);
916 m_name_table_string_offs.file_write (file_names);
917 m_name_table_entry_offs.file_write (file_names);
918 m_abbrev_table.file_write (file_names);
919 m_entry_pool.file_write (file_names);
920 m_debugstrlookup.file_write (file_str);
921 }
922
923 /* A helper user data for write_one_signatured_type. */
924 class write_one_signatured_type_data
925 {
926 public:
927 write_one_signatured_type_data (debug_names &nametable_,
928 signatured_type_index_data &&info_)
929 : nametable (nametable_), info (std::move (info_))
930 {}
931 debug_names &nametable;
932 struct signatured_type_index_data info;
933 };
934
935 /* A helper function to pass write_one_signatured_type to
936 htab_traverse_noresize. */
937 static int
938 write_one_signatured_type (void **slot, void *d)
939 {
940 write_one_signatured_type_data *data = (write_one_signatured_type_data *) d;
941 struct signatured_type_index_data *info = &data->info;
942 struct signatured_type *entry = (struct signatured_type *) *slot;
943
944 data->nametable.write_one_signatured_type (entry, info);
945
946 return 1;
947 }
948
949 private:
950
951 /* Storage for symbol names mapping them to their .debug_str section
952 offsets. */
953 class debug_str_lookup
954 {
955 public:
956
957 /* Object constructor to be called for current DWARF2_PER_OBJFILE.
958 All .debug_str section strings are automatically stored. */
959 debug_str_lookup (struct dwarf2_per_objfile *dwarf2_per_objfile)
960 : m_abfd (dwarf2_per_objfile->objfile->obfd),
961 m_dwarf2_per_objfile (dwarf2_per_objfile)
962 {
963 dwarf2_read_section (dwarf2_per_objfile->objfile,
964 &dwarf2_per_objfile->str);
965 if (dwarf2_per_objfile->str.buffer == NULL)
966 return;
967 for (const gdb_byte *data = dwarf2_per_objfile->str.buffer;
968 data < (dwarf2_per_objfile->str.buffer
969 + dwarf2_per_objfile->str.size);)
970 {
971 const char *const s = reinterpret_cast<const char *> (data);
972 const auto insertpair
973 = m_str_table.emplace (c_str_view (s),
974 data - dwarf2_per_objfile->str.buffer);
975 if (!insertpair.second)
976 complaint (_("Duplicate string \"%s\" in "
977 ".debug_str section [in module %s]"),
978 s, bfd_get_filename (m_abfd));
979 data += strlen (s) + 1;
980 }
981 }
982
983 /* Return offset of symbol name S in the .debug_str section. Add
984 such symbol to the section's end if it does not exist there
985 yet. */
986 size_t lookup (const char *s)
987 {
988 const auto it = m_str_table.find (c_str_view (s));
989 if (it != m_str_table.end ())
990 return it->second;
991 const size_t offset = (m_dwarf2_per_objfile->str.size
992 + m_str_add_buf.size ());
993 m_str_table.emplace (c_str_view (s), offset);
994 m_str_add_buf.append_cstr0 (s);
995 return offset;
996 }
997
998 /* Append the end of the .debug_str section to FILE. */
999 void file_write (FILE *file) const
1000 {
1001 m_str_add_buf.file_write (file);
1002 }
1003
1004 private:
1005 std::unordered_map<c_str_view, size_t, c_str_view_hasher> m_str_table;
1006 bfd *const m_abfd;
1007 struct dwarf2_per_objfile *m_dwarf2_per_objfile;
1008
1009 /* Data to add at the end of .debug_str for new needed symbol names. */
1010 data_buf m_str_add_buf;
1011 };
1012
1013 /* Container to map used DWARF tags to their .debug_names abbreviation
1014 tags. */
1015 class index_key
1016 {
1017 public:
1018 index_key (int dwarf_tag_, bool is_static_, unit_kind kind_)
1019 : dwarf_tag (dwarf_tag_), is_static (is_static_), kind (kind_)
1020 {
1021 }
1022
1023 bool
1024 operator== (const index_key &other) const
1025 {
1026 return (dwarf_tag == other.dwarf_tag && is_static == other.is_static
1027 && kind == other.kind);
1028 }
1029
1030 const int dwarf_tag;
1031 const bool is_static;
1032 const unit_kind kind;
1033 };
1034
1035 /* Provide std::unordered_map::hasher for index_key. */
1036 class index_key_hasher
1037 {
1038 public:
1039 size_t
1040 operator () (const index_key &key) const
1041 {
1042 return (std::hash<int>() (key.dwarf_tag) << 1) | key.is_static;
1043 }
1044 };
1045
1046 /* Parameters of one symbol entry. */
1047 class symbol_value
1048 {
1049 public:
1050 const int dwarf_tag, cu_index;
1051 const bool is_static;
1052 const unit_kind kind;
1053
1054 symbol_value (int dwarf_tag_, int cu_index_, bool is_static_,
1055 unit_kind kind_)
1056 : dwarf_tag (dwarf_tag_), cu_index (cu_index_), is_static (is_static_),
1057 kind (kind_)
1058 {}
1059
1060 bool
1061 operator< (const symbol_value &other) const
1062 {
1063 #define X(n) \
1064 do \
1065 { \
1066 if (n < other.n) \
1067 return true; \
1068 if (n > other.n) \
1069 return false; \
1070 } \
1071 while (0)
1072 X (dwarf_tag);
1073 X (is_static);
1074 X (kind);
1075 X (cu_index);
1076 #undef X
1077 return false;
1078 }
1079 };
1080
1081 /* Abstract base class to unify DWARF-32 and DWARF-64 name table
1082 output. */
1083 class offset_vec
1084 {
1085 protected:
1086 const bfd_endian dwarf5_byte_order;
1087 public:
1088 explicit offset_vec (bfd_endian dwarf5_byte_order_)
1089 : dwarf5_byte_order (dwarf5_byte_order_)
1090 {}
1091
1092 /* Call std::vector::reserve for NELEM elements. */
1093 virtual void reserve (size_t nelem) = 0;
1094
1095 /* Call std::vector::push_back with store_unsigned_integer byte
1096 reordering for ELEM. */
1097 virtual void push_back_reorder (size_t elem) = 0;
1098
1099 /* Return expected output size in bytes. */
1100 virtual size_t bytes () const = 0;
1101
1102 /* Write name table to FILE. */
1103 virtual void file_write (FILE *file) const = 0;
1104 };
1105
1106 /* Template to unify DWARF-32 and DWARF-64 output. */
1107 template<typename OffsetSize>
1108 class offset_vec_tmpl : public offset_vec
1109 {
1110 public:
1111 explicit offset_vec_tmpl (bfd_endian dwarf5_byte_order_)
1112 : offset_vec (dwarf5_byte_order_)
1113 {}
1114
1115 /* Implement offset_vec::reserve. */
1116 void reserve (size_t nelem) override
1117 {
1118 m_vec.reserve (nelem);
1119 }
1120
1121 /* Implement offset_vec::push_back_reorder. */
1122 void push_back_reorder (size_t elem) override
1123 {
1124 m_vec.push_back (elem);
1125 /* Check for overflow. */
1126 gdb_assert (m_vec.back () == elem);
1127 store_unsigned_integer (reinterpret_cast<gdb_byte *> (&m_vec.back ()),
1128 sizeof (m_vec.back ()), dwarf5_byte_order, elem);
1129 }
1130
1131 /* Implement offset_vec::bytes. */
1132 size_t bytes () const override
1133 {
1134 return m_vec.size () * sizeof (m_vec[0]);
1135 }
1136
1137 /* Implement offset_vec::file_write. */
1138 void file_write (FILE *file) const override
1139 {
1140 ::file_write (file, m_vec);
1141 }
1142
1143 private:
1144 std::vector<OffsetSize> m_vec;
1145 };
1146
1147 /* Base class to unify DWARF-32 and DWARF-64 .debug_names output
1148 respecting name table width. */
1149 class dwarf
1150 {
1151 public:
1152 offset_vec &name_table_string_offs, &name_table_entry_offs;
1153
1154 dwarf (offset_vec &name_table_string_offs_,
1155 offset_vec &name_table_entry_offs_)
1156 : name_table_string_offs (name_table_string_offs_),
1157 name_table_entry_offs (name_table_entry_offs_)
1158 {
1159 }
1160 };
1161
1162 /* Template to unify DWARF-32 and DWARF-64 .debug_names output
1163 respecting name table width. */
1164 template<typename OffsetSize>
1165 class dwarf_tmpl : public dwarf
1166 {
1167 public:
1168 explicit dwarf_tmpl (bfd_endian dwarf5_byte_order_)
1169 : dwarf (m_name_table_string_offs, m_name_table_entry_offs),
1170 m_name_table_string_offs (dwarf5_byte_order_),
1171 m_name_table_entry_offs (dwarf5_byte_order_)
1172 {}
1173
1174 private:
1175 offset_vec_tmpl<OffsetSize> m_name_table_string_offs;
1176 offset_vec_tmpl<OffsetSize> m_name_table_entry_offs;
1177 };
1178
1179 /* Try to reconstruct original DWARF tag for given partial_symbol.
1180 This function is not DWARF-5 compliant but it is sufficient for
1181 GDB as a DWARF-5 index consumer. */
1182 static int psymbol_tag (const struct partial_symbol *psym)
1183 {
1184 domain_enum domain = psym->domain;
1185 enum address_class aclass = psym->aclass;
1186
1187 switch (domain)
1188 {
1189 case VAR_DOMAIN:
1190 switch (aclass)
1191 {
1192 case LOC_BLOCK:
1193 return DW_TAG_subprogram;
1194 case LOC_TYPEDEF:
1195 return DW_TAG_typedef;
1196 case LOC_COMPUTED:
1197 case LOC_CONST_BYTES:
1198 case LOC_OPTIMIZED_OUT:
1199 case LOC_STATIC:
1200 return DW_TAG_variable;
1201 case LOC_CONST:
1202 /* Note: It's currently impossible to recognize psyms as enum values
1203 short of reading the type info. For now punt. */
1204 return DW_TAG_variable;
1205 default:
1206 /* There are other LOC_FOO values that one might want to classify
1207 as variables, but dwarf2read.c doesn't currently use them. */
1208 return DW_TAG_variable;
1209 }
1210 case STRUCT_DOMAIN:
1211 return DW_TAG_structure_type;
1212 default:
1213 return 0;
1214 }
1215 }
1216
1217 /* Call insert for all partial symbols and mark them in PSYMS_SEEN. */
1218 void write_psymbols (std::unordered_set<partial_symbol *> &psyms_seen,
1219 struct partial_symbol **psymp, int count, int cu_index,
1220 bool is_static, unit_kind kind)
1221 {
1222 for (; count-- > 0; ++psymp)
1223 {
1224 struct partial_symbol *psym = *psymp;
1225
1226 /* Only add a given psymbol once. */
1227 if (psyms_seen.insert (psym).second)
1228 insert (psym, cu_index, is_static, kind);
1229 }
1230 }
1231
1232 /* A helper function that writes a single signatured_type
1233 to a debug_names. */
1234 void
1235 write_one_signatured_type (struct signatured_type *entry,
1236 struct signatured_type_index_data *info)
1237 {
1238 dwarf2_psymtab *psymtab = entry->per_cu.v.psymtab;
1239
1240 write_psymbols (info->psyms_seen,
1241 (info->objfile->partial_symtabs->global_psymbols.data ()
1242 + psymtab->globals_offset),
1243 psymtab->n_global_syms, info->cu_index, false,
1244 unit_kind::tu);
1245 write_psymbols (info->psyms_seen,
1246 (info->objfile->partial_symtabs->static_psymbols.data ()
1247 + psymtab->statics_offset),
1248 psymtab->n_static_syms, info->cu_index, true,
1249 unit_kind::tu);
1250
1251 info->types_list.append_uint (dwarf5_offset_size (), m_dwarf5_byte_order,
1252 to_underlying (entry->per_cu.sect_off));
1253
1254 ++info->cu_index;
1255 }
1256
1257 /* Store value of each symbol. */
1258 std::unordered_map<c_str_view, std::set<symbol_value>, c_str_view_hasher>
1259 m_name_to_value_set;
1260
1261 /* Tables of DWARF-5 .debug_names. They are in object file byte
1262 order. */
1263 std::vector<uint32_t> m_bucket_table;
1264 std::vector<uint32_t> m_hash_table;
1265
1266 const bfd_endian m_dwarf5_byte_order;
1267 dwarf_tmpl<uint32_t> m_dwarf32;
1268 dwarf_tmpl<uint64_t> m_dwarf64;
1269 dwarf &m_dwarf;
1270 offset_vec &m_name_table_string_offs, &m_name_table_entry_offs;
1271 debug_str_lookup m_debugstrlookup;
1272
1273 /* Map each used .debug_names abbreviation tag parameter to its
1274 index value. */
1275 std::unordered_map<index_key, int, index_key_hasher> m_indexkey_to_idx;
1276
1277 /* Next unused .debug_names abbreviation tag for
1278 m_indexkey_to_idx. */
1279 int m_idx_next = 1;
1280
1281 /* .debug_names abbreviation table. */
1282 data_buf m_abbrev_table;
1283
1284 /* .debug_names entry pool. */
1285 data_buf m_entry_pool;
1286
1287 /* Temporary storage for Ada names. */
1288 auto_obstack m_string_obstack;
1289 };
1290
1291 /* Return iff any of the needed offsets does not fit into 32-bit
1292 .debug_names section. */
1293
1294 static bool
1295 check_dwarf64_offsets (struct dwarf2_per_objfile *dwarf2_per_objfile)
1296 {
1297 for (dwarf2_per_cu_data *per_cu : dwarf2_per_objfile->all_comp_units)
1298 {
1299 if (to_underlying (per_cu->sect_off) >= (static_cast<uint64_t> (1) << 32))
1300 return true;
1301 }
1302 for (const signatured_type *sigtype : dwarf2_per_objfile->all_type_units)
1303 {
1304 const dwarf2_per_cu_data &per_cu = sigtype->per_cu;
1305
1306 if (to_underlying (per_cu.sect_off) >= (static_cast<uint64_t> (1) << 32))
1307 return true;
1308 }
1309 return false;
1310 }
1311
1312 /* The psyms_seen set is potentially going to be largish (~40k
1313 elements when indexing a -g3 build of GDB itself). Estimate the
1314 number of elements in order to avoid too many rehashes, which
1315 require rebuilding buckets and thus many trips to
1316 malloc/free. */
1317
1318 static size_t
1319 psyms_seen_size (struct dwarf2_per_objfile *dwarf2_per_objfile)
1320 {
1321 size_t psyms_count = 0;
1322 for (dwarf2_per_cu_data *per_cu : dwarf2_per_objfile->all_comp_units)
1323 {
1324 dwarf2_psymtab *psymtab = per_cu->v.psymtab;
1325
1326 if (psymtab != NULL && psymtab->user == NULL)
1327 recursively_count_psymbols (psymtab, psyms_count);
1328 }
1329 /* Generating an index for gdb itself shows a ratio of
1330 TOTAL_SEEN_SYMS/UNIQUE_SYMS or ~5. 4 seems like a good bet. */
1331 return psyms_count / 4;
1332 }
1333
1334 /* Assert that FILE's size is EXPECTED_SIZE. Assumes file's seek
1335 position is at the end of the file. */
1336
1337 static void
1338 assert_file_size (FILE *file, size_t expected_size)
1339 {
1340 const auto file_size = ftell (file);
1341 if (file_size == -1)
1342 perror_with_name (("ftell"));
1343 gdb_assert (file_size == expected_size);
1344 }
1345
1346 /* Write a gdb index file to OUT_FILE from all the sections passed as
1347 arguments. */
1348
1349 static void
1350 write_gdbindex_1 (FILE *out_file,
1351 const data_buf &cu_list,
1352 const data_buf &types_cu_list,
1353 const data_buf &addr_vec,
1354 const data_buf &symtab_vec,
1355 const data_buf &constant_pool)
1356 {
1357 data_buf contents;
1358 const offset_type size_of_header = 6 * sizeof (offset_type);
1359 offset_type total_len = size_of_header;
1360
1361 /* The version number. */
1362 contents.append_data (MAYBE_SWAP (8));
1363
1364 /* The offset of the CU list from the start of the file. */
1365 contents.append_data (MAYBE_SWAP (total_len));
1366 total_len += cu_list.size ();
1367
1368 /* The offset of the types CU list from the start of the file. */
1369 contents.append_data (MAYBE_SWAP (total_len));
1370 total_len += types_cu_list.size ();
1371
1372 /* The offset of the address table from the start of the file. */
1373 contents.append_data (MAYBE_SWAP (total_len));
1374 total_len += addr_vec.size ();
1375
1376 /* The offset of the symbol table from the start of the file. */
1377 contents.append_data (MAYBE_SWAP (total_len));
1378 total_len += symtab_vec.size ();
1379
1380 /* The offset of the constant pool from the start of the file. */
1381 contents.append_data (MAYBE_SWAP (total_len));
1382 total_len += constant_pool.size ();
1383
1384 gdb_assert (contents.size () == size_of_header);
1385
1386 contents.file_write (out_file);
1387 cu_list.file_write (out_file);
1388 types_cu_list.file_write (out_file);
1389 addr_vec.file_write (out_file);
1390 symtab_vec.file_write (out_file);
1391 constant_pool.file_write (out_file);
1392
1393 assert_file_size (out_file, total_len);
1394 }
1395
1396 /* Write contents of a .gdb_index section for OBJFILE into OUT_FILE.
1397 If OBJFILE has an associated dwz file, write contents of a .gdb_index
1398 section for that dwz file into DWZ_OUT_FILE. If OBJFILE does not have an
1399 associated dwz file, DWZ_OUT_FILE must be NULL. */
1400
1401 static void
1402 write_gdbindex (struct dwarf2_per_objfile *dwarf2_per_objfile, FILE *out_file,
1403 FILE *dwz_out_file)
1404 {
1405 struct objfile *objfile = dwarf2_per_objfile->objfile;
1406 mapped_symtab symtab;
1407 data_buf objfile_cu_list;
1408 data_buf dwz_cu_list;
1409
1410 /* While we're scanning CU's create a table that maps a psymtab pointer
1411 (which is what addrmap records) to its index (which is what is recorded
1412 in the index file). This will later be needed to write the address
1413 table. */
1414 psym_index_map cu_index_htab;
1415 cu_index_htab.reserve (dwarf2_per_objfile->all_comp_units.size ());
1416
1417 /* The CU list is already sorted, so we don't need to do additional
1418 work here. Also, the debug_types entries do not appear in
1419 all_comp_units, but only in their own hash table. */
1420
1421 std::unordered_set<partial_symbol *> psyms_seen
1422 (psyms_seen_size (dwarf2_per_objfile));
1423 for (int i = 0; i < dwarf2_per_objfile->all_comp_units.size (); ++i)
1424 {
1425 struct dwarf2_per_cu_data *per_cu
1426 = dwarf2_per_objfile->all_comp_units[i];
1427 dwarf2_psymtab *psymtab = per_cu->v.psymtab;
1428
1429 /* CU of a shared file from 'dwz -m' may be unused by this main file.
1430 It may be referenced from a local scope but in such case it does not
1431 need to be present in .gdb_index. */
1432 if (psymtab == NULL)
1433 continue;
1434
1435 if (psymtab->user == NULL)
1436 recursively_write_psymbols (objfile, psymtab, &symtab,
1437 psyms_seen, i);
1438
1439 const auto insertpair = cu_index_htab.emplace (psymtab, i);
1440 gdb_assert (insertpair.second);
1441
1442 /* The all_comp_units list contains CUs read from the objfile as well as
1443 from the eventual dwz file. We need to place the entry in the
1444 corresponding index. */
1445 data_buf &cu_list = per_cu->is_dwz ? dwz_cu_list : objfile_cu_list;
1446 cu_list.append_uint (8, BFD_ENDIAN_LITTLE,
1447 to_underlying (per_cu->sect_off));
1448 cu_list.append_uint (8, BFD_ENDIAN_LITTLE, per_cu->length);
1449 }
1450
1451 /* Dump the address map. */
1452 data_buf addr_vec;
1453 write_address_map (objfile, addr_vec, cu_index_htab);
1454
1455 /* Write out the .debug_type entries, if any. */
1456 data_buf types_cu_list;
1457 if (dwarf2_per_objfile->signatured_types)
1458 {
1459 signatured_type_index_data sig_data (types_cu_list,
1460 psyms_seen);
1461
1462 sig_data.objfile = objfile;
1463 sig_data.symtab = &symtab;
1464 sig_data.cu_index = dwarf2_per_objfile->all_comp_units.size ();
1465 htab_traverse_noresize (dwarf2_per_objfile->signatured_types,
1466 write_one_signatured_type, &sig_data);
1467 }
1468
1469 /* Now that we've processed all symbols we can shrink their cu_indices
1470 lists. */
1471 uniquify_cu_indices (&symtab);
1472
1473 data_buf symtab_vec, constant_pool;
1474 write_hash_table (&symtab, symtab_vec, constant_pool);
1475
1476 write_gdbindex_1(out_file, objfile_cu_list, types_cu_list, addr_vec,
1477 symtab_vec, constant_pool);
1478
1479 if (dwz_out_file != NULL)
1480 write_gdbindex_1 (dwz_out_file, dwz_cu_list, {}, {}, {}, {});
1481 else
1482 gdb_assert (dwz_cu_list.empty ());
1483 }
1484
1485 /* DWARF-5 augmentation string for GDB's DW_IDX_GNU_* extension. */
1486 static const gdb_byte dwarf5_gdb_augmentation[] = { 'G', 'D', 'B', 0 };
1487
1488 /* Write a new .debug_names section for OBJFILE into OUT_FILE, write
1489 needed addition to .debug_str section to OUT_FILE_STR. Return how
1490 many bytes were expected to be written into OUT_FILE. */
1491
1492 static void
1493 write_debug_names (struct dwarf2_per_objfile *dwarf2_per_objfile,
1494 FILE *out_file, FILE *out_file_str)
1495 {
1496 const bool dwarf5_is_dwarf64 = check_dwarf64_offsets (dwarf2_per_objfile);
1497 struct objfile *objfile = dwarf2_per_objfile->objfile;
1498 const enum bfd_endian dwarf5_byte_order
1499 = gdbarch_byte_order (get_objfile_arch (objfile));
1500
1501 /* The CU list is already sorted, so we don't need to do additional
1502 work here. Also, the debug_types entries do not appear in
1503 all_comp_units, but only in their own hash table. */
1504 data_buf cu_list;
1505 debug_names nametable (dwarf2_per_objfile, dwarf5_is_dwarf64,
1506 dwarf5_byte_order);
1507 std::unordered_set<partial_symbol *>
1508 psyms_seen (psyms_seen_size (dwarf2_per_objfile));
1509 for (int i = 0; i < dwarf2_per_objfile->all_comp_units.size (); ++i)
1510 {
1511 const dwarf2_per_cu_data *per_cu = dwarf2_per_objfile->all_comp_units[i];
1512 dwarf2_psymtab *psymtab = per_cu->v.psymtab;
1513
1514 /* CU of a shared file from 'dwz -m' may be unused by this main
1515 file. It may be referenced from a local scope but in such
1516 case it does not need to be present in .debug_names. */
1517 if (psymtab == NULL)
1518 continue;
1519
1520 if (psymtab->user == NULL)
1521 nametable.recursively_write_psymbols (objfile, psymtab, psyms_seen, i);
1522
1523 cu_list.append_uint (nametable.dwarf5_offset_size (), dwarf5_byte_order,
1524 to_underlying (per_cu->sect_off));
1525 }
1526
1527 /* Write out the .debug_type entries, if any. */
1528 data_buf types_cu_list;
1529 if (dwarf2_per_objfile->signatured_types)
1530 {
1531 debug_names::write_one_signatured_type_data sig_data (nametable,
1532 signatured_type_index_data (types_cu_list, psyms_seen));
1533
1534 sig_data.info.objfile = objfile;
1535 /* It is used only for gdb_index. */
1536 sig_data.info.symtab = nullptr;
1537 sig_data.info.cu_index = 0;
1538 htab_traverse_noresize (dwarf2_per_objfile->signatured_types,
1539 debug_names::write_one_signatured_type,
1540 &sig_data);
1541 }
1542
1543 nametable.build ();
1544
1545 /* No addr_vec - DWARF-5 uses .debug_aranges generated by GCC. */
1546
1547 const offset_type bytes_of_header
1548 = ((dwarf5_is_dwarf64 ? 12 : 4)
1549 + 2 + 2 + 7 * 4
1550 + sizeof (dwarf5_gdb_augmentation));
1551 size_t expected_bytes = 0;
1552 expected_bytes += bytes_of_header;
1553 expected_bytes += cu_list.size ();
1554 expected_bytes += types_cu_list.size ();
1555 expected_bytes += nametable.bytes ();
1556 data_buf header;
1557
1558 if (!dwarf5_is_dwarf64)
1559 {
1560 const uint64_t size64 = expected_bytes - 4;
1561 gdb_assert (size64 < 0xfffffff0);
1562 header.append_uint (4, dwarf5_byte_order, size64);
1563 }
1564 else
1565 {
1566 header.append_uint (4, dwarf5_byte_order, 0xffffffff);
1567 header.append_uint (8, dwarf5_byte_order, expected_bytes - 12);
1568 }
1569
1570 /* The version number. */
1571 header.append_uint (2, dwarf5_byte_order, 5);
1572
1573 /* Padding. */
1574 header.append_uint (2, dwarf5_byte_order, 0);
1575
1576 /* comp_unit_count - The number of CUs in the CU list. */
1577 header.append_uint (4, dwarf5_byte_order,
1578 dwarf2_per_objfile->all_comp_units.size ());
1579
1580 /* local_type_unit_count - The number of TUs in the local TU
1581 list. */
1582 header.append_uint (4, dwarf5_byte_order,
1583 dwarf2_per_objfile->all_type_units.size ());
1584
1585 /* foreign_type_unit_count - The number of TUs in the foreign TU
1586 list. */
1587 header.append_uint (4, dwarf5_byte_order, 0);
1588
1589 /* bucket_count - The number of hash buckets in the hash lookup
1590 table. */
1591 header.append_uint (4, dwarf5_byte_order, nametable.bucket_count ());
1592
1593 /* name_count - The number of unique names in the index. */
1594 header.append_uint (4, dwarf5_byte_order, nametable.name_count ());
1595
1596 /* abbrev_table_size - The size in bytes of the abbreviations
1597 table. */
1598 header.append_uint (4, dwarf5_byte_order, nametable.abbrev_table_bytes ());
1599
1600 /* augmentation_string_size - The size in bytes of the augmentation
1601 string. This value is rounded up to a multiple of 4. */
1602 static_assert (sizeof (dwarf5_gdb_augmentation) % 4 == 0, "");
1603 header.append_uint (4, dwarf5_byte_order, sizeof (dwarf5_gdb_augmentation));
1604 header.append_data (dwarf5_gdb_augmentation);
1605
1606 gdb_assert (header.size () == bytes_of_header);
1607
1608 header.file_write (out_file);
1609 cu_list.file_write (out_file);
1610 types_cu_list.file_write (out_file);
1611 nametable.file_write (out_file, out_file_str);
1612
1613 assert_file_size (out_file, expected_bytes);
1614 }
1615
1616 /* This represents an index file being written (work-in-progress).
1617
1618 The data is initially written to a temporary file. When the finalize method
1619 is called, the file is closed and moved to its final location.
1620
1621 On failure (if this object is being destroyed with having called finalize),
1622 the temporary file is closed and deleted. */
1623
1624 struct index_wip_file
1625 {
1626 index_wip_file (const char *dir, const char *basename,
1627 const char *suffix)
1628 {
1629 filename = (std::string (dir) + SLASH_STRING + basename
1630 + suffix);
1631
1632 filename_temp = make_temp_filename (filename);
1633
1634 scoped_fd out_file_fd (gdb_mkostemp_cloexec (filename_temp.data (),
1635 O_BINARY));
1636 if (out_file_fd.get () == -1)
1637 perror_with_name (("mkstemp"));
1638
1639 out_file = out_file_fd.to_file ("wb");
1640
1641 if (out_file == nullptr)
1642 error (_("Can't open `%s' for writing"), filename_temp.data ());
1643
1644 unlink_file.emplace (filename_temp.data ());
1645 }
1646
1647 void finalize ()
1648 {
1649 /* We want to keep the file. */
1650 unlink_file->keep ();
1651
1652 /* Close and move the str file in place. */
1653 unlink_file.reset ();
1654 if (rename (filename_temp.data (), filename.c_str ()) != 0)
1655 perror_with_name (("rename"));
1656 }
1657
1658 std::string filename;
1659 gdb::char_vector filename_temp;
1660
1661 /* Order matters here; we want FILE to be closed before
1662 FILENAME_TEMP is unlinked, because on MS-Windows one cannot
1663 delete a file that is still open. So, we wrap the unlinker in an
1664 optional and emplace it once we know the file name. */
1665 gdb::optional<gdb::unlinker> unlink_file;
1666
1667 gdb_file_up out_file;
1668 };
1669
1670 /* See dwarf-index-write.h. */
1671
1672 void
1673 write_psymtabs_to_index (struct dwarf2_per_objfile *dwarf2_per_objfile,
1674 const char *dir, const char *basename,
1675 const char *dwz_basename,
1676 dw_index_kind index_kind)
1677 {
1678 struct objfile *objfile = dwarf2_per_objfile->objfile;
1679
1680 if (dwarf2_per_objfile->using_index)
1681 error (_("Cannot use an index to create the index"));
1682
1683 if (dwarf2_per_objfile->types.size () > 1)
1684 error (_("Cannot make an index when the file has multiple .debug_types sections"));
1685
1686 if (!objfile->partial_symtabs->psymtabs
1687 || !objfile->partial_symtabs->psymtabs_addrmap)
1688 return;
1689
1690 struct stat st;
1691 if (stat (objfile_name (objfile), &st) < 0)
1692 perror_with_name (objfile_name (objfile));
1693
1694 const char *index_suffix = (index_kind == dw_index_kind::DEBUG_NAMES
1695 ? INDEX5_SUFFIX : INDEX4_SUFFIX);
1696
1697 index_wip_file objfile_index_wip (dir, basename, index_suffix);
1698 gdb::optional<index_wip_file> dwz_index_wip;
1699
1700 if (dwz_basename != NULL)
1701 dwz_index_wip.emplace (dir, dwz_basename, index_suffix);
1702
1703 if (index_kind == dw_index_kind::DEBUG_NAMES)
1704 {
1705 index_wip_file str_wip_file (dir, basename, DEBUG_STR_SUFFIX);
1706
1707 write_debug_names (dwarf2_per_objfile, objfile_index_wip.out_file.get (),
1708 str_wip_file.out_file.get ());
1709
1710 str_wip_file.finalize ();
1711 }
1712 else
1713 write_gdbindex (dwarf2_per_objfile, objfile_index_wip.out_file.get (),
1714 (dwz_index_wip.has_value ()
1715 ? dwz_index_wip->out_file.get () : NULL));
1716
1717 objfile_index_wip.finalize ();
1718
1719 if (dwz_index_wip.has_value ())
1720 dwz_index_wip->finalize ();
1721 }
1722
1723 /* Implementation of the `save gdb-index' command.
1724
1725 Note that the .gdb_index file format used by this command is
1726 documented in the GDB manual. Any changes here must be documented
1727 there. */
1728
1729 static void
1730 save_gdb_index_command (const char *arg, int from_tty)
1731 {
1732 const char dwarf5space[] = "-dwarf-5 ";
1733 dw_index_kind index_kind = dw_index_kind::GDB_INDEX;
1734
1735 if (!arg)
1736 arg = "";
1737
1738 arg = skip_spaces (arg);
1739 if (strncmp (arg, dwarf5space, strlen (dwarf5space)) == 0)
1740 {
1741 index_kind = dw_index_kind::DEBUG_NAMES;
1742 arg += strlen (dwarf5space);
1743 arg = skip_spaces (arg);
1744 }
1745
1746 if (!*arg)
1747 error (_("usage: save gdb-index [-dwarf-5] DIRECTORY"));
1748
1749 for (objfile *objfile : current_program_space->objfiles ())
1750 {
1751 struct stat st;
1752
1753 /* If the objfile does not correspond to an actual file, skip it. */
1754 if (stat (objfile_name (objfile), &st) < 0)
1755 continue;
1756
1757 struct dwarf2_per_objfile *dwarf2_per_objfile
1758 = get_dwarf2_per_objfile (objfile);
1759
1760 if (dwarf2_per_objfile != NULL)
1761 {
1762 try
1763 {
1764 const char *basename = lbasename (objfile_name (objfile));
1765 const dwz_file *dwz = dwarf2_get_dwz_file (dwarf2_per_objfile);
1766 const char *dwz_basename = NULL;
1767
1768 if (dwz != NULL)
1769 dwz_basename = lbasename (dwz->filename ());
1770
1771 write_psymtabs_to_index (dwarf2_per_objfile, arg, basename,
1772 dwz_basename, index_kind);
1773 }
1774 catch (const gdb_exception_error &except)
1775 {
1776 exception_fprintf (gdb_stderr, except,
1777 _("Error while writing index for `%s': "),
1778 objfile_name (objfile));
1779 }
1780 }
1781
1782 }
1783 }
1784
1785 void _initialize_dwarf_index_write ();
1786 void
1787 _initialize_dwarf_index_write ()
1788 {
1789 cmd_list_element *c = add_cmd ("gdb-index", class_files,
1790 save_gdb_index_command, _("\
1791 Save a gdb-index file.\n\
1792 Usage: save gdb-index [-dwarf-5] DIRECTORY\n\
1793 \n\
1794 No options create one file with .gdb-index extension for pre-DWARF-5\n\
1795 compatible .gdb_index section. With -dwarf-5 creates two files with\n\
1796 extension .debug_names and .debug_str for DWARF-5 .debug_names section."),
1797 &save_cmdlist);
1798 set_cmd_completer (c, filename_completer);
1799 }