[gdb] Fix more typos in comments
[deliverable/binutils-gdb.git] / gdb / dwarf-index-write.c
1 /* DWARF index writing support for GDB.
2
3 Copyright (C) 1994-2019 Free Software Foundation, Inc.
4
5 This file is part of GDB.
6
7 This program is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3 of the License, or
10 (at your option) any later version.
11
12 This program is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
16
17 You should have received a copy of the GNU General Public License
18 along with this program. If not, see <http://www.gnu.org/licenses/>. */
19
20 #include "defs.h"
21
22 #include "addrmap.h"
23 #include "cli/cli-decode.h"
24 #include "gdbsupport/byte-vector.h"
25 #include "gdbsupport/filestuff.h"
26 #include "gdbsupport/gdb_unlinker.h"
27 #include "gdbsupport/pathstuff.h"
28 #include "gdbsupport/scoped_fd.h"
29 #include "complaints.h"
30 #include "dwarf-index-common.h"
31 #include "dwarf2.h"
32 #include "dwarf2read.h"
33 #include "gdb/gdb-index.h"
34 #include "gdbcmd.h"
35 #include "objfiles.h"
36 #include "psympriv.h"
37 #include "ada-lang.h"
38
39 #include <algorithm>
40 #include <cmath>
41 #include <set>
42 #include <unordered_map>
43 #include <unordered_set>
44
45 /* Ensure only legit values are used. */
46 #define DW2_GDB_INDEX_SYMBOL_STATIC_SET_VALUE(cu_index, value) \
47 do { \
48 gdb_assert ((unsigned int) (value) <= 1); \
49 GDB_INDEX_SYMBOL_STATIC_SET_VALUE((cu_index), (value)); \
50 } while (0)
51
52 /* Ensure only legit values are used. */
53 #define DW2_GDB_INDEX_SYMBOL_KIND_SET_VALUE(cu_index, value) \
54 do { \
55 gdb_assert ((value) >= GDB_INDEX_SYMBOL_KIND_TYPE \
56 && (value) <= GDB_INDEX_SYMBOL_KIND_OTHER); \
57 GDB_INDEX_SYMBOL_KIND_SET_VALUE((cu_index), (value)); \
58 } while (0)
59
60 /* Ensure we don't use more than the allotted number of bits for the CU. */
61 #define DW2_GDB_INDEX_CU_SET_VALUE(cu_index, value) \
62 do { \
63 gdb_assert (((value) & ~GDB_INDEX_CU_MASK) == 0); \
64 GDB_INDEX_CU_SET_VALUE((cu_index), (value)); \
65 } while (0)
66
67 /* The "save gdb-index" command. */
68
69 /* Write SIZE bytes from the buffer pointed to by DATA to FILE, with
70 error checking. */
71
72 static void
73 file_write (FILE *file, const void *data, size_t size)
74 {
75 if (fwrite (data, 1, size, file) != size)
76 error (_("couldn't data write to file"));
77 }
78
79 /* Write the contents of VEC to FILE, with error checking. */
80
81 template<typename Elem, typename Alloc>
82 static void
83 file_write (FILE *file, const std::vector<Elem, Alloc> &vec)
84 {
85 if (!vec.empty ())
86 file_write (file, vec.data (), vec.size () * sizeof (vec[0]));
87 }
88
89 /* In-memory buffer to prepare data to be written later to a file. */
90 class data_buf
91 {
92 public:
93 /* Copy DATA to the end of the buffer. */
94 template<typename T>
95 void append_data (const T &data)
96 {
97 std::copy (reinterpret_cast<const gdb_byte *> (&data),
98 reinterpret_cast<const gdb_byte *> (&data + 1),
99 grow (sizeof (data)));
100 }
101
102 /* Copy CSTR (a zero-terminated string) to the end of buffer. The
103 terminating zero is appended too. */
104 void append_cstr0 (const char *cstr)
105 {
106 const size_t size = strlen (cstr) + 1;
107 std::copy (cstr, cstr + size, grow (size));
108 }
109
110 /* Store INPUT as ULEB128 to the end of buffer. */
111 void append_unsigned_leb128 (ULONGEST input)
112 {
113 for (;;)
114 {
115 gdb_byte output = input & 0x7f;
116 input >>= 7;
117 if (input)
118 output |= 0x80;
119 append_data (output);
120 if (input == 0)
121 break;
122 }
123 }
124
125 /* Accept a host-format integer in VAL and append it to the buffer
126 as a target-format integer which is LEN bytes long. */
127 void append_uint (size_t len, bfd_endian byte_order, ULONGEST val)
128 {
129 ::store_unsigned_integer (grow (len), len, byte_order, val);
130 }
131
132 /* Return the size of the buffer. */
133 size_t size () const
134 {
135 return m_vec.size ();
136 }
137
138 /* Return true iff the buffer is empty. */
139 bool empty () const
140 {
141 return m_vec.empty ();
142 }
143
144 /* Write the buffer to FILE. */
145 void file_write (FILE *file) const
146 {
147 ::file_write (file, m_vec);
148 }
149
150 private:
151 /* Grow SIZE bytes at the end of the buffer. Returns a pointer to
152 the start of the new block. */
153 gdb_byte *grow (size_t size)
154 {
155 m_vec.resize (m_vec.size () + size);
156 return &*(m_vec.end () - size);
157 }
158
159 gdb::byte_vector m_vec;
160 };
161
162 /* An entry in the symbol table. */
163 struct symtab_index_entry
164 {
165 /* The name of the symbol. */
166 const char *name;
167 /* The offset of the name in the constant pool. */
168 offset_type index_offset;
169 /* A sorted vector of the indices of all the CUs that hold an object
170 of this name. */
171 std::vector<offset_type> cu_indices;
172 };
173
174 /* The symbol table. This is a power-of-2-sized hash table. */
175 struct mapped_symtab
176 {
177 mapped_symtab ()
178 {
179 data.resize (1024);
180 }
181
182 offset_type n_elements = 0;
183 std::vector<symtab_index_entry> data;
184 };
185
186 /* Find a slot in SYMTAB for the symbol NAME. Returns a reference to
187 the slot.
188
189 Function is used only during write_hash_table so no index format backward
190 compatibility is needed. */
191
192 static symtab_index_entry &
193 find_slot (struct mapped_symtab *symtab, const char *name)
194 {
195 offset_type index, step, hash = mapped_index_string_hash (INT_MAX, name);
196
197 index = hash & (symtab->data.size () - 1);
198 step = ((hash * 17) & (symtab->data.size () - 1)) | 1;
199
200 for (;;)
201 {
202 if (symtab->data[index].name == NULL
203 || strcmp (name, symtab->data[index].name) == 0)
204 return symtab->data[index];
205 index = (index + step) & (symtab->data.size () - 1);
206 }
207 }
208
209 /* Expand SYMTAB's hash table. */
210
211 static void
212 hash_expand (struct mapped_symtab *symtab)
213 {
214 auto old_entries = std::move (symtab->data);
215
216 symtab->data.clear ();
217 symtab->data.resize (old_entries.size () * 2);
218
219 for (auto &it : old_entries)
220 if (it.name != NULL)
221 {
222 auto &ref = find_slot (symtab, it.name);
223 ref = std::move (it);
224 }
225 }
226
227 /* Add an entry to SYMTAB. NAME is the name of the symbol.
228 CU_INDEX is the index of the CU in which the symbol appears.
229 IS_STATIC is one if the symbol is static, otherwise zero (global). */
230
231 static void
232 add_index_entry (struct mapped_symtab *symtab, const char *name,
233 int is_static, gdb_index_symbol_kind kind,
234 offset_type cu_index)
235 {
236 offset_type cu_index_and_attrs;
237
238 ++symtab->n_elements;
239 if (4 * symtab->n_elements / 3 >= symtab->data.size ())
240 hash_expand (symtab);
241
242 symtab_index_entry &slot = find_slot (symtab, name);
243 if (slot.name == NULL)
244 {
245 slot.name = name;
246 /* index_offset is set later. */
247 }
248
249 cu_index_and_attrs = 0;
250 DW2_GDB_INDEX_CU_SET_VALUE (cu_index_and_attrs, cu_index);
251 DW2_GDB_INDEX_SYMBOL_STATIC_SET_VALUE (cu_index_and_attrs, is_static);
252 DW2_GDB_INDEX_SYMBOL_KIND_SET_VALUE (cu_index_and_attrs, kind);
253
254 /* We don't want to record an index value twice as we want to avoid the
255 duplication.
256 We process all global symbols and then all static symbols
257 (which would allow us to avoid the duplication by only having to check
258 the last entry pushed), but a symbol could have multiple kinds in one CU.
259 To keep things simple we don't worry about the duplication here and
260 sort and uniquify the list after we've processed all symbols. */
261 slot.cu_indices.push_back (cu_index_and_attrs);
262 }
263
264 /* Sort and remove duplicates of all symbols' cu_indices lists. */
265
266 static void
267 uniquify_cu_indices (struct mapped_symtab *symtab)
268 {
269 for (auto &entry : symtab->data)
270 {
271 if (entry.name != NULL && !entry.cu_indices.empty ())
272 {
273 auto &cu_indices = entry.cu_indices;
274 std::sort (cu_indices.begin (), cu_indices.end ());
275 auto from = std::unique (cu_indices.begin (), cu_indices.end ());
276 cu_indices.erase (from, cu_indices.end ());
277 }
278 }
279 }
280
281 /* A form of 'const char *' suitable for container keys. Only the
282 pointer is stored. The strings themselves are compared, not the
283 pointers. */
284 class c_str_view
285 {
286 public:
287 c_str_view (const char *cstr)
288 : m_cstr (cstr)
289 {}
290
291 bool operator== (const c_str_view &other) const
292 {
293 return strcmp (m_cstr, other.m_cstr) == 0;
294 }
295
296 /* Return the underlying C string. Note, the returned string is
297 only a reference with lifetime of this object. */
298 const char *c_str () const
299 {
300 return m_cstr;
301 }
302
303 private:
304 friend class c_str_view_hasher;
305 const char *const m_cstr;
306 };
307
308 /* A std::unordered_map::hasher for c_str_view that uses the right
309 hash function for strings in a mapped index. */
310 class c_str_view_hasher
311 {
312 public:
313 size_t operator () (const c_str_view &x) const
314 {
315 return mapped_index_string_hash (INT_MAX, x.m_cstr);
316 }
317 };
318
319 /* A std::unordered_map::hasher for std::vector<>. */
320 template<typename T>
321 class vector_hasher
322 {
323 public:
324 size_t operator () (const std::vector<T> &key) const
325 {
326 return iterative_hash (key.data (),
327 sizeof (key.front ()) * key.size (), 0);
328 }
329 };
330
331 /* Write the mapped hash table SYMTAB to the data buffer OUTPUT, with
332 constant pool entries going into the data buffer CPOOL. */
333
334 static void
335 write_hash_table (mapped_symtab *symtab, data_buf &output, data_buf &cpool)
336 {
337 {
338 /* Elements are sorted vectors of the indices of all the CUs that
339 hold an object of this name. */
340 std::unordered_map<std::vector<offset_type>, offset_type,
341 vector_hasher<offset_type>>
342 symbol_hash_table;
343
344 /* We add all the index vectors to the constant pool first, to
345 ensure alignment is ok. */
346 for (symtab_index_entry &entry : symtab->data)
347 {
348 if (entry.name == NULL)
349 continue;
350 gdb_assert (entry.index_offset == 0);
351
352 /* Finding before inserting is faster than always trying to
353 insert, because inserting always allocates a node, does the
354 lookup, and then destroys the new node if another node
355 already had the same key. C++17 try_emplace will avoid
356 this. */
357 const auto found
358 = symbol_hash_table.find (entry.cu_indices);
359 if (found != symbol_hash_table.end ())
360 {
361 entry.index_offset = found->second;
362 continue;
363 }
364
365 symbol_hash_table.emplace (entry.cu_indices, cpool.size ());
366 entry.index_offset = cpool.size ();
367 cpool.append_data (MAYBE_SWAP (entry.cu_indices.size ()));
368 for (const auto index : entry.cu_indices)
369 cpool.append_data (MAYBE_SWAP (index));
370 }
371 }
372
373 /* Now write out the hash table. */
374 std::unordered_map<c_str_view, offset_type, c_str_view_hasher> str_table;
375 for (const auto &entry : symtab->data)
376 {
377 offset_type str_off, vec_off;
378
379 if (entry.name != NULL)
380 {
381 const auto insertpair = str_table.emplace (entry.name, cpool.size ());
382 if (insertpair.second)
383 cpool.append_cstr0 (entry.name);
384 str_off = insertpair.first->second;
385 vec_off = entry.index_offset;
386 }
387 else
388 {
389 /* While 0 is a valid constant pool index, it is not valid
390 to have 0 for both offsets. */
391 str_off = 0;
392 vec_off = 0;
393 }
394
395 output.append_data (MAYBE_SWAP (str_off));
396 output.append_data (MAYBE_SWAP (vec_off));
397 }
398 }
399
400 typedef std::unordered_map<partial_symtab *, unsigned int> psym_index_map;
401
402 /* Helper struct for building the address table. */
403 struct addrmap_index_data
404 {
405 addrmap_index_data (data_buf &addr_vec_, psym_index_map &cu_index_htab_)
406 : addr_vec (addr_vec_), cu_index_htab (cu_index_htab_)
407 {}
408
409 struct objfile *objfile;
410 data_buf &addr_vec;
411 psym_index_map &cu_index_htab;
412
413 /* Non-zero if the previous_* fields are valid.
414 We can't write an entry until we see the next entry (since it is only then
415 that we know the end of the entry). */
416 int previous_valid;
417 /* Index of the CU in the table of all CUs in the index file. */
418 unsigned int previous_cu_index;
419 /* Start address of the CU. */
420 CORE_ADDR previous_cu_start;
421 };
422
423 /* Write an address entry to ADDR_VEC. */
424
425 static void
426 add_address_entry (struct objfile *objfile, data_buf &addr_vec,
427 CORE_ADDR start, CORE_ADDR end, unsigned int cu_index)
428 {
429 addr_vec.append_uint (8, BFD_ENDIAN_LITTLE, start);
430 addr_vec.append_uint (8, BFD_ENDIAN_LITTLE, end);
431 addr_vec.append_data (MAYBE_SWAP (cu_index));
432 }
433
434 /* Worker function for traversing an addrmap to build the address table. */
435
436 static int
437 add_address_entry_worker (void *datap, CORE_ADDR start_addr, void *obj)
438 {
439 struct addrmap_index_data *data = (struct addrmap_index_data *) datap;
440 struct partial_symtab *pst = (struct partial_symtab *) obj;
441
442 if (data->previous_valid)
443 add_address_entry (data->objfile, data->addr_vec,
444 data->previous_cu_start, start_addr,
445 data->previous_cu_index);
446
447 data->previous_cu_start = start_addr;
448 if (pst != NULL)
449 {
450 const auto it = data->cu_index_htab.find (pst);
451 gdb_assert (it != data->cu_index_htab.cend ());
452 data->previous_cu_index = it->second;
453 data->previous_valid = 1;
454 }
455 else
456 data->previous_valid = 0;
457
458 return 0;
459 }
460
461 /* Write OBJFILE's address map to ADDR_VEC.
462 CU_INDEX_HTAB is used to map addrmap entries to their CU indices
463 in the index file. */
464
465 static void
466 write_address_map (struct objfile *objfile, data_buf &addr_vec,
467 psym_index_map &cu_index_htab)
468 {
469 struct addrmap_index_data addrmap_index_data (addr_vec, cu_index_htab);
470
471 /* When writing the address table, we have to cope with the fact that
472 the addrmap iterator only provides the start of a region; we have to
473 wait until the next invocation to get the start of the next region. */
474
475 addrmap_index_data.objfile = objfile;
476 addrmap_index_data.previous_valid = 0;
477
478 addrmap_foreach (objfile->partial_symtabs->psymtabs_addrmap,
479 add_address_entry_worker, &addrmap_index_data);
480
481 /* It's highly unlikely the last entry (end address = 0xff...ff)
482 is valid, but we should still handle it.
483 The end address is recorded as the start of the next region, but that
484 doesn't work here. To cope we pass 0xff...ff, this is a rare situation
485 anyway. */
486 if (addrmap_index_data.previous_valid)
487 add_address_entry (objfile, addr_vec,
488 addrmap_index_data.previous_cu_start, (CORE_ADDR) -1,
489 addrmap_index_data.previous_cu_index);
490 }
491
492 /* Return the symbol kind of PSYM. */
493
494 static gdb_index_symbol_kind
495 symbol_kind (struct partial_symbol *psym)
496 {
497 domain_enum domain = psym->domain;
498 enum address_class aclass = psym->aclass;
499
500 switch (domain)
501 {
502 case VAR_DOMAIN:
503 switch (aclass)
504 {
505 case LOC_BLOCK:
506 return GDB_INDEX_SYMBOL_KIND_FUNCTION;
507 case LOC_TYPEDEF:
508 return GDB_INDEX_SYMBOL_KIND_TYPE;
509 case LOC_COMPUTED:
510 case LOC_CONST_BYTES:
511 case LOC_OPTIMIZED_OUT:
512 case LOC_STATIC:
513 return GDB_INDEX_SYMBOL_KIND_VARIABLE;
514 case LOC_CONST:
515 /* Note: It's currently impossible to recognize psyms as enum values
516 short of reading the type info. For now punt. */
517 return GDB_INDEX_SYMBOL_KIND_VARIABLE;
518 default:
519 /* There are other LOC_FOO values that one might want to classify
520 as variables, but dwarf2read.c doesn't currently use them. */
521 return GDB_INDEX_SYMBOL_KIND_OTHER;
522 }
523 case STRUCT_DOMAIN:
524 return GDB_INDEX_SYMBOL_KIND_TYPE;
525 default:
526 return GDB_INDEX_SYMBOL_KIND_OTHER;
527 }
528 }
529
530 /* Add a list of partial symbols to SYMTAB. */
531
532 static void
533 write_psymbols (struct mapped_symtab *symtab,
534 std::unordered_set<partial_symbol *> &psyms_seen,
535 struct partial_symbol **psymp,
536 int count,
537 offset_type cu_index,
538 int is_static)
539 {
540 for (; count-- > 0; ++psymp)
541 {
542 struct partial_symbol *psym = *psymp;
543
544 if (psym->ginfo.language == language_ada)
545 error (_("Ada is not currently supported by the index; "
546 "use the DWARF 5 index instead"));
547
548 /* Only add a given psymbol once. */
549 if (psyms_seen.insert (psym).second)
550 {
551 gdb_index_symbol_kind kind = symbol_kind (psym);
552
553 add_index_entry (symtab, symbol_search_name (&psym->ginfo),
554 is_static, kind, cu_index);
555 }
556 }
557 }
558
559 /* A helper struct used when iterating over debug_types. */
560 struct signatured_type_index_data
561 {
562 signatured_type_index_data (data_buf &types_list_,
563 std::unordered_set<partial_symbol *> &psyms_seen_)
564 : types_list (types_list_), psyms_seen (psyms_seen_)
565 {}
566
567 struct objfile *objfile;
568 struct mapped_symtab *symtab;
569 data_buf &types_list;
570 std::unordered_set<partial_symbol *> &psyms_seen;
571 int cu_index;
572 };
573
574 /* A helper function that writes a single signatured_type to an
575 obstack. */
576
577 static int
578 write_one_signatured_type (void **slot, void *d)
579 {
580 struct signatured_type_index_data *info
581 = (struct signatured_type_index_data *) d;
582 struct signatured_type *entry = (struct signatured_type *) *slot;
583 struct partial_symtab *psymtab = entry->per_cu.v.psymtab;
584
585 write_psymbols (info->symtab,
586 info->psyms_seen,
587 (info->objfile->partial_symtabs->global_psymbols.data ()
588 + psymtab->globals_offset),
589 psymtab->n_global_syms, info->cu_index,
590 0);
591 write_psymbols (info->symtab,
592 info->psyms_seen,
593 (info->objfile->partial_symtabs->static_psymbols.data ()
594 + psymtab->statics_offset),
595 psymtab->n_static_syms, info->cu_index,
596 1);
597
598 info->types_list.append_uint (8, BFD_ENDIAN_LITTLE,
599 to_underlying (entry->per_cu.sect_off));
600 info->types_list.append_uint (8, BFD_ENDIAN_LITTLE,
601 to_underlying (entry->type_offset_in_tu));
602 info->types_list.append_uint (8, BFD_ENDIAN_LITTLE, entry->signature);
603
604 ++info->cu_index;
605
606 return 1;
607 }
608
609 /* Recurse into all "included" dependencies and count their symbols as
610 if they appeared in this psymtab. */
611
612 static void
613 recursively_count_psymbols (struct partial_symtab *psymtab,
614 size_t &psyms_seen)
615 {
616 for (int i = 0; i < psymtab->number_of_dependencies; ++i)
617 if (psymtab->dependencies[i]->user != NULL)
618 recursively_count_psymbols (psymtab->dependencies[i],
619 psyms_seen);
620
621 psyms_seen += psymtab->n_global_syms;
622 psyms_seen += psymtab->n_static_syms;
623 }
624
625 /* Recurse into all "included" dependencies and write their symbols as
626 if they appeared in this psymtab. */
627
628 static void
629 recursively_write_psymbols (struct objfile *objfile,
630 struct partial_symtab *psymtab,
631 struct mapped_symtab *symtab,
632 std::unordered_set<partial_symbol *> &psyms_seen,
633 offset_type cu_index)
634 {
635 int i;
636
637 for (i = 0; i < psymtab->number_of_dependencies; ++i)
638 if (psymtab->dependencies[i]->user != NULL)
639 recursively_write_psymbols (objfile, psymtab->dependencies[i],
640 symtab, psyms_seen, cu_index);
641
642 write_psymbols (symtab,
643 psyms_seen,
644 (objfile->partial_symtabs->global_psymbols.data ()
645 + psymtab->globals_offset),
646 psymtab->n_global_syms, cu_index,
647 0);
648 write_psymbols (symtab,
649 psyms_seen,
650 (objfile->partial_symtabs->static_psymbols.data ()
651 + psymtab->statics_offset),
652 psymtab->n_static_syms, cu_index,
653 1);
654 }
655
656 /* DWARF-5 .debug_names builder. */
657 class debug_names
658 {
659 public:
660 debug_names (struct dwarf2_per_objfile *dwarf2_per_objfile, bool is_dwarf64,
661 bfd_endian dwarf5_byte_order)
662 : m_dwarf5_byte_order (dwarf5_byte_order),
663 m_dwarf32 (dwarf5_byte_order),
664 m_dwarf64 (dwarf5_byte_order),
665 m_dwarf (is_dwarf64
666 ? static_cast<dwarf &> (m_dwarf64)
667 : static_cast<dwarf &> (m_dwarf32)),
668 m_name_table_string_offs (m_dwarf.name_table_string_offs),
669 m_name_table_entry_offs (m_dwarf.name_table_entry_offs),
670 m_debugstrlookup (dwarf2_per_objfile)
671 {}
672
673 int dwarf5_offset_size () const
674 {
675 const bool dwarf5_is_dwarf64 = &m_dwarf == &m_dwarf64;
676 return dwarf5_is_dwarf64 ? 8 : 4;
677 }
678
679 /* Is this symbol from DW_TAG_compile_unit or DW_TAG_type_unit? */
680 enum class unit_kind { cu, tu };
681
682 /* Insert one symbol. */
683 void insert (const partial_symbol *psym, int cu_index, bool is_static,
684 unit_kind kind)
685 {
686 const int dwarf_tag = psymbol_tag (psym);
687 if (dwarf_tag == 0)
688 return;
689 const char *name = symbol_search_name (&psym->ginfo);
690
691 if (psym->ginfo.language == language_ada)
692 {
693 /* We want to ensure that the Ada main function's name appears
694 verbatim in the index. However, this name will be of the
695 form "_ada_mumble", and will be rewritten by ada_decode.
696 So, recognize it specially here and add it to the index by
697 hand. */
698 if (strcmp (main_name (), name) == 0)
699 {
700 const auto insertpair
701 = m_name_to_value_set.emplace (c_str_view (name),
702 std::set<symbol_value> ());
703 std::set<symbol_value> &value_set = insertpair.first->second;
704 value_set.emplace (symbol_value (dwarf_tag, cu_index, is_static,
705 kind));
706 }
707
708 /* In order for the index to work when read back into gdb, it
709 has to supply a funny form of the name: it should be the
710 encoded name, with any suffixes stripped. Using the
711 ordinary encoded name will not work properly with the
712 searching logic in find_name_components_bounds; nor will
713 using the decoded name. Furthermore, an Ada "verbatim"
714 name (of the form "<MumBle>") must be entered without the
715 angle brackets. Note that the current index is unusual,
716 see PR symtab/24820 for details. */
717 std::string decoded = ada_decode (name);
718 if (decoded[0] == '<')
719 name = (char *) obstack_copy0 (&m_string_obstack,
720 decoded.c_str () + 1,
721 decoded.length () - 2);
722 else
723 name = obstack_strdup (&m_string_obstack,
724 ada_encode (decoded.c_str ()));
725 }
726
727 const auto insertpair
728 = m_name_to_value_set.emplace (c_str_view (name),
729 std::set<symbol_value> ());
730 std::set<symbol_value> &value_set = insertpair.first->second;
731 value_set.emplace (symbol_value (dwarf_tag, cu_index, is_static, kind));
732 }
733
734 /* Build all the tables. All symbols must be already inserted.
735 This function does not call file_write, caller has to do it
736 afterwards. */
737 void build ()
738 {
739 /* Verify the build method has not be called twice. */
740 gdb_assert (m_abbrev_table.empty ());
741 const size_t name_count = m_name_to_value_set.size ();
742 m_bucket_table.resize
743 (std::pow (2, std::ceil (std::log2 (name_count * 4 / 3))));
744 m_hash_table.reserve (name_count);
745 m_name_table_string_offs.reserve (name_count);
746 m_name_table_entry_offs.reserve (name_count);
747
748 /* Map each hash of symbol to its name and value. */
749 struct hash_it_pair
750 {
751 uint32_t hash;
752 decltype (m_name_to_value_set)::const_iterator it;
753 };
754 std::vector<std::forward_list<hash_it_pair>> bucket_hash;
755 bucket_hash.resize (m_bucket_table.size ());
756 for (decltype (m_name_to_value_set)::const_iterator it
757 = m_name_to_value_set.cbegin ();
758 it != m_name_to_value_set.cend ();
759 ++it)
760 {
761 const char *const name = it->first.c_str ();
762 const uint32_t hash = dwarf5_djb_hash (name);
763 hash_it_pair hashitpair;
764 hashitpair.hash = hash;
765 hashitpair.it = it;
766 auto &slot = bucket_hash[hash % bucket_hash.size()];
767 slot.push_front (std::move (hashitpair));
768 }
769 for (size_t bucket_ix = 0; bucket_ix < bucket_hash.size (); ++bucket_ix)
770 {
771 const std::forward_list<hash_it_pair> &hashitlist
772 = bucket_hash[bucket_ix];
773 if (hashitlist.empty ())
774 continue;
775 uint32_t &bucket_slot = m_bucket_table[bucket_ix];
776 /* The hashes array is indexed starting at 1. */
777 store_unsigned_integer (reinterpret_cast<gdb_byte *> (&bucket_slot),
778 sizeof (bucket_slot), m_dwarf5_byte_order,
779 m_hash_table.size () + 1);
780 for (const hash_it_pair &hashitpair : hashitlist)
781 {
782 m_hash_table.push_back (0);
783 store_unsigned_integer (reinterpret_cast<gdb_byte *>
784 (&m_hash_table.back ()),
785 sizeof (m_hash_table.back ()),
786 m_dwarf5_byte_order, hashitpair.hash);
787 const c_str_view &name = hashitpair.it->first;
788 const std::set<symbol_value> &value_set = hashitpair.it->second;
789 m_name_table_string_offs.push_back_reorder
790 (m_debugstrlookup.lookup (name.c_str ()));
791 m_name_table_entry_offs.push_back_reorder (m_entry_pool.size ());
792 gdb_assert (!value_set.empty ());
793 for (const symbol_value &value : value_set)
794 {
795 int &idx = m_indexkey_to_idx[index_key (value.dwarf_tag,
796 value.is_static,
797 value.kind)];
798 if (idx == 0)
799 {
800 idx = m_idx_next++;
801 m_abbrev_table.append_unsigned_leb128 (idx);
802 m_abbrev_table.append_unsigned_leb128 (value.dwarf_tag);
803 m_abbrev_table.append_unsigned_leb128
804 (value.kind == unit_kind::cu ? DW_IDX_compile_unit
805 : DW_IDX_type_unit);
806 m_abbrev_table.append_unsigned_leb128 (DW_FORM_udata);
807 m_abbrev_table.append_unsigned_leb128 (value.is_static
808 ? DW_IDX_GNU_internal
809 : DW_IDX_GNU_external);
810 m_abbrev_table.append_unsigned_leb128 (DW_FORM_flag_present);
811
812 /* Terminate attributes list. */
813 m_abbrev_table.append_unsigned_leb128 (0);
814 m_abbrev_table.append_unsigned_leb128 (0);
815 }
816
817 m_entry_pool.append_unsigned_leb128 (idx);
818 m_entry_pool.append_unsigned_leb128 (value.cu_index);
819 }
820
821 /* Terminate the list of CUs. */
822 m_entry_pool.append_unsigned_leb128 (0);
823 }
824 }
825 gdb_assert (m_hash_table.size () == name_count);
826
827 /* Terminate tags list. */
828 m_abbrev_table.append_unsigned_leb128 (0);
829 }
830
831 /* Return .debug_names bucket count. This must be called only after
832 calling the build method. */
833 uint32_t bucket_count () const
834 {
835 /* Verify the build method has been already called. */
836 gdb_assert (!m_abbrev_table.empty ());
837 const uint32_t retval = m_bucket_table.size ();
838
839 /* Check for overflow. */
840 gdb_assert (retval == m_bucket_table.size ());
841 return retval;
842 }
843
844 /* Return .debug_names names count. This must be called only after
845 calling the build method. */
846 uint32_t name_count () const
847 {
848 /* Verify the build method has been already called. */
849 gdb_assert (!m_abbrev_table.empty ());
850 const uint32_t retval = m_hash_table.size ();
851
852 /* Check for overflow. */
853 gdb_assert (retval == m_hash_table.size ());
854 return retval;
855 }
856
857 /* Return number of bytes of .debug_names abbreviation table. This
858 must be called only after calling the build method. */
859 uint32_t abbrev_table_bytes () const
860 {
861 gdb_assert (!m_abbrev_table.empty ());
862 return m_abbrev_table.size ();
863 }
864
865 /* Recurse into all "included" dependencies and store their symbols
866 as if they appeared in this psymtab. */
867 void recursively_write_psymbols
868 (struct objfile *objfile,
869 struct partial_symtab *psymtab,
870 std::unordered_set<partial_symbol *> &psyms_seen,
871 int cu_index)
872 {
873 for (int i = 0; i < psymtab->number_of_dependencies; ++i)
874 if (psymtab->dependencies[i]->user != NULL)
875 recursively_write_psymbols (objfile, psymtab->dependencies[i],
876 psyms_seen, cu_index);
877
878 write_psymbols (psyms_seen,
879 (objfile->partial_symtabs->global_psymbols.data ()
880 + psymtab->globals_offset),
881 psymtab->n_global_syms, cu_index, false, unit_kind::cu);
882 write_psymbols (psyms_seen,
883 (objfile->partial_symtabs->static_psymbols.data ()
884 + psymtab->statics_offset),
885 psymtab->n_static_syms, cu_index, true, unit_kind::cu);
886 }
887
888 /* Return number of bytes the .debug_names section will have. This
889 must be called only after calling the build method. */
890 size_t bytes () const
891 {
892 /* Verify the build method has been already called. */
893 gdb_assert (!m_abbrev_table.empty ());
894 size_t expected_bytes = 0;
895 expected_bytes += m_bucket_table.size () * sizeof (m_bucket_table[0]);
896 expected_bytes += m_hash_table.size () * sizeof (m_hash_table[0]);
897 expected_bytes += m_name_table_string_offs.bytes ();
898 expected_bytes += m_name_table_entry_offs.bytes ();
899 expected_bytes += m_abbrev_table.size ();
900 expected_bytes += m_entry_pool.size ();
901 return expected_bytes;
902 }
903
904 /* Write .debug_names to FILE_NAMES and .debug_str addition to
905 FILE_STR. This must be called only after calling the build
906 method. */
907 void file_write (FILE *file_names, FILE *file_str) const
908 {
909 /* Verify the build method has been already called. */
910 gdb_assert (!m_abbrev_table.empty ());
911 ::file_write (file_names, m_bucket_table);
912 ::file_write (file_names, m_hash_table);
913 m_name_table_string_offs.file_write (file_names);
914 m_name_table_entry_offs.file_write (file_names);
915 m_abbrev_table.file_write (file_names);
916 m_entry_pool.file_write (file_names);
917 m_debugstrlookup.file_write (file_str);
918 }
919
920 /* A helper user data for write_one_signatured_type. */
921 class write_one_signatured_type_data
922 {
923 public:
924 write_one_signatured_type_data (debug_names &nametable_,
925 signatured_type_index_data &&info_)
926 : nametable (nametable_), info (std::move (info_))
927 {}
928 debug_names &nametable;
929 struct signatured_type_index_data info;
930 };
931
932 /* A helper function to pass write_one_signatured_type to
933 htab_traverse_noresize. */
934 static int
935 write_one_signatured_type (void **slot, void *d)
936 {
937 write_one_signatured_type_data *data = (write_one_signatured_type_data *) d;
938 struct signatured_type_index_data *info = &data->info;
939 struct signatured_type *entry = (struct signatured_type *) *slot;
940
941 data->nametable.write_one_signatured_type (entry, info);
942
943 return 1;
944 }
945
946 private:
947
948 /* Storage for symbol names mapping them to their .debug_str section
949 offsets. */
950 class debug_str_lookup
951 {
952 public:
953
954 /* Object costructor to be called for current DWARF2_PER_OBJFILE.
955 All .debug_str section strings are automatically stored. */
956 debug_str_lookup (struct dwarf2_per_objfile *dwarf2_per_objfile)
957 : m_abfd (dwarf2_per_objfile->objfile->obfd),
958 m_dwarf2_per_objfile (dwarf2_per_objfile)
959 {
960 dwarf2_read_section (dwarf2_per_objfile->objfile,
961 &dwarf2_per_objfile->str);
962 if (dwarf2_per_objfile->str.buffer == NULL)
963 return;
964 for (const gdb_byte *data = dwarf2_per_objfile->str.buffer;
965 data < (dwarf2_per_objfile->str.buffer
966 + dwarf2_per_objfile->str.size);)
967 {
968 const char *const s = reinterpret_cast<const char *> (data);
969 const auto insertpair
970 = m_str_table.emplace (c_str_view (s),
971 data - dwarf2_per_objfile->str.buffer);
972 if (!insertpair.second)
973 complaint (_("Duplicate string \"%s\" in "
974 ".debug_str section [in module %s]"),
975 s, bfd_get_filename (m_abfd));
976 data += strlen (s) + 1;
977 }
978 }
979
980 /* Return offset of symbol name S in the .debug_str section. Add
981 such symbol to the section's end if it does not exist there
982 yet. */
983 size_t lookup (const char *s)
984 {
985 const auto it = m_str_table.find (c_str_view (s));
986 if (it != m_str_table.end ())
987 return it->second;
988 const size_t offset = (m_dwarf2_per_objfile->str.size
989 + m_str_add_buf.size ());
990 m_str_table.emplace (c_str_view (s), offset);
991 m_str_add_buf.append_cstr0 (s);
992 return offset;
993 }
994
995 /* Append the end of the .debug_str section to FILE. */
996 void file_write (FILE *file) const
997 {
998 m_str_add_buf.file_write (file);
999 }
1000
1001 private:
1002 std::unordered_map<c_str_view, size_t, c_str_view_hasher> m_str_table;
1003 bfd *const m_abfd;
1004 struct dwarf2_per_objfile *m_dwarf2_per_objfile;
1005
1006 /* Data to add at the end of .debug_str for new needed symbol names. */
1007 data_buf m_str_add_buf;
1008 };
1009
1010 /* Container to map used DWARF tags to their .debug_names abbreviation
1011 tags. */
1012 class index_key
1013 {
1014 public:
1015 index_key (int dwarf_tag_, bool is_static_, unit_kind kind_)
1016 : dwarf_tag (dwarf_tag_), is_static (is_static_), kind (kind_)
1017 {
1018 }
1019
1020 bool
1021 operator== (const index_key &other) const
1022 {
1023 return (dwarf_tag == other.dwarf_tag && is_static == other.is_static
1024 && kind == other.kind);
1025 }
1026
1027 const int dwarf_tag;
1028 const bool is_static;
1029 const unit_kind kind;
1030 };
1031
1032 /* Provide std::unordered_map::hasher for index_key. */
1033 class index_key_hasher
1034 {
1035 public:
1036 size_t
1037 operator () (const index_key &key) const
1038 {
1039 return (std::hash<int>() (key.dwarf_tag) << 1) | key.is_static;
1040 }
1041 };
1042
1043 /* Parameters of one symbol entry. */
1044 class symbol_value
1045 {
1046 public:
1047 const int dwarf_tag, cu_index;
1048 const bool is_static;
1049 const unit_kind kind;
1050
1051 symbol_value (int dwarf_tag_, int cu_index_, bool is_static_,
1052 unit_kind kind_)
1053 : dwarf_tag (dwarf_tag_), cu_index (cu_index_), is_static (is_static_),
1054 kind (kind_)
1055 {}
1056
1057 bool
1058 operator< (const symbol_value &other) const
1059 {
1060 #define X(n) \
1061 do \
1062 { \
1063 if (n < other.n) \
1064 return true; \
1065 if (n > other.n) \
1066 return false; \
1067 } \
1068 while (0)
1069 X (dwarf_tag);
1070 X (is_static);
1071 X (kind);
1072 X (cu_index);
1073 #undef X
1074 return false;
1075 }
1076 };
1077
1078 /* Abstract base class to unify DWARF-32 and DWARF-64 name table
1079 output. */
1080 class offset_vec
1081 {
1082 protected:
1083 const bfd_endian dwarf5_byte_order;
1084 public:
1085 explicit offset_vec (bfd_endian dwarf5_byte_order_)
1086 : dwarf5_byte_order (dwarf5_byte_order_)
1087 {}
1088
1089 /* Call std::vector::reserve for NELEM elements. */
1090 virtual void reserve (size_t nelem) = 0;
1091
1092 /* Call std::vector::push_back with store_unsigned_integer byte
1093 reordering for ELEM. */
1094 virtual void push_back_reorder (size_t elem) = 0;
1095
1096 /* Return expected output size in bytes. */
1097 virtual size_t bytes () const = 0;
1098
1099 /* Write name table to FILE. */
1100 virtual void file_write (FILE *file) const = 0;
1101 };
1102
1103 /* Template to unify DWARF-32 and DWARF-64 output. */
1104 template<typename OffsetSize>
1105 class offset_vec_tmpl : public offset_vec
1106 {
1107 public:
1108 explicit offset_vec_tmpl (bfd_endian dwarf5_byte_order_)
1109 : offset_vec (dwarf5_byte_order_)
1110 {}
1111
1112 /* Implement offset_vec::reserve. */
1113 void reserve (size_t nelem) override
1114 {
1115 m_vec.reserve (nelem);
1116 }
1117
1118 /* Implement offset_vec::push_back_reorder. */
1119 void push_back_reorder (size_t elem) override
1120 {
1121 m_vec.push_back (elem);
1122 /* Check for overflow. */
1123 gdb_assert (m_vec.back () == elem);
1124 store_unsigned_integer (reinterpret_cast<gdb_byte *> (&m_vec.back ()),
1125 sizeof (m_vec.back ()), dwarf5_byte_order, elem);
1126 }
1127
1128 /* Implement offset_vec::bytes. */
1129 size_t bytes () const override
1130 {
1131 return m_vec.size () * sizeof (m_vec[0]);
1132 }
1133
1134 /* Implement offset_vec::file_write. */
1135 void file_write (FILE *file) const override
1136 {
1137 ::file_write (file, m_vec);
1138 }
1139
1140 private:
1141 std::vector<OffsetSize> m_vec;
1142 };
1143
1144 /* Base class to unify DWARF-32 and DWARF-64 .debug_names output
1145 respecting name table width. */
1146 class dwarf
1147 {
1148 public:
1149 offset_vec &name_table_string_offs, &name_table_entry_offs;
1150
1151 dwarf (offset_vec &name_table_string_offs_,
1152 offset_vec &name_table_entry_offs_)
1153 : name_table_string_offs (name_table_string_offs_),
1154 name_table_entry_offs (name_table_entry_offs_)
1155 {
1156 }
1157 };
1158
1159 /* Template to unify DWARF-32 and DWARF-64 .debug_names output
1160 respecting name table width. */
1161 template<typename OffsetSize>
1162 class dwarf_tmpl : public dwarf
1163 {
1164 public:
1165 explicit dwarf_tmpl (bfd_endian dwarf5_byte_order_)
1166 : dwarf (m_name_table_string_offs, m_name_table_entry_offs),
1167 m_name_table_string_offs (dwarf5_byte_order_),
1168 m_name_table_entry_offs (dwarf5_byte_order_)
1169 {}
1170
1171 private:
1172 offset_vec_tmpl<OffsetSize> m_name_table_string_offs;
1173 offset_vec_tmpl<OffsetSize> m_name_table_entry_offs;
1174 };
1175
1176 /* Try to reconstruct original DWARF tag for given partial_symbol.
1177 This function is not DWARF-5 compliant but it is sufficient for
1178 GDB as a DWARF-5 index consumer. */
1179 static int psymbol_tag (const struct partial_symbol *psym)
1180 {
1181 domain_enum domain = psym->domain;
1182 enum address_class aclass = psym->aclass;
1183
1184 switch (domain)
1185 {
1186 case VAR_DOMAIN:
1187 switch (aclass)
1188 {
1189 case LOC_BLOCK:
1190 return DW_TAG_subprogram;
1191 case LOC_TYPEDEF:
1192 return DW_TAG_typedef;
1193 case LOC_COMPUTED:
1194 case LOC_CONST_BYTES:
1195 case LOC_OPTIMIZED_OUT:
1196 case LOC_STATIC:
1197 return DW_TAG_variable;
1198 case LOC_CONST:
1199 /* Note: It's currently impossible to recognize psyms as enum values
1200 short of reading the type info. For now punt. */
1201 return DW_TAG_variable;
1202 default:
1203 /* There are other LOC_FOO values that one might want to classify
1204 as variables, but dwarf2read.c doesn't currently use them. */
1205 return DW_TAG_variable;
1206 }
1207 case STRUCT_DOMAIN:
1208 return DW_TAG_structure_type;
1209 default:
1210 return 0;
1211 }
1212 }
1213
1214 /* Call insert for all partial symbols and mark them in PSYMS_SEEN. */
1215 void write_psymbols (std::unordered_set<partial_symbol *> &psyms_seen,
1216 struct partial_symbol **psymp, int count, int cu_index,
1217 bool is_static, unit_kind kind)
1218 {
1219 for (; count-- > 0; ++psymp)
1220 {
1221 struct partial_symbol *psym = *psymp;
1222
1223 /* Only add a given psymbol once. */
1224 if (psyms_seen.insert (psym).second)
1225 insert (psym, cu_index, is_static, kind);
1226 }
1227 }
1228
1229 /* A helper function that writes a single signatured_type
1230 to a debug_names. */
1231 void
1232 write_one_signatured_type (struct signatured_type *entry,
1233 struct signatured_type_index_data *info)
1234 {
1235 struct partial_symtab *psymtab = entry->per_cu.v.psymtab;
1236
1237 write_psymbols (info->psyms_seen,
1238 (info->objfile->partial_symtabs->global_psymbols.data ()
1239 + psymtab->globals_offset),
1240 psymtab->n_global_syms, info->cu_index, false,
1241 unit_kind::tu);
1242 write_psymbols (info->psyms_seen,
1243 (info->objfile->partial_symtabs->static_psymbols.data ()
1244 + psymtab->statics_offset),
1245 psymtab->n_static_syms, info->cu_index, true,
1246 unit_kind::tu);
1247
1248 info->types_list.append_uint (dwarf5_offset_size (), m_dwarf5_byte_order,
1249 to_underlying (entry->per_cu.sect_off));
1250
1251 ++info->cu_index;
1252 }
1253
1254 /* Store value of each symbol. */
1255 std::unordered_map<c_str_view, std::set<symbol_value>, c_str_view_hasher>
1256 m_name_to_value_set;
1257
1258 /* Tables of DWARF-5 .debug_names. They are in object file byte
1259 order. */
1260 std::vector<uint32_t> m_bucket_table;
1261 std::vector<uint32_t> m_hash_table;
1262
1263 const bfd_endian m_dwarf5_byte_order;
1264 dwarf_tmpl<uint32_t> m_dwarf32;
1265 dwarf_tmpl<uint64_t> m_dwarf64;
1266 dwarf &m_dwarf;
1267 offset_vec &m_name_table_string_offs, &m_name_table_entry_offs;
1268 debug_str_lookup m_debugstrlookup;
1269
1270 /* Map each used .debug_names abbreviation tag parameter to its
1271 index value. */
1272 std::unordered_map<index_key, int, index_key_hasher> m_indexkey_to_idx;
1273
1274 /* Next unused .debug_names abbreviation tag for
1275 m_indexkey_to_idx. */
1276 int m_idx_next = 1;
1277
1278 /* .debug_names abbreviation table. */
1279 data_buf m_abbrev_table;
1280
1281 /* .debug_names entry pool. */
1282 data_buf m_entry_pool;
1283
1284 /* Temporary storage for Ada names. */
1285 auto_obstack m_string_obstack;
1286 };
1287
1288 /* Return iff any of the needed offsets does not fit into 32-bit
1289 .debug_names section. */
1290
1291 static bool
1292 check_dwarf64_offsets (struct dwarf2_per_objfile *dwarf2_per_objfile)
1293 {
1294 for (dwarf2_per_cu_data *per_cu : dwarf2_per_objfile->all_comp_units)
1295 {
1296 if (to_underlying (per_cu->sect_off) >= (static_cast<uint64_t> (1) << 32))
1297 return true;
1298 }
1299 for (const signatured_type *sigtype : dwarf2_per_objfile->all_type_units)
1300 {
1301 const dwarf2_per_cu_data &per_cu = sigtype->per_cu;
1302
1303 if (to_underlying (per_cu.sect_off) >= (static_cast<uint64_t> (1) << 32))
1304 return true;
1305 }
1306 return false;
1307 }
1308
1309 /* The psyms_seen set is potentially going to be largish (~40k
1310 elements when indexing a -g3 build of GDB itself). Estimate the
1311 number of elements in order to avoid too many rehashes, which
1312 require rebuilding buckets and thus many trips to
1313 malloc/free. */
1314
1315 static size_t
1316 psyms_seen_size (struct dwarf2_per_objfile *dwarf2_per_objfile)
1317 {
1318 size_t psyms_count = 0;
1319 for (dwarf2_per_cu_data *per_cu : dwarf2_per_objfile->all_comp_units)
1320 {
1321 struct partial_symtab *psymtab = per_cu->v.psymtab;
1322
1323 if (psymtab != NULL && psymtab->user == NULL)
1324 recursively_count_psymbols (psymtab, psyms_count);
1325 }
1326 /* Generating an index for gdb itself shows a ratio of
1327 TOTAL_SEEN_SYMS/UNIQUE_SYMS or ~5. 4 seems like a good bet. */
1328 return psyms_count / 4;
1329 }
1330
1331 /* Assert that FILE's size is EXPECTED_SIZE. Assumes file's seek
1332 position is at the end of the file. */
1333
1334 static void
1335 assert_file_size (FILE *file, size_t expected_size)
1336 {
1337 const auto file_size = ftell (file);
1338 if (file_size == -1)
1339 perror_with_name (("ftell"));
1340 gdb_assert (file_size == expected_size);
1341 }
1342
1343 /* Write a gdb index file to OUT_FILE from all the sections passed as
1344 arguments. */
1345
1346 static void
1347 write_gdbindex_1 (FILE *out_file,
1348 const data_buf &cu_list,
1349 const data_buf &types_cu_list,
1350 const data_buf &addr_vec,
1351 const data_buf &symtab_vec,
1352 const data_buf &constant_pool)
1353 {
1354 data_buf contents;
1355 const offset_type size_of_header = 6 * sizeof (offset_type);
1356 offset_type total_len = size_of_header;
1357
1358 /* The version number. */
1359 contents.append_data (MAYBE_SWAP (8));
1360
1361 /* The offset of the CU list from the start of the file. */
1362 contents.append_data (MAYBE_SWAP (total_len));
1363 total_len += cu_list.size ();
1364
1365 /* The offset of the types CU list from the start of the file. */
1366 contents.append_data (MAYBE_SWAP (total_len));
1367 total_len += types_cu_list.size ();
1368
1369 /* The offset of the address table from the start of the file. */
1370 contents.append_data (MAYBE_SWAP (total_len));
1371 total_len += addr_vec.size ();
1372
1373 /* The offset of the symbol table from the start of the file. */
1374 contents.append_data (MAYBE_SWAP (total_len));
1375 total_len += symtab_vec.size ();
1376
1377 /* The offset of the constant pool from the start of the file. */
1378 contents.append_data (MAYBE_SWAP (total_len));
1379 total_len += constant_pool.size ();
1380
1381 gdb_assert (contents.size () == size_of_header);
1382
1383 contents.file_write (out_file);
1384 cu_list.file_write (out_file);
1385 types_cu_list.file_write (out_file);
1386 addr_vec.file_write (out_file);
1387 symtab_vec.file_write (out_file);
1388 constant_pool.file_write (out_file);
1389
1390 assert_file_size (out_file, total_len);
1391 }
1392
1393 /* Write contents of a .gdb_index section for OBJFILE into OUT_FILE.
1394 If OBJFILE has an associated dwz file, write contents of a .gdb_index
1395 section for that dwz file into DWZ_OUT_FILE. If OBJFILE does not have an
1396 associated dwz file, DWZ_OUT_FILE must be NULL. */
1397
1398 static void
1399 write_gdbindex (struct dwarf2_per_objfile *dwarf2_per_objfile, FILE *out_file,
1400 FILE *dwz_out_file)
1401 {
1402 struct objfile *objfile = dwarf2_per_objfile->objfile;
1403 mapped_symtab symtab;
1404 data_buf objfile_cu_list;
1405 data_buf dwz_cu_list;
1406
1407 /* While we're scanning CU's create a table that maps a psymtab pointer
1408 (which is what addrmap records) to its index (which is what is recorded
1409 in the index file). This will later be needed to write the address
1410 table. */
1411 psym_index_map cu_index_htab;
1412 cu_index_htab.reserve (dwarf2_per_objfile->all_comp_units.size ());
1413
1414 /* The CU list is already sorted, so we don't need to do additional
1415 work here. Also, the debug_types entries do not appear in
1416 all_comp_units, but only in their own hash table. */
1417
1418 std::unordered_set<partial_symbol *> psyms_seen
1419 (psyms_seen_size (dwarf2_per_objfile));
1420 for (int i = 0; i < dwarf2_per_objfile->all_comp_units.size (); ++i)
1421 {
1422 struct dwarf2_per_cu_data *per_cu
1423 = dwarf2_per_objfile->all_comp_units[i];
1424 struct partial_symtab *psymtab = per_cu->v.psymtab;
1425
1426 /* CU of a shared file from 'dwz -m' may be unused by this main file.
1427 It may be referenced from a local scope but in such case it does not
1428 need to be present in .gdb_index. */
1429 if (psymtab == NULL)
1430 continue;
1431
1432 if (psymtab->user == NULL)
1433 recursively_write_psymbols (objfile, psymtab, &symtab,
1434 psyms_seen, i);
1435
1436 const auto insertpair = cu_index_htab.emplace (psymtab, i);
1437 gdb_assert (insertpair.second);
1438
1439 /* The all_comp_units list contains CUs read from the objfile as well as
1440 from the eventual dwz file. We need to place the entry in the
1441 corresponding index. */
1442 data_buf &cu_list = per_cu->is_dwz ? dwz_cu_list : objfile_cu_list;
1443 cu_list.append_uint (8, BFD_ENDIAN_LITTLE,
1444 to_underlying (per_cu->sect_off));
1445 cu_list.append_uint (8, BFD_ENDIAN_LITTLE, per_cu->length);
1446 }
1447
1448 /* Dump the address map. */
1449 data_buf addr_vec;
1450 write_address_map (objfile, addr_vec, cu_index_htab);
1451
1452 /* Write out the .debug_type entries, if any. */
1453 data_buf types_cu_list;
1454 if (dwarf2_per_objfile->signatured_types)
1455 {
1456 signatured_type_index_data sig_data (types_cu_list,
1457 psyms_seen);
1458
1459 sig_data.objfile = objfile;
1460 sig_data.symtab = &symtab;
1461 sig_data.cu_index = dwarf2_per_objfile->all_comp_units.size ();
1462 htab_traverse_noresize (dwarf2_per_objfile->signatured_types,
1463 write_one_signatured_type, &sig_data);
1464 }
1465
1466 /* Now that we've processed all symbols we can shrink their cu_indices
1467 lists. */
1468 uniquify_cu_indices (&symtab);
1469
1470 data_buf symtab_vec, constant_pool;
1471 write_hash_table (&symtab, symtab_vec, constant_pool);
1472
1473 write_gdbindex_1(out_file, objfile_cu_list, types_cu_list, addr_vec,
1474 symtab_vec, constant_pool);
1475
1476 if (dwz_out_file != NULL)
1477 write_gdbindex_1 (dwz_out_file, dwz_cu_list, {}, {}, {}, {});
1478 else
1479 gdb_assert (dwz_cu_list.empty ());
1480 }
1481
1482 /* DWARF-5 augmentation string for GDB's DW_IDX_GNU_* extension. */
1483 static const gdb_byte dwarf5_gdb_augmentation[] = { 'G', 'D', 'B', 0 };
1484
1485 /* Write a new .debug_names section for OBJFILE into OUT_FILE, write
1486 needed addition to .debug_str section to OUT_FILE_STR. Return how
1487 many bytes were expected to be written into OUT_FILE. */
1488
1489 static void
1490 write_debug_names (struct dwarf2_per_objfile *dwarf2_per_objfile,
1491 FILE *out_file, FILE *out_file_str)
1492 {
1493 const bool dwarf5_is_dwarf64 = check_dwarf64_offsets (dwarf2_per_objfile);
1494 struct objfile *objfile = dwarf2_per_objfile->objfile;
1495 const enum bfd_endian dwarf5_byte_order
1496 = gdbarch_byte_order (get_objfile_arch (objfile));
1497
1498 /* The CU list is already sorted, so we don't need to do additional
1499 work here. Also, the debug_types entries do not appear in
1500 all_comp_units, but only in their own hash table. */
1501 data_buf cu_list;
1502 debug_names nametable (dwarf2_per_objfile, dwarf5_is_dwarf64,
1503 dwarf5_byte_order);
1504 std::unordered_set<partial_symbol *>
1505 psyms_seen (psyms_seen_size (dwarf2_per_objfile));
1506 for (int i = 0; i < dwarf2_per_objfile->all_comp_units.size (); ++i)
1507 {
1508 const dwarf2_per_cu_data *per_cu = dwarf2_per_objfile->all_comp_units[i];
1509 partial_symtab *psymtab = per_cu->v.psymtab;
1510
1511 /* CU of a shared file from 'dwz -m' may be unused by this main
1512 file. It may be referenced from a local scope but in such
1513 case it does not need to be present in .debug_names. */
1514 if (psymtab == NULL)
1515 continue;
1516
1517 if (psymtab->user == NULL)
1518 nametable.recursively_write_psymbols (objfile, psymtab, psyms_seen, i);
1519
1520 cu_list.append_uint (nametable.dwarf5_offset_size (), dwarf5_byte_order,
1521 to_underlying (per_cu->sect_off));
1522 }
1523
1524 /* Write out the .debug_type entries, if any. */
1525 data_buf types_cu_list;
1526 if (dwarf2_per_objfile->signatured_types)
1527 {
1528 debug_names::write_one_signatured_type_data sig_data (nametable,
1529 signatured_type_index_data (types_cu_list, psyms_seen));
1530
1531 sig_data.info.objfile = objfile;
1532 /* It is used only for gdb_index. */
1533 sig_data.info.symtab = nullptr;
1534 sig_data.info.cu_index = 0;
1535 htab_traverse_noresize (dwarf2_per_objfile->signatured_types,
1536 debug_names::write_one_signatured_type,
1537 &sig_data);
1538 }
1539
1540 nametable.build ();
1541
1542 /* No addr_vec - DWARF-5 uses .debug_aranges generated by GCC. */
1543
1544 const offset_type bytes_of_header
1545 = ((dwarf5_is_dwarf64 ? 12 : 4)
1546 + 2 + 2 + 7 * 4
1547 + sizeof (dwarf5_gdb_augmentation));
1548 size_t expected_bytes = 0;
1549 expected_bytes += bytes_of_header;
1550 expected_bytes += cu_list.size ();
1551 expected_bytes += types_cu_list.size ();
1552 expected_bytes += nametable.bytes ();
1553 data_buf header;
1554
1555 if (!dwarf5_is_dwarf64)
1556 {
1557 const uint64_t size64 = expected_bytes - 4;
1558 gdb_assert (size64 < 0xfffffff0);
1559 header.append_uint (4, dwarf5_byte_order, size64);
1560 }
1561 else
1562 {
1563 header.append_uint (4, dwarf5_byte_order, 0xffffffff);
1564 header.append_uint (8, dwarf5_byte_order, expected_bytes - 12);
1565 }
1566
1567 /* The version number. */
1568 header.append_uint (2, dwarf5_byte_order, 5);
1569
1570 /* Padding. */
1571 header.append_uint (2, dwarf5_byte_order, 0);
1572
1573 /* comp_unit_count - The number of CUs in the CU list. */
1574 header.append_uint (4, dwarf5_byte_order,
1575 dwarf2_per_objfile->all_comp_units.size ());
1576
1577 /* local_type_unit_count - The number of TUs in the local TU
1578 list. */
1579 header.append_uint (4, dwarf5_byte_order,
1580 dwarf2_per_objfile->all_type_units.size ());
1581
1582 /* foreign_type_unit_count - The number of TUs in the foreign TU
1583 list. */
1584 header.append_uint (4, dwarf5_byte_order, 0);
1585
1586 /* bucket_count - The number of hash buckets in the hash lookup
1587 table. */
1588 header.append_uint (4, dwarf5_byte_order, nametable.bucket_count ());
1589
1590 /* name_count - The number of unique names in the index. */
1591 header.append_uint (4, dwarf5_byte_order, nametable.name_count ());
1592
1593 /* abbrev_table_size - The size in bytes of the abbreviations
1594 table. */
1595 header.append_uint (4, dwarf5_byte_order, nametable.abbrev_table_bytes ());
1596
1597 /* augmentation_string_size - The size in bytes of the augmentation
1598 string. This value is rounded up to a multiple of 4. */
1599 static_assert (sizeof (dwarf5_gdb_augmentation) % 4 == 0, "");
1600 header.append_uint (4, dwarf5_byte_order, sizeof (dwarf5_gdb_augmentation));
1601 header.append_data (dwarf5_gdb_augmentation);
1602
1603 gdb_assert (header.size () == bytes_of_header);
1604
1605 header.file_write (out_file);
1606 cu_list.file_write (out_file);
1607 types_cu_list.file_write (out_file);
1608 nametable.file_write (out_file, out_file_str);
1609
1610 assert_file_size (out_file, expected_bytes);
1611 }
1612
1613 /* This represents an index file being written (work-in-progress).
1614
1615 The data is initially written to a temporary file. When the finalize method
1616 is called, the file is closed and moved to its final location.
1617
1618 On failure (if this object is being destroyed with having called finalize),
1619 the temporary file is closed and deleted. */
1620
1621 struct index_wip_file
1622 {
1623 index_wip_file (const char *dir, const char *basename,
1624 const char *suffix)
1625 {
1626 filename = (std::string (dir) + SLASH_STRING + basename
1627 + suffix);
1628
1629 filename_temp = make_temp_filename (filename);
1630
1631 scoped_fd out_file_fd (gdb_mkostemp_cloexec (filename_temp.data (),
1632 O_BINARY));
1633 if (out_file_fd.get () == -1)
1634 perror_with_name (("mkstemp"));
1635
1636 out_file = out_file_fd.to_file ("wb");
1637
1638 if (out_file == nullptr)
1639 error (_("Can't open `%s' for writing"), filename_temp.data ());
1640
1641 unlink_file.emplace (filename_temp.data ());
1642 }
1643
1644 void finalize ()
1645 {
1646 /* We want to keep the file. */
1647 unlink_file->keep ();
1648
1649 /* Close and move the str file in place. */
1650 unlink_file.reset ();
1651 if (rename (filename_temp.data (), filename.c_str ()) != 0)
1652 perror_with_name (("rename"));
1653 }
1654
1655 std::string filename;
1656 gdb::char_vector filename_temp;
1657
1658 /* Order matters here; we want FILE to be closed before
1659 FILENAME_TEMP is unlinked, because on MS-Windows one cannot
1660 delete a file that is still open. So, we wrap the unlinker in an
1661 optional and emplace it once we know the file name. */
1662 gdb::optional<gdb::unlinker> unlink_file;
1663
1664 gdb_file_up out_file;
1665 };
1666
1667 /* See dwarf-index-write.h. */
1668
1669 void
1670 write_psymtabs_to_index (struct dwarf2_per_objfile *dwarf2_per_objfile,
1671 const char *dir, const char *basename,
1672 const char *dwz_basename,
1673 dw_index_kind index_kind)
1674 {
1675 struct objfile *objfile = dwarf2_per_objfile->objfile;
1676
1677 if (dwarf2_per_objfile->using_index)
1678 error (_("Cannot use an index to create the index"));
1679
1680 if (dwarf2_per_objfile->types.size () > 1)
1681 error (_("Cannot make an index when the file has multiple .debug_types sections"));
1682
1683 if (!objfile->partial_symtabs->psymtabs
1684 || !objfile->partial_symtabs->psymtabs_addrmap)
1685 return;
1686
1687 struct stat st;
1688 if (stat (objfile_name (objfile), &st) < 0)
1689 perror_with_name (objfile_name (objfile));
1690
1691 const char *index_suffix = (index_kind == dw_index_kind::DEBUG_NAMES
1692 ? INDEX5_SUFFIX : INDEX4_SUFFIX);
1693
1694 index_wip_file objfile_index_wip (dir, basename, index_suffix);
1695 gdb::optional<index_wip_file> dwz_index_wip;
1696
1697 if (dwz_basename != NULL)
1698 dwz_index_wip.emplace (dir, dwz_basename, index_suffix);
1699
1700 if (index_kind == dw_index_kind::DEBUG_NAMES)
1701 {
1702 index_wip_file str_wip_file (dir, basename, DEBUG_STR_SUFFIX);
1703
1704 write_debug_names (dwarf2_per_objfile, objfile_index_wip.out_file.get (),
1705 str_wip_file.out_file.get ());
1706
1707 str_wip_file.finalize ();
1708 }
1709 else
1710 write_gdbindex (dwarf2_per_objfile, objfile_index_wip.out_file.get (),
1711 (dwz_index_wip.has_value ()
1712 ? dwz_index_wip->out_file.get () : NULL));
1713
1714 objfile_index_wip.finalize ();
1715
1716 if (dwz_index_wip.has_value ())
1717 dwz_index_wip->finalize ();
1718 }
1719
1720 /* Implementation of the `save gdb-index' command.
1721
1722 Note that the .gdb_index file format used by this command is
1723 documented in the GDB manual. Any changes here must be documented
1724 there. */
1725
1726 static void
1727 save_gdb_index_command (const char *arg, int from_tty)
1728 {
1729 const char dwarf5space[] = "-dwarf-5 ";
1730 dw_index_kind index_kind = dw_index_kind::GDB_INDEX;
1731
1732 if (!arg)
1733 arg = "";
1734
1735 arg = skip_spaces (arg);
1736 if (strncmp (arg, dwarf5space, strlen (dwarf5space)) == 0)
1737 {
1738 index_kind = dw_index_kind::DEBUG_NAMES;
1739 arg += strlen (dwarf5space);
1740 arg = skip_spaces (arg);
1741 }
1742
1743 if (!*arg)
1744 error (_("usage: save gdb-index [-dwarf-5] DIRECTORY"));
1745
1746 for (objfile *objfile : current_program_space->objfiles ())
1747 {
1748 struct stat st;
1749
1750 /* If the objfile does not correspond to an actual file, skip it. */
1751 if (stat (objfile_name (objfile), &st) < 0)
1752 continue;
1753
1754 struct dwarf2_per_objfile *dwarf2_per_objfile
1755 = get_dwarf2_per_objfile (objfile);
1756
1757 if (dwarf2_per_objfile != NULL)
1758 {
1759 try
1760 {
1761 const char *basename = lbasename (objfile_name (objfile));
1762 const dwz_file *dwz = dwarf2_get_dwz_file (dwarf2_per_objfile);
1763 const char *dwz_basename = NULL;
1764
1765 if (dwz != NULL)
1766 dwz_basename = lbasename (dwz->filename ());
1767
1768 write_psymtabs_to_index (dwarf2_per_objfile, arg, basename,
1769 dwz_basename, index_kind);
1770 }
1771 catch (const gdb_exception_error &except)
1772 {
1773 exception_fprintf (gdb_stderr, except,
1774 _("Error while writing index for `%s': "),
1775 objfile_name (objfile));
1776 }
1777 }
1778
1779 }
1780 }
1781
1782 void
1783 _initialize_dwarf_index_write ()
1784 {
1785 cmd_list_element *c = add_cmd ("gdb-index", class_files,
1786 save_gdb_index_command, _("\
1787 Save a gdb-index file.\n\
1788 Usage: save gdb-index [-dwarf-5] DIRECTORY\n\
1789 \n\
1790 No options create one file with .gdb-index extension for pre-DWARF-5\n\
1791 compatible .gdb_index section. With -dwarf-5 creates two files with\n\
1792 extension .debug_names and .debug_str for DWARF-5 .debug_names section."),
1793 &save_cmdlist);
1794 set_cmd_completer (c, filename_completer);
1795 }
This page took 0.129056 seconds and 5 git commands to generate.