2 Copyright (C) 2001-2019 Free Software Foundation, Inc.
3 Written by Jakub Jelinek <jakub@redhat.com>.
5 This file is part of BFD, the Binary File Descriptor library.
7 This program is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3 of the License, or
10 (at your option) any later version.
12 This program is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with this program; if not, write to the Free Software
19 Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston,
20 MA 02110-1301, USA. */
23 /* This file contains support for merging duplicate entities within sections,
24 as used in ELF SHF_MERGE. */
32 #include "libiberty.h"
34 struct sec_merge_sec_info
;
36 /* An entry in the section merge hash table. */
38 struct sec_merge_hash_entry
40 struct bfd_hash_entry root
;
41 /* Length of this entry. This includes the zero terminator. */
43 /* Start of this string needs to be aligned to
44 alignment octets (not 1 << align). */
45 unsigned int alignment
;
48 /* Index within the merged section. */
50 /* Entry this is a suffix of (if alignment is 0). */
51 struct sec_merge_hash_entry
*suffix
;
53 /* Which section is it in. */
54 struct sec_merge_sec_info
*secinfo
;
55 /* Next entity in the hash table. */
56 struct sec_merge_hash_entry
*next
;
59 /* The section merge hash table. */
63 struct bfd_hash_table table
;
64 /* Next available index. */
66 /* First entity in the SEC_MERGE sections of this type. */
67 struct sec_merge_hash_entry
*first
;
68 /* Last entity in the SEC_MERGE sections of this type. */
69 struct sec_merge_hash_entry
*last
;
72 /* Are entries fixed size or zero terminated strings? */
78 /* Chain of sec_merge_infos. */
79 struct sec_merge_info
*next
;
80 /* Chain of sec_merge_sec_infos. */
81 struct sec_merge_sec_info
*chain
;
82 /* A hash table used to hold section content. */
83 struct sec_merge_hash
*htab
;
86 struct sec_merge_sec_info
88 /* Chain of sec_merge_sec_infos. */
89 struct sec_merge_sec_info
*next
;
90 /* The corresponding section. */
92 /* Pointer to merge_info pointing to us. */
94 /* A hash table used to hold section content. */
95 struct sec_merge_hash
*htab
;
96 /* First string in this section. */
97 struct sec_merge_hash_entry
*first_str
;
98 /* Original section content. */
99 unsigned char contents
[1];
103 /* Routine to create an entry in a section merge hashtab. */
105 static struct bfd_hash_entry
*
106 sec_merge_hash_newfunc (struct bfd_hash_entry
*entry
,
107 struct bfd_hash_table
*table
, const char *string
)
109 /* Allocate the structure if it has not already been allocated by a
112 entry
= (struct bfd_hash_entry
*)
113 bfd_hash_allocate (table
, sizeof (struct sec_merge_hash_entry
));
117 /* Call the allocation method of the superclass. */
118 entry
= bfd_hash_newfunc (entry
, table
, string
);
122 /* Initialize the local fields. */
123 struct sec_merge_hash_entry
*ret
= (struct sec_merge_hash_entry
*) entry
;
125 ret
->u
.suffix
= NULL
;
134 /* Look up an entry in a section merge hash table. */
136 static struct sec_merge_hash_entry
*
137 sec_merge_hash_lookup (struct sec_merge_hash
*table
, const char *string
,
138 unsigned int alignment
, bfd_boolean create
)
140 const unsigned char *s
;
143 struct sec_merge_hash_entry
*hashp
;
149 s
= (const unsigned char *) string
;
152 if (table
->entsize
== 1)
154 while ((c
= *s
++) != '\0')
156 hash
+= c
+ (c
<< 17);
160 hash
+= len
+ (len
<< 17);
166 for (i
= 0; i
< table
->entsize
; ++i
)
169 if (i
== table
->entsize
)
171 for (i
= 0; i
< table
->entsize
; ++i
)
174 hash
+= c
+ (c
<< 17);
179 hash
+= len
+ (len
<< 17);
180 len
*= table
->entsize
;
183 len
+= table
->entsize
;
187 for (i
= 0; i
< table
->entsize
; ++i
)
190 hash
+= c
+ (c
<< 17);
193 len
= table
->entsize
;
196 _index
= hash
% table
->table
.size
;
197 for (hashp
= (struct sec_merge_hash_entry
*) table
->table
.table
[_index
];
199 hashp
= (struct sec_merge_hash_entry
*) hashp
->root
.next
)
201 if (hashp
->root
.hash
== hash
203 && memcmp (hashp
->root
.string
, string
, len
) == 0)
205 /* If the string we found does not have at least the required
206 alignment, we need to insert another copy. */
207 if (hashp
->alignment
< alignment
)
211 /* Mark the less aligned copy as deleted. */
213 hashp
->alignment
= 0;
224 hashp
= ((struct sec_merge_hash_entry
*)
225 bfd_hash_insert (&table
->table
, string
, hash
));
229 hashp
->alignment
= alignment
;
233 /* Create a new hash table. */
235 static struct sec_merge_hash
*
236 sec_merge_init (unsigned int entsize
, bfd_boolean strings
)
238 struct sec_merge_hash
*table
;
240 table
= (struct sec_merge_hash
*) bfd_malloc (sizeof (struct sec_merge_hash
));
244 if (! bfd_hash_table_init_n (&table
->table
, sec_merge_hash_newfunc
,
245 sizeof (struct sec_merge_hash_entry
), 16699))
254 table
->entsize
= entsize
;
255 table
->strings
= strings
;
260 /* Get the index of an entity in a hash table, adding it if it is not
263 static struct sec_merge_hash_entry
*
264 sec_merge_add (struct sec_merge_hash
*tab
, const char *str
,
265 unsigned int alignment
, struct sec_merge_sec_info
*secinfo
)
267 struct sec_merge_hash_entry
*entry
;
269 entry
= sec_merge_hash_lookup (tab
, str
, alignment
, TRUE
);
273 if (entry
->secinfo
== NULL
)
276 entry
->secinfo
= secinfo
;
277 if (tab
->first
== NULL
)
280 tab
->last
->next
= entry
;
288 sec_merge_emit (bfd
*abfd
, struct sec_merge_hash_entry
*entry
,
289 unsigned char *contents
, file_ptr offset
)
291 struct sec_merge_sec_info
*secinfo
= entry
->secinfo
;
292 asection
*sec
= secinfo
->sec
;
294 bfd_size_type off
= 0;
295 int alignment_power
= sec
->output_section
->alignment_power
;
296 bfd_size_type pad_len
;
298 /* FIXME: If alignment_power is 0 then really we should scan the
299 entry list for the largest required alignment and use that. */
300 pad_len
= alignment_power
? ((bfd_size_type
) 1 << alignment_power
) : 16;
302 pad
= (char *) bfd_zmalloc (pad_len
);
306 for (; entry
!= NULL
&& entry
->secinfo
== secinfo
; entry
= entry
->next
)
311 len
= -off
& (entry
->alignment
- 1);
314 BFD_ASSERT (len
<= pad_len
);
317 memcpy (contents
+ offset
, pad
, len
);
320 else if (bfd_bwrite (pad
, len
, abfd
) != len
)
325 str
= entry
->root
.string
;
330 memcpy (contents
+ offset
, str
, len
);
333 else if (bfd_bwrite (str
, len
, abfd
) != len
)
339 /* Trailing alignment needed? */
340 off
= sec
->size
- off
;
343 BFD_ASSERT (off
<= pad_len
);
345 memcpy (contents
+ offset
, pad
, off
);
346 else if (bfd_bwrite (pad
, off
, abfd
) != off
)
358 /* Register a SEC_MERGE section as a candidate for merging.
359 This function is called for all non-dynamic SEC_MERGE input sections. */
362 _bfd_add_merge_section (bfd
*abfd
, void **psinfo
, asection
*sec
,
365 struct sec_merge_info
*sinfo
;
366 struct sec_merge_sec_info
*secinfo
;
371 if ((abfd
->flags
& DYNAMIC
) != 0
372 || (sec
->flags
& SEC_MERGE
) == 0)
376 || (sec
->flags
& SEC_EXCLUDE
) != 0
377 || sec
->entsize
== 0)
380 if (sec
->size
% sec
->entsize
!= 0)
383 if ((sec
->flags
& SEC_RELOC
) != 0)
385 /* We aren't prepared to handle relocations in merged sections. */
392 if (sec
->alignment_power
>= sizeof (align
) * CHAR_BIT
)
395 align
= 1u << sec
->alignment_power
;
396 if ((sec
->entsize
< align
397 && ((sec
->entsize
& (sec
->entsize
- 1))
398 || !(sec
->flags
& SEC_STRINGS
)))
399 || (sec
->entsize
> align
400 && (sec
->entsize
& (align
- 1))))
402 /* Sanity check. If string character size is smaller than
403 alignment, then we require character size to be a power
404 of 2, otherwise character size must be integer multiple
405 of alignment. For non-string constants, alignment must
406 be smaller than or equal to entity size and entity size
407 must be integer multiple of alignment. */
411 for (sinfo
= (struct sec_merge_info
*) *psinfo
; sinfo
; sinfo
= sinfo
->next
)
412 if ((secinfo
= sinfo
->chain
)
413 && ! ((secinfo
->sec
->flags
^ sec
->flags
) & (SEC_MERGE
| SEC_STRINGS
))
414 && secinfo
->sec
->entsize
== sec
->entsize
415 && secinfo
->sec
->alignment_power
== sec
->alignment_power
416 && secinfo
->sec
->output_section
== sec
->output_section
)
421 /* Initialize the information we need to keep track of. */
422 sinfo
= (struct sec_merge_info
*)
423 bfd_alloc (abfd
, sizeof (struct sec_merge_info
));
426 sinfo
->next
= (struct sec_merge_info
*) *psinfo
;
429 sinfo
->htab
= sec_merge_init (sec
->entsize
, (sec
->flags
& SEC_STRINGS
));
430 if (sinfo
->htab
== NULL
)
434 /* Read the section from abfd. */
436 amt
= sizeof (struct sec_merge_sec_info
) - 1 + sec
->size
;
437 if (sec
->flags
& SEC_STRINGS
)
438 /* Some versions of gcc may emit a string without a zero terminator.
439 See http://gcc.gnu.org/ml/gcc-patches/2006-06/msg01004.html
440 Allocate space for an extra zero. */
442 *psecinfo
= bfd_alloc (abfd
, amt
);
443 if (*psecinfo
== NULL
)
446 secinfo
= (struct sec_merge_sec_info
*) *psecinfo
;
449 secinfo
->next
= sinfo
->chain
->next
;
450 sinfo
->chain
->next
= secinfo
;
453 secinfo
->next
= secinfo
;
454 sinfo
->chain
= secinfo
;
456 secinfo
->psecinfo
= psecinfo
;
457 secinfo
->htab
= sinfo
->htab
;
458 secinfo
->first_str
= NULL
;
460 sec
->rawsize
= sec
->size
;
461 if (sec
->flags
& SEC_STRINGS
)
462 memset (secinfo
->contents
+ sec
->size
, 0, sec
->entsize
);
463 contents
= secinfo
->contents
;
464 if (! bfd_get_full_section_contents (sec
->owner
, sec
, &contents
))
474 /* Record one section into the hash table. */
476 record_section (struct sec_merge_info
*sinfo
,
477 struct sec_merge_sec_info
*secinfo
)
479 asection
*sec
= secinfo
->sec
;
480 struct sec_merge_hash_entry
*entry
;
482 unsigned char *p
, *end
;
483 bfd_vma mask
, eltalign
;
484 unsigned int align
, i
;
486 align
= sec
->alignment_power
;
487 end
= secinfo
->contents
+ sec
->size
;
489 mask
= ((bfd_vma
) 1 << align
) - 1;
490 if (sec
->flags
& SEC_STRINGS
)
492 for (p
= secinfo
->contents
; p
< end
; )
494 eltalign
= p
- secinfo
->contents
;
495 eltalign
= ((eltalign
^ (eltalign
- 1)) + 1) >> 1;
496 if (!eltalign
|| eltalign
> mask
)
498 entry
= sec_merge_add (sinfo
->htab
, (char *) p
, (unsigned) eltalign
,
503 if (sec
->entsize
== 1)
505 while (p
< end
&& *p
== 0)
507 if (!nul
&& !((p
- secinfo
->contents
) & mask
))
510 entry
= sec_merge_add (sinfo
->htab
, "",
511 (unsigned) mask
+ 1, secinfo
);
522 for (i
= 0; i
< sec
->entsize
; i
++)
525 if (i
!= sec
->entsize
)
527 if (!nul
&& !((p
- secinfo
->contents
) & mask
))
530 entry
= sec_merge_add (sinfo
->htab
, (char *) p
,
531 (unsigned) mask
+ 1, secinfo
);
542 for (p
= secinfo
->contents
; p
< end
; p
+= sec
->entsize
)
544 entry
= sec_merge_add (sinfo
->htab
, (char *) p
, 1, secinfo
);
553 for (secinfo
= sinfo
->chain
; secinfo
; secinfo
= secinfo
->next
)
554 *secinfo
->psecinfo
= NULL
;
559 strrevcmp (const void *a
, const void *b
)
561 struct sec_merge_hash_entry
*A
= *(struct sec_merge_hash_entry
**) a
;
562 struct sec_merge_hash_entry
*B
= *(struct sec_merge_hash_entry
**) b
;
563 unsigned int lenA
= A
->len
;
564 unsigned int lenB
= B
->len
;
565 const unsigned char *s
= (const unsigned char *) A
->root
.string
+ lenA
- 1;
566 const unsigned char *t
= (const unsigned char *) B
->root
.string
+ lenB
- 1;
567 int l
= lenA
< lenB
? lenA
: lenB
;
572 return (int) *s
- (int) *t
;
580 /* Like strrevcmp, but for the case where all strings have the same
581 alignment > entsize. */
584 strrevcmp_align (const void *a
, const void *b
)
586 struct sec_merge_hash_entry
*A
= *(struct sec_merge_hash_entry
**) a
;
587 struct sec_merge_hash_entry
*B
= *(struct sec_merge_hash_entry
**) b
;
588 unsigned int lenA
= A
->len
;
589 unsigned int lenB
= B
->len
;
590 const unsigned char *s
= (const unsigned char *) A
->root
.string
+ lenA
- 1;
591 const unsigned char *t
= (const unsigned char *) B
->root
.string
+ lenB
- 1;
592 int l
= lenA
< lenB
? lenA
: lenB
;
593 int tail_align
= (lenA
& (A
->alignment
- 1)) - (lenB
& (A
->alignment
- 1));
601 return (int) *s
- (int) *t
;
610 is_suffix (const struct sec_merge_hash_entry
*A
,
611 const struct sec_merge_hash_entry
*B
)
613 if (A
->len
<= B
->len
)
614 /* B cannot be a suffix of A unless A is equal to B, which is guaranteed
615 not to be equal by the hash table. */
618 return memcmp (A
->root
.string
+ (A
->len
- B
->len
),
619 B
->root
.string
, B
->len
) == 0;
622 /* This is a helper function for _bfd_merge_sections. It attempts to
623 merge strings matching suffixes of longer strings. */
624 static struct sec_merge_sec_info
*
625 merge_strings (struct sec_merge_info
*sinfo
)
627 struct sec_merge_hash_entry
**array
, **a
, *e
;
628 struct sec_merge_sec_info
*secinfo
;
629 bfd_size_type size
, amt
;
630 unsigned int alignment
= 0;
632 /* Now sort the strings */
633 amt
= sinfo
->htab
->size
* sizeof (struct sec_merge_hash_entry
*);
634 array
= (struct sec_merge_hash_entry
**) bfd_malloc (amt
);
638 for (e
= sinfo
->htab
->first
, a
= array
; e
; e
= e
->next
)
642 /* Adjust the length to not include the zero terminator. */
643 e
->len
-= sinfo
->htab
->entsize
;
644 if (alignment
!= e
->alignment
)
647 alignment
= e
->alignment
;
649 alignment
= (unsigned) -1;
653 sinfo
->htab
->size
= a
- array
;
654 if (sinfo
->htab
->size
!= 0)
656 qsort (array
, (size_t) sinfo
->htab
->size
,
657 sizeof (struct sec_merge_hash_entry
*),
658 (alignment
!= (unsigned) -1 && alignment
> sinfo
->htab
->entsize
659 ? strrevcmp_align
: strrevcmp
));
661 /* Loop over the sorted array and merge suffixes */
663 e
->len
+= sinfo
->htab
->entsize
;
666 struct sec_merge_hash_entry
*cmp
= *a
;
668 cmp
->len
+= sinfo
->htab
->entsize
;
669 if (e
->alignment
>= cmp
->alignment
670 && !((e
->len
- cmp
->len
) & (cmp
->alignment
- 1))
671 && is_suffix (e
, cmp
))
683 /* Now assign positions to the strings we want to keep. */
685 secinfo
= sinfo
->htab
->first
->secinfo
;
686 for (e
= sinfo
->htab
->first
; e
; e
= e
->next
)
688 if (e
->secinfo
!= secinfo
)
690 secinfo
->sec
->size
= size
;
691 secinfo
= e
->secinfo
;
695 if (e
->secinfo
->first_str
== NULL
)
697 e
->secinfo
->first_str
= e
;
700 size
= (size
+ e
->alignment
- 1) & ~((bfd_vma
) e
->alignment
- 1);
705 secinfo
->sec
->size
= size
;
707 /* And now adjust the rest, removing them from the chain (but not hashtable)
709 for (a
= &sinfo
->htab
->first
, e
= *a
; e
; e
= e
->next
)
717 e
->secinfo
= e
->u
.suffix
->secinfo
;
718 e
->alignment
= e
->u
.suffix
->alignment
;
719 e
->u
.index
= e
->u
.suffix
->u
.index
+ (e
->u
.suffix
->len
- e
->len
);
725 /* This function is called once after all SEC_MERGE sections are registered
726 with _bfd_merge_section. */
729 _bfd_merge_sections (bfd
*abfd
,
730 struct bfd_link_info
*info ATTRIBUTE_UNUSED
,
732 void (*remove_hook
) (bfd
*, asection
*))
734 struct sec_merge_info
*sinfo
;
736 for (sinfo
= (struct sec_merge_info
*) xsinfo
; sinfo
; sinfo
= sinfo
->next
)
738 struct sec_merge_sec_info
*secinfo
;
744 /* Move sinfo->chain to head of the chain, terminate it. */
745 secinfo
= sinfo
->chain
;
746 sinfo
->chain
= secinfo
->next
;
747 secinfo
->next
= NULL
;
749 /* Record the sections into the hash table. */
751 for (secinfo
= sinfo
->chain
; secinfo
; secinfo
= secinfo
->next
)
752 if (secinfo
->sec
->flags
& SEC_EXCLUDE
)
754 *secinfo
->psecinfo
= NULL
;
756 (*remove_hook
) (abfd
, secinfo
->sec
);
760 if (!record_section (sinfo
, secinfo
))
764 align
= (bfd_size_type
) 1 << secinfo
->sec
->alignment_power
;
765 if ((secinfo
->sec
->size
& (align
- 1)) != 0)
770 if (sinfo
->htab
->first
== NULL
)
773 if (sinfo
->htab
->strings
)
775 secinfo
= merge_strings (sinfo
);
781 struct sec_merge_hash_entry
*e
;
782 bfd_size_type size
= 0;
784 /* Things are much simpler for non-strings.
785 Just assign them slots in the section. */
787 for (e
= sinfo
->htab
->first
; e
; e
= e
->next
)
789 if (e
->secinfo
->first_str
== NULL
)
792 secinfo
->sec
->size
= size
;
793 e
->secinfo
->first_str
= e
;
796 size
= (size
+ e
->alignment
- 1) & ~((bfd_vma
) e
->alignment
- 1);
799 secinfo
= e
->secinfo
;
801 secinfo
->sec
->size
= size
;
804 /* If the input sections were padded according to their alignments,
805 then pad the output too. */
807 secinfo
->sec
->size
= (secinfo
->sec
->size
+ align
- 1) & -align
;
809 /* Finally remove all input sections which have not made it into
810 the hash table at all. */
811 for (secinfo
= sinfo
->chain
; secinfo
; secinfo
= secinfo
->next
)
812 if (secinfo
->first_str
== NULL
)
813 secinfo
->sec
->flags
|= SEC_EXCLUDE
| SEC_KEEP
;
819 /* Write out the merged section. */
822 _bfd_write_merged_section (bfd
*output_bfd
, asection
*sec
, void *psecinfo
)
824 struct sec_merge_sec_info
*secinfo
;
826 unsigned char *contents
;
827 Elf_Internal_Shdr
*hdr
;
829 secinfo
= (struct sec_merge_sec_info
*) psecinfo
;
834 if (secinfo
->first_str
== NULL
)
837 /* FIXME: octets_per_byte. */
838 hdr
= &elf_section_data (sec
->output_section
)->this_hdr
;
839 if (hdr
->sh_offset
== (file_ptr
) -1)
841 /* We must compress this section. Write output to the
843 contents
= hdr
->contents
;
844 if ((sec
->output_section
->flags
& SEC_ELF_COMPRESS
) == 0
851 pos
= sec
->output_section
->filepos
+ sec
->output_offset
;
852 if (bfd_seek (output_bfd
, pos
, SEEK_SET
) != 0)
856 if (! sec_merge_emit (output_bfd
, secinfo
->first_str
, contents
,
863 /* Adjust an address in the SEC_MERGE section. Given OFFSET within
864 *PSEC, this returns the new offset in the adjusted SEC_MERGE
865 section and writes the new section back into *PSEC. */
868 _bfd_merged_section_offset (bfd
*output_bfd ATTRIBUTE_UNUSED
, asection
**psec
,
869 void *psecinfo
, bfd_vma offset
)
871 struct sec_merge_sec_info
*secinfo
;
872 struct sec_merge_hash_entry
*entry
;
874 asection
*sec
= *psec
;
876 secinfo
= (struct sec_merge_sec_info
*) psecinfo
;
881 if (offset
>= sec
->rawsize
)
883 if (offset
> sec
->rawsize
)
885 /* xgettext:c-format */
886 (_("%pB: access beyond end of merged section (%" PRId64
")"),
887 sec
->owner
, (int64_t) offset
);
888 return secinfo
->first_str
? sec
->size
: 0;
891 if (secinfo
->htab
->strings
)
893 if (sec
->entsize
== 1)
895 p
= secinfo
->contents
+ offset
- 1;
896 while (p
>= secinfo
->contents
&& *p
)
902 p
= secinfo
->contents
+ (offset
/ sec
->entsize
) * sec
->entsize
;
904 while (p
>= secinfo
->contents
)
908 for (i
= 0; i
< sec
->entsize
; ++i
)
911 if (i
== sec
->entsize
)
920 p
= secinfo
->contents
+ (offset
/ sec
->entsize
) * sec
->entsize
;
922 entry
= sec_merge_hash_lookup (secinfo
->htab
, (char *) p
, 0, FALSE
);
925 if (! secinfo
->htab
->strings
)
927 /* This should only happen if somebody points into the padding
928 after a NUL character but before next entity. */
931 if (! secinfo
->htab
->first
)
933 entry
= secinfo
->htab
->first
;
934 p
= (secinfo
->contents
+ (offset
/ sec
->entsize
+ 1) * sec
->entsize
938 *psec
= entry
->secinfo
->sec
;
939 return entry
->u
.index
+ (secinfo
->contents
+ offset
- p
);
942 /* Tidy up when done. */
945 _bfd_merge_sections_free (void *xsinfo
)
947 struct sec_merge_info
*sinfo
;
949 for (sinfo
= (struct sec_merge_info
*) xsinfo
; sinfo
; sinfo
= sinfo
->next
)
951 bfd_hash_table_free (&sinfo
->htab
->table
);