BR 2413272: Warn about byte displacement overflow
[nasm/avx512.git] / output / outmacho.c
blob06ae8ee8c35202cbfaad0a99cf5741f2cf22eee4
1 /* outmacho.c output routines for the Netwide Assembler to produce
2 * NeXTstep/OpenStep/Rhapsody/Darwin/MacOS X object files
4 * The Netwide Assembler is copyright (C) 1996 Simon Tatham and
5 * Julian Hall. All rights reserved. The software is
6 * redistributable under the license given in the file "LICENSE"
7 * distributed in the NASM archive.
8 */
10 /* Most of this file is, like Mach-O itself, based on a.out. For more
11 * guidelines see outaout.c. */
13 #include "compiler.h"
15 #include <stdio.h>
16 #include <stdlib.h>
17 #include <string.h>
18 #include <ctype.h>
19 #include <inttypes.h>
21 #include "nasm.h"
22 #include "nasmlib.h"
23 #include "saa.h"
24 #include "raa.h"
25 #include "outform.h"
26 #include "outlib.h"
28 #if defined(OF_MACHO)
30 /* Mach-O in-file header structure sizes */
31 #define MACHO_HEADER_SIZE (28)
32 #define MACHO_SEGCMD_SIZE (56)
33 #define MACHO_SECTCMD_SIZE (68)
34 #define MACHO_SYMCMD_SIZE (24)
35 #define MACHO_NLIST_SIZE (12)
36 #define MACHO_RELINFO_SIZE (8)
38 /* Mach-O file header values */
39 #define MH_MAGIC (0xfeedface)
40 #define CPU_TYPE_I386 (7) /* x86 platform */
41 #define CPU_SUBTYPE_I386_ALL (3) /* all-x86 compatible */
42 #define MH_OBJECT (0x1) /* object file */
44 #define LC_SEGMENT (0x1) /* segment load command */
45 #define LC_SYMTAB (0x2) /* symbol table load command */
47 #define VM_PROT_NONE (0x00)
48 #define VM_PROT_READ (0x01)
49 #define VM_PROT_WRITE (0x02)
50 #define VM_PROT_EXECUTE (0x04)
52 #define VM_PROT_DEFAULT (VM_PROT_READ | VM_PROT_WRITE | VM_PROT_EXECUTE)
53 #define VM_PROT_ALL (VM_PROT_READ | VM_PROT_WRITE | VM_PROT_EXECUTE)
55 struct section {
56 /* nasm internal data */
57 struct section *next;
58 struct SAA *data;
59 int32_t index;
60 struct reloc *relocs;
61 int align;
63 /* data that goes into the file */
64 char sectname[16]; /* what this section is called */
65 char segname[16]; /* segment this section will be in */
66 uint32_t size; /* in-memory and -file size */
67 uint32_t nreloc; /* relocation entry count */
68 uint32_t flags; /* type and attributes (masked) */
71 #define SECTION_TYPE 0x000000ff /* section type mask */
73 #define S_REGULAR (0x0) /* standard section */
74 #define S_ZEROFILL (0x1) /* zerofill, in-memory only */
76 #define SECTION_ATTRIBUTES_SYS 0x00ffff00 /* system setable attributes */
77 #define S_ATTR_SOME_INSTRUCTIONS 0x00000400 /* section contains some
78 machine instructions */
79 #define S_ATTR_EXT_RELOC 0x00000200 /* section has external
80 relocation entries */
81 #define S_ATTR_LOC_RELOC 0x00000100 /* section has local
82 relocation entries */
85 static struct sectmap {
86 const char *nasmsect;
87 const char *segname;
88 const char *sectname;
89 const int32_t flags;
90 } sectmap[] = {
91 {".text", "__TEXT", "__text", S_REGULAR|S_ATTR_SOME_INSTRUCTIONS},
92 {".data", "__DATA", "__data", S_REGULAR},
93 {".rodata", "__DATA", "__const", S_REGULAR},
94 {".bss", "__DATA", "__bss", S_ZEROFILL},
95 {NULL, NULL, NULL, 0}
98 struct reloc {
99 /* nasm internal data */
100 struct reloc *next;
102 /* data that goes into the file */
103 int32_t addr; /* op's offset in section */
104 unsigned int snum:24, /* contains symbol index if
105 ** ext otherwise in-file
106 ** section number */
107 pcrel:1, /* relative relocation */
108 length:2, /* 0=byte, 1=word, 2=int32_t */
109 ext:1, /* external symbol referenced */
110 type:4; /* reloc type, 0 for us */
113 #define R_ABS 0 /* absolute relocation */
114 #define R_SCATTERED 0x80000000 /* reloc entry is scattered if
115 ** highest bit == 1 */
117 struct symbol {
118 /* nasm internal data */
119 struct symbol *next; /* next symbol in the list */
120 char *name; /* name of this symbol */
121 int32_t initial_snum; /* symbol number used above in
122 reloc */
123 int32_t snum; /* true snum for reloc */
125 /* data that goes into the file */
126 int32_t strx; /* string table index */
127 uint8_t type; /* symbol type */
128 uint8_t sect; /* NO_SECT or section number */
129 int16_t desc; /* for stab debugging, 0 for us */
130 uint32_t value; /* offset of symbol in section */
133 /* symbol type bits */
134 #define N_EXT 0x01 /* global or external symbol */
136 #define N_UNDF 0x0 /* undefined symbol | n_sect == */
137 #define N_ABS 0x2 /* absolute symbol | NO_SECT */
138 #define N_SECT 0xe /* defined symbol, n_sect holds
139 ** section number */
141 #define N_TYPE 0x0e /* type bit mask */
143 #define DEFAULT_SECTION_ALIGNMENT 0 /* byte (i.e. no) alignment */
145 /* special section number values */
146 #define NO_SECT 0 /* no section, invalid */
147 #define MAX_SECT 255 /* maximum number of sections */
149 static struct section *sects, **sectstail;
150 static struct symbol *syms, **symstail;
151 static uint32_t nsyms;
153 /* These variables are set by macho_layout_symbols() to organize
154 the symbol table and string table in order the dynamic linker
155 expects. They are then used in macho_write() to put out the
156 symbols and strings in that order.
158 The order of the symbol table is:
159 local symbols
160 defined external symbols (sorted by name)
161 undefined external symbols (sorted by name)
163 The order of the string table is:
164 strings for external symbols
165 strings for local symbols
167 static uint32_t ilocalsym = 0;
168 static uint32_t iextdefsym = 0;
169 static uint32_t iundefsym = 0;
170 static uint32_t nlocalsym;
171 static uint32_t nextdefsym;
172 static uint32_t nundefsym;
173 static struct symbol **extdefsyms = NULL;
174 static struct symbol **undefsyms = NULL;
176 static struct RAA *extsyms;
177 static struct SAA *strs;
178 static uint32_t strslen;
180 static FILE *machofp;
181 static efunc error;
182 static evalfunc evaluate;
184 extern struct ofmt of_macho;
186 /* Global file information. This should be cleaned up into either
187 a structure or as function arguments. */
188 uint32_t head_ncmds = 0;
189 uint32_t head_sizeofcmds = 0;
190 uint32_t seg_filesize = 0;
191 uint32_t seg_vmsize = 0;
192 uint32_t seg_nsects = 0;
193 uint32_t rel_padcnt = 0;
196 #define xstrncpy(xdst, xsrc) \
197 memset(xdst, '\0', sizeof(xdst)); /* zero out whole buffer */ \
198 strncpy(xdst, xsrc, sizeof(xdst)); /* copy over string */ \
199 xdst[sizeof(xdst) - 1] = '\0'; /* proper null-termination */
201 #define align(x, y) \
202 (((x) + (y) - 1) & ~((y) - 1)) /* align x to multiple of y */
204 #define alignint32_t(x) \
205 align(x, sizeof(int32_t)) /* align x to int32_t boundary */
207 static void debug_reloc (struct reloc *);
208 static void debug_section_relocs (struct section *) _unused;
210 static int exact_log2 (uint32_t align)
212 if (align == 0) {
213 return 0;
214 } else if (align & (align-1)) {
215 return -1; /* Not a power of 2 */
216 } else {
217 #ifdef HAVE_GNUC_4
218 return __builtin_ctzl (align);
219 #else
220 uint32_t result = 0;
222 /* We know exactly one bit is set at this point. */
223 if (align & 0xffff0000)
224 result |= 16;
225 if (align & 0xff00ff00)
226 result |= 8;
227 if (align & 0xf0f0f0f0)
228 result |= 4;
229 if (align & 0xcccccccc)
230 result |= 2;
231 if (align & 0xaaaaaaaa)
232 result |= 1;
234 return result;
235 #endif
239 static struct section *get_section_by_name(const char *segname,
240 const char *sectname)
242 struct section *s;
244 for (s = sects; s != NULL; s = s->next)
245 if (!strcmp(s->segname, segname) && !strcmp(s->sectname, sectname))
246 break;
248 return s;
251 static struct section *get_section_by_index(const int32_t index)
253 struct section *s;
255 for (s = sects; s != NULL; s = s->next)
256 if (index == s->index)
257 break;
259 return s;
262 static int32_t get_section_index_by_name(const char *segname,
263 const char *sectname)
265 struct section *s;
267 for (s = sects; s != NULL; s = s->next)
268 if (!strcmp(s->segname, segname) && !strcmp(s->sectname, sectname))
269 return s->index;
271 return -1;
274 static char *get_section_name_by_index(const int32_t index)
276 struct section *s;
278 for (s = sects; s != NULL; s = s->next)
279 if (index == s->index)
280 return s->sectname;
282 return NULL;
285 static uint8_t get_section_fileindex_by_index(const int32_t index)
287 struct section *s;
288 uint8_t i = 1;
290 for (s = sects; s != NULL && i < MAX_SECT; s = s->next, ++i)
291 if (index == s->index)
292 return i;
294 if (i == MAX_SECT)
295 error(ERR_WARNING,
296 "too many sections (>255) - clipped by fileindex");
298 return NO_SECT;
301 static void macho_init(FILE * fp, efunc errfunc, ldfunc ldef,
302 evalfunc eval)
304 char zero = 0;
306 machofp = fp;
307 error = errfunc;
308 evaluate = eval;
310 (void)ldef; /* placate optimisers */
312 sects = NULL;
313 sectstail = &sects;
315 syms = NULL;
316 symstail = &syms;
317 nsyms = 0;
318 nlocalsym = 0;
319 nextdefsym = 0;
320 nundefsym = 0;
322 extsyms = raa_init();
323 strs = saa_init(1L);
325 /* string table starts with a zero byte - don't ask why */
326 saa_wbytes(strs, &zero, sizeof(char));
327 strslen = 1;
330 static int macho_setinfo(enum geninfo type, char **val)
332 (void)type;
333 (void)val;
334 return 0;
337 static void sect_write(struct section *sect,
338 const uint8_t *data, uint32_t len)
340 saa_wbytes(sect->data, data, len);
341 sect->size += len;
344 static void add_reloc(struct section *sect, int32_t section,
345 int pcrel, int bytes)
347 struct reloc *r;
348 int32_t fi;
350 /* NeXT as puts relocs in reversed order (address-wise) into the
351 ** files, so we do the same, doesn't seem to make much of a
352 ** difference either way */
353 r = nasm_malloc(sizeof(struct reloc));
354 r->next = sect->relocs;
355 sect->relocs = r;
357 /* the current end of the section will be the symbol's address for
358 ** now, might have to be fixed by macho_fixup_relocs() later on. make
359 ** sure we don't make the symbol scattered by setting the highest
360 ** bit by accident */
361 r->addr = sect->size & ~R_SCATTERED;
362 r->ext = 0;
363 r->pcrel = pcrel;
365 /* match byte count 1, 2, 4 to length codes 0, 1, 2 respectively */
366 r->length = bytes >> 1;
368 /* vanilla relocation (GENERIC_RELOC_VANILLA) */
369 r->type = 0;
371 if (section == NO_SEG) {
372 /* absolute local symbol if no section index given */
373 r->snum = R_ABS;
374 } else {
375 fi = get_section_fileindex_by_index(section);
377 if (fi == NO_SECT) {
378 /* external symbol if no section with that index known,
379 ** symbol number was saved in macho_symdef() */
380 r->snum = raa_read(extsyms, section);
381 r->ext = 1;
382 } else {
383 /* local symbol in section fi */
384 r->snum = fi;
388 ++sect->nreloc;
391 static void macho_output(int32_t secto, const void *data,
392 enum out_type type, uint64_t size,
393 int32_t section, int32_t wrt)
395 struct section *s, *sbss;
396 int32_t addr;
397 uint8_t mydata[4], *p;
399 if (wrt != NO_SEG) {
400 wrt = NO_SEG;
401 error(ERR_NONFATAL, "WRT not supported by Mach-O output format");
402 /* continue to do _something_ */
405 if (secto == NO_SEG) {
406 if (type != OUT_RESERVE)
407 error(ERR_NONFATAL, "attempt to assemble code in "
408 "[ABSOLUTE] space");
410 return;
413 s = get_section_by_index(secto);
415 if (s == NULL) {
416 error(ERR_WARNING, "attempt to assemble code in"
417 " section %d: defaulting to `.text'", secto);
418 s = get_section_by_name("__TEXT", "__text");
420 /* should never happen */
421 if (s == NULL)
422 error(ERR_PANIC, "text section not found");
425 sbss = get_section_by_name("__DATA", "__bss");
427 if (s == sbss && type != OUT_RESERVE) {
428 error(ERR_WARNING, "attempt to initialize memory in the"
429 " BSS section: ignored");
430 s->size += realsize(type, size);
431 return;
434 switch (type) {
435 case OUT_RESERVE:
436 if (s != sbss) {
437 error(ERR_WARNING, "uninitialized space declared in"
438 " %s section: zeroing",
439 get_section_name_by_index(secto));
441 sect_write(s, NULL, size);
442 } else
443 s->size += size;
445 break;
447 case OUT_RAWDATA:
448 if (section != NO_SEG)
449 error(ERR_PANIC, "OUT_RAWDATA with other than NO_SEG");
451 sect_write(s, data, size);
452 break;
454 case OUT_ADDRESS:
455 addr = *(int64_t *)data;
457 if (section != NO_SEG) {
458 if (section % 2) {
459 error(ERR_NONFATAL, "Mach-O format does not support"
460 " section base references");
461 } else
462 add_reloc(s, section, 0, size);
465 p = mydata;
466 WRITEADDR(p, addr, size);
467 sect_write(s, mydata, size);
468 break;
470 case OUT_REL2ADR:
471 if (section == secto)
472 error(ERR_PANIC, "intra-section OUT_REL2ADR");
474 if (section != NO_SEG && section % 2) {
475 error(ERR_NONFATAL, "Mach-O format does not support"
476 " section base references");
477 } else
478 add_reloc(s, section, 1, 2);
480 p = mydata;
481 WRITESHORT(p, *(int32_t *)data - (size + s->size));
482 sect_write(s, mydata, 2L);
483 break;
485 case OUT_REL4ADR:
486 if (section == secto)
487 error(ERR_PANIC, "intra-section OUT_REL4ADR");
489 if (section != NO_SEG && section % 2) {
490 error(ERR_NONFATAL, "Mach-O format does not support"
491 " section base references");
492 } else
493 add_reloc(s, section, 1, 4);
495 p = mydata;
496 WRITELONG(p, *(int32_t *)data - (size + s->size));
497 sect_write(s, mydata, 4L);
498 break;
500 default:
501 error(ERR_PANIC, "unknown output type?");
502 break;
506 static int32_t macho_section(char *name, int pass, int *bits)
508 int32_t index, originalIndex;
509 char *sectionAttributes;
510 struct sectmap *sm;
511 struct section *s;
513 (void)pass;
515 /* Default to 32 bits. */
516 if (!name) {
517 *bits = 32;
518 name = ".text";
519 sectionAttributes = NULL;
520 } else {
521 sectionAttributes = name;
522 name = nasm_strsep(&sectionAttributes, " \t");
525 for (sm = sectmap; sm->nasmsect != NULL; ++sm) {
526 /* make lookup into section name translation table */
527 if (!strcmp(name, sm->nasmsect)) {
528 char *currentAttribute;
530 /* try to find section with that name */
531 originalIndex = index = get_section_index_by_name(sm->segname,
532 sm->sectname);
534 /* create it if it doesn't exist yet */
535 if (index == -1) {
536 s = *sectstail = nasm_malloc(sizeof(struct section));
537 s->next = NULL;
538 sectstail = &s->next;
540 s->data = saa_init(1L);
541 s->index = seg_alloc();
542 s->relocs = NULL;
543 s->align = -1;
545 xstrncpy(s->segname, sm->segname);
546 xstrncpy(s->sectname, sm->sectname);
547 s->size = 0;
548 s->nreloc = 0;
549 s->flags = sm->flags;
551 index = s->index;
552 } else {
553 s = get_section_by_index(index);
556 while ((NULL != sectionAttributes)
557 && (currentAttribute = nasm_strsep(&sectionAttributes, " \t"))) {
558 if (0 != *currentAttribute) {
559 if (!nasm_strnicmp("align=", currentAttribute, 6)) {
560 char *end;
561 int newAlignment, value;
563 value = strtoul(currentAttribute + 6, (char**)&end, 0);
564 newAlignment = exact_log2(value);
566 if (0 != *end) {
567 error(ERR_PANIC,
568 "unknown or missing alignment value \"%s\" "
569 "specified for section \"%s\"",
570 currentAttribute + 6,
571 name);
572 return NO_SEG;
573 } else if (0 > newAlignment) {
574 error(ERR_PANIC,
575 "alignment of %d (for section \"%s\") is not "
576 "a power of two",
577 value,
578 name);
579 return NO_SEG;
582 if ((-1 != originalIndex)
583 && (s->align != newAlignment)
584 && (s->align != -1)) {
585 error(ERR_PANIC,
586 "section \"%s\" has already been specified "
587 "with alignment %d, conflicts with new "
588 "alignment of %d",
589 name,
590 (1 << s->align),
591 value);
592 return NO_SEG;
595 s->align = newAlignment;
596 } else if (!nasm_stricmp("data", currentAttribute)) {
597 /* Do nothing; 'data' is implicit */
598 } else {
599 error(ERR_PANIC,
600 "unknown section attribute %s for section %s",
601 currentAttribute,
602 name);
603 return NO_SEG;
608 return index;
612 error(ERR_PANIC, "invalid section name %s", name);
613 return NO_SEG;
616 static void macho_symdef(char *name, int32_t section, int64_t offset,
617 int is_global, char *special)
619 struct symbol *sym;
621 if (special) {
622 error(ERR_NONFATAL, "The Mach-O output format does "
623 "not support any special symbol types");
624 return;
627 if (is_global == 3) {
628 error(ERR_NONFATAL, "The Mach-O format does not "
629 "(yet) support forward reference fixups.");
630 return;
633 sym = *symstail = nasm_malloc(sizeof(struct symbol));
634 sym->next = NULL;
635 symstail = &sym->next;
637 sym->name = name;
638 sym->strx = strslen;
639 sym->type = 0;
640 sym->desc = 0;
641 sym->value = offset;
642 sym->initial_snum = -1;
644 /* external and common symbols get N_EXT */
645 if (is_global != 0)
646 sym->type |= N_EXT;
648 if (section == NO_SEG) {
649 /* symbols in no section get absolute */
650 sym->type |= N_ABS;
651 sym->sect = NO_SECT;
652 } else {
653 sym->type |= N_SECT;
655 /* get the in-file index of the section the symbol was defined in */
656 sym->sect = get_section_fileindex_by_index(section);
658 if (sym->sect == NO_SECT) {
659 /* remember symbol number of references to external
660 ** symbols, this works because every external symbol gets
661 ** its own section number allocated internally by nasm and
662 ** can so be used as a key */
663 extsyms = raa_write(extsyms, section, nsyms);
664 sym->initial_snum = nsyms;
666 switch (is_global) {
667 case 1:
668 case 2:
669 /* there isn't actually a difference between global
670 ** and common symbols, both even have their size in
671 ** sym->value */
672 sym->type = N_EXT;
673 break;
675 default:
676 /* give an error on unfound section if it's not an
677 ** external or common symbol (assemble_file() does a
678 ** seg_alloc() on every call for them) */
679 error(ERR_PANIC, "in-file index for section %d not found",
680 section);
685 ++nsyms;
688 static int32_t macho_segbase(int32_t section)
690 return section;
693 static int macho_directive(char *directive, char *value, int pass)
695 (void)directive;
696 (void)value;
697 (void)pass;
698 return 0;
701 static void macho_filename(char *inname, char *outname, efunc error)
703 standard_extension(inname, outname, ".o", error);
706 extern macros_t macho_stdmac[];
708 /* Comparison function for qsort symbol layout. */
709 static int layout_compare (const struct symbol **s1,
710 const struct symbol **s2)
712 return (strcmp ((*s1)->name, (*s2)->name));
715 /* The native assembler does a few things in a similar function
717 * Remove temporary labels
718 * Sort symbols according to local, external, undefined (by name)
719 * Order the string table
721 We do not remove temporary labels right now.
723 numsyms is the total number of symbols we have. strtabsize is the
724 number entries in the string table. */
726 static void macho_layout_symbols (uint32_t *numsyms,
727 uint32_t *strtabsize)
729 struct symbol *sym, **symp;
730 uint32_t i,j;
732 *numsyms = 0;
733 *strtabsize = sizeof (char);
735 symp = &syms;
737 while ((sym = *symp)) {
738 /* Undefined symbols are now external. */
739 if (sym->type == N_UNDF)
740 sym->type |= N_EXT;
742 if ((sym->type & N_EXT) == 0) {
743 sym->snum = *numsyms;
744 *numsyms = *numsyms + 1;
745 nlocalsym++;
747 else {
748 if ((sym->type & N_TYPE) != N_UNDF)
749 nextdefsym++;
750 else
751 nundefsym++;
753 /* If we handle debug info we'll want
754 to check for it here instead of just
755 adding the symbol to the string table. */
756 sym->strx = *strtabsize;
757 saa_wbytes (strs, sym->name, (int32_t)(strlen(sym->name) + 1));
758 *strtabsize += strlen(sym->name) + 1;
760 symp = &(sym->next);
763 /* Next, sort the symbols. Most of this code is a direct translation from
764 the Apple cctools symbol layout. We need to keep compatibility with that. */
765 /* Set the indexes for symbol groups into the symbol table */
766 ilocalsym = 0;
767 iextdefsym = nlocalsym;
768 iundefsym = nlocalsym + nextdefsym;
770 /* allocate arrays for sorting externals by name */
771 extdefsyms = nasm_malloc(nextdefsym * sizeof(struct symbol *));
772 undefsyms = nasm_malloc(nundefsym * sizeof(struct symbol *));
774 i = 0;
775 j = 0;
777 symp = &syms;
779 while ((sym = *symp)) {
781 if((sym->type & N_EXT) == 0) {
782 sym->strx = *strtabsize;
783 saa_wbytes (strs, sym->name, (int32_t)(strlen (sym->name) + 1));
784 *strtabsize += strlen(sym->name) + 1;
786 else {
787 if((sym->type & N_TYPE) != N_UNDF)
788 extdefsyms[i++] = sym;
789 else
790 undefsyms[j++] = sym;
792 symp = &(sym->next);
795 qsort(extdefsyms, nextdefsym, sizeof(struct symbol *),
796 (int (*)(const void *, const void *))layout_compare);
797 qsort(undefsyms, nundefsym, sizeof(struct symbol *),
798 (int (*)(const void *, const void *))layout_compare);
800 for(i = 0; i < nextdefsym; i++) {
801 extdefsyms[i]->snum = *numsyms;
802 *numsyms += 1;
804 for(j = 0; j < nundefsym; j++) {
805 undefsyms[j]->snum = *numsyms;
806 *numsyms += 1;
810 /* Calculate some values we'll need for writing later. */
812 static void macho_calculate_sizes (void)
814 struct section *s;
816 /* count sections and calculate in-memory and in-file offsets */
817 for (s = sects; s != NULL; s = s->next) {
818 /* zerofill sections aren't actually written to the file */
819 if ((s->flags & SECTION_TYPE) != S_ZEROFILL)
820 seg_filesize += s->size;
822 seg_vmsize += s->size;
823 ++seg_nsects;
826 /* calculate size of all headers, load commands and sections to
827 ** get a pointer to the start of all the raw data */
828 if (seg_nsects > 0) {
829 ++head_ncmds;
830 head_sizeofcmds +=
831 MACHO_SEGCMD_SIZE + seg_nsects * MACHO_SECTCMD_SIZE;
834 if (nsyms > 0) {
835 ++head_ncmds;
836 head_sizeofcmds += MACHO_SYMCMD_SIZE;
840 /* Write out the header information for the file. */
842 static void macho_write_header (void)
844 fwriteint32_t(MH_MAGIC, machofp); /* magic */
845 fwriteint32_t(CPU_TYPE_I386, machofp); /* CPU type */
846 fwriteint32_t(CPU_SUBTYPE_I386_ALL, machofp); /* CPU subtype */
847 fwriteint32_t(MH_OBJECT, machofp); /* Mach-O file type */
848 fwriteint32_t(head_ncmds, machofp); /* number of load commands */
849 fwriteint32_t(head_sizeofcmds, machofp); /* size of load commands */
850 fwriteint32_t(0, machofp); /* no flags */
853 /* Write out the segment load command at offset. */
855 static uint32_t macho_write_segment (uint32_t offset)
857 uint32_t s_addr = 0;
858 uint32_t rel_base = alignint32_t (offset + seg_filesize);
859 uint32_t s_reloff = 0;
860 struct section *s;
862 fwriteint32_t(LC_SEGMENT, machofp); /* cmd == LC_SEGMENT */
864 /* size of load command including section load commands */
865 fwriteint32_t(MACHO_SEGCMD_SIZE + seg_nsects *
866 MACHO_SECTCMD_SIZE, machofp);
868 /* in an MH_OBJECT file all sections are in one unnamed (name
869 ** all zeros) segment */
870 fwrite("\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0", 16, 1, machofp);
871 fwriteint32_t(0, machofp); /* in-memory offset */
872 fwriteint32_t(seg_vmsize, machofp); /* in-memory size */
873 fwriteint32_t(offset, machofp); /* in-file offset to data */
874 fwriteint32_t(seg_filesize, machofp); /* in-file size */
875 fwriteint32_t(VM_PROT_DEFAULT, machofp); /* maximum vm protection */
876 fwriteint32_t(VM_PROT_DEFAULT, machofp); /* initial vm protection */
877 fwriteint32_t(seg_nsects, machofp); /* number of sections */
878 fwriteint32_t(0, machofp); /* no flags */
880 /* emit section headers */
881 for (s = sects; s != NULL; s = s->next) {
882 fwrite(s->sectname, sizeof(s->sectname), 1, machofp);
883 fwrite(s->segname, sizeof(s->segname), 1, machofp);
884 fwriteint32_t(s_addr, machofp);
885 fwriteint32_t(s->size, machofp);
887 /* dummy data for zerofill sections or proper values */
888 if ((s->flags & SECTION_TYPE) != S_ZEROFILL) {
889 fwriteint32_t(offset, machofp);
890 /* Write out section alignment, as a power of two.
891 e.g. 32-bit word alignment would be 2 (2^^2 = 4). */
892 if (s->align == -1)
893 s->align = DEFAULT_SECTION_ALIGNMENT;
894 fwriteint32_t(s->align, machofp);
895 /* To be compatible with cctools as we emit
896 a zero reloff if we have no relocations. */
897 fwriteint32_t(s->nreloc ? rel_base + s_reloff : 0, machofp);
898 fwriteint32_t(s->nreloc, machofp);
900 offset += s->size;
901 s_reloff += s->nreloc * MACHO_RELINFO_SIZE;
902 } else {
903 fwriteint32_t(0, machofp);
904 fwriteint32_t(0, machofp);
905 fwriteint32_t(0, machofp);
906 fwriteint32_t(0, machofp);
909 fwriteint32_t(s->flags, machofp); /* flags */
910 fwriteint32_t(0, machofp); /* reserved */
911 fwriteint32_t(0, machofp); /* reserved */
913 s_addr += s->size;
916 rel_padcnt = rel_base - offset;
917 offset = rel_base + s_reloff;
919 return offset;
922 /* For a given chain of relocs r, write out the entire relocation
923 chain to the object file. */
925 static void macho_write_relocs (struct reloc *r)
927 while (r) {
928 uint32_t word2;
930 fwriteint32_t(r->addr, machofp); /* reloc offset */
932 word2 = r->snum;
933 word2 |= r->pcrel << 24;
934 word2 |= r->length << 25;
935 word2 |= r->ext << 27;
936 word2 |= r->type << 28;
937 fwriteint32_t(word2, machofp); /* reloc data */
939 r = r->next;
943 /* Write out the section data. */
944 static void macho_write_section (void)
946 struct section *s, *s2;
947 struct reloc *r;
948 char *rel_paddata = "\0\0\0";
949 uint8_t fi, *p, *q, blk[4];
950 int32_t l;
952 for (s = sects; s != NULL; s = s->next) {
953 if ((s->flags & SECTION_TYPE) == S_ZEROFILL)
954 continue;
956 /* no padding needs to be done to the sections */
958 /* Like a.out Mach-O references things in the data or bss
959 * sections by addresses which are actually relative to the
960 * start of the _text_ section, in the _file_. See outaout.c
961 * for more information. */
962 saa_rewind(s->data);
963 for (r = s->relocs; r != NULL; r = r->next) {
964 saa_fread(s->data, r->addr, blk, (int32_t)r->length << 1);
965 p = q = blk;
966 l = *p++;
968 /* get offset based on relocation type */
969 if (r->length > 0) {
970 l += ((int32_t)*p++) << 8;
972 if (r->length == 2) {
973 l += ((int32_t)*p++) << 16;
974 l += ((int32_t)*p++) << 24;
978 /* If the relocation is internal add to the current section
979 offset. Otherwise the only value we need is the symbol
980 offset which we already have. The linker takes care
981 of the rest of the address. */
982 if (!r->ext) {
983 /* add sizes of previous sections to current offset */
984 for (s2 = sects, fi = 1;
985 s2 != NULL && fi < r->snum; s2 = s2->next, fi++)
986 l += s2->size;
989 /* write new offset back */
990 if (r->length == 2)
991 WRITELONG(q, l);
992 else if (r->length == 1)
993 WRITESHORT(q, l);
994 else
995 *q++ = l & 0xFF;
997 saa_fwrite(s->data, r->addr, blk, (int32_t)r->length << 1);
1000 /* dump the section data to file */
1001 saa_fpwrite(s->data, machofp);
1004 /* pad last section up to reloc entries on int32_t boundary */
1005 fwrite(rel_paddata, rel_padcnt, 1, machofp);
1007 /* emit relocation entries */
1008 for (s = sects; s != NULL; s = s->next)
1009 macho_write_relocs (s->relocs);
1012 /* Write out the symbol table. We should already have sorted this
1013 before now. */
1014 static void macho_write_symtab (void)
1016 struct symbol *sym;
1017 struct section *s;
1018 int32_t fi;
1019 uint32_t i;
1021 /* we don't need to pad here since MACHO_RELINFO_SIZE == 8 */
1023 for (sym = syms; sym != NULL; sym = sym->next) {
1024 if ((sym->type & N_EXT) == 0) {
1025 fwriteint32_t(sym->strx, machofp); /* string table entry number */
1026 fwrite(&sym->type, 1, 1, machofp); /* symbol type */
1027 fwrite(&sym->sect, 1, 1, machofp); /* section */
1028 fwriteint16_t(sym->desc, machofp); /* description */
1030 /* Fix up the symbol value now that we know the final section
1031 sizes. */
1032 if (((sym->type & N_TYPE) == N_SECT) && (sym->sect != NO_SECT)) {
1033 for (s = sects, fi = 1;
1034 s != NULL && fi < sym->sect; s = s->next, ++fi)
1035 sym->value += s->size;
1038 fwriteint32_t(sym->value, machofp); /* value (i.e. offset) */
1042 for (i = 0; i < nextdefsym; i++) {
1043 sym = extdefsyms[i];
1044 fwriteint32_t(sym->strx, machofp);
1045 fwrite(&sym->type, 1, 1, machofp); /* symbol type */
1046 fwrite(&sym->sect, 1, 1, machofp); /* section */
1047 fwriteint16_t(sym->desc, machofp); /* description */
1049 /* Fix up the symbol value now that we know the final section
1050 sizes. */
1051 if (((sym->type & N_TYPE) == N_SECT) && (sym->sect != NO_SECT)) {
1052 for (s = sects, fi = 1;
1053 s != NULL && fi < sym->sect; s = s->next, ++fi)
1054 sym->value += s->size;
1057 fwriteint32_t(sym->value, machofp); /* value (i.e. offset) */
1060 for (i = 0; i < nundefsym; i++) {
1061 sym = undefsyms[i];
1062 fwriteint32_t(sym->strx, machofp);
1063 fwrite(&sym->type, 1, 1, machofp); /* symbol type */
1064 fwrite(&sym->sect, 1, 1, machofp); /* section */
1065 fwriteint16_t(sym->desc, machofp); /* description */
1067 /* Fix up the symbol value now that we know the final section
1068 sizes. */
1069 if (((sym->type & N_TYPE) == N_SECT) && (sym->sect != NO_SECT)) {
1070 for (s = sects, fi = 1;
1071 s != NULL && fi < sym->sect; s = s->next, ++fi)
1072 sym->value += s->size;
1075 fwriteint32_t(sym->value, machofp); /* value (i.e. offset) */
1079 /* Fixup the snum in the relocation entries, we should be
1080 doing this only for externally undefined symbols. */
1081 static void macho_fixup_relocs (struct reloc *r)
1083 struct symbol *sym;
1084 uint32_t i;
1086 while (r != NULL) {
1087 if (r->ext) {
1088 for (i = 0; i < nundefsym; i++) {
1089 sym = undefsyms[i];
1090 if (sym->initial_snum == r->snum) {
1091 r->snum = sym->snum;
1092 break;
1096 r = r->next;
1100 /* Write out the object file. */
1102 static void macho_write (void)
1104 uint32_t offset = 0;
1106 /* mach-o object file structure:
1108 ** mach header
1109 ** uint32_t magic
1110 ** int cpu type
1111 ** int cpu subtype
1112 ** uint32_t mach file type
1113 ** uint32_t number of load commands
1114 ** uint32_t size of all load commands
1115 ** (includes section struct size of segment command)
1116 ** uint32_t flags
1118 ** segment command
1119 ** uint32_t command type == LC_SEGMENT
1120 ** uint32_t size of load command
1121 ** (including section load commands)
1122 ** char[16] segment name
1123 ** uint32_t in-memory offset
1124 ** uint32_t in-memory size
1125 ** uint32_t in-file offset to data area
1126 ** uint32_t in-file size
1127 ** (in-memory size excluding zerofill sections)
1128 ** int maximum vm protection
1129 ** int initial vm protection
1130 ** uint32_t number of sections
1131 ** uint32_t flags
1133 ** section commands
1134 ** char[16] section name
1135 ** char[16] segment name
1136 ** uint32_t in-memory offset
1137 ** uint32_t in-memory size
1138 ** uint32_t in-file offset
1139 ** uint32_t alignment
1140 ** (irrelevant in MH_OBJECT)
1141 ** uint32_t in-file offset of relocation entires
1142 ** uint32_t number of relocations
1143 ** uint32_t flags
1144 ** uint32_t reserved
1145 ** uint32_t reserved
1147 ** symbol table command
1148 ** uint32_t command type == LC_SYMTAB
1149 ** uint32_t size of load command
1150 ** uint32_t symbol table offset
1151 ** uint32_t number of symbol table entries
1152 ** uint32_t string table offset
1153 ** uint32_t string table size
1155 ** raw section data
1157 ** padding to int32_t boundary
1159 ** relocation data (struct reloc)
1160 ** int32_t offset
1161 ** uint data (symbolnum, pcrel, length, extern, type)
1163 ** symbol table data (struct nlist)
1164 ** int32_t string table entry number
1165 ** uint8_t type
1166 ** (extern, absolute, defined in section)
1167 ** uint8_t section
1168 ** (0 for global symbols, section number of definition (>= 1, <=
1169 ** 254) for local symbols, size of variable for common symbols
1170 ** [type == extern])
1171 ** int16_t description
1172 ** (for stab debugging format)
1173 ** uint32_t value (i.e. file offset) of symbol or stab offset
1175 ** string table data
1176 ** list of null-terminated strings
1179 /* Emit the Mach-O header. */
1180 macho_write_header();
1182 offset = MACHO_HEADER_SIZE + head_sizeofcmds;
1184 /* emit the segment load command */
1185 if (seg_nsects > 0)
1186 offset = macho_write_segment (offset);
1187 else
1188 error(ERR_WARNING, "no sections?");
1190 if (nsyms > 0) {
1191 /* write out symbol command */
1192 fwriteint32_t(LC_SYMTAB, machofp); /* cmd == LC_SYMTAB */
1193 fwriteint32_t(MACHO_SYMCMD_SIZE, machofp); /* size of load command */
1194 fwriteint32_t(offset, machofp); /* symbol table offset */
1195 fwriteint32_t(nsyms, machofp); /* number of symbol
1196 ** table entries */
1198 offset += nsyms * MACHO_NLIST_SIZE;
1199 fwriteint32_t(offset, machofp); /* string table offset */
1200 fwriteint32_t(strslen, machofp); /* string table size */
1203 /* emit section data */
1204 if (seg_nsects > 0)
1205 macho_write_section ();
1207 /* emit symbol table if we have symbols */
1208 if (nsyms > 0)
1209 macho_write_symtab ();
1211 /* we don't need to pad here since MACHO_NLIST_SIZE == 12 */
1213 /* emit string table */
1214 saa_fpwrite(strs, machofp);
1216 /* We do quite a bit here, starting with finalizing all of the data
1217 for the object file, writing, and then freeing all of the data from
1218 the file. */
1220 static void macho_cleanup(int debuginfo)
1222 struct section *s;
1223 struct reloc *r;
1224 struct symbol *sym;
1226 (void)debuginfo;
1228 /* Sort all symbols. */
1229 macho_layout_symbols (&nsyms, &strslen);
1231 /* Fixup relocation entries */
1232 for (s = sects; s != NULL; s = s->next) {
1233 macho_fixup_relocs (s->relocs);
1236 /* First calculate and finalize needed values. */
1237 macho_calculate_sizes();
1238 macho_write();
1240 /* done - yay! */
1241 fclose(machofp);
1243 /* free up everything */
1244 while (sects->next) {
1245 s = sects;
1246 sects = sects->next;
1248 saa_free(s->data);
1249 while (s->relocs != NULL) {
1250 r = s->relocs;
1251 s->relocs = s->relocs->next;
1252 nasm_free(r);
1255 nasm_free(s);
1258 saa_free(strs);
1259 raa_free(extsyms);
1261 if (syms) {
1262 while (syms->next) {
1263 sym = syms;
1264 syms = syms->next;
1266 nasm_free (sym);
1271 /* Debugging routines. */
1272 static void debug_reloc (struct reloc *r)
1274 fprintf (stdout, "reloc:\n");
1275 fprintf (stdout, "\taddr: %"PRId32"\n", r->addr);
1276 fprintf (stdout, "\tsnum: %d\n", r->snum);
1277 fprintf (stdout, "\tpcrel: %d\n", r->pcrel);
1278 fprintf (stdout, "\tlength: %d\n", r->length);
1279 fprintf (stdout, "\text: %d\n", r->ext);
1280 fprintf (stdout, "\ttype: %d\n", r->type);
1283 static void debug_section_relocs (struct section *s)
1285 struct reloc *r = s->relocs;
1287 fprintf (stdout, "relocs for section %s:\n\n", s->sectname);
1289 while (r != NULL) {
1290 debug_reloc (r);
1291 r = r->next;
1295 struct ofmt of_macho = {
1296 "NeXTstep/OpenStep/Rhapsody/Darwin/MacOS X object files",
1297 "macho",
1298 NULL,
1299 null_debug_arr,
1300 &null_debug_form,
1301 macho_stdmac,
1302 macho_init,
1303 macho_setinfo,
1304 macho_output,
1305 macho_symdef,
1306 macho_section,
1307 macho_segbase,
1308 macho_directive,
1309 macho_filename,
1310 macho_cleanup
1313 #endif
1316 * Local Variables:
1317 * mode:c
1318 * c-basic-offset:4
1319 * End:
1321 * end of file */