preproc: Convert tabs to spaces
[nasm/externdefs.git] / output / outmac64.c
blobabad84aa7e6b7cbd0b489690528ee708a5d6c265
1 /* ----------------------------------------------------------------------- *
2 *
3 * Copyright 1996-2013 The NASM Authors - All Rights Reserved
4 * See the file AUTHORS included with the NASM distribution for
5 * the specific copyright holders.
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following
9 * conditions are met:
11 * * Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * * Redistributions in binary form must reproduce the above
14 * copyright notice, this list of conditions and the following
15 * disclaimer in the documentation and/or other materials provided
16 * with the distribution.
18 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
19 * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
20 * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
21 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
22 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
23 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
25 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
26 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
28 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
29 * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
30 * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32 * ----------------------------------------------------------------------- */
35 * outmac64.c output routines for the Netwide Assembler to produce
36 * NeXTstep/OpenStep/Rhapsody/Darwin/MacOS X (x86_64) object files
39 /* Most of this file is, like Mach-O itself, based on a.out. For more
40 * guidelines see outaout.c. */
42 #include "compiler.h"
44 #include <stdio.h>
45 #include <stdlib.h>
46 #include <string.h>
47 #include <ctype.h>
48 #include <inttypes.h>
50 #include "nasm.h"
51 #include "nasmlib.h"
52 #include "saa.h"
53 #include "raa.h"
54 #include "output/outform.h"
55 #include "output/outlib.h"
57 #if defined(OF_MACHO64)
59 /* Mach-O in-file header structure sizes */
60 #define MACHO_HEADER64_SIZE (32)
61 #define MACHO_SEGCMD64_SIZE (72)
62 #define MACHO_SECTCMD64_SIZE (80)
63 #define MACHO_SYMCMD_SIZE (24)
64 #define MACHO_NLIST64_SIZE (16)
65 #define MACHO_RELINFO64_SIZE (8)
67 /* Mach-O file header values */
68 #define MH_MAGIC_64 (0xfeedfacf)
69 #define CPU_TYPE_X86_64 (0x01000007) /* x86-64 platform */
70 #define CPU_SUBTYPE_I386_ALL (3) /* all-x86 compatible */
71 #define MH_OBJECT (0x1) /* object file */
73 #define LC_SEGMENT_64 (0x19) /* segment load command */
74 #define LC_SYMTAB (0x2) /* symbol table load command */
76 #define VM_PROT_NONE (0x00)
77 #define VM_PROT_READ (0x01)
78 #define VM_PROT_WRITE (0x02)
79 #define VM_PROT_EXECUTE (0x04)
81 #define VM_PROT_DEFAULT (VM_PROT_READ | VM_PROT_WRITE | VM_PROT_EXECUTE)
82 #define VM_PROT_ALL (VM_PROT_READ | VM_PROT_WRITE | VM_PROT_EXECUTE)
84 struct section {
85 /* nasm internal data */
86 struct section *next;
87 struct SAA *data;
88 int32_t index;
89 struct reloc *relocs;
90 int align;
92 /* data that goes into the file */
93 char sectname[16]; /* what this section is called */
94 char segname[16]; /* segment this section will be in */
95 uint64_t addr; /* in-memory address (subject to alignment) */
96 uint64_t size; /* in-memory and -file size */
97 uint32_t nreloc; /* relocation entry count */
98 uint32_t flags; /* type and attributes (masked) */
99 uint32_t extreloc; /* external relocations */
102 #define SECTION_TYPE 0x000000ff /* section type mask */
104 #define S_REGULAR (0x0) /* standard section */
105 #define S_ZEROFILL (0x1) /* zerofill, in-memory only */
107 #define SECTION_ATTRIBUTES_SYS 0x00ffff00 /* system setable attributes */
108 #define S_ATTR_SOME_INSTRUCTIONS 0x00000400 /* section contains some
109 machine instructions */
110 #define S_ATTR_EXT_RELOC 0x00000200 /* section has external
111 relocation entries */
112 #define S_ATTR_LOC_RELOC 0x00000100 /* section has local
113 relocation entries */
114 #define S_ATTR_PURE_INSTRUCTIONS 0x80000000 /* section uses pure
115 machine instructions */
117 static struct sectmap {
118 const char *nasmsect;
119 const char *segname;
120 const char *sectname;
121 const int32_t flags;
122 } sectmap[] = {
123 {".text", "__TEXT", "__text", S_REGULAR|S_ATTR_SOME_INSTRUCTIONS|S_ATTR_PURE_INSTRUCTIONS},
124 {".data", "__DATA", "__data", S_REGULAR},
125 {".rodata", "__DATA", "__const", S_REGULAR},
126 {".bss", "__DATA", "__bss", S_ZEROFILL},
127 {NULL, NULL, NULL, 0}
130 struct reloc {
131 /* nasm internal data */
132 struct reloc *next;
134 /* data that goes into the file */
135 int32_t addr; /* op's offset in section */
136 uint32_t snum:24, /* contains symbol index if
137 ** ext otherwise in-file
138 ** section number */
139 pcrel:1, /* relative relocation */
140 length:2, /* 0=byte, 1=word, 2=int32_t, 3=int64_t */
141 ext:1, /* external symbol referenced */
142 type:4; /* reloc type */
145 #define R_ABS 0 /* absolute relocation */
146 #define R_SCATTERED 0x80000000 /* reloc entry is scattered if
147 ** highest bit == 1 */
149 struct symbol {
150 /* nasm internal data */
151 struct symbol *next; /* next symbol in the list */
152 char *name; /* name of this symbol */
153 int32_t initial_snum; /* symbol number used above in
154 reloc */
155 int32_t snum; /* true snum for reloc */
157 /* data that goes into the file */
158 uint32_t strx; /* string table index */
159 uint8_t type; /* symbol type */
160 uint8_t sect; /* NO_SECT or section number */
161 uint16_t desc; /* for stab debugging, 0 for us */
162 uint64_t value; /* offset of symbol in section */
165 /* symbol type bits */
166 #define N_EXT 0x01 /* global or external symbol */
168 #define N_UNDF 0x0 /* undefined symbol | n_sect == */
169 #define N_ABS 0x2 /* absolute symbol | NO_SECT */
170 #define N_SECT 0xe /* defined symbol, n_sect holds
171 ** section number */
173 #define N_TYPE 0x0e /* type bit mask */
175 #define DEFAULT_SECTION_ALIGNMENT 0 /* byte (i.e. no) alignment */
177 /* special section number values */
178 #define NO_SECT 0 /* no section, invalid */
179 #define MAX_SECT 255 /* maximum number of sections */
181 static struct section *sects, **sectstail;
182 static struct symbol *syms, **symstail;
183 static uint32_t nsyms;
185 /* These variables are set by macho_layout_symbols() to organize
186 the symbol table and string table in order the dynamic linker
187 expects. They are then used in macho_write() to put out the
188 symbols and strings in that order.
190 The order of the symbol table is:
191 local symbols
192 defined external symbols (sorted by name)
193 undefined external symbols (sorted by name)
195 The order of the string table is:
196 strings for external symbols
197 strings for local symbols
199 static uint32_t ilocalsym = 0;
200 static uint32_t iextdefsym = 0;
201 static uint32_t iundefsym = 0;
202 static uint32_t nlocalsym;
203 static uint32_t nextdefsym;
204 static uint32_t nundefsym;
205 static struct symbol **extdefsyms = NULL;
206 static struct symbol **undefsyms = NULL;
208 static struct RAA *extsyms;
209 static struct SAA *strs;
210 static uint32_t strslen;
212 extern struct ofmt of_macho64;
214 /* Global file information. This should be cleaned up into either
215 a structure or as function arguments. */
216 uint32_t head_ncmds64 = 0;
217 uint32_t head_sizeofcmds64 = 0;
218 uint64_t seg_filesize64 = 0;
219 uint64_t seg_vmsize64 = 0;
220 uint32_t seg_nsects64 = 0;
221 uint64_t rel_padcnt64 = 0;
224 #define xstrncpy(xdst, xsrc) \
225 memset(xdst, '\0', sizeof(xdst)); /* zero out whole buffer */ \
226 strncpy(xdst, xsrc, sizeof(xdst)); /* copy over string */ \
227 xdst[sizeof(xdst) - 1] = '\0'; /* proper null-termination */
229 #define alignint32_t(x) \
230 ALIGN(x, sizeof(int32_t)) /* align x to int32_t boundary */
232 #define alignint64_t(x) \
233 ALIGN(x, sizeof(int64_t)) /* align x to int64_t boundary */
235 static void debug_reloc (struct reloc *);
236 static void debug_section_relocs (struct section *) _unused;
238 static struct section *get_section_by_name(const char *segname,
239 const char *sectname)
241 struct section *s;
243 for (s = sects; s != NULL; s = s->next)
244 if (!strcmp(s->segname, segname) && !strcmp(s->sectname, sectname))
245 break;
247 return s;
250 static struct section *get_section_by_index(const int32_t index)
252 struct section *s;
254 for (s = sects; s != NULL; s = s->next)
255 if (index == s->index)
256 break;
258 return s;
261 static int32_t get_section_index_by_name(const char *segname,
262 const char *sectname)
264 struct section *s;
266 for (s = sects; s != NULL; s = s->next)
267 if (!strcmp(s->segname, segname) && !strcmp(s->sectname, sectname))
268 return s->index;
270 return -1;
273 static char *get_section_name_by_index(const int32_t index)
275 struct section *s;
277 for (s = sects; s != NULL; s = s->next)
278 if (index == s->index)
279 return s->sectname;
281 return NULL;
284 static uint8_t get_section_fileindex_by_index(const int32_t index)
286 struct section *s;
287 uint8_t i = 1;
289 for (s = sects; s != NULL && i < MAX_SECT; s = s->next, ++i)
290 if (index == s->index)
291 return i;
293 if (i == MAX_SECT)
294 nasm_error(ERR_WARNING,
295 "too many sections (>255) - clipped by fileindex");
297 return NO_SECT;
300 static struct symbol *get_closest_section_symbol_by_offset(uint8_t fileindex, int64_t offset)
302 struct symbol *nearest = NULL;
303 struct symbol *sym;
305 for (sym = syms; sym; sym = sym->next) {
306 if ((sym->sect != NO_SECT) && (sym->sect == fileindex)) {
307 if ((int64_t)sym->value > offset)
308 break;
309 nearest = sym;
313 return nearest;
317 * Special section numbers which are used to define Mach-O special
318 * symbols, which can be used with WRT to provide PIC relocation
319 * types.
321 static int32_t macho_gotpcrel_sect;
323 static void macho_init(void)
325 char zero = 0;
327 maxbits = 64;
329 sects = NULL;
330 sectstail = &sects;
332 syms = NULL;
333 symstail = &syms;
334 nsyms = 0;
335 nlocalsym = 0;
336 nextdefsym = 0;
337 nundefsym = 0;
339 extsyms = raa_init();
340 strs = saa_init(1L);
342 /* string table starts with a zero byte - don't ask why */
343 saa_wbytes(strs, &zero, sizeof(char));
344 strslen = 1;
346 /* add special symbol for ..gotpcrel */
347 macho_gotpcrel_sect = seg_alloc();
348 macho_gotpcrel_sect++;
349 define_label("..gotpcrel", macho_gotpcrel_sect, 0L, NULL, false, false);
352 static void sect_write(struct section *sect,
353 const uint8_t *data, uint32_t len)
355 saa_wbytes(sect->data, data, len);
356 sect->size += len;
359 static int32_t add_reloc(struct section *sect, int32_t section,
360 int pcrel, int bytes, int64_t reloff)
362 struct reloc *r;
363 struct symbol *sym;
364 int32_t fi;
365 int32_t adjustment = 0;
367 /* NeXT as puts relocs in reversed order (address-wise) into the
368 ** files, so we do the same, doesn't seem to make much of a
369 ** difference either way */
370 r = nasm_malloc(sizeof(struct reloc));
371 r->next = sect->relocs;
372 sect->relocs = r;
374 /* the current end of the section will be the symbol's address for
375 ** now, might have to be fixed by macho_fixup_relocs() later on. make
376 ** sure we don't make the symbol scattered by setting the highest
377 ** bit by accident */
378 r->addr = sect->size & ~R_SCATTERED;
379 r->ext = 1;
380 r->pcrel = (pcrel ? 1 : 0);
382 /* match byte count 1, 2, 4, 8 to length codes 0, 1, 2, 3 respectively */
383 switch(bytes){
384 case 1:
385 r->length = 0;
386 break;
387 case 2:
388 r->length = 1;
389 break;
390 case 4:
391 r->length = 2;
392 break;
393 case 8:
394 r->length = 3;
395 break;
396 default:
397 break;
400 /* set default relocation values */
401 r->type = 0; // X86_64_RELOC_UNSIGNED
402 r->snum = R_ABS; // Absolute Symbol (indicates no relocation)
404 /* absolute relocation */
405 if (pcrel == 0) {
407 /* intra-section */
408 if (section == NO_SEG) {
409 // r->snum = R_ABS; // Set above
411 /* inter-section */
412 } else {
413 fi = get_section_fileindex_by_index(section);
415 /* external */
416 if (fi == NO_SECT) {
417 r->snum = raa_read(extsyms, section);
419 /* local */
420 } else {
421 sym = get_closest_section_symbol_by_offset(fi, reloff);
422 r->snum = sym->initial_snum;
423 adjustment = sym->value;
427 /* relative relocation */
428 } else if (pcrel == 1) {
430 /* intra-section */
431 if (section == NO_SEG) {
432 r->type = 1; // X86_64_RELOC_SIGNED
434 /* inter-section */
435 } else {
436 r->type = 2; // X86_64_RELOC_BRANCH
437 fi = get_section_fileindex_by_index(section);
439 /* external */
440 if (fi == NO_SECT) {
441 sect->extreloc = 1;
442 r->snum = raa_read(extsyms, section);
444 /* local */
445 } else {
446 sym = get_closest_section_symbol_by_offset(fi, reloff);
447 r->snum = sym->initial_snum;
448 adjustment = sym->value;
452 /* subtractor */
453 } else if (pcrel == 2) {
454 r->pcrel = 0;
455 r->type = 5; // X86_64_RELOC_SUBTRACTOR
457 /* gotpcrel */
458 } else if (pcrel == 3) {
459 r->type = 4; // X86_64_RELOC_GOT
460 r->snum = macho_gotpcrel_sect;
462 /* gotpcrel MOVQ load */
463 } else if (pcrel == 4) {
464 r->type = 3; // X86_64_RELOC_GOT_LOAD
465 r->snum = macho_gotpcrel_sect;
468 ++sect->nreloc;
470 return adjustment;
473 static void macho_output(int32_t secto, const void *data,
474 enum out_type type, uint64_t size,
475 int32_t section, int32_t wrt)
477 struct section *s, *sbss;
478 int64_t addr;
479 uint8_t mydata[16], *p, gotload;
481 if (secto == NO_SEG) {
482 if (type != OUT_RESERVE)
483 nasm_error(ERR_NONFATAL, "attempt to assemble code in "
484 "[ABSOLUTE] space");
486 return;
489 s = get_section_by_index(secto);
491 if (s == NULL) {
492 nasm_error(ERR_WARNING, "attempt to assemble code in"
493 " section %d: defaulting to `.text'", secto);
494 s = get_section_by_name("__TEXT", "__text");
496 /* should never happen */
497 if (s == NULL)
498 nasm_error(ERR_PANIC, "text section not found");
501 sbss = get_section_by_name("__DATA", "__bss");
503 if (s == sbss && type != OUT_RESERVE) {
504 nasm_error(ERR_WARNING, "attempt to initialize memory in the"
505 " BSS section: ignored");
506 s->size += realsize(type, size);
507 return;
510 switch (type) {
511 case OUT_RESERVE:
512 if (s != sbss) {
513 nasm_error(ERR_WARNING, "uninitialized space declared in"
514 " %s section: zeroing",
515 get_section_name_by_index(secto));
517 sect_write(s, NULL, size);
518 } else
519 s->size += size;
521 break;
523 case OUT_RAWDATA:
524 if (section != NO_SEG)
525 nasm_error(ERR_PANIC, "OUT_RAWDATA with other than NO_SEG");
527 sect_write(s, data, size);
528 break;
530 case OUT_ADDRESS:
532 int asize = abs(size);
534 addr = *(int64_t *)data;
535 if (section != NO_SEG) {
536 if (section % 2) {
537 nasm_error(ERR_NONFATAL, "Mach-O format does not support"
538 " section base references");
539 } else {
540 if (wrt == NO_SEG) {
541 if (asize < 8) {
542 nasm_error(ERR_NONFATAL, "Mach-O 64-bit format does not support"
543 " 32-bit absolute addresses");
545 Seemingly, Mach-O's X86_64_RELOC_SUBTRACTOR would require
546 pre-determined knowledge of where the image base would be,
547 making it impractical for use in intermediate object files
549 } else {
550 addr -= add_reloc(s, section, 0, asize, addr); // X86_64_RELOC_UNSIGNED
552 } else {
553 nasm_error(ERR_NONFATAL, "Mach-O format does not support"
554 " this use of WRT");
559 p = mydata;
560 WRITEADDR(p, addr, asize);
561 sect_write(s, mydata, asize);
562 break;
565 case OUT_REL2ADR:
566 p = mydata;
567 WRITESHORT(p, *(int64_t *)data);
569 if (section == secto)
570 nasm_error(ERR_PANIC, "intra-section OUT_REL2ADR");
572 if (section == NO_SEG) {
573 /* Do nothing */
574 } else if (section % 2) {
575 nasm_error(ERR_NONFATAL, "Mach-O format does not support"
576 " section base references");
577 } else {
578 nasm_error(ERR_NONFATAL, "Unsupported non-32-bit"
579 " Macho-O relocation [2]");
582 sect_write(s, mydata, 2L);
583 break;
585 case OUT_REL4ADR:
586 p = mydata;
587 WRITELONG(p, *(int64_t *)data + 4 - size);
589 if (section == secto)
590 nasm_error(ERR_PANIC, "intra-section OUT_REL4ADR");
592 if (section != NO_SEG && section % 2) {
593 nasm_error(ERR_NONFATAL, "Mach-O format does not support"
594 " section base references");
595 } else {
596 if (wrt == NO_SEG) {
597 *mydata -= add_reloc(s, section, 1, 4, (int64_t)*mydata); // X86_64_RELOC_SIGNED/BRANCH
598 } else if (wrt == macho_gotpcrel_sect) {
599 if (s->data->datalen > 1) {
600 saa_fread(s->data, s->data->datalen-2, &gotload, 1); // Retrieve Instruction Opcode
601 } else {
602 gotload = 0;
604 if (gotload == 0x8B) { // Check for MOVQ Opcode
605 *mydata -= add_reloc(s, section, 4, 4, (int64_t)*mydata); // X86_64_GOT_LOAD (MOVQ load)
606 } else {
607 *mydata -= add_reloc(s, section, 3, 4, (int64_t)*mydata); // X86_64_GOT
609 } else {
610 nasm_error(ERR_NONFATAL, "Mach-O format does not support"
611 " this use of WRT");
612 wrt = NO_SEG; /* we can at least _try_ to continue */
616 sect_write(s, mydata, 4L);
617 break;
619 default:
620 nasm_error(ERR_PANIC, "unknown output type?");
621 break;
625 static int32_t macho_section(char *name, int pass, int *bits)
627 int32_t index, originalIndex;
628 char *sectionAttributes;
629 struct sectmap *sm;
630 struct section *s;
632 (void)pass;
634 /* Default to 64 bits. */
635 if (!name) {
636 *bits = 64;
637 name = ".text";
638 sectionAttributes = NULL;
639 } else {
640 sectionAttributes = name;
641 name = nasm_strsep(&sectionAttributes, " \t");
644 for (sm = sectmap; sm->nasmsect != NULL; ++sm) {
645 /* make lookup into section name translation table */
646 if (!strcmp(name, sm->nasmsect)) {
647 char *currentAttribute;
649 /* try to find section with that name */
650 originalIndex = index = get_section_index_by_name(sm->segname,
651 sm->sectname);
653 /* create it if it doesn't exist yet */
654 if (index == -1) {
655 s = *sectstail = nasm_malloc(sizeof(struct section));
656 s->next = NULL;
657 sectstail = &s->next;
659 s->data = saa_init(1L);
660 s->index = seg_alloc();
661 s->relocs = NULL;
662 s->align = -1;
664 xstrncpy(s->segname, sm->segname);
665 xstrncpy(s->sectname, sm->sectname);
666 s->size = 0;
667 s->nreloc = 0;
668 s->flags = sm->flags;
670 index = s->index;
671 } else {
672 s = get_section_by_index(index);
675 while ((NULL != sectionAttributes)
676 && (currentAttribute = nasm_strsep(&sectionAttributes, " \t"))) {
677 if (0 != *currentAttribute) {
678 if (!nasm_strnicmp("align=", currentAttribute, 6)) {
679 char *end;
680 int newAlignment, value;
682 value = strtoul(currentAttribute + 6, (char**)&end, 0);
683 newAlignment = alignlog2_32(value);
685 if (0 != *end) {
686 nasm_error(ERR_PANIC,
687 "unknown or missing alignment value \"%s\" "
688 "specified for section \"%s\"",
689 currentAttribute + 6,
690 name);
691 return NO_SEG;
692 } else if (0 > newAlignment) {
693 nasm_error(ERR_PANIC,
694 "alignment of %d (for section \"%s\") is not "
695 "a power of two",
696 value,
697 name);
698 return NO_SEG;
701 if ((-1 != originalIndex)
702 && (s->align != newAlignment)
703 && (s->align != -1)) {
704 nasm_error(ERR_PANIC,
705 "section \"%s\" has already been specified "
706 "with alignment %d, conflicts with new "
707 "alignment of %d",
708 name,
709 (1 << s->align),
710 value);
711 return NO_SEG;
714 s->align = newAlignment;
715 } else if (!nasm_stricmp("data", currentAttribute)) {
716 /* Do nothing; 'data' is implicit */
717 } else {
718 nasm_error(ERR_PANIC,
719 "unknown section attribute %s for section %s",
720 currentAttribute,
721 name);
722 return NO_SEG;
727 return index;
731 nasm_error(ERR_PANIC, "invalid section name %s", name);
732 return NO_SEG;
735 static void macho_symdef(char *name, int32_t section, int64_t offset,
736 int is_global, char *special)
738 struct symbol *sym;
740 if (special) {
741 nasm_error(ERR_NONFATAL, "The Mach-O output format does "
742 "not support any special symbol types");
743 return;
746 if (is_global == 3) {
747 nasm_error(ERR_NONFATAL, "The Mach-O format does not "
748 "(yet) support forward reference fixups.");
749 return;
752 if (name[0] == '.' && name[1] == '.' && name[2] != '@') {
754 * This is a NASM special symbol. We never allow it into
755 * the Macho-O symbol table, even if it's a valid one. If it
756 * _isn't_ a valid one, we should barf immediately.
758 if (strcmp(name, "..gotpcrel"))
759 nasm_error(ERR_NONFATAL, "unrecognized special symbol `%s'", name);
760 return;
763 sym = *symstail = nasm_malloc(sizeof(struct symbol));
764 sym->next = NULL;
765 symstail = &sym->next;
767 sym->name = name;
768 sym->strx = strslen;
769 sym->type = 0;
770 sym->desc = 0;
771 sym->value = offset;
772 sym->initial_snum = -1;
774 /* external and common symbols get N_EXT */
775 if (is_global != 0) {
776 sym->type |= N_EXT;
779 if (section == NO_SEG) {
780 /* symbols in no section get absolute */
781 sym->type |= N_ABS;
782 sym->sect = NO_SECT;
783 } else {
784 sym->type |= N_SECT;
786 /* get the in-file index of the section the symbol was defined in */
787 sym->sect = get_section_fileindex_by_index(section);
789 /* track the initially allocated symbol number for use in future fix-ups */
790 sym->initial_snum = nsyms;
792 if (sym->sect == NO_SECT) {
794 /* remember symbol number of references to external
795 ** symbols, this works because every external symbol gets
796 ** its own section number allocated internally by nasm and
797 ** can so be used as a key */
798 extsyms = raa_write(extsyms, section, nsyms);
800 switch (is_global) {
801 case 1:
802 case 2:
803 /* there isn't actually a difference between global
804 ** and common symbols, both even have their size in
805 ** sym->value */
806 sym->type = N_EXT;
807 break;
809 default:
810 /* give an error on unfound section if it's not an
811 ** external or common symbol (assemble_file() does a
812 ** seg_alloc() on every call for them) */
813 nasm_error(ERR_PANIC, "in-file index for section %d not found",
814 section);
818 ++nsyms;
821 static void macho_sectalign(int32_t seg, unsigned int value)
823 struct section *s;
825 list_for_each(s, sects) {
826 if (s->index == seg)
827 break;
830 if (!s || !is_power2(value))
831 return;
833 value = alignlog2_32(value);
834 if (s->align < (int)value)
835 s->align = value;
838 static int32_t macho_segbase(int32_t section)
840 return section;
843 static void macho_filename(char *inname, char *outname)
845 standard_extension(inname, outname, ".o");
848 extern macros_t macho_stdmac[];
850 /* Comparison function for qsort symbol layout. */
851 static int layout_compare (const struct symbol **s1,
852 const struct symbol **s2)
854 return (strcmp ((*s1)->name, (*s2)->name));
857 /* The native assembler does a few things in a similar function
859 * Remove temporary labels
860 * Sort symbols according to local, external, undefined (by name)
861 * Order the string table
863 We do not remove temporary labels right now.
865 numsyms is the total number of symbols we have. strtabsize is the
866 number entries in the string table. */
868 static void macho_layout_symbols (uint32_t *numsyms,
869 uint32_t *strtabsize)
871 struct symbol *sym, **symp;
872 uint32_t i,j;
874 *numsyms = 0;
875 *strtabsize = sizeof (char);
877 symp = &syms;
879 while ((sym = *symp)) {
880 /* Undefined symbols are now external. */
881 if (sym->type == N_UNDF)
882 sym->type |= N_EXT;
884 if ((sym->type & N_EXT) == 0) {
885 sym->snum = *numsyms;
886 *numsyms = *numsyms + 1;
887 nlocalsym++;
889 else {
890 if ((sym->type & N_TYPE) != N_UNDF) {
891 nextdefsym++;
892 } else {
893 nundefsym++;
896 /* If we handle debug info we'll want
897 to check for it here instead of just
898 adding the symbol to the string table. */
899 sym->strx = *strtabsize;
900 saa_wbytes (strs, sym->name, (int32_t)(strlen(sym->name) + 1));
901 *strtabsize += strlen(sym->name) + 1;
903 symp = &(sym->next);
906 /* Next, sort the symbols. Most of this code is a direct translation from
907 the Apple cctools symbol layout. We need to keep compatibility with that. */
908 /* Set the indexes for symbol groups into the symbol table */
909 ilocalsym = 0;
910 iextdefsym = nlocalsym;
911 iundefsym = nlocalsym + nextdefsym;
913 /* allocate arrays for sorting externals by name */
914 extdefsyms = nasm_malloc(nextdefsym * sizeof(struct symbol *));
915 undefsyms = nasm_malloc(nundefsym * sizeof(struct symbol *));
917 i = 0;
918 j = 0;
920 symp = &syms;
922 while ((sym = *symp)) {
924 if((sym->type & N_EXT) == 0) {
925 sym->strx = *strtabsize;
926 saa_wbytes (strs, sym->name, (int32_t)(strlen (sym->name) + 1));
927 *strtabsize += strlen(sym->name) + 1;
929 else {
930 if((sym->type & N_TYPE) != N_UNDF) {
931 extdefsyms[i++] = sym;
932 } else {
933 undefsyms[j++] = sym;
936 symp = &(sym->next);
939 qsort(extdefsyms, nextdefsym, sizeof(struct symbol *),
940 (int (*)(const void *, const void *))layout_compare);
941 qsort(undefsyms, nundefsym, sizeof(struct symbol *),
942 (int (*)(const void *, const void *))layout_compare);
944 for(i = 0; i < nextdefsym; i++) {
945 extdefsyms[i]->snum = *numsyms;
946 *numsyms += 1;
948 for(j = 0; j < nundefsym; j++) {
949 undefsyms[j]->snum = *numsyms;
950 *numsyms += 1;
954 /* Calculate some values we'll need for writing later. */
956 static void macho_calculate_sizes (void)
958 struct section *s;
960 /* count sections and calculate in-memory and in-file offsets */
961 for (s = sects; s != NULL; s = s->next) {
962 uint64_t pad = 0;
964 /* zerofill sections aren't actually written to the file */
965 if ((s->flags & SECTION_TYPE) != S_ZEROFILL)
966 seg_filesize64 += s->size;
968 /* recalculate segment address based on alignment and vm size */
969 s->addr = seg_vmsize64;
970 /* we need section alignment to calculate final section address */
971 if (s->align == -1)
972 s->align = DEFAULT_SECTION_ALIGNMENT;
973 if(s->align) {
974 uint64_t newaddr = ALIGN(s->addr, 1 << s->align);
975 pad = newaddr - s->addr;
976 s->addr = newaddr;
979 seg_vmsize64 += s->size + pad;
980 ++seg_nsects64;
983 /* calculate size of all headers, load commands and sections to
984 ** get a pointer to the start of all the raw data */
985 if (seg_nsects64 > 0) {
986 ++head_ncmds64;
987 head_sizeofcmds64 +=
988 MACHO_SEGCMD64_SIZE + seg_nsects64 * MACHO_SECTCMD64_SIZE;
991 if (nsyms > 0) {
992 ++head_ncmds64;
993 head_sizeofcmds64 += MACHO_SYMCMD_SIZE;
997 /* Write out the header information for the file. */
999 static void macho_write_header (void)
1001 fwriteint32_t(MH_MAGIC_64, ofile); /* magic */
1002 fwriteint32_t(CPU_TYPE_X86_64, ofile); /* CPU type */
1003 fwriteint32_t(CPU_SUBTYPE_I386_ALL, ofile); /* CPU subtype */
1004 fwriteint32_t(MH_OBJECT, ofile); /* Mach-O file type */
1005 fwriteint32_t(head_ncmds64, ofile); /* number of load commands */
1006 fwriteint32_t(head_sizeofcmds64, ofile); /* size of load commands */
1007 fwriteint32_t(0, ofile); /* no flags */
1008 fwriteint32_t(0, ofile); /* reserved for future use */
1011 /* Write out the segment load command at offset. */
1013 static uint32_t macho_write_segment (uint64_t offset)
1015 uint64_t rel_base = alignint64_t (offset + seg_filesize64);
1016 uint32_t s_reloff = 0;
1017 struct section *s;
1019 fwriteint32_t(LC_SEGMENT_64, ofile); /* cmd == LC_SEGMENT_64 */
1021 /* size of load command including section load commands */
1022 fwriteint32_t(MACHO_SEGCMD64_SIZE + seg_nsects64 *
1023 MACHO_SECTCMD64_SIZE, ofile);
1025 /* in an MH_OBJECT file all sections are in one unnamed (name
1026 ** all zeros) segment */
1027 fwritezero(16, ofile);
1028 fwriteint64_t(0, ofile); /* in-memory offset */
1029 fwriteint64_t(seg_vmsize64, ofile); /* in-memory size */
1030 fwriteint64_t(offset, ofile); /* in-file offset to data */
1031 fwriteint64_t(seg_filesize64, ofile); /* in-file size */
1032 fwriteint32_t(VM_PROT_DEFAULT, ofile); /* maximum vm protection */
1033 fwriteint32_t(VM_PROT_DEFAULT, ofile); /* initial vm protection */
1034 fwriteint32_t(seg_nsects64, ofile); /* number of sections */
1035 fwriteint32_t(0, ofile); /* no flags */
1037 /* emit section headers */
1038 for (s = sects; s != NULL; s = s->next) {
1039 fwrite(s->sectname, sizeof(s->sectname), 1, ofile);
1040 fwrite(s->segname, sizeof(s->segname), 1, ofile);
1041 fwriteint64_t(s->addr, ofile);
1042 fwriteint64_t(s->size, ofile);
1044 /* dummy data for zerofill sections or proper values */
1045 if ((s->flags & SECTION_TYPE) != S_ZEROFILL) {
1046 fwriteint32_t(offset, ofile);
1047 /* Write out section alignment, as a power of two.
1048 e.g. 32-bit word alignment would be 2 (2^2 = 4). */
1049 if (s->align == -1)
1050 s->align = DEFAULT_SECTION_ALIGNMENT;
1051 fwriteint32_t(s->align, ofile);
1052 /* To be compatible with cctools as we emit
1053 a zero reloff if we have no relocations. */
1054 fwriteint32_t(s->nreloc ? rel_base + s_reloff : 0, ofile);
1055 fwriteint32_t(s->nreloc, ofile);
1057 offset += s->size;
1058 s_reloff += s->nreloc * MACHO_RELINFO64_SIZE;
1059 } else {
1060 fwriteint32_t(0, ofile);
1061 fwriteint32_t(0, ofile);
1062 fwriteint32_t(0, ofile);
1063 fwriteint32_t(0, ofile);
1066 if (s->nreloc) {
1067 s->flags |= S_ATTR_LOC_RELOC;
1068 if (s->extreloc)
1069 s->flags |= S_ATTR_EXT_RELOC;
1072 fwriteint32_t(s->flags, ofile); /* flags */
1073 fwriteint32_t(0, ofile); /* reserved */
1074 fwriteint32_t(0, ofile); /* reserved */
1076 fwriteint32_t(0, ofile); /* align */
1079 rel_padcnt64 = rel_base - offset;
1080 offset = rel_base + s_reloff;
1082 return offset;
1085 /* For a given chain of relocs r, write out the entire relocation
1086 chain to the object file. */
1088 static void macho_write_relocs (struct reloc *r)
1090 while (r) {
1091 uint32_t word2;
1093 fwriteint32_t(r->addr, ofile); /* reloc offset */
1095 word2 = r->snum;
1096 word2 |= r->pcrel << 24;
1097 word2 |= r->length << 25;
1098 word2 |= r->ext << 27;
1099 word2 |= r->type << 28;
1100 fwriteint32_t(word2, ofile); /* reloc data */
1101 r = r->next;
1105 /* Write out the section data. */
1106 static void macho_write_section (void)
1108 struct section *s, *s2;
1109 struct reloc *r;
1110 uint8_t fi, *p, *q, blk[8];
1111 int32_t len;
1112 int64_t l;
1114 for (s = sects; s != NULL; s = s->next) {
1115 if ((s->flags & SECTION_TYPE) == S_ZEROFILL)
1116 continue;
1118 /* no padding needs to be done to the sections */
1120 /* Like a.out Mach-O references things in the data or bss
1121 * sections by addresses which are actually relative to the
1122 * start of the _text_ section, in the _file_. See outaout.c
1123 * for more information. */
1124 saa_rewind(s->data);
1125 for (r = s->relocs; r != NULL; r = r->next) {
1126 len = (int32_t)r->length << 1;
1127 if(len > 4) len = 8;
1128 saa_fread(s->data, r->addr, blk, len);
1129 p = q = blk;
1130 l = *p++;
1132 /* get offset based on relocation type */
1133 if (r->length > 0) {
1134 l += ((int64_t)*p++) << 8;
1136 if (r->length > 1) {
1137 l += ((int64_t)*p++) << 16;
1138 l += ((int64_t)*p++) << 24;
1141 if (r->length > 2) {
1142 l += ((int64_t)*p++) << 32;
1143 l += ((int64_t)*p++) << 40;
1144 l += ((int64_t)*p++) << 48;
1145 l += ((int64_t)*p++) << 56;
1151 /* If the relocation is internal add to the current section
1152 offset. Otherwise the only value we need is the symbol
1153 offset which we already have. The linker takes care
1154 of the rest of the address. */
1155 if (!r->ext) {
1156 /* generate final address by section address and offset */
1157 for (s2 = sects, fi = 1;
1158 s2 != NULL; s2 = s2->next, fi++) {
1159 if (fi == r->snum) {
1160 l += s2->addr;
1161 break;
1166 /* write new offset back */
1167 if (r->length == 3)
1168 WRITEDLONG(q, l);
1169 else if (r->length == 2)
1170 WRITELONG(q, l);
1171 else if (r->length == 1)
1172 WRITESHORT(q, l);
1173 else
1174 *q++ = l & 0xFF;
1176 saa_fwrite(s->data, r->addr, blk, len);
1179 /* dump the section data to file */
1180 saa_fpwrite(s->data, ofile);
1183 /* pad last section up to reloc entries on int64_t boundary */
1184 fwritezero(rel_padcnt64, ofile);
1186 /* emit relocation entries */
1187 for (s = sects; s != NULL; s = s->next)
1188 macho_write_relocs (s->relocs);
1191 /* Write out the symbol table. We should already have sorted this
1192 before now. */
1193 static void macho_write_symtab (void)
1195 struct symbol *sym;
1196 struct section *s;
1197 int64_t fi;
1198 uint64_t i;
1200 /* we don't need to pad here since MACHO_RELINFO_SIZE == 8 */
1202 for (sym = syms; sym != NULL; sym = sym->next) {
1203 if ((sym->type & N_EXT) == 0) {
1204 fwriteint32_t(sym->strx, ofile); /* string table entry number */
1205 fwrite(&sym->type, 1, 1, ofile); /* symbol type */
1206 fwrite(&sym->sect, 1, 1, ofile); /* section */
1207 fwriteint16_t(sym->desc, ofile); /* description */
1209 /* Fix up the symbol value now that we know the final section
1210 sizes. */
1211 if (((sym->type & N_TYPE) == N_SECT) && (sym->sect != NO_SECT)) {
1212 for (s = sects, fi = 1; s != NULL; s = s->next, fi++) {
1213 if (fi == sym->sect) {
1214 sym->value += s->addr;
1215 break;
1220 fwriteint64_t(sym->value, ofile); /* value (i.e. offset) */
1224 for (i = 0; i < nextdefsym; i++) {
1225 sym = extdefsyms[i];
1226 fwriteint32_t(sym->strx, ofile);
1227 fwrite(&sym->type, 1, 1, ofile); /* symbol type */
1228 fwrite(&sym->sect, 1, 1, ofile); /* section */
1229 fwriteint16_t(sym->desc, ofile); /* description */
1231 /* Fix up the symbol value now that we know the final section
1232 sizes. */
1233 if (((sym->type & N_TYPE) == N_SECT) && (sym->sect != NO_SECT)) {
1234 for (s = sects, fi = 1;
1235 s != NULL && fi < sym->sect; s = s->next, ++fi)
1236 sym->value += s->size;
1239 fwriteint64_t(sym->value, ofile); /* value (i.e. offset) */
1242 for (i = 0; i < nundefsym; i++) {
1243 sym = undefsyms[i];
1244 fwriteint32_t(sym->strx, ofile);
1245 fwrite(&sym->type, 1, 1, ofile); /* symbol type */
1246 fwrite(&sym->sect, 1, 1, ofile); /* section */
1247 fwriteint16_t(sym->desc, ofile); /* description */
1249 // Fix up the symbol value now that we know the final section sizes.
1250 if (((sym->type & N_TYPE) == N_SECT) && (sym->sect != NO_SECT)) {
1251 for (s = sects, fi = 1;
1252 s != NULL && fi < sym->sect; s = s->next, ++fi)
1253 sym->value += s->size;
1256 fwriteint64_t(sym->value, ofile); // value (i.e. offset)
1261 /* Fixup the snum in the relocation entries, we should be
1262 doing this only for externally referenced symbols. */
1263 static void macho_fixup_relocs (struct reloc *r)
1265 struct symbol *sym;
1267 while (r != NULL) {
1268 if (r->ext) {
1269 for (sym = syms; sym != NULL; sym = sym->next) {
1270 if (sym->initial_snum == r->snum) {
1271 r->snum = sym->snum;
1272 break;
1276 r = r->next;
1280 /* Write out the object file. */
1282 static void macho_write (void)
1284 uint64_t offset = 0;
1286 /* mach-o object file structure:
1288 ** mach header
1289 ** uint32_t magic
1290 ** int cpu type
1291 ** int cpu subtype
1292 ** uint32_t mach file type
1293 ** uint32_t number of load commands
1294 ** uint32_t size of all load commands
1295 ** (includes section struct size of segment command)
1296 ** uint32_t flags
1298 ** segment command
1299 ** uint32_t command type == LC_SEGMENT_64
1300 ** uint32_t size of load command
1301 ** (including section load commands)
1302 ** char[16] segment name
1303 ** uint64_t in-memory offset
1304 ** uint64_t in-memory size
1305 ** uint64_t in-file offset to data area
1306 ** uint64_t in-file size
1307 ** (in-memory size excluding zerofill sections)
1308 ** int maximum vm protection
1309 ** int initial vm protection
1310 ** uint32_t number of sections
1311 ** uint32_t flags
1313 ** section commands
1314 ** char[16] section name
1315 ** char[16] segment name
1316 ** uint64_t in-memory offset
1317 ** uint64_t in-memory size
1318 ** uint32_t in-file offset
1319 ** uint32_t alignment
1320 ** (irrelevant in MH_OBJECT)
1321 ** uint32_t in-file offset of relocation entires
1322 ** uint32_t number of relocations
1323 ** uint32_t flags
1324 ** uint32_t reserved
1325 ** uint32_t reserved
1327 ** symbol table command
1328 ** uint32_t command type == LC_SYMTAB
1329 ** uint32_t size of load command
1330 ** uint32_t symbol table offset
1331 ** uint32_t number of symbol table entries
1332 ** uint32_t string table offset
1333 ** uint32_t string table size
1335 ** raw section data
1337 ** padding to int64_t boundary
1339 ** relocation data (struct reloc)
1340 ** int32_t offset
1341 ** uint data (symbolnum, pcrel, length, extern, type)
1343 ** symbol table data (struct nlist)
1344 ** int32_t string table entry number
1345 ** uint8_t type
1346 ** (extern, absolute, defined in section)
1347 ** uint8_t section
1348 ** (0 for global symbols, section number of definition (>= 1, <=
1349 ** 254) for local symbols, size of variable for common symbols
1350 ** [type == extern])
1351 ** int16_t description
1352 ** (for stab debugging format)
1353 ** uint64_t value (i.e. file offset) of symbol or stab offset
1355 ** string table data
1356 ** list of null-terminated strings
1359 /* Emit the Mach-O header. */
1360 macho_write_header();
1362 offset = MACHO_HEADER64_SIZE + head_sizeofcmds64;
1364 /* emit the segment load command */
1365 if (seg_nsects64 > 0)
1366 offset = macho_write_segment (offset);
1367 else
1368 nasm_error(ERR_WARNING, "no sections?");
1370 if (nsyms > 0) {
1371 /* write out symbol command */
1372 fwriteint32_t(LC_SYMTAB, ofile); /* cmd == LC_SYMTAB */
1373 fwriteint32_t(MACHO_SYMCMD_SIZE, ofile); /* size of load command */
1374 fwriteint32_t(offset, ofile); /* symbol table offset */
1375 fwriteint32_t(nsyms, ofile); /* number of symbol
1376 ** table entries */
1378 offset += nsyms * MACHO_NLIST64_SIZE;
1379 fwriteint32_t(offset, ofile); /* string table offset */
1380 fwriteint32_t(strslen, ofile); /* string table size */
1383 /* emit section data */
1384 if (seg_nsects64 > 0)
1385 macho_write_section ();
1387 /* emit symbol table if we have symbols */
1388 if (nsyms > 0)
1389 macho_write_symtab ();
1391 /* we don't need to pad here since MACHO_NLIST64_SIZE == 16 */
1393 /* emit string table */
1394 saa_fpwrite(strs, ofile);
1396 /* We do quite a bit here, starting with finalizing all of the data
1397 for the object file, writing, and then freeing all of the data from
1398 the file. */
1400 static void macho_cleanup(int debuginfo)
1402 struct section *s;
1403 struct reloc *r;
1404 struct symbol *sym;
1406 (void)debuginfo;
1408 /* Sort all symbols. */
1409 macho_layout_symbols (&nsyms, &strslen);
1411 /* Fixup relocation entries */
1412 for (s = sects; s != NULL; s = s->next) {
1413 macho_fixup_relocs (s->relocs);
1416 /* First calculate and finalize needed values. */
1417 macho_calculate_sizes();
1418 macho_write();
1420 /* free up everything */
1421 while (sects->next) {
1422 s = sects;
1423 sects = sects->next;
1425 saa_free(s->data);
1426 while (s->relocs != NULL) {
1427 r = s->relocs;
1428 s->relocs = s->relocs->next;
1429 nasm_free(r);
1432 nasm_free(s);
1435 saa_free(strs);
1436 raa_free(extsyms);
1438 if (syms) {
1439 while (syms->next) {
1440 sym = syms;
1441 syms = syms->next;
1443 nasm_free (sym);
1448 /* Debugging routines. */
1449 static void debug_reloc (struct reloc *r)
1451 fprintf (stdout, "reloc:\n");
1452 fprintf (stdout, "\taddr: %"PRId32"\n", r->addr);
1453 fprintf (stdout, "\tsnum: %d\n", r->snum);
1454 fprintf (stdout, "\tpcrel: %d\n", r->pcrel);
1455 fprintf (stdout, "\tlength: %d\n", r->length);
1456 fprintf (stdout, "\text: %d\n", r->ext);
1457 fprintf (stdout, "\ttype: %d\n", r->type);
1460 static void debug_section_relocs (struct section *s)
1462 struct reloc *r = s->relocs;
1464 fprintf (stdout, "relocs for section %s:\n\n", s->sectname);
1466 while (r != NULL) {
1467 debug_reloc (r);
1468 r = r->next;
1472 struct ofmt of_macho64 = {
1473 "NeXTstep/OpenStep/Rhapsody/Darwin/MacOS X (x86_64) object files",
1474 "macho64",
1476 null_debug_arr,
1477 &null_debug_form,
1478 macho_stdmac,
1479 macho_init,
1480 null_setinfo,
1481 macho_output,
1482 macho_symdef,
1483 macho_section,
1484 macho_sectalign,
1485 macho_segbase,
1486 null_directive,
1487 macho_filename,
1488 macho_cleanup
1491 #endif
1494 * Local Variables:
1495 * mode:c
1496 * c-basic-offset:4
1497 * End:
1499 * end of file */