gdb/testsuite: fix gdb.trace/signal.exp on x86
[binutils-gdb/blckswan.git] / gas / config / tc-vax.c
blobba7acaee45b667a922c1ef791db0bb03c6e2d6a6
1 /* tc-vax.c - vax-specific -
2 Copyright (C) 1987-2022 Free Software Foundation, Inc.
4 This file is part of GAS, the GNU Assembler.
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
21 #include "as.h"
23 #include "vax-inst.h"
24 #include "obstack.h" /* For FRAG_APPEND_1_CHAR macro in "frags.h" */
25 #include "subsegs.h"
26 #include "safe-ctype.h"
28 #ifdef OBJ_ELF
29 #include "elf/vax.h"
30 #endif
32 /* These chars start a comment anywhere in a source file (except inside
33 another comment */
34 const char comment_chars[] = "#";
36 /* These chars only start a comment at the beginning of a line. */
37 /* Note that for the VAX the are the same as comment_chars above. */
38 const char line_comment_chars[] = "#";
40 const char line_separator_chars[] = ";";
42 /* Chars that can be used to separate mant from exp in floating point nums. */
43 const char EXP_CHARS[] = "eE";
45 /* Chars that mean this number is a floating point constant
46 as in 0f123.456
47 or 0H1.234E-12 (see exp chars above). */
48 const char FLT_CHARS[] = "dDfFgGhH";
50 /* Also be aware that MAXIMUM_NUMBER_OF_CHARS_FOR_FLOAT may have to be
51 changed in read.c . Ideally it shouldn't have to know about it at all,
52 but nothing is ideal around here. */
54 /* Hold details of an operand expression. */
55 static expressionS exp_of_operand[VIT_MAX_OPERANDS];
56 static segT seg_of_operand[VIT_MAX_OPERANDS];
58 /* A vax instruction after decoding. */
59 static struct vit v;
61 /* Hold details of big operands. */
62 LITTLENUM_TYPE big_operand_bits[VIT_MAX_OPERANDS][SIZE_OF_LARGE_NUMBER];
63 FLONUM_TYPE float_operand[VIT_MAX_OPERANDS];
64 /* Above is made to point into big_operand_bits by md_begin(). */
66 #ifdef OBJ_ELF
67 #define GLOBAL_OFFSET_TABLE_NAME "_GLOBAL_OFFSET_TABLE_"
68 #define PROCEDURE_LINKAGE_TABLE_NAME "_PROCEDURE_LINKAGE_TABLE_"
69 symbolS *GOT_symbol; /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
70 symbolS *PLT_symbol; /* Pre-defined "_PROCEDURE_LINKAGE_TABLE_". */
71 #endif
73 int flag_hash_long_names; /* -+ */
74 int flag_one; /* -1 */
75 int flag_show_after_trunc; /* -H */
76 int flag_no_hash_mixed_case; /* -h NUM */
77 #ifdef OBJ_ELF
78 int flag_want_pic; /* -k */
79 #endif
81 /* For VAX, relative addresses of "just the right length" are easy.
82 The branch displacement is always the last operand, even in
83 synthetic instructions.
84 For VAX, we encode the relax_substateTs (in e.g. fr_substate) as:
86 4 3 2 1 0 bit number
87 ---/ /--+-------+-------+-------+-------+-------+
88 | what state ? | how long ? |
89 ---/ /--+-------+-------+-------+-------+-------+
91 The "how long" bits are 00=byte, 01=word, 10=long.
92 This is a Un*x convention.
93 Not all lengths are legit for a given value of (what state).
94 The "how long" refers merely to the displacement length.
95 The address usually has some constant bytes in it as well.
97 groups for VAX address relaxing.
99 1. "foo" pc-relative.
100 length of byte, word, long
102 2a. J<cond> where <cond> is a simple flag test.
103 length of byte, word, long.
104 VAX opcodes are: (Hex)
105 bneq/bnequ 12
106 beql/beqlu 13
107 bgtr 14
108 bleq 15
109 bgeq 18
110 blss 19
111 bgtru 1a
112 blequ 1b
113 bvc 1c
114 bvs 1d
115 bgequ/bcc 1e
116 blssu/bcs 1f
117 Always, you complement 0th bit to reverse condition.
118 Always, 1-byte opcode, then 1-byte displacement.
120 2b. J<cond> where cond tests a memory bit.
121 length of byte, word, long.
122 Vax opcodes are: (Hex)
123 bbs e0
124 bbc e1
125 bbss e2
126 bbcs e3
127 bbsc e4
128 bbcc e5
129 Always, you complement 0th bit to reverse condition.
130 Always, 1-byte opcode, longword-address, byte-address, 1-byte-displacement
132 2c. J<cond> where cond tests low-order memory bit
133 length of byte,word,long.
134 Vax opcodes are: (Hex)
135 blbs e8
136 blbc e9
137 Always, you complement 0th bit to reverse condition.
138 Always, 1-byte opcode, longword-address, 1-byte displacement.
140 3. Jbs/Jbr.
141 length of byte,word,long.
142 Vax opcodes are: (Hex)
143 bsbb 10
144 brb 11
145 These are like (2) but there is no condition to reverse.
146 Always, 1 byte opcode, then displacement/absolute.
148 4a. JacbX
149 length of word, long.
150 Vax opcodes are: (Hex)
151 acbw 3d
152 acbf 4f
153 acbd 6f
154 abcb 9d
155 acbl f1
156 acbg 4ffd
157 acbh 6ffd
158 Always, we cannot reverse the sense of the branch; we have a word
159 displacement.
160 The double-byte op-codes don't hurt: we never want to modify the
161 opcode, so we don't care how many bytes are between the opcode and
162 the operand.
164 4b. JXobXXX
165 length of long, long, byte.
166 Vax opcodes are: (Hex)
167 aoblss f2
168 aobleq f3
169 sobgeq f4
170 sobgtr f5
171 Always, we cannot reverse the sense of the branch; we have a byte
172 displacement.
174 The only time we need to modify the opcode is for class 2 instructions.
175 After relax() we may complement the lowest order bit of such instruction
176 to reverse sense of branch.
178 For class 2 instructions, we store context of "where is the opcode literal".
179 We can change an opcode's lowest order bit without breaking anything else.
181 We sometimes store context in the operand literal. This way we can figure out
182 after relax() what the original addressing mode was. */
184 /* These displacements are relative to the start address of the
185 displacement. The first letter is Byte, Word. 2nd letter is
186 Forward, Backward. */
187 #define BF (1+ 127)
188 #define BB (1+-128)
189 #define WF (2+ 32767)
190 #define WB (2+-32768)
191 /* Don't need LF, LB because they always reach. [They are coded as 0.] */
193 #define C(a,b) ENCODE_RELAX(a,b)
194 /* This macro has no side-effects. */
195 #define ENCODE_RELAX(what,length) (((what) << 2) + (length))
196 #define RELAX_STATE(s) ((s) >> 2)
197 #define RELAX_LENGTH(s) ((s) & 3)
199 const relax_typeS md_relax_table[] =
201 {1, 1, 0, 0}, /* error sentinel 0,0 */
202 {1, 1, 0, 0}, /* unused 0,1 */
203 {1, 1, 0, 0}, /* unused 0,2 */
204 {1, 1, 0, 0}, /* unused 0,3 */
206 {BF + 1, BB + 1, 2, C (1, 1)},/* B^"foo" 1,0 */
207 {WF + 1, WB + 1, 3, C (1, 2)},/* W^"foo" 1,1 */
208 {0, 0, 5, 0}, /* L^"foo" 1,2 */
209 {1, 1, 0, 0}, /* unused 1,3 */
211 {BF, BB, 1, C (2, 1)}, /* b<cond> B^"foo" 2,0 */
212 {WF + 2, WB + 2, 4, C (2, 2)},/* br.+? brw X 2,1 */
213 {0, 0, 7, 0}, /* br.+? jmp X 2,2 */
214 {1, 1, 0, 0}, /* unused 2,3 */
216 {BF, BB, 1, C (3, 1)}, /* brb B^foo 3,0 */
217 {WF, WB, 2, C (3, 2)}, /* brw W^foo 3,1 */
218 {0, 0, 5, 0}, /* Jmp L^foo 3,2 */
219 {1, 1, 0, 0}, /* unused 3,3 */
221 {1, 1, 0, 0}, /* unused 4,0 */
222 {WF, WB, 2, C (4, 2)}, /* acb_ ^Wfoo 4,1 */
223 {0, 0, 10, 0}, /* acb_,br,jmp L^foo4,2 */
224 {1, 1, 0, 0}, /* unused 4,3 */
226 {BF, BB, 1, C (5, 1)}, /* Xob___,,foo 5,0 */
227 {WF + 4, WB + 4, 6, C (5, 2)},/* Xob.+2,brb.+3,brw5,1 */
228 {0, 0, 9, 0}, /* Xob.+2,brb.+6,jmp5,2 */
229 {1, 1, 0, 0}, /* unused 5,3 */
232 #undef C
233 #undef BF
234 #undef BB
235 #undef WF
236 #undef WB
238 void float_cons (int);
239 int flonum_gen2vax (int, FLONUM_TYPE *, LITTLENUM_TYPE *);
241 const pseudo_typeS md_pseudo_table[] =
243 {"dfloat", float_cons, 'd'},
244 {"ffloat", float_cons, 'f'},
245 {"gfloat", float_cons, 'g'},
246 {"hfloat", float_cons, 'h'},
247 {"d_floating", float_cons, 'd'},
248 {"f_floating", float_cons, 'f'},
249 {"g_floating", float_cons, 'g'},
250 {"h_floating", float_cons, 'h'},
251 {NULL, NULL, 0},
254 #define STATE_PC_RELATIVE (1)
255 #define STATE_CONDITIONAL_BRANCH (2)
256 #define STATE_ALWAYS_BRANCH (3) /* includes BSB... */
257 #define STATE_COMPLEX_BRANCH (4)
258 #define STATE_COMPLEX_HOP (5)
260 #define STATE_BYTE (0)
261 #define STATE_WORD (1)
262 #define STATE_LONG (2)
263 #define STATE_UNDF (3) /* Symbol undefined in pass1. */
265 #define min(a, b) ((a) < (b) ? (a) : (b))
267 void
268 md_number_to_chars (char con[], valueT value, int nbytes)
270 number_to_chars_littleendian (con, value, nbytes);
273 /* Fix up some data or instructions after we find out the value of a symbol
274 that they reference. */
276 void /* Knows about order of bytes in address. */
277 md_apply_fix (fixS *fixP, valueT *valueP, segT seg ATTRIBUTE_UNUSED)
279 valueT value = * valueP;
281 if (fixP->fx_subsy != (symbolS *) NULL)
282 as_bad_subtract (fixP);
284 if (fixP->fx_addsy == NULL)
285 fixP->fx_done = 1;
287 if (fixP->fx_done)
288 number_to_chars_littleendian (fixP->fx_where + fixP->fx_frag->fr_literal,
289 value, fixP->fx_size);
290 else
291 /* Initialise the part of an instruction frag covered by the
292 relocation. (Many occurrences of frag_more followed by fix_new
293 lack any init of the frag.) Since VAX uses RELA relocs the
294 value we write into this field doesn't really matter. */
295 memset (fixP->fx_where + fixP->fx_frag->fr_literal, 0, fixP->fx_size);
298 /* Convert a number from VAX byte order (little endian)
299 into host byte order.
300 con is the buffer to convert,
301 nbytes is the length of the given buffer. */
302 static long
303 md_chars_to_number (unsigned char con[], int nbytes)
305 long retval;
307 for (retval = 0, con += nbytes - 1; nbytes--; con--)
309 retval <<= BITS_PER_CHAR;
310 retval |= *con;
312 return retval;
315 /* Copy a bignum from in to out.
316 If the output is shorter than the input, copy lower-order
317 littlenums. Return 0 or the number of significant littlenums
318 dropped. Assumes littlenum arrays are densely packed: no unused
319 chars between the littlenums. Uses memcpy() to move littlenums, and
320 wants to know length (in chars) of the input bignum. */
322 static int
323 bignum_copy (LITTLENUM_TYPE *in,
324 int in_length, /* in sizeof(littlenum)s */
325 LITTLENUM_TYPE *out,
326 int out_length /* in sizeof(littlenum)s */)
328 int significant_littlenums_dropped;
330 if (out_length < in_length)
332 LITTLENUM_TYPE *p; /* -> most significant (non-zero) input
333 littlenum. */
335 memcpy ((void *) out, (void *) in,
336 (unsigned int) out_length << LITTLENUM_SHIFT);
337 for (p = in + in_length - 1; p >= in; --p)
339 if (*p)
340 break;
342 significant_littlenums_dropped = p - in - in_length + 1;
344 if (significant_littlenums_dropped < 0)
345 significant_littlenums_dropped = 0;
347 else
349 memcpy ((char *) out, (char *) in,
350 (unsigned int) in_length << LITTLENUM_SHIFT);
352 if (out_length > in_length)
353 memset ((char *) (out + in_length), '\0',
354 (unsigned int) (out_length - in_length) << LITTLENUM_SHIFT);
356 significant_littlenums_dropped = 0;
359 return significant_littlenums_dropped;
362 /* md_estimate_size_before_relax(), called just before relax().
363 Any symbol that is now undefined will not become defined.
364 Return the correct fr_subtype in the frag and the growth beyond
365 fr_fix. */
367 md_estimate_size_before_relax (fragS *fragP, segT segment)
369 if (RELAX_LENGTH (fragP->fr_subtype) == STATE_UNDF)
371 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
372 #ifdef OBJ_ELF
373 || S_IS_WEAK (fragP->fr_symbol)
374 || S_IS_EXTERNAL (fragP->fr_symbol)
375 #endif
378 /* Non-relaxable cases. */
379 int reloc_type = NO_RELOC;
380 char *p;
381 int old_fr_fix;
383 old_fr_fix = fragP->fr_fix;
384 p = &fragP->fr_literal[0] + old_fr_fix;
385 #ifdef OBJ_ELF
386 /* If this is to an undefined symbol, then if it's an indirect
387 reference indicate that is can mutated into a GLOB_DAT or
388 JUMP_SLOT by the loader. We restrict ourselves to no offset
389 due to a limitation in the NetBSD linker. */
391 if (GOT_symbol == NULL)
392 GOT_symbol = symbol_find (GLOBAL_OFFSET_TABLE_NAME);
393 if (PLT_symbol == NULL)
394 PLT_symbol = symbol_find (PROCEDURE_LINKAGE_TABLE_NAME);
395 if ((GOT_symbol == NULL || fragP->fr_symbol != GOT_symbol)
396 && (PLT_symbol == NULL || fragP->fr_symbol != PLT_symbol)
397 && fragP->fr_symbol != NULL
398 && flag_want_pic
399 && (!S_IS_DEFINED (fragP->fr_symbol)
400 || S_IS_WEAK (fragP->fr_symbol)
401 || S_IS_EXTERNAL (fragP->fr_symbol)))
403 /* Indirect references cannot go through the GOT or PLT,
404 let's hope they'll become local in the final link. */
405 if ((ELF_ST_VISIBILITY (S_GET_OTHER (fragP->fr_symbol))
406 != STV_DEFAULT)
407 || (p[0] & 0x10))
408 reloc_type = BFD_RELOC_32_PCREL;
409 else if (((unsigned char *) fragP->fr_opcode)[0] == VAX_CALLS
410 || ((unsigned char *) fragP->fr_opcode)[0] == VAX_CALLG
411 || ((unsigned char *) fragP->fr_opcode)[0] == VAX_JSB
412 || ((unsigned char *) fragP->fr_opcode)[0] == VAX_JMP
413 || S_IS_FUNCTION (fragP->fr_symbol))
414 reloc_type = BFD_RELOC_32_PLT_PCREL;
415 else
416 reloc_type = BFD_RELOC_32_GOT_PCREL;
418 #endif
419 switch (RELAX_STATE (fragP->fr_subtype))
421 case STATE_PC_RELATIVE:
422 p[0] |= VAX_PC_RELATIVE_MODE; /* Preserve @ bit. */
423 fragP->fr_fix += 1 + 4;
424 fix_new (fragP, old_fr_fix + 1, 4, fragP->fr_symbol,
425 fragP->fr_offset, 1, reloc_type);
426 break;
428 case STATE_CONDITIONAL_BRANCH:
429 *fragP->fr_opcode ^= 1; /* Reverse sense of branch. */
430 p[0] = 6;
431 p[1] = VAX_JMP;
432 p[2] = VAX_PC_RELATIVE_MODE; /* ...(PC) */
433 fragP->fr_fix += 1 + 1 + 1 + 4;
434 fix_new (fragP, old_fr_fix + 3, 4, fragP->fr_symbol,
435 fragP->fr_offset, 1, NO_RELOC);
436 break;
438 case STATE_COMPLEX_BRANCH:
439 p[0] = 2;
440 p[1] = 0;
441 p[2] = VAX_BRB;
442 p[3] = 6;
443 p[4] = VAX_JMP;
444 p[5] = VAX_PC_RELATIVE_MODE; /* ...(pc) */
445 fragP->fr_fix += 2 + 2 + 1 + 1 + 4;
446 fix_new (fragP, old_fr_fix + 6, 4, fragP->fr_symbol,
447 fragP->fr_offset, 1, NO_RELOC);
448 break;
450 case STATE_COMPLEX_HOP:
451 p[0] = 2;
452 p[1] = VAX_BRB;
453 p[2] = 6;
454 p[3] = VAX_JMP;
455 p[4] = VAX_PC_RELATIVE_MODE; /* ...(pc) */
456 fragP->fr_fix += 1 + 2 + 1 + 1 + 4;
457 fix_new (fragP, old_fr_fix + 5, 4, fragP->fr_symbol,
458 fragP->fr_offset, 1, NO_RELOC);
459 break;
461 case STATE_ALWAYS_BRANCH:
462 *fragP->fr_opcode += VAX_WIDEN_LONG;
463 p[0] = VAX_PC_RELATIVE_MODE; /* ...(PC) */
464 fragP->fr_fix += 1 + 4;
465 fix_new (fragP, old_fr_fix + 1, 4, fragP->fr_symbol,
466 fragP->fr_offset, 1, NO_RELOC);
467 break;
469 default:
470 abort ();
472 frag_wane (fragP);
474 /* Return the growth in the fixed part of the frag. */
475 return fragP->fr_fix - old_fr_fix;
478 /* Relaxable cases. Set up the initial guess for the variable
479 part of the frag. */
480 switch (RELAX_STATE (fragP->fr_subtype))
482 case STATE_PC_RELATIVE:
483 fragP->fr_subtype = ENCODE_RELAX (STATE_PC_RELATIVE, STATE_BYTE);
484 break;
485 case STATE_CONDITIONAL_BRANCH:
486 fragP->fr_subtype = ENCODE_RELAX (STATE_CONDITIONAL_BRANCH, STATE_BYTE);
487 break;
488 case STATE_COMPLEX_BRANCH:
489 fragP->fr_subtype = ENCODE_RELAX (STATE_COMPLEX_BRANCH, STATE_WORD);
490 break;
491 case STATE_COMPLEX_HOP:
492 fragP->fr_subtype = ENCODE_RELAX (STATE_COMPLEX_HOP, STATE_BYTE);
493 break;
494 case STATE_ALWAYS_BRANCH:
495 fragP->fr_subtype = ENCODE_RELAX (STATE_ALWAYS_BRANCH, STATE_BYTE);
496 break;
500 if (fragP->fr_subtype >= sizeof (md_relax_table) / sizeof (md_relax_table[0]))
501 abort ();
503 /* Return the size of the variable part of the frag. */
504 return md_relax_table[fragP->fr_subtype].rlx_length;
507 /* Called after relax() is finished.
508 In: Address of frag.
509 fr_type == rs_machine_dependent.
510 fr_subtype is what the address relaxed to.
512 Out: Any fixSs and constants are set up.
513 Caller will turn frag into a ".space 0". */
514 void
515 md_convert_frag (bfd *headers ATTRIBUTE_UNUSED,
516 segT seg ATTRIBUTE_UNUSED,
517 fragS *fragP)
519 char *addressP; /* -> _var to change. */
520 char *opcodeP; /* -> opcode char(s) to change. */
521 short int extension = 0; /* Size of relaxed address. */
522 /* Added to fr_fix: incl. ALL var chars. */
523 symbolS *symbolP;
524 long where;
526 know (fragP->fr_type == rs_machine_dependent);
527 where = fragP->fr_fix;
528 addressP = &fragP->fr_literal[0] + where;
529 opcodeP = fragP->fr_opcode;
530 symbolP = fragP->fr_symbol;
531 know (symbolP);
533 switch (fragP->fr_subtype)
535 case ENCODE_RELAX (STATE_PC_RELATIVE, STATE_BYTE):
536 know (*addressP == 0 || *addressP == 0x10); /* '@' bit. */
537 addressP[0] |= 0xAF; /* Byte displacement. */
538 fix_new (fragP, fragP->fr_fix + 1, 1, fragP->fr_symbol,
539 fragP->fr_offset, 1, NO_RELOC);
540 extension = 2;
541 break;
543 case ENCODE_RELAX (STATE_PC_RELATIVE, STATE_WORD):
544 know (*addressP == 0 || *addressP == 0x10); /* '@' bit. */
545 addressP[0] |= 0xCF; /* Word displacement. */
546 fix_new (fragP, fragP->fr_fix + 1, 2, fragP->fr_symbol,
547 fragP->fr_offset, 1, NO_RELOC);
548 extension = 3;
549 break;
551 case ENCODE_RELAX (STATE_PC_RELATIVE, STATE_LONG):
552 know (*addressP == 0 || *addressP == 0x10); /* '@' bit. */
553 addressP[0] |= 0xEF; /* Long word displacement. */
554 fix_new (fragP, fragP->fr_fix + 1, 4, fragP->fr_symbol,
555 fragP->fr_offset, 1, NO_RELOC);
556 extension = 5;
557 break;
559 case ENCODE_RELAX (STATE_CONDITIONAL_BRANCH, STATE_BYTE):
560 fix_new (fragP, fragP->fr_fix, 1, fragP->fr_symbol,
561 fragP->fr_offset, 1, NO_RELOC);
562 extension = 1;
563 break;
565 case ENCODE_RELAX (STATE_CONDITIONAL_BRANCH, STATE_WORD):
566 opcodeP[0] ^= 1; /* Reverse sense of test. */
567 addressP[0] = 3;
568 addressP[1] = VAX_BRW;
569 fix_new (fragP, fragP->fr_fix + 2, 2, fragP->fr_symbol,
570 fragP->fr_offset, 1, NO_RELOC);
571 extension = 4;
572 break;
574 case ENCODE_RELAX (STATE_CONDITIONAL_BRANCH, STATE_LONG):
575 opcodeP[0] ^= 1; /* Reverse sense of test. */
576 addressP[0] = 6;
577 addressP[1] = VAX_JMP;
578 addressP[2] = VAX_PC_RELATIVE_MODE;
579 fix_new (fragP, fragP->fr_fix + 3, 4, fragP->fr_symbol,
580 fragP->fr_offset, 1, NO_RELOC);
581 extension = 7;
582 break;
584 case ENCODE_RELAX (STATE_ALWAYS_BRANCH, STATE_BYTE):
585 fix_new (fragP, fragP->fr_fix, 1, fragP->fr_symbol,
586 fragP->fr_offset, 1, NO_RELOC);
587 extension = 1;
588 break;
590 case ENCODE_RELAX (STATE_ALWAYS_BRANCH, STATE_WORD):
591 opcodeP[0] += VAX_WIDEN_WORD; /* brb -> brw, bsbb -> bsbw */
592 fix_new (fragP, fragP->fr_fix, 2, fragP->fr_symbol, fragP->fr_offset,
593 1, NO_RELOC);
594 extension = 2;
595 break;
597 case ENCODE_RELAX (STATE_ALWAYS_BRANCH, STATE_LONG):
598 opcodeP[0] += VAX_WIDEN_LONG; /* brb -> jmp, bsbb -> jsb */
599 addressP[0] = VAX_PC_RELATIVE_MODE;
600 fix_new (fragP, fragP->fr_fix + 1, 4, fragP->fr_symbol,
601 fragP->fr_offset, 1, NO_RELOC);
602 extension = 5;
603 break;
605 case ENCODE_RELAX (STATE_COMPLEX_BRANCH, STATE_WORD):
606 fix_new (fragP, fragP->fr_fix, 2, fragP->fr_symbol,
607 fragP->fr_offset, 1, NO_RELOC);
608 extension = 2;
609 break;
611 case ENCODE_RELAX (STATE_COMPLEX_BRANCH, STATE_LONG):
612 addressP[0] = 2;
613 addressP[1] = 0;
614 addressP[2] = VAX_BRB;
615 addressP[3] = 6;
616 addressP[4] = VAX_JMP;
617 addressP[5] = VAX_PC_RELATIVE_MODE;
618 fix_new (fragP, fragP->fr_fix + 6, 4, fragP->fr_symbol,
619 fragP->fr_offset, 1, NO_RELOC);
620 extension = 10;
621 break;
623 case ENCODE_RELAX (STATE_COMPLEX_HOP, STATE_BYTE):
624 fix_new (fragP, fragP->fr_fix, 1, fragP->fr_symbol,
625 fragP->fr_offset, 1, NO_RELOC);
626 extension = 1;
627 break;
629 case ENCODE_RELAX (STATE_COMPLEX_HOP, STATE_WORD):
630 addressP[0] = 2;
631 addressP[1] = VAX_BRB;
632 addressP[2] = 3;
633 addressP[3] = VAX_BRW;
634 fix_new (fragP, fragP->fr_fix + 4, 2, fragP->fr_symbol,
635 fragP->fr_offset, 1, NO_RELOC);
636 extension = 6;
637 break;
639 case ENCODE_RELAX (STATE_COMPLEX_HOP, STATE_LONG):
640 addressP[0] = 2;
641 addressP[1] = VAX_BRB;
642 addressP[2] = 6;
643 addressP[3] = VAX_JMP;
644 addressP[4] = VAX_PC_RELATIVE_MODE;
645 fix_new (fragP, fragP->fr_fix + 5, 4, fragP->fr_symbol,
646 fragP->fr_offset, 1, NO_RELOC);
647 extension = 9;
648 break;
650 default:
651 BAD_CASE (fragP->fr_subtype);
652 break;
654 fragP->fr_fix += extension;
657 /* Translate internal format of relocation info into target format.
659 On vax: first 4 bytes are normal unsigned long, next three bytes
660 are symbolnum, least sig. byte first. Last byte is broken up with
661 the upper nibble as nuthin, bit 3 as extern, bits 2 & 1 as length, and
662 bit 0 as pcrel. */
663 #ifdef comment
664 void
665 md_ri_to_chars (char *the_bytes, struct reloc_info_generic ri)
667 /* This is easy. */
668 md_number_to_chars (the_bytes, ri.r_address, sizeof (ri.r_address));
669 /* Now the fun stuff. */
670 the_bytes[6] = (ri.r_symbolnum >> 16) & 0x0ff;
671 the_bytes[5] = (ri.r_symbolnum >> 8) & 0x0ff;
672 the_bytes[4] = ri.r_symbolnum & 0x0ff;
673 the_bytes[7] = (((ri.r_extern << 3) & 0x08) | ((ri.r_length << 1) & 0x06)
674 | ((ri.r_pcrel << 0) & 0x01)) & 0x0F;
677 #endif /* comment */
679 /* BUGS, GRIPES, APOLOGIA, etc.
681 The opcode table 'votstrs' needs to be sorted on opcode frequency.
682 That is, AFTER we hash it with hash_...(), we want most-used opcodes
683 to come out of the hash table faster.
685 I am sorry to inflict yet another VAX assembler on the world, but
686 RMS says we must do everything from scratch, to prevent pin-heads
687 restricting this software.
689 This is a vaguely modular set of routines in C to parse VAX
690 assembly code using DEC mnemonics. It is NOT un*x specific.
692 The idea here is that the assembler has taken care of all:
693 labels
694 macros
695 listing
696 pseudo-ops
697 line continuation
698 comments
699 condensing any whitespace down to exactly one space
700 and all we have to do is parse 1 line into a vax instruction
701 partially formed. We will accept a line, and deliver:
702 an error message (hopefully empty)
703 a skeleton VAX instruction (tree structure)
704 textual pointers to all the operand expressions
705 a warning message that notes a silly operand (hopefully empty)
707 E D I T H I S T O R Y
709 17may86 Dean Elsner. Bug if line ends immediately after opcode.
710 30apr86 Dean Elsner. New vip_op() uses arg block so change call.
711 6jan86 Dean Elsner. Crock vip_begin() to call vip_op_defaults().
712 2jan86 Dean Elsner. Invent synthetic opcodes.
713 Widen vax_opcodeT to 32 bits. Use a bit for VIT_OPCODE_SYNTHETIC,
714 which means this is not a real opcode, it is like a macro; it will
715 be relax()ed into 1 or more instructions.
716 Use another bit for VIT_OPCODE_SPECIAL if the op-code is not optimised
717 like a regular branch instruction. Option added to vip_begin():
718 exclude synthetic opcodes. Invent synthetic_votstrs[].
719 31dec85 Dean Elsner. Invent vit_opcode_nbytes.
720 Also make vit_opcode into a char[]. We now have n-byte vax opcodes,
721 so caller's don't have to know the difference between a 1-byte & a
722 2-byte op-code. Still need vax_opcodeT concept, so we know how
723 big an object must be to hold an op.code.
724 30dec85 Dean Elsner. Widen typedef vax_opcodeT in "vax-inst.h"
725 because vax opcodes may be 16 bits. Our crufty C compiler was
726 happily initialising 8-bit vot_codes with 16-bit numbers!
727 (Wouldn't the 'phone company like to compress data so easily!)
728 29dec85 Dean Elsner. New static table vax_operand_width_size[].
729 Invented so we know hw many bytes a "I^#42" needs in its immediate
730 operand. Revised struct vop in "vax-inst.h": explicitly include
731 byte length of each operand, and it's letter-code datum type.
732 17nov85 Dean Elsner. Name Change.
733 Due to ar(1) truncating names, we learned the hard way that
734 "vax-inst-parse.c" -> "vax-inst-parse." dropping the "o" off
735 the archived object name. SO... we shortened the name of this
736 source file, and changed the makefile. */
738 /* Handle of the OPCODE hash table. */
739 static htab_t op_hash;
741 /* In: 1 character, from "bdfghloqpw" being the data-type of an operand
742 of a vax instruction.
744 Out: the length of an operand of that type, in bytes.
745 Special branch operands types "-?!" have length 0. */
747 static const short int vax_operand_width_size[256] =
749 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
750 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
751 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
752 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
753 0, 0, 1, 0, 8, 0, 4, 8, 16, 0, 0, 0, 4, 0, 0,16, /* ..b.d.fgh...l..o */
754 0, 8, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, /* .q.....w........ */
755 0, 0, 1, 0, 8, 0, 4, 8, 16, 0, 0, 0, 4, 0, 0,16, /* ..b.d.fgh...l..o */
756 0, 8, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, /* .q.....w........ */
757 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
758 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
759 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
760 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
761 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
762 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
763 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
764 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
767 /* This perversion encodes all the vax opcodes as a bunch of strings.
768 RMS says we should build our hash-table at run-time. Hmm.
769 Please would someone arrange these in decreasing frequency of opcode?
770 Because of the way hash_...() works, the most frequently used opcode
771 should be textually first and so on.
773 Input for this table was 'vax.opcodes', awk(1)ed by 'vax.opcodes.c.awk' .
774 So change 'vax.opcodes', then re-generate this table. */
776 #include "opcode/vax.h"
778 /* This is a table of optional op-codes. All of them represent
779 'synthetic' instructions that seem popular.
781 Here we make some pseudo op-codes. Every code has a bit set to say
782 it is synthetic. This lets you catch them if you want to
783 ban these opcodes. They are mnemonics for "elastic" instructions
784 that are supposed to assemble into the fewest bytes needed to do a
785 branch, or to do a conditional branch, or whatever.
787 The opcode is in the usual place [low-order n*8 bits]. This means
788 that if you mask off the bucky bits, the usual rules apply about
789 how long the opcode is.
791 All VAX branch displacements come at the end of the instruction.
792 For simple branches (1-byte opcode + 1-byte displacement) the last
793 operand is coded 'b?' where the "data type" '?' is a clue that we
794 may reverse the sense of the branch (complement lowest order bit)
795 and branch around a jump. This is by far the most common case.
796 That is why the VIT_OPCODE_SYNTHETIC bit is set: it says this is
797 a 0-byte op-code followed by 2 or more bytes of operand address.
799 If the op-code has VIT_OPCODE_SPECIAL set, then we have a more unusual
800 case.
802 For JBSB & JBR the treatment is the similar, except (1) we have a 'bw'
803 option before (2) we can directly JSB/JMP because there is no condition.
804 These operands have 'b-' as their access/data type.
806 That leaves a bunch of random opcodes: JACBx, JxOBxxx. In these
807 cases, we do the same idea. JACBxxx are all marked with a 'b!'
808 JAOBxxx & JSOBxxx are marked with a 'b:'. */
809 #if (VIT_OPCODE_SYNTHETIC != 0x80000000)
810 #error "You have just broken the encoding below, which assumes the sign bit means 'I am an imaginary instruction'."
811 #endif
813 #if (VIT_OPCODE_SPECIAL != 0x40000000)
814 #error "You have just broken the encoding below, which assumes the 0x40 M bit means 'I am not to be "optimised" the way normal branches are'."
815 #endif
817 static const struct vot
818 synthetic_votstrs[] =
820 {"jbsb", {"b-", 0xC0000010}}, /* BSD 4.2 */
821 /* jsb used already */
822 {"jbr", {"b-", 0xC0000011}}, /* BSD 4.2 */
823 {"jr", {"b-", 0xC0000011}}, /* consistent */
824 {"jneq", {"b?", 0x80000012}},
825 {"jnequ", {"b?", 0x80000012}},
826 {"jeql", {"b?", 0x80000013}},
827 {"jeqlu", {"b?", 0x80000013}},
828 {"jgtr", {"b?", 0x80000014}},
829 {"jleq", {"b?", 0x80000015}},
830 /* un-used opcodes here */
831 {"jgeq", {"b?", 0x80000018}},
832 {"jlss", {"b?", 0x80000019}},
833 {"jgtru", {"b?", 0x8000001a}},
834 {"jlequ", {"b?", 0x8000001b}},
835 {"jvc", {"b?", 0x8000001c}},
836 {"jvs", {"b?", 0x8000001d}},
837 {"jgequ", {"b?", 0x8000001e}},
838 {"jcc", {"b?", 0x8000001e}},
839 {"jlssu", {"b?", 0x8000001f}},
840 {"jcs", {"b?", 0x8000001f}},
842 {"jacbw", {"rwrwmwb!", 0xC000003d}},
843 {"jacbf", {"rfrfmfb!", 0xC000004f}},
844 {"jacbd", {"rdrdmdb!", 0xC000006f}},
845 {"jacbb", {"rbrbmbb!", 0xC000009d}},
846 {"jacbl", {"rlrlmlb!", 0xC00000f1}},
847 {"jacbg", {"rgrgmgb!", 0xC0004ffd}},
848 {"jacbh", {"rhrhmhb!", 0xC0006ffd}},
850 {"jbs", {"rlvbb?", 0x800000e0}},
851 {"jbc", {"rlvbb?", 0x800000e1}},
852 {"jbss", {"rlvbb?", 0x800000e2}},
853 {"jbcs", {"rlvbb?", 0x800000e3}},
854 {"jbsc", {"rlvbb?", 0x800000e4}},
855 {"jbcc", {"rlvbb?", 0x800000e5}},
856 {"jbssi", {"rlvbb?", 0x800000e6}},
857 {"jbcci", {"rlvbb?", 0x800000e7}},
858 {"jlbs", {"rlb?", 0x800000e8}},
859 {"jlbc", {"rlb?", 0x800000e9}},
861 {"jaoblss", {"rlmlb:", 0xC00000f2}},
862 {"jaobleq", {"rlmlb:", 0xC00000f3}},
863 {"jsobgeq", {"mlb:", 0xC00000f4}},
864 {"jsobgtr", {"mlb:", 0xC00000f5}},
866 /* CASEx has no branch addresses in our conception of it. */
867 /* You should use ".word ..." statements after the "case ...". */
869 {"", {"", 0}} /* Empty is end sentinel. */
872 /* Because this module is useful for both VMS and UN*X style assemblers
873 and because of the variety of UN*X assemblers we must recognise
874 the different conventions for assembler operand notation. For example
875 VMS says "#42" for immediate mode, while most UN*X say "$42".
876 We permit arbitrary sets of (single) characters to represent the
877 3 concepts that DEC writes '#', '@', '^'. */
879 /* Character tests. */
880 #define VIP_IMMEDIATE 01 /* Character is like DEC # */
881 #define VIP_INDIRECT 02 /* Char is like DEC @ */
882 #define VIP_DISPLEN 04 /* Char is like DEC ^ */
884 #define IMMEDIATEP(c) (vip_metacharacters [(c) & 0xff] & VIP_IMMEDIATE)
885 #define INDIRECTP(c) (vip_metacharacters [(c) & 0xff] & VIP_INDIRECT)
886 #define DISPLENP(c) (vip_metacharacters [(c) & 0xff] & VIP_DISPLEN)
888 /* We assume 8 bits per byte. Use vip_op_defaults() to set these up BEFORE we
889 are ever called. */
891 #if defined(CONST_TABLE)
892 #define _ 0,
893 #define I VIP_IMMEDIATE,
894 #define S VIP_INDIRECT,
895 #define D VIP_DISPLEN,
896 static const char
897 vip_metacharacters[256] =
899 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ /* ^@ ^A ^B ^C ^D ^E ^F ^G ^H ^I ^J ^K ^L ^M ^N ^O*/
900 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ /* ^P ^Q ^R ^S ^T ^U ^V ^W ^X ^Y ^Z ^[ ^\ ^] ^^ ^_ */
901 _ _ _ _ I _ _ _ _ _ S _ _ _ _ _ /* sp ! " # $ % & ' ( ) * + , - . / */
902 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ /*0 1 2 3 4 5 6 7 8 9 : ; < = > ?*/
903 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ /*@ A B C D E F G H I J K L M N O*/
904 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ /*P Q R S T U V W X Y Z [ \ ] ^ _*/
905 D _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ /*` a b c d e f g h i j k l m n o*/
906 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ /*p q r s t u v w x y z { | } ~ ^?*/
908 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
909 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
910 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
911 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
912 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
913 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
914 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
915 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
917 #undef _
918 #undef I
919 #undef S
920 #undef D
922 #else
924 static char vip_metacharacters[256];
926 static void
927 vip_op_1 (int bit, const char *syms)
929 unsigned char t;
931 while ((t = *syms++) != 0)
932 vip_metacharacters[t] |= bit;
935 /* Can be called any time. More arguments may appear in future. */
936 static void
937 vip_op_defaults (const char *immediate, const char *indirect, const char *displen)
939 vip_op_1 (VIP_IMMEDIATE, immediate);
940 vip_op_1 (VIP_INDIRECT, indirect);
941 vip_op_1 (VIP_DISPLEN, displen);
944 #endif
946 /* Call me once before you decode any lines.
947 I decode votstrs into a hash table at op_hash (which I create).
948 I return an error text or null.
949 If you want, I will include the 'synthetic' jXXX instructions in the
950 instruction table.
951 You must nominate metacharacters for eg DEC's "#", "@", "^". */
953 static void
954 vip_begin (int synthetic_too, /* 1 means include jXXX op-codes. */
955 const char *immediate,
956 const char *indirect,
957 const char *displen)
959 const struct vot *vP; /* scan votstrs */
961 op_hash = str_htab_create ();
963 for (vP = votstrs; *vP->vot_name; vP++)
964 if (str_hash_insert (op_hash, vP->vot_name, &vP->vot_detail, 0) != NULL)
965 as_fatal (_("duplicate %s"), vP->vot_name);
967 if (synthetic_too)
968 for (vP = synthetic_votstrs; *vP->vot_name; vP++)
969 if (str_hash_insert (op_hash, vP->vot_name, &vP->vot_detail, 0) != NULL)
970 as_fatal (_("duplicate %s"), vP->vot_name);
972 #ifndef CONST_TABLE
973 vip_op_defaults (immediate, indirect, displen);
974 #endif
977 /* Take 3 char.s, the last of which may be `\0` (non-existent)
978 and return the VAX register number that they represent.
980 Return -1 if they don't form a register name. Good names return
981 a number from 0:15 inclusive.
983 Case is not important in a name.
985 Register names understood are:
999 R12 AP
1000 R13 FP
1001 R14 SP
1002 R15 PC */
1004 #define AP 12
1005 #define FP 13
1006 #define SP 14
1007 #define PC 15
1009 /* Returns the register number of something like '%r15' or 'ap', supplied
1010 in four single chars. Returns -1 if the register isn't recognized,
1011 0..15 otherwise. */
1012 static int
1013 vax_reg_parse (char c1, char c2, char c3, char c4)
1015 int retval = -1;
1017 #ifdef OBJ_ELF
1018 if (c1 != '%') /* Register prefixes are mandatory for ELF. */
1019 return retval;
1020 c1 = c2;
1021 c2 = c3;
1022 c3 = c4;
1023 #endif
1024 #ifdef OBJ_VMS
1025 if (c4 != 0) /* Register prefixes are not allowed under VMS. */
1026 return retval;
1027 #endif
1028 #ifdef OBJ_AOUT
1029 if (c1 == '%') /* Register prefixes are optional under a.out. */
1031 c1 = c2;
1032 c2 = c3;
1033 c3 = c4;
1035 else if (c3 && c4) /* Can't be 4 characters long. */
1036 return retval;
1037 #endif
1039 c1 = TOLOWER (c1);
1040 c2 = TOLOWER (c2);
1041 if (ISDIGIT (c2) && c1 == 'r')
1043 retval = c2 - '0';
1044 if (ISDIGIT (c3))
1046 retval = retval * 10 + c3 - '0';
1047 retval = (retval > 15) ? -1 : retval;
1048 /* clamp the register value to 1 hex digit */
1050 else if (c3)
1051 retval = -1; /* c3 must be '\0' or a digit. */
1053 else if (c3) /* There are no three letter regs. */
1054 retval = -1;
1055 else if (c2 == 'p')
1057 switch (c1)
1059 case 's':
1060 retval = SP;
1061 break;
1062 case 'f':
1063 retval = FP;
1064 break;
1065 case 'a':
1066 retval = AP;
1067 break;
1068 default:
1069 retval = -1;
1072 else if (c1 == 'p' && c2 == 'c')
1073 retval = PC;
1074 else
1075 retval = -1;
1076 return retval;
1079 /* Parse a vax operand in DEC assembler notation.
1080 For speed, expect a string of whitespace to be reduced to a single ' '.
1081 This is the case for GNU AS, and is easy for other DEC-compatible
1082 assemblers.
1084 Knowledge about DEC VAX assembler operand notation lives here.
1085 This doesn't even know what a register name is, except it believes
1086 all register names are 2 or 3 characters, and lets vax_reg_parse() say
1087 what number each name represents.
1088 It does, however, know that PC, SP etc are special registers so it can
1089 detect addressing modes that are silly for those registers.
1091 Where possible, it delivers 1 fatal or 1 warning message if the operand
1092 is suspect. Exactly what we test for is still evolving.
1095 Arg block.
1097 There were a number of 'mismatched argument type' bugs to vip_op.
1098 The most general solution is to typedef each (of many) arguments.
1099 We used instead a typedef'd argument block. This is less modular
1100 than using separate return pointers for each result, but runs faster
1101 on most engines, and seems to keep programmers happy. It will have
1102 to be done properly if we ever want to use vip_op as a general-purpose
1103 module (it was designed to be).
1107 Doesn't support DEC "G^" format operands. These always take 5 bytes
1108 to express, and code as modes 8F or 9F. Reason: "G^" deprives you of
1109 optimising to (say) a "B^" if you are lucky in the way you link.
1110 When someone builds a linker smart enough to convert "G^" to "B^", "W^"
1111 whenever possible, then we should implement it.
1112 If there is some other use for "G^", feel free to code it in!
1114 speed
1116 If I nested if()s more, I could avoid testing (*err) which would save
1117 time, space and page faults. I didn't nest all those if()s for clarity
1118 and because I think the mode testing can be re-arranged 1st to test the
1119 commoner constructs 1st. Does anybody have statistics on this?
1121 error messages
1123 In future, we should be able to 'compose' error messages in a scratch area
1124 and give the user MUCH more informative error messages. Although this takes
1125 a little more code at run-time, it will make this module much more self-
1126 documenting. As an example of what sucks now: most error messages have
1127 hardwired into them the DEC VAX metacharacters "#^@" which are nothing like
1128 the Un*x characters "$`*", that most users will expect from this AS.
1130 ----
1132 The input is a string, ending with '\0'.
1134 We also require a 'hint' of what kind of operand is expected: so
1135 we can remind caller not to write into literals for instance.
1137 The output is a skeletal instruction.
1139 The algorithm has two parts.
1140 1. extract the syntactic features (parse off all the @^#-()+[] mode crud);
1141 2. express the @^#-()+[] as some parameters suited to further analysis.
1143 2nd step is where we detect the googles of possible invalid combinations
1144 a human (or compiler) might write. Note that if we do a half-way
1145 decent assembler, we don't know how long to make (eg) displacement
1146 fields when we first meet them (because they may not have defined values).
1147 So we must wait until we know how many bits are needed for each address,
1148 then we can know both length and opcodes of instructions.
1149 For reason(s) above, we will pass to our caller a 'broken' instruction
1150 of these major components, from which our caller can generate instructions:
1151 - displacement length I^ S^ L^ B^ W^ unspecified
1152 - mode (many)
1153 - register R0-R15 or absent
1154 - index register R0-R15 or absent
1155 - expression text what we don't parse
1156 - error text(s) why we couldn't understand the operand
1158 ----
1160 To decode output of this, test errtxt. If errtxt[0] == '\0', then
1161 we had no errors that prevented parsing. Also, if we ever report
1162 an internal bug, errtxt[0] is set non-zero. So one test tells you
1163 if the other outputs are to be taken seriously.
1165 ----
1167 Dec defines the semantics of address modes (and values)
1168 by a two-letter code, explained here.
1170 letter 1: access type
1172 a address calculation - no data access, registers forbidden
1173 b branch displacement
1174 m read - let go of bus - write back "modify"
1175 r read
1176 v bit field address: like 'a' but registers are OK
1177 w write
1178 space no operator (eg ".long foo") [our convention]
1180 letter 2: data type (i.e. width, alignment)
1182 b byte
1183 d double precision floating point (D format)
1184 f single precision floating point (F format)
1185 g G format floating
1186 h H format floating
1187 l longword
1188 o octaword
1189 q quadword
1190 w word
1191 ? simple synthetic branch operand
1192 - unconditional synthetic JSB/JSR operand
1193 ! complex synthetic branch operand
1195 The '-?!' letter 2's are not for external consumption. They are used
1196 for various assemblers. Generally, all unknown widths are assumed 0.
1197 We don't limit your choice of width character.
1199 DEC operands are hard work to parse. For example, '@' as the first
1200 character means indirect (deferred) mode but elsewhere it is a shift
1201 operator.
1202 The long-winded explanation of how this is supposed to work is
1203 cancelled. Read a DEC vax manual.
1204 We try hard not to parse anything that MIGHT be part of the expression
1205 buried in that syntax. For example if we see @...(Rn) we don't check
1206 for '-' before the '(' because mode @-(Rn) does not exist.
1208 After parsing we have:
1210 at 1 if leading '@' (or Un*x '*')
1211 len takes one value from " bilsw". eg B^ -> 'b'.
1212 hash 1 if leading '#' (or Un*x '$')
1213 expr_begin, expr_end the expression we did not parse
1214 even though we don't interpret it, we make use
1215 of its presence or absence.
1216 sign -1: -(Rn) 0: absent +1: (Rn)+
1217 paren 1 if () are around register
1218 reg major register number 0:15 -1 means absent
1219 ndx index register number 0:15 -1 means absent
1221 Again, I dare not explain it: just trace ALL the code!
1223 Summary of vip_op outputs.
1225 mode reg len ndx
1226 (Rn) => @Rn
1227 {@}Rn 5+@ n ' ' optional
1228 branch operand 0 -1 ' ' -1
1229 S^#foo 0 -1 's' -1
1230 -(Rn) 7 n ' ' optional
1231 {@}(Rn)+ 8+@ n ' ' optional
1232 {@}#foo, no S^ 8+@ PC " i" optional
1233 {@}{q^}{(Rn)} 10+@+q option " bwl" optional */
1235 /* Dissect user-input 'optext' (which is something like "@B^foo@bar(AP)[FP]:")
1236 using the vop in vopP. vopP's vop_access and vop_width. We fill _ndx, _reg,
1237 _mode, _short, _warn, _error, _expr_begin, _expr_end and _nbytes. */
1239 static void
1240 vip_op (char *optext, struct vop *vopP)
1242 /* Track operand text forward. */
1243 char *p;
1244 /* Track operand text backward. */
1245 char *q;
1246 /* 1 if leading '@' ('*') seen. */
1247 int at;
1248 /* one of " bilsw" */
1249 char len;
1250 /* 1 if leading '#' ('$') seen. */
1251 int hash;
1252 /* -1, 0 or +1. */
1253 int sign = 0;
1254 /* 1 if () surround register. */
1255 int paren = 0;
1256 /* Register number, -1:absent. */
1257 int reg = 0;
1258 /* Index register number -1:absent. */
1259 int ndx = 0;
1260 /* Report illegal operand, ""==OK. */
1261 /* " " is a FAKE error: means we won. */
1262 /* ANY err that begins with ' ' is a fake. */
1263 /* " " is converted to "" before return. */
1264 const char *err;
1265 /* Warn about weird modes pf address. */
1266 const char *wrn;
1267 /* Preserve q in case we backup. */
1268 char *oldq = NULL;
1269 /* Build up 4-bit operand mode here. */
1270 /* Note: index mode is in ndx, this is. */
1271 /* The major mode of operand address. */
1272 int mode = 0;
1273 /* Notice how we move wrong-arg-type bugs INSIDE this module: if we
1274 get the types wrong below, we lose at compile time rather than at
1275 lint or run time. */
1276 char access_mode; /* vop_access. */
1278 access_mode = vopP->vop_access;
1279 /* None of our code bugs (yet), no user text errors, no warnings
1280 even. */
1281 err = wrn = 0;
1283 p = optext;
1285 if (*p == ' ') /* Expect all whitespace reduced to ' '. */
1286 p++; /* skip over whitespace */
1288 if ((at = INDIRECTP (*p)) != 0)
1289 { /* 1 if *p=='@'(or '*' for Un*x) */
1290 p++; /* at is determined */
1291 if (*p == ' ') /* Expect all whitespace reduced to ' '. */
1292 p++; /* skip over whitespace */
1295 /* This code is subtle. It tries to detect all legal (letter)'^'
1296 but it doesn't waste time explicitly testing for premature '\0' because
1297 this case is rejected as a mismatch against either (letter) or '^'. */
1299 char c;
1301 c = *p;
1302 c = TOLOWER (c);
1303 if (DISPLENP (p[1]) && strchr ("bilws", len = c))
1304 p += 2; /* Skip (letter) '^'. */
1305 else /* No (letter) '^' seen. */
1306 len = ' '; /* Len is determined. */
1309 if (*p == ' ') /* Expect all whitespace reduced to ' '. */
1310 p++;
1312 if ((hash = IMMEDIATEP (*p)) != 0) /* 1 if *p=='#' ('$' for Un*x) */
1313 p++; /* Hash is determined. */
1315 /* p points to what may be the beginning of an expression.
1316 We have peeled off the front all that is peelable.
1317 We know at, len, hash.
1319 Lets point q at the end of the text and parse that (backwards). */
1321 for (q = p; *q; q++)
1323 q--; /* Now q points at last char of text. */
1325 if (*q == ' ' && q >= p) /* Expect all whitespace reduced to ' '. */
1326 q--;
1328 /* Reverse over whitespace, but don't. */
1329 /* Run back over *p. */
1331 /* As a matter of policy here, we look for [Rn], although both Rn and S^#
1332 forbid [Rn]. This is because it is easy, and because only a sick
1333 cyborg would have [...] trailing an expression in a VAX-like assembler.
1334 A meticulous parser would first check for Rn followed by '(' or '['
1335 and not parse a trailing ']' if it found another. We just ban expressions
1336 ending in ']'. */
1337 if (*q == ']')
1339 while (q >= p && *q != '[')
1340 q--;
1341 /* Either q<p or we got matching '['. */
1342 if (q < p)
1343 err = _("no '[' to match ']'");
1344 else
1346 /* Confusers like "[]" will eventually lose with a bad register
1347 * name error. So again we don't need to check for early '\0'. */
1348 if (q[3] == ']')
1349 ndx = vax_reg_parse (q[1], q[2], 0, 0);
1350 else if (q[4] == ']')
1351 ndx = vax_reg_parse (q[1], q[2], q[3], 0);
1352 else if (q[5] == ']')
1353 ndx = vax_reg_parse (q[1], q[2], q[3], q[4]);
1354 else
1355 ndx = -1;
1356 /* Since we saw a ']' we will demand a register name in the [].
1357 * If luser hasn't given us one: be rude. */
1358 if (ndx < 0)
1359 err = _("bad register in []");
1360 else if (ndx == PC)
1361 err = _("[PC] index banned");
1362 else
1363 /* Point q just before "[...]". */
1364 q--;
1367 else
1368 /* No ']', so no iNDeX register. */
1369 ndx = -1;
1371 /* If err = "..." then we lost: run away.
1372 Otherwise ndx == -1 if there was no "[...]".
1373 Otherwise, ndx is index register number, and q points before "[...]". */
1375 if (*q == ' ' && q >= p) /* Expect all whitespace reduced to ' '. */
1376 q--;
1377 /* Reverse over whitespace, but don't. */
1378 /* Run back over *p. */
1379 if (!err || !*err)
1381 /* no ()+ or -() seen yet */
1382 sign = 0;
1384 if (q > p + 3 && *q == '+' && q[-1] == ')')
1386 sign = 1; /* we saw a ")+" */
1387 q--; /* q points to ')' */
1390 if (*q == ')' && q > p + 2)
1392 paren = 1; /* assume we have "(...)" */
1393 while (q >= p && *q != '(')
1394 q--;
1395 /* either q<p or we got matching '(' */
1396 if (q < p)
1397 err = _("no '(' to match ')'");
1398 else
1400 /* Confusers like "()" will eventually lose with a bad register
1401 name error. So again we don't need to check for early '\0'. */
1402 if (q[3] == ')')
1403 reg = vax_reg_parse (q[1], q[2], 0, 0);
1404 else if (q[4] == ')')
1405 reg = vax_reg_parse (q[1], q[2], q[3], 0);
1406 else if (q[5] == ')')
1407 reg = vax_reg_parse (q[1], q[2], q[3], q[4]);
1408 else
1409 reg = -1;
1410 /* Since we saw a ')' we will demand a register name in the ')'.
1411 This is nasty: why can't our hypothetical assembler permit
1412 parenthesised expressions? BECAUSE I AM LAZY! That is why.
1413 Abuse luser if we didn't spy a register name. */
1414 if (reg < 0)
1416 /* JF allow parenthesized expressions. I hope this works. */
1417 paren = 0;
1418 while (*q != ')')
1419 q++;
1420 /* err = "unknown register in ()"; */
1422 else
1423 q--; /* point just before '(' of "(...)" */
1424 /* If err == "..." then we lost. Run away.
1425 Otherwise if reg >= 0 then we saw (Rn). */
1427 /* If err == "..." then we lost.
1428 Otherwise paren==1 and reg = register in "()". */
1430 else
1431 paren = 0;
1432 /* If err == "..." then we lost.
1433 Otherwise, q points just before "(Rn)", if any.
1434 If there was a "(...)" then paren==1, and reg is the register. */
1436 /* We should only seek '-' of "-(...)" if:
1437 we saw "(...)" paren == 1
1438 we have no errors so far ! *err
1439 we did not see '+' of "(...)+" sign < 1
1440 We don't check len. We want a specific error message later if
1441 user tries "x^...-(Rn)". This is a feature not a bug. */
1442 if (!err || !*err)
1444 if (paren && sign < 1)/* !sign is adequate test */
1446 if (*q == '-')
1448 sign = -1;
1449 q--;
1452 /* We have back-tracked over most
1453 of the crud at the end of an operand.
1454 Unless err, we know: sign, paren. If paren, we know reg.
1455 The last case is of an expression "Rn".
1456 This is worth hunting for if !err, !paren.
1457 We wouldn't be here if err.
1458 We remember to save q, in case we didn't want "Rn" anyway. */
1459 if (!paren)
1461 if (*q == ' ' && q >= p) /* Expect all whitespace reduced to ' '. */
1462 q--;
1463 /* Reverse over whitespace, but don't. */
1464 /* Run back over *p. */
1465 /* Room for Rn or Rnn (include prefix) exactly? */
1466 if (q > p && q < p + 4)
1467 reg = vax_reg_parse (p[0], p[1],
1468 q < p + 2 ? 0 : p[2],
1469 q < p + 3 ? 0 : p[3]);
1470 else
1471 reg = -1; /* Always comes here if no register at all. */
1472 /* Here with a definitive reg value. */
1473 if (reg >= 0)
1475 oldq = q;
1476 q = p - 1;
1481 /* have reg. -1:absent; else 0:15. */
1483 /* We have: err, at, len, hash, ndx, sign, paren, reg.
1484 Also, any remaining expression is from *p through *q inclusive.
1485 Should there be no expression, q==p-1. So expression length = q-p+1.
1486 This completes the first part: parsing the operand text. */
1488 /* We now want to boil the data down, checking consistency on the way.
1489 We want: len, mode, reg, ndx, err, p, q, wrn, bug.
1490 We will deliver a 4-bit reg, and a 4-bit mode. */
1492 /* Case of branch operand. Different. No L^B^W^I^S^ allowed for instance.
1494 in: at ?
1495 len ?
1496 hash ?
1497 p:q ?
1498 sign ?
1499 paren ?
1500 reg ?
1501 ndx ?
1503 out: mode 0
1504 reg -1
1505 len ' '
1506 p:q whatever was input
1507 ndx -1
1508 err " " or error message, and other outputs trashed. */
1509 /* Branch operands have restricted forms. */
1510 if ((!err || !*err) && access_mode == 'b')
1512 if (at || hash || sign || paren || ndx >= 0 || reg >= 0 || len != ' ')
1513 err = _("invalid branch operand");
1514 else
1515 err = " ";
1518 /* Since nobody seems to use it: comment this 'feature'(?) out for now. */
1519 #ifdef NEVER
1520 /* Case of stand-alone operand. e.g. ".long foo"
1522 in: at ?
1523 len ?
1524 hash ?
1525 p:q ?
1526 sign ?
1527 paren ?
1528 reg ?
1529 ndx ?
1531 out: mode 0
1532 reg -1
1533 len ' '
1534 p:q whatever was input
1535 ndx -1
1536 err " " or error message, and other outputs trashed. */
1537 if ((!err || !*err) && access_mode == ' ')
1539 if (at)
1540 err = _("address prohibits @");
1541 else if (hash)
1542 err = _("address prohibits #");
1543 else if (sign)
1545 if (sign < 0)
1546 err = _("address prohibits -()");
1547 else
1548 err = _("address prohibits ()+");
1550 else if (paren)
1551 err = _("address prohibits ()");
1552 else if (ndx >= 0)
1553 err = _("address prohibits []");
1554 else if (reg >= 0)
1555 err = _("address prohibits register");
1556 else if (len != ' ')
1557 err = _("address prohibits displacement length specifier");
1558 else
1560 err = " "; /* succeed */
1561 mode = 0;
1564 #endif
1566 /* Case of S^#.
1568 in: at 0
1569 len 's' definition
1570 hash 1 demand
1571 p:q demand not empty
1572 sign 0 by paren==0
1573 paren 0 by "()" scan logic because "S^" seen
1574 reg -1 or nn by mistake
1575 ndx -1
1577 out: mode 0
1578 reg -1
1579 len 's'
1581 ndx -1 */
1582 if ((!err || !*err) && len == 's')
1584 if (!hash || paren || at || ndx >= 0)
1585 err = _("invalid operand of S^#");
1586 else
1588 if (reg >= 0)
1590 /* Darn! we saw S^#Rnn ! put the Rnn back in
1591 expression. KLUDGE! Use oldq so we don't
1592 need to know exact length of reg name. */
1593 q = oldq;
1594 reg = 0;
1596 /* We have all the expression we will ever get. */
1597 if (p > q)
1598 err = _("S^# needs expression");
1599 else if (access_mode == 'r')
1601 err = " "; /* WIN! */
1602 mode = 0;
1604 else
1605 err = _("S^# may only read-access");
1609 /* Case of -(Rn), which is weird case.
1611 in: at 0
1612 len '
1613 hash 0
1614 p:q q<p
1615 sign -1 by definition
1616 paren 1 by definition
1617 reg present by definition
1618 ndx optional
1620 out: mode 7
1621 reg present
1622 len ' '
1623 exp "" enforce empty expression
1624 ndx optional warn if same as reg. */
1625 if ((!err || !*err) && sign < 0)
1627 if (len != ' ' || hash || at || p <= q)
1628 err = _("invalid operand of -()");
1629 else
1631 err = " "; /* win */
1632 mode = 7;
1633 if (reg == PC)
1634 wrn = _("-(PC) unpredictable");
1635 else if (reg == ndx)
1636 wrn = _("[]index same as -()register: unpredictable");
1640 /* We convert "(Rn)" to "@Rn" for our convenience.
1641 (I hope this is convenient: has someone got a better way to parse this?)
1642 A side-effect of this is that "@Rn" is a valid operand. */
1643 if (paren && !sign && !hash && !at && len == ' ' && p > q)
1645 at = 1;
1646 paren = 0;
1649 /* Case of (Rn)+, which is slightly different.
1651 in: at
1652 len ' '
1653 hash 0
1654 p:q q<p
1655 sign +1 by definition
1656 paren 1 by definition
1657 reg present by definition
1658 ndx optional
1660 out: mode 8+@
1661 reg present
1662 len ' '
1663 exp "" enforce empty expression
1664 ndx optional warn if same as reg. */
1665 if ((!err || !*err) && sign > 0)
1667 if (len != ' ' || hash || p <= q)
1668 err = _("invalid operand of ()+");
1669 else
1671 err = " "; /* win */
1672 mode = 8 + (at ? 1 : 0);
1673 if (reg == PC)
1674 wrn = _("(PC)+ unpredictable");
1675 else if (reg == ndx)
1676 wrn = _("[]index same as ()+register: unpredictable");
1680 /* Case of #, without S^.
1682 in: at
1683 len ' ' or 'i'
1684 hash 1 by definition
1686 sign 0
1687 paren 0
1688 reg absent
1689 ndx optional
1691 out: mode 8+@
1692 reg PC
1693 len ' ' or 'i'
1695 ndx optional. */
1696 if ((!err || !*err) && hash)
1698 if (len != 'i' && len != ' ')
1699 err = _("# conflicts length");
1700 else if (paren)
1701 err = _("# bars register");
1702 else
1704 if (reg >= 0)
1706 /* Darn! we saw #Rnn! Put the Rnn back into the expression.
1707 By using oldq, we don't need to know how long Rnn was.
1708 KLUDGE! */
1709 q = oldq;
1710 reg = -1; /* No register any more. */
1712 err = " "; /* Win. */
1714 /* JF a bugfix, I think! */
1715 if (at && access_mode == 'a')
1716 vopP->vop_nbytes = 4;
1718 mode = (at ? 9 : 8);
1719 reg = PC;
1720 if ((access_mode == 'm' || access_mode == 'w') && !at)
1721 wrn = _("writing or modifying # is unpredictable");
1724 /* If !*err, then sign == 0
1725 hash == 0 */
1727 /* Case of Rn. We separate this one because it has a few special
1728 errors the remaining modes lack.
1730 in: at optional
1731 len ' '
1732 hash 0 by program logic
1733 p:q empty
1734 sign 0 by program logic
1735 paren 0 by definition
1736 reg present by definition
1737 ndx optional
1739 out: mode 5+@
1740 reg present
1741 len ' ' enforce no length
1742 exp "" enforce empty expression
1743 ndx optional warn if same as reg. */
1744 if ((!err || !*err) && !paren && reg >= 0)
1746 if (len != ' ')
1747 err = _("length not needed");
1748 else if (at)
1750 err = " "; /* win */
1751 mode = 6; /* @Rn */
1753 else if (ndx >= 0)
1754 err = _("can't []index a register, because it has no address");
1755 else if (access_mode == 'a')
1756 err = _("a register has no address");
1757 else
1759 /* Idea here is to detect from length of datum
1760 and from register number if we will touch PC.
1761 Warn if we do.
1762 vop_nbytes is number of bytes in operand.
1763 Compute highest byte affected, compare to PC0. */
1764 if ((vopP->vop_nbytes + reg * 4) > 60)
1765 wrn = _("PC part of operand unpredictable");
1766 err = " "; /* win */
1767 mode = 5; /* Rn */
1770 /* If !*err, sign == 0
1771 hash == 0
1772 paren == 1 OR reg==-1 */
1774 /* Rest of cases fit into one bunch.
1776 in: at optional
1777 len ' ' or 'b' or 'w' or 'l'
1778 hash 0 by program logic
1779 p:q expected (empty is not an error)
1780 sign 0 by program logic
1781 paren optional
1782 reg optional
1783 ndx optional
1785 out: mode 10 + @ + len
1786 reg optional
1787 len ' ' or 'b' or 'w' or 'l'
1788 exp maybe empty
1789 ndx optional warn if same as reg. */
1790 if (!err || !*err)
1792 err = " "; /* win (always) */
1793 mode = 10 + (at ? 1 : 0);
1794 switch (len)
1796 case 'l':
1797 mode += 2;
1798 /* Fall through. */
1799 case 'w':
1800 mode += 2;
1801 /* Fall through. */
1802 case ' ': /* Assumed B^ until our caller changes it. */
1803 case 'b':
1804 break;
1808 /* here with completely specified mode
1811 expression p,q
1812 ndx. */
1814 if (*err == ' ')
1815 err = 0; /* " " is no longer an error. */
1817 vopP->vop_mode = mode;
1818 vopP->vop_reg = reg;
1819 vopP->vop_short = len;
1820 vopP->vop_expr_begin = p;
1821 vopP->vop_expr_end = q;
1822 vopP->vop_ndx = ndx;
1823 vopP->vop_error = err;
1824 vopP->vop_warn = wrn;
1827 /* This converts a string into a vax instruction.
1828 The string must be a bare single instruction in dec-vax (with BSD4 frobs)
1829 format.
1830 It provides some error messages: at most one fatal error message (which
1831 stops the scan) and at most one warning message for each operand.
1832 The vax instruction is returned in exploded form, since we have no
1833 knowledge of how you parse (or evaluate) your expressions.
1834 We do however strip off and decode addressing modes and operation
1835 mnemonic.
1837 The exploded instruction is returned to a struct vit of your choice.
1838 #include "vax-inst.h" to know what a struct vit is.
1840 This function's value is a string. If it is not "" then an internal
1841 logic error was found: read this code to assign meaning to the string.
1842 No argument string should generate such an error string:
1843 it means a bug in our code, not in the user's text.
1845 You MUST have called vip_begin() once before using this function. */
1847 static void
1848 vip (struct vit *vitP, /* We build an exploded instruction here. */
1849 char *instring) /* Text of a vax instruction: we modify. */
1851 /* How to bit-encode this opcode. */
1852 struct vot_wot *vwP;
1853 /* 1/skip whitespace.2/scan vot_how */
1854 char *p;
1855 char *q;
1856 /* counts number of operands seen */
1857 unsigned char count;
1858 /* scan operands in struct vit */
1859 struct vop *operandp;
1860 /* error over all operands */
1861 const char *alloperr;
1862 /* Remember char, (we clobber it with '\0' temporarily). */
1863 char c;
1864 /* Op-code of this instruction. */
1865 vax_opcodeT oc;
1867 if (*instring == ' ')
1868 ++instring;
1870 /* MUST end in end-of-string or exactly 1 space. */
1871 for (p = instring; *p && *p != ' '; p++)
1874 /* Scanned up to end of operation-code. */
1875 /* Operation-code is ended with whitespace. */
1876 if (p - instring == 0)
1878 vitP->vit_error = _("No operator");
1879 count = 0;
1880 memset (vitP->vit_opcode, '\0', sizeof (vitP->vit_opcode));
1882 else
1884 c = *p;
1885 *p = '\0';
1886 /* Here with instring pointing to what better be an op-name, and p
1887 pointing to character just past that.
1888 We trust instring points to an op-name, with no whitespace. */
1889 vwP = (struct vot_wot *) str_hash_find (op_hash, instring);
1890 /* Restore char after op-code. */
1891 *p = c;
1892 if (vwP == 0)
1894 vitP->vit_error = _("Unknown operator");
1895 count = 0;
1896 memset (vitP->vit_opcode, '\0', sizeof (vitP->vit_opcode));
1898 else
1900 /* We found a match! So let's pick up as many operands as the
1901 instruction wants, and even gripe if there are too many.
1902 We expect comma to separate each operand.
1903 We let instring track the text, while p tracks a part of the
1904 struct vot. */
1905 const char *howp;
1906 /* The lines below know about 2-byte opcodes starting FD,FE or FF.
1907 They also understand synthetic opcodes. Note:
1908 we return 32 bits of opcode, including bucky bits, BUT
1909 an opcode length is either 8 or 16 bits for vit_opcode_nbytes. */
1910 oc = vwP->vot_code; /* The op-code. */
1911 vitP->vit_opcode_nbytes = (oc & 0xFF) >= 0xFD ? 2 : 1;
1912 md_number_to_chars (vitP->vit_opcode, oc, 4);
1913 count = 0; /* No operands seen yet. */
1914 instring = p; /* Point just past operation code. */
1915 alloperr = "";
1916 for (howp = vwP->vot_how, operandp = vitP->vit_operand;
1917 !(alloperr && *alloperr) && *howp;
1918 operandp++, howp += 2)
1920 /* Here to parse one operand. Leave instring pointing just
1921 past any one ',' that marks the end of this operand. */
1922 if (!howp[1])
1923 as_fatal (_("odd number of bytes in operand description"));
1924 else if (*instring)
1926 for (q = instring; (c = *q) && c != ','; q++)
1928 /* Q points to ',' or '\0' that ends argument. C is that
1929 character. */
1930 *q = 0;
1931 operandp->vop_width = howp[1];
1932 operandp->vop_nbytes = vax_operand_width_size[(unsigned) howp[1]];
1933 operandp->vop_access = howp[0];
1934 vip_op (instring, operandp);
1935 *q = c; /* Restore input text. */
1936 if (operandp->vop_error)
1937 alloperr = _("Bad operand");
1938 instring = q + (c ? 1 : 0); /* Next operand (if any). */
1939 count++; /* Won another argument, may have an operr. */
1941 else
1942 alloperr = _("Not enough operands");
1944 if (!*alloperr)
1946 if (*instring == ' ')
1947 instring++;
1948 if (*instring)
1949 alloperr = _("Too many operands");
1951 vitP->vit_error = alloperr;
1954 vitP->vit_operands = count;
1957 #ifdef test
1959 /* Test program for above. */
1961 struct vit myvit; /* Build an exploded vax instruction here. */
1962 char answer[100]; /* Human types a line of vax assembler here. */
1963 char *mybug; /* "" or an internal logic diagnostic. */
1964 int mycount; /* Number of operands. */
1965 struct vop *myvop; /* Scan operands from myvit. */
1966 int mysynth; /* 1 means want synthetic opcodes. */
1967 char my_immediate[200];
1968 char my_indirect[200];
1969 char my_displen[200];
1972 main (void)
1974 char *p;
1976 printf ("0 means no synthetic instructions. ");
1977 printf ("Value for vip_begin? ");
1978 gets (answer);
1979 sscanf (answer, "%d", &mysynth);
1980 printf ("Synthetic opcodes %s be included.\n", mysynth ? "will" : "will not");
1981 printf ("enter immediate symbols eg enter # ");
1982 gets (my_immediate);
1983 printf ("enter indirect symbols eg enter @ ");
1984 gets (my_indirect);
1985 printf ("enter displen symbols eg enter ^ ");
1986 gets (my_displen);
1988 vip_begin (mysynth, my_immediate, my_indirect, my_displen)
1990 printf ("An empty input line will quit you from the vax instruction parser\n");
1991 for (;;)
1993 printf ("vax instruction: ");
1994 fflush (stdout);
1995 gets (answer);
1996 if (!*answer)
1997 break; /* Out of for each input text loop. */
1999 vip (& myvit, answer);
2000 if (*myvit.vit_error)
2001 printf ("ERR:\"%s\"\n", myvit.vit_error);
2003 printf ("opcode=");
2004 for (mycount = myvit.vit_opcode_nbytes, p = myvit.vit_opcode;
2005 mycount;
2006 mycount--, p++)
2007 printf ("%02x ", *p & 0xFF);
2009 printf (" operand count=%d.\n", mycount = myvit.vit_operands);
2010 for (myvop = myvit.vit_operand; mycount; mycount--, myvop++)
2012 printf ("mode=%xx reg=%xx ndx=%xx len='%c'=%c%c%d. expr=\"",
2013 myvop->vop_mode, myvop->vop_reg, myvop->vop_ndx,
2014 myvop->vop_short, myvop->vop_access, myvop->vop_width,
2015 myvop->vop_nbytes);
2016 for (p = myvop->vop_expr_begin; p <= myvop->vop_expr_end; p++)
2017 putchar (*p);
2019 printf ("\"\n");
2020 if (myvop->vop_error)
2021 printf (" err:\"%s\"\n", myvop->vop_error);
2023 if (myvop->vop_warn)
2024 printf (" wrn:\"%s\"\n", myvop->vop_warn);
2027 vip_end ();
2028 exit (EXIT_SUCCESS);
2031 #endif
2033 #ifdef TEST /* #Define to use this testbed. */
2035 /* Follows a test program for this function.
2036 We declare arrays non-local in case some of our tiny-minded machines
2037 default to small stacks. Also, helps with some debuggers. */
2039 char answer[100]; /* Human types into here. */
2040 char *p; /* */
2041 char *myerr;
2042 char *mywrn;
2043 char *mybug;
2044 char myaccess;
2045 char mywidth;
2046 char mymode;
2047 char myreg;
2048 char mylen;
2049 char *myleft;
2050 char *myright;
2051 char myndx;
2052 int my_operand_length;
2053 char my_immediate[200];
2054 char my_indirect[200];
2055 char my_displen[200];
2058 main (void)
2060 printf ("enter immediate symbols eg enter # ");
2061 gets (my_immediate);
2062 printf ("enter indirect symbols eg enter @ ");
2063 gets (my_indirect);
2064 printf ("enter displen symbols eg enter ^ ");
2065 gets (my_displen);
2066 vip_op_defaults (my_immediate, my_indirect, my_displen);
2068 for (;;)
2070 printf ("access,width (eg 'ab' or 'wh') [empty line to quit] : ");
2071 fflush (stdout);
2072 gets (answer);
2073 if (!answer[0])
2074 exit (EXIT_SUCCESS);
2075 myaccess = answer[0];
2076 mywidth = answer[1];
2077 switch (mywidth)
2079 case 'b':
2080 my_operand_length = 1;
2081 break;
2082 case 'd':
2083 my_operand_length = 8;
2084 break;
2085 case 'f':
2086 my_operand_length = 4;
2087 break;
2088 case 'g':
2089 my_operand_length = 16;
2090 break;
2091 case 'h':
2092 my_operand_length = 32;
2093 break;
2094 case 'l':
2095 my_operand_length = 4;
2096 break;
2097 case 'o':
2098 my_operand_length = 16;
2099 break;
2100 case 'q':
2101 my_operand_length = 8;
2102 break;
2103 case 'w':
2104 my_operand_length = 2;
2105 break;
2106 case '!':
2107 case '?':
2108 case '-':
2109 my_operand_length = 0;
2110 break;
2112 default:
2113 my_operand_length = 2;
2114 printf ("I don't understand access width %c\n", mywidth);
2115 break;
2117 printf ("VAX assembler instruction operand: ");
2118 fflush (stdout);
2119 gets (answer);
2120 mybug = vip_op (answer, myaccess, mywidth, my_operand_length,
2121 &mymode, &myreg, &mylen, &myleft, &myright, &myndx,
2122 &myerr, &mywrn);
2123 if (*myerr)
2125 printf ("error: \"%s\"\n", myerr);
2126 if (*mybug)
2127 printf (" bug: \"%s\"\n", mybug);
2129 else
2131 if (*mywrn)
2132 printf ("warning: \"%s\"\n", mywrn);
2133 mumble ("mode", mymode);
2134 mumble ("register", myreg);
2135 mumble ("index", myndx);
2136 printf ("width:'%c' ", mylen);
2137 printf ("expression: \"");
2138 while (myleft <= myright)
2139 putchar (*myleft++);
2140 printf ("\"\n");
2145 void
2146 mumble (char *text, int value)
2148 printf ("%s:", text);
2149 if (value >= 0)
2150 printf ("%xx", value);
2151 else
2152 printf ("ABSENT");
2153 printf (" ");
2156 #endif
2158 int md_short_jump_size = 3;
2159 int md_long_jump_size = 6;
2161 void
2162 md_create_short_jump (char *ptr,
2163 addressT from_addr,
2164 addressT to_addr ATTRIBUTE_UNUSED,
2165 fragS *frag ATTRIBUTE_UNUSED,
2166 symbolS *to_symbol ATTRIBUTE_UNUSED)
2168 valueT offset;
2170 /* This former calculation was off by two:
2171 offset = to_addr - (from_addr + 1);
2172 We need to account for the one byte instruction and also its
2173 two byte operand. */
2174 offset = to_addr - (from_addr + 1 + 2);
2175 *ptr++ = VAX_BRW; /* Branch with word (16 bit) offset. */
2176 md_number_to_chars (ptr, offset, 2);
2179 void
2180 md_create_long_jump (char *ptr,
2181 addressT from_addr ATTRIBUTE_UNUSED,
2182 addressT to_addr,
2183 fragS *frag,
2184 symbolS *to_symbol)
2186 valueT offset;
2188 offset = to_addr - S_GET_VALUE (to_symbol);
2189 *ptr++ = VAX_JMP; /* Arbitrary jump. */
2190 *ptr++ = VAX_ABSOLUTE_MODE;
2191 md_number_to_chars (ptr, offset, 4);
2192 fix_new (frag, ptr - frag->fr_literal, 4, to_symbol, (long) 0, 0, NO_RELOC);
2195 #ifdef OBJ_VMS
2196 const char *md_shortopts = "d:STt:V+1h:Hv::";
2197 #elif defined(OBJ_ELF)
2198 const char *md_shortopts = "d:STt:VkKQ:";
2199 #else
2200 const char *md_shortopts = "d:STt:V";
2201 #endif
2202 struct option md_longopts[] =
2204 #ifdef OBJ_ELF
2205 #define OPTION_PIC (OPTION_MD_BASE)
2206 { "pic", no_argument, NULL, OPTION_PIC },
2207 #endif
2208 { NULL, no_argument, NULL, 0 }
2210 size_t md_longopts_size = sizeof (md_longopts);
2213 md_parse_option (int c, const char *arg)
2215 switch (c)
2217 case 'S':
2218 as_warn (_("SYMBOL TABLE not implemented"));
2219 break;
2221 case 'T':
2222 as_warn (_("TOKEN TRACE not implemented"));
2223 break;
2225 case 'd':
2226 as_warn (_("Displacement length %s ignored!"), arg);
2227 break;
2229 case 't':
2230 as_warn (_("I don't need or use temp. file \"%s\"."), arg);
2231 break;
2233 case 'V':
2234 as_warn (_("I don't use an interpass file! -V ignored"));
2235 break;
2237 #ifdef OBJ_VMS
2238 case '+': /* For g++. Hash any name > 31 chars long. */
2239 flag_hash_long_names = 1;
2240 break;
2242 case '1': /* For backward compatibility. */
2243 flag_one = 1;
2244 break;
2246 case 'H': /* Show new symbol after hash truncation. */
2247 flag_show_after_trunc = 1;
2248 break;
2250 case 'h': /* No hashing of mixed-case names. */
2252 extern char vms_name_mapping;
2253 vms_name_mapping = atoi (arg);
2254 flag_no_hash_mixed_case = 1;
2256 break;
2258 case 'v':
2260 extern char *compiler_version_string;
2262 if (!arg || !*arg || access (arg, 0) == 0)
2263 return 0; /* Have caller show the assembler version. */
2264 compiler_version_string = arg;
2266 break;
2267 #endif
2269 #ifdef OBJ_ELF
2270 case OPTION_PIC:
2271 case 'k':
2272 flag_want_pic = 1;
2273 break; /* -pic, Position Independent Code. */
2275 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment
2276 section should be emitted or not. FIXME: Not implemented. */
2277 case 'Q':
2278 break;
2279 #endif
2281 default:
2282 return 0;
2285 return 1;
2288 void
2289 md_show_usage (FILE *stream)
2291 fprintf (stream, _("\
2292 VAX options:\n\
2293 -d LENGTH ignored\n\
2294 -J ignored\n\
2295 -S ignored\n\
2296 -t FILE ignored\n\
2297 -T ignored\n\
2298 -V ignored\n"));
2299 #ifdef OBJ_VMS
2300 fprintf (stream, _("\
2301 VMS options:\n\
2302 -+ hash encode names longer than 31 characters\n\
2303 -1 `const' handling compatible with gcc 1.x\n\
2304 -H show new symbol after hash truncation\n\
2305 -h NUM don't hash mixed-case names, and adjust case:\n\
2306 0 = upper, 2 = lower, 3 = preserve case\n\
2307 -v\"VERSION\" code being assembled was produced by compiler \"VERSION\"\n"));
2308 #endif
2311 /* We have no need to default values of symbols. */
2313 symbolS *
2314 md_undefined_symbol (char *name ATTRIBUTE_UNUSED)
2316 return NULL;
2319 /* Round up a section size to the appropriate boundary. */
2320 valueT
2321 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
2323 /* Byte alignment is fine */
2324 return size;
2327 /* Exactly what point is a PC-relative offset relative TO?
2328 On the vax, they're relative to the address of the offset, plus
2329 its size. */
2330 long
2331 md_pcrel_from (fixS *fixP)
2333 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
2336 arelent *
2337 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
2339 arelent *reloc;
2340 bfd_reloc_code_real_type code;
2342 if (fixp->fx_tcbit)
2343 abort ();
2345 if (fixp->fx_r_type != NO_RELOC)
2347 code = fixp->fx_r_type;
2349 if (fixp->fx_pcrel)
2351 switch (code)
2353 case BFD_RELOC_8_PCREL:
2354 case BFD_RELOC_16_PCREL:
2355 case BFD_RELOC_32_PCREL:
2356 #ifdef OBJ_ELF
2357 case BFD_RELOC_8_GOT_PCREL:
2358 case BFD_RELOC_16_GOT_PCREL:
2359 case BFD_RELOC_32_GOT_PCREL:
2360 case BFD_RELOC_8_PLT_PCREL:
2361 case BFD_RELOC_16_PLT_PCREL:
2362 case BFD_RELOC_32_PLT_PCREL:
2363 #endif
2364 break;
2365 default:
2366 as_bad_where (fixp->fx_file, fixp->fx_line,
2367 _("Cannot make %s relocation PC relative"),
2368 bfd_get_reloc_code_name (code));
2372 else
2374 #define F(SZ,PCREL) (((SZ) << 1) + (PCREL))
2375 switch (F (fixp->fx_size, fixp->fx_pcrel))
2377 #define MAP(SZ,PCREL,TYPE) case F(SZ,PCREL): code = (TYPE); break
2378 MAP (1, 0, BFD_RELOC_8);
2379 MAP (2, 0, BFD_RELOC_16);
2380 MAP (4, 0, BFD_RELOC_32);
2381 MAP (1, 1, BFD_RELOC_8_PCREL);
2382 MAP (2, 1, BFD_RELOC_16_PCREL);
2383 MAP (4, 1, BFD_RELOC_32_PCREL);
2384 default:
2385 abort ();
2388 #undef F
2389 #undef MAP
2391 reloc = XNEW (arelent);
2392 reloc->sym_ptr_ptr = XNEW (asymbol *);
2393 *reloc->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
2394 reloc->address = fixp->fx_frag->fr_address + fixp->fx_where;
2395 #ifndef OBJ_ELF
2396 if (fixp->fx_pcrel)
2397 reloc->addend = fixp->fx_addnumber;
2398 else
2399 reloc->addend = 0;
2400 #else
2401 reloc->addend = fixp->fx_offset;
2402 #endif
2404 reloc->howto = bfd_reloc_type_lookup (stdoutput, code);
2405 gas_assert (reloc->howto != 0);
2407 return reloc;
2410 /* vax:md_assemble() emit frags for 1 instruction given in textual form. */
2411 void
2412 md_assemble (char *instruction_string)
2414 /* Non-zero if operand expression's segment is not known yet. */
2415 int is_undefined;
2416 /* Non-zero if operand expression's segment is absolute. */
2417 int is_absolute;
2418 int length_code;
2419 char *p;
2420 /* An operand. Scans all operands. */
2421 struct vop *operandP;
2422 char *save_input_line_pointer;
2423 /* What used to live after an expression. */
2424 char c_save;
2425 /* 1: instruction_string bad for all passes. */
2426 int goofed;
2427 /* Points to slot just after last operand. */
2428 struct vop *end_operandP;
2429 /* Points to expression values for this operand. */
2430 expressionS *expP;
2431 segT *segP;
2433 /* These refer to an instruction operand expression. */
2434 /* Target segment of the address. */
2435 segT to_seg;
2436 valueT this_add_number;
2437 /* Positive (minuend) symbol. */
2438 symbolS *this_add_symbol;
2439 /* As a number. */
2440 long opcode_as_number;
2441 /* Least significant byte 1st. */
2442 char *opcode_as_chars;
2443 /* As an array of characters. */
2444 /* Least significant byte 1st */
2445 char *opcode_low_byteP;
2446 /* length (bytes) meant by vop_short. */
2447 int length;
2448 /* 0, or 1 if '@' is in addressing mode. */
2449 int at;
2450 /* From vop_nbytes: vax_operand_width (in bytes) */
2451 int nbytes;
2452 FLONUM_TYPE *floatP;
2453 LITTLENUM_TYPE literal_float[8];
2454 /* Big enough for any floating point literal. */
2456 vip (&v, instruction_string);
2458 /* Now we try to find as many as_warn()s as we can. If we do any as_warn()s
2459 then goofed=1. Notice that we don't make any frags yet.
2460 Should goofed be 1, then this instruction will wedge in any pass,
2461 and we can safely flush it, without causing interpass symbol phase
2462 errors. That is, without changing label values in different passes. */
2463 if ((goofed = (*v.vit_error)) != 0)
2465 as_fatal (_("Ignoring statement due to \"%s\""), v.vit_error);
2467 /* We need to use expression() and friends, which require us to diddle
2468 input_line_pointer. So we save it and restore it later. */
2469 save_input_line_pointer = input_line_pointer;
2470 for (operandP = v.vit_operand,
2471 expP = exp_of_operand,
2472 segP = seg_of_operand,
2473 floatP = float_operand,
2474 end_operandP = v.vit_operand + v.vit_operands;
2476 operandP < end_operandP;
2478 operandP++, expP++, segP++, floatP++)
2480 if (operandP->vop_error)
2482 as_fatal (_("Aborting because statement has \"%s\""), operandP->vop_error);
2483 goofed = 1;
2485 else
2487 /* Statement has no syntax goofs: let's sniff the expression. */
2488 int can_be_short = 0; /* 1 if a bignum can be reduced to a short literal. */
2490 input_line_pointer = operandP->vop_expr_begin;
2491 c_save = operandP->vop_expr_end[1];
2492 operandP->vop_expr_end[1] = '\0';
2493 /* If to_seg == SEG_PASS1, expression() will have set need_pass_2 = 1. */
2494 *segP = expression (expP);
2495 switch (expP->X_op)
2497 case O_absent:
2498 /* for BSD4.2 compatibility, missing expression is absolute 0 */
2499 expP->X_op = O_constant;
2500 expP->X_add_number = 0;
2501 /* For SEG_ABSOLUTE, we shouldn't need to set X_op_symbol,
2502 X_add_symbol to any particular value. But, we will program
2503 defensively. Since this situation occurs rarely so it costs
2504 us little to do, and stops Dean worrying about the origin of
2505 random bits in expressionS's. */
2506 expP->X_add_symbol = NULL;
2507 expP->X_op_symbol = NULL;
2508 break;
2510 case O_symbol:
2511 case O_constant:
2512 break;
2514 default:
2515 /* Major bug. We can't handle the case of a
2516 SEG_OP expression in a VIT_OPCODE_SYNTHETIC
2517 variable-length instruction.
2518 We don't have a frag type that is smart enough to
2519 relax a SEG_OP, and so we just force all
2520 SEG_OPs to behave like SEG_PASS1s.
2521 Clearly, if there is a demand we can invent a new or
2522 modified frag type and then coding up a frag for this
2523 case will be easy. SEG_OP was invented for the
2524 .words after a CASE opcode, and was never intended for
2525 instruction operands. */
2526 need_pass_2 = 1;
2527 as_fatal (_("Can't relocate expression"));
2528 break;
2530 case O_big:
2531 /* Preserve the bits. */
2532 if (expP->X_add_number > 0)
2534 bignum_copy (generic_bignum, expP->X_add_number,
2535 floatP->low, SIZE_OF_LARGE_NUMBER);
2537 else
2539 know (expP->X_add_number < 0);
2540 flonum_copy (&generic_floating_point_number,
2541 floatP);
2542 if (strchr ("s i", operandP->vop_short))
2544 /* Could possibly become S^# */
2545 flonum_gen2vax (-expP->X_add_number, floatP, literal_float);
2546 switch (-expP->X_add_number)
2548 case 'f':
2549 can_be_short =
2550 (literal_float[0] & 0xFC0F) == 0x4000
2551 && literal_float[1] == 0;
2552 break;
2554 case 'd':
2555 can_be_short =
2556 (literal_float[0] & 0xFC0F) == 0x4000
2557 && literal_float[1] == 0
2558 && literal_float[2] == 0
2559 && literal_float[3] == 0;
2560 break;
2562 case 'g':
2563 can_be_short =
2564 (literal_float[0] & 0xFF81) == 0x4000
2565 && literal_float[1] == 0
2566 && literal_float[2] == 0
2567 && literal_float[3] == 0;
2568 break;
2570 case 'h':
2571 can_be_short = ((literal_float[0] & 0xFFF8) == 0x4000
2572 && (literal_float[1] & 0xE000) == 0
2573 && literal_float[2] == 0
2574 && literal_float[3] == 0
2575 && literal_float[4] == 0
2576 && literal_float[5] == 0
2577 && literal_float[6] == 0
2578 && literal_float[7] == 0);
2579 break;
2581 default:
2582 BAD_CASE (-expP->X_add_number);
2583 break;
2588 if (operandP->vop_short == 's'
2589 || operandP->vop_short == 'i'
2590 || (operandP->vop_short == ' '
2591 && operandP->vop_reg == 0xF
2592 && (operandP->vop_mode & 0xE) == 0x8))
2594 /* Saw a '#'. */
2595 if (operandP->vop_short == ' ')
2597 /* We must chose S^ or I^. */
2598 if (expP->X_add_number > 0)
2600 /* Bignum: Short literal impossible. */
2601 operandP->vop_short = 'i';
2602 operandP->vop_mode = 8;
2603 operandP->vop_reg = 0xF; /* VAX PC. */
2605 else
2607 /* Flonum: Try to do it. */
2608 if (can_be_short)
2610 operandP->vop_short = 's';
2611 operandP->vop_mode = 0;
2612 operandP->vop_ndx = -1;
2613 operandP->vop_reg = -1;
2614 expP->X_op = O_constant;
2616 else
2618 operandP->vop_short = 'i';
2619 operandP->vop_mode = 8;
2620 operandP->vop_reg = 0xF; /* VAX PC */
2622 } /* bignum or flonum ? */
2623 } /* if #, but no S^ or I^ seen. */
2624 /* No more ' ' case: either 's' or 'i'. */
2625 if (operandP->vop_short == 's')
2627 /* Wants to be a short literal. */
2628 if (expP->X_add_number > 0)
2630 as_warn (_("Bignum not permitted in short literal. Immediate mode assumed."));
2631 operandP->vop_short = 'i';
2632 operandP->vop_mode = 8;
2633 operandP->vop_reg = 0xF; /* VAX PC. */
2635 else
2637 if (!can_be_short)
2639 as_warn (_("Can't do flonum short literal: immediate mode used."));
2640 operandP->vop_short = 'i';
2641 operandP->vop_mode = 8;
2642 operandP->vop_reg = 0xF; /* VAX PC. */
2644 else
2646 /* Encode short literal now. */
2647 int temp = 0;
2649 switch (-expP->X_add_number)
2651 case 'f':
2652 case 'd':
2653 temp = literal_float[0] >> 4;
2654 break;
2656 case 'g':
2657 temp = literal_float[0] >> 1;
2658 break;
2660 case 'h':
2661 temp = ((literal_float[0] << 3) & 070)
2662 | ((literal_float[1] >> 13) & 07);
2663 break;
2665 default:
2666 BAD_CASE (-expP->X_add_number);
2667 break;
2670 floatP->low[0] = temp & 077;
2671 floatP->low[1] = 0;
2675 else
2677 /* I^# seen: set it up if float. */
2678 if (expP->X_add_number < 0)
2680 memcpy (floatP->low, literal_float, sizeof (literal_float));
2682 } /* if S^# seen. */
2684 else
2686 as_warn (_("A bignum/flonum may not be a displacement: 0x%lx used"),
2687 (expP->X_add_number = 0x80000000L));
2688 /* Chosen so luser gets the most offset bits to patch later. */
2690 expP->X_add_number = floatP->low[0]
2691 | ((LITTLENUM_MASK & (floatP->low[1])) << LITTLENUM_NUMBER_OF_BITS);
2693 /* For the O_big case we have:
2694 If vop_short == 's' then a short floating literal is in the
2695 lowest 6 bits of floatP -> low [0], which is
2696 big_operand_bits [---] [0].
2697 If vop_short == 'i' then the appropriate number of elements
2698 of big_operand_bits [---] [...] are set up with the correct
2699 bits.
2700 Also, just in case width is byte word or long, we copy the lowest
2701 32 bits of the number to X_add_number. */
2702 break;
2704 if (input_line_pointer != operandP->vop_expr_end + 1)
2706 as_fatal ("Junk at end of expression \"%s\"", input_line_pointer);
2707 goofed = 1;
2709 operandP->vop_expr_end[1] = c_save;
2713 input_line_pointer = save_input_line_pointer;
2715 if (need_pass_2 || goofed)
2716 return;
2718 dwarf2_emit_insn (0);
2719 /* Emit op-code. */
2720 /* Remember where it is, in case we want to modify the op-code later. */
2721 opcode_low_byteP = frag_more (v.vit_opcode_nbytes);
2722 memcpy (opcode_low_byteP, v.vit_opcode, v.vit_opcode_nbytes);
2723 opcode_as_chars = v.vit_opcode;
2724 opcode_as_number = md_chars_to_number ((unsigned char *) opcode_as_chars, 4);
2725 for (operandP = v.vit_operand,
2726 expP = exp_of_operand,
2727 segP = seg_of_operand,
2728 floatP = float_operand,
2729 end_operandP = v.vit_operand + v.vit_operands;
2731 operandP < end_operandP;
2733 operandP++,
2734 floatP++,
2735 segP++,
2736 expP++)
2738 if (operandP->vop_ndx >= 0)
2740 /* Indexed addressing byte. */
2741 /* Legality of indexed mode already checked: it is OK. */
2742 FRAG_APPEND_1_CHAR (0x40 + operandP->vop_ndx);
2743 } /* if(vop_ndx>=0) */
2745 /* Here to make main operand frag(s). */
2746 this_add_number = expP->X_add_number;
2747 this_add_symbol = expP->X_add_symbol;
2748 to_seg = *segP;
2749 is_undefined = (to_seg == undefined_section);
2750 is_absolute = (to_seg == absolute_section);
2751 at = operandP->vop_mode & 1;
2752 length = (operandP->vop_short == 'b'
2753 ? 1 : (operandP->vop_short == 'w'
2754 ? 2 : (operandP->vop_short == 'l'
2755 ? 4 : 0)));
2756 nbytes = operandP->vop_nbytes;
2757 if (operandP->vop_access == 'b')
2759 if (to_seg == now_seg || is_undefined)
2761 /* If is_undefined, then it might BECOME now_seg. */
2762 if (nbytes)
2764 p = frag_more (nbytes);
2765 fix_new (frag_now, p - frag_now->fr_literal, nbytes,
2766 this_add_symbol, this_add_number, 1, NO_RELOC);
2768 else
2770 /* to_seg==now_seg || to_seg == SEG_UNKNOWN */
2771 /* nbytes==0 */
2772 length_code = is_undefined ? STATE_UNDF : STATE_BYTE;
2773 if (opcode_as_number & VIT_OPCODE_SPECIAL)
2775 if (operandP->vop_width == VAX_WIDTH_UNCONDITIONAL_JUMP)
2777 /* br or jsb */
2778 frag_var (rs_machine_dependent, 5, 1,
2779 ENCODE_RELAX (STATE_ALWAYS_BRANCH, length_code),
2780 this_add_symbol, this_add_number,
2781 opcode_low_byteP);
2783 else
2785 if (operandP->vop_width == VAX_WIDTH_WORD_JUMP)
2787 length_code = STATE_WORD;
2788 /* JF: There is no state_byte for this one! */
2789 frag_var (rs_machine_dependent, 10, 2,
2790 ENCODE_RELAX (STATE_COMPLEX_BRANCH, length_code),
2791 this_add_symbol, this_add_number,
2792 opcode_low_byteP);
2794 else
2796 know (operandP->vop_width == VAX_WIDTH_BYTE_JUMP);
2797 frag_var (rs_machine_dependent, 9, 1,
2798 ENCODE_RELAX (STATE_COMPLEX_HOP, length_code),
2799 this_add_symbol, this_add_number,
2800 opcode_low_byteP);
2804 else
2806 know (operandP->vop_width == VAX_WIDTH_CONDITIONAL_JUMP);
2807 frag_var (rs_machine_dependent, 7, 1,
2808 ENCODE_RELAX (STATE_CONDITIONAL_BRANCH, length_code),
2809 this_add_symbol, this_add_number,
2810 opcode_low_byteP);
2814 else
2816 /* to_seg != now_seg && to_seg != SEG_UNKNOWN */
2817 /* --- SEG FLOAT MAY APPEAR HERE --- */
2818 if (is_absolute)
2820 if (nbytes)
2822 know (!(opcode_as_number & VIT_OPCODE_SYNTHETIC));
2823 p = frag_more (nbytes);
2824 /* Conventional relocation. */
2825 fix_new (frag_now, p - frag_now->fr_literal, nbytes,
2826 section_symbol (absolute_section),
2827 this_add_number, 1, NO_RELOC);
2829 else
2831 know (opcode_as_number & VIT_OPCODE_SYNTHETIC);
2832 if (opcode_as_number & VIT_OPCODE_SPECIAL)
2834 if (operandP->vop_width == VAX_WIDTH_UNCONDITIONAL_JUMP)
2836 /* br or jsb */
2837 *opcode_low_byteP = opcode_as_chars[0] + VAX_WIDEN_LONG;
2838 know (opcode_as_chars[1] == 0);
2839 p = frag_more (5);
2840 p[0] = VAX_ABSOLUTE_MODE; /* @#... */
2841 md_number_to_chars (p + 1, this_add_number, 4);
2842 /* Now (eg) JMP @#foo or JSB @#foo. */
2844 else
2846 if (operandP->vop_width == VAX_WIDTH_WORD_JUMP)
2848 p = frag_more (10);
2849 p[0] = 2;
2850 p[1] = 0;
2851 p[2] = VAX_BRB;
2852 p[3] = 6;
2853 p[4] = VAX_JMP;
2854 p[5] = VAX_ABSOLUTE_MODE; /* @#... */
2855 md_number_to_chars (p + 6, this_add_number, 4);
2856 /* Now (eg) ACBx 1f
2857 BRB 2f
2858 1: JMP @#foo
2859 2: */
2861 else
2863 know (operandP->vop_width == VAX_WIDTH_BYTE_JUMP);
2864 p = frag_more (9);
2865 p[0] = 2;
2866 p[1] = VAX_BRB;
2867 p[2] = 6;
2868 p[3] = VAX_JMP;
2869 p[4] = VAX_ABSOLUTE_MODE; /* @#... */
2870 md_number_to_chars (p + 5, this_add_number, 4);
2871 /* Now (eg) xOBxxx 1f
2872 BRB 2f
2873 1: JMP @#foo
2874 2: */
2878 else
2880 /* b<cond> */
2881 *opcode_low_byteP ^= 1;
2882 /* To reverse the condition in a VAX branch,
2883 complement the lowest order bit. */
2884 p = frag_more (7);
2885 p[0] = 6;
2886 p[1] = VAX_JMP;
2887 p[2] = VAX_ABSOLUTE_MODE; /* @#... */
2888 md_number_to_chars (p + 3, this_add_number, 4);
2889 /* Now (eg) BLEQ 1f
2890 JMP @#foo
2891 1: */
2895 else
2897 /* to_seg != now_seg && !is_undefinfed && !is_absolute */
2898 if (nbytes > 0)
2900 /* Pc-relative. Conventional relocation. */
2901 know (!(opcode_as_number & VIT_OPCODE_SYNTHETIC));
2902 p = frag_more (nbytes);
2903 fix_new (frag_now, p - frag_now->fr_literal, nbytes,
2904 section_symbol (absolute_section),
2905 this_add_number, 1, NO_RELOC);
2907 else
2909 know (opcode_as_number & VIT_OPCODE_SYNTHETIC);
2910 if (opcode_as_number & VIT_OPCODE_SPECIAL)
2912 if (operandP->vop_width == VAX_WIDTH_UNCONDITIONAL_JUMP)
2914 /* br or jsb */
2915 know (opcode_as_chars[1] == 0);
2916 *opcode_low_byteP = opcode_as_chars[0] + VAX_WIDEN_LONG;
2917 p = frag_more (5);
2918 p[0] = VAX_PC_RELATIVE_MODE;
2919 fix_new (frag_now,
2920 p + 1 - frag_now->fr_literal, 4,
2921 this_add_symbol,
2922 this_add_number, 1, NO_RELOC);
2923 /* Now eg JMP foo or JSB foo. */
2925 else
2927 if (operandP->vop_width == VAX_WIDTH_WORD_JUMP)
2929 p = frag_more (10);
2930 p[0] = 0;
2931 p[1] = 2;
2932 p[2] = VAX_BRB;
2933 p[3] = 6;
2934 p[4] = VAX_JMP;
2935 p[5] = VAX_PC_RELATIVE_MODE;
2936 fix_new (frag_now,
2937 p + 6 - frag_now->fr_literal, 4,
2938 this_add_symbol,
2939 this_add_number, 1, NO_RELOC);
2940 /* Now (eg) ACBx 1f
2941 BRB 2f
2942 1: JMP foo
2943 2: */
2945 else
2947 know (operandP->vop_width == VAX_WIDTH_BYTE_JUMP);
2948 p = frag_more (10);
2949 p[0] = 2;
2950 p[1] = VAX_BRB;
2951 p[2] = 6;
2952 p[3] = VAX_JMP;
2953 p[4] = VAX_PC_RELATIVE_MODE;
2954 fix_new (frag_now,
2955 p + 5 - frag_now->fr_literal,
2956 4, this_add_symbol,
2957 this_add_number, 1, NO_RELOC);
2958 /* Now (eg) xOBxxx 1f
2959 BRB 2f
2960 1: JMP foo
2961 2: */
2965 else
2967 know (operandP->vop_width == VAX_WIDTH_CONDITIONAL_JUMP);
2968 *opcode_low_byteP ^= 1; /* Reverse branch condition. */
2969 p = frag_more (7);
2970 p[0] = 6;
2971 p[1] = VAX_JMP;
2972 p[2] = VAX_PC_RELATIVE_MODE;
2973 fix_new (frag_now, p + 3 - frag_now->fr_literal,
2974 4, this_add_symbol,
2975 this_add_number, 1, NO_RELOC);
2981 else
2983 /* So it is ordinary operand. */
2984 know (operandP->vop_access != 'b');
2985 /* ' ' target-independent: elsewhere. */
2986 know (operandP->vop_access != ' ');
2987 know (operandP->vop_access == 'a'
2988 || operandP->vop_access == 'm'
2989 || operandP->vop_access == 'r'
2990 || operandP->vop_access == 'v'
2991 || operandP->vop_access == 'w');
2992 if (operandP->vop_short == 's')
2994 if (is_absolute)
2996 if (this_add_number >= 64)
2998 as_warn (_("Short literal overflow(%ld.), immediate mode assumed."),
2999 (long) this_add_number);
3000 operandP->vop_short = 'i';
3001 operandP->vop_mode = 8;
3002 operandP->vop_reg = 0xF;
3005 else
3007 as_warn (_("Forced short literal to immediate mode. now_seg=%s to_seg=%s"),
3008 segment_name (now_seg), segment_name (to_seg));
3009 operandP->vop_short = 'i';
3010 operandP->vop_mode = 8;
3011 operandP->vop_reg = 0xF;
3014 if (operandP->vop_reg >= 0 && (operandP->vop_mode < 8
3015 || (operandP->vop_reg != 0xF && operandP->vop_mode < 10)))
3017 /* One byte operand. */
3018 know (operandP->vop_mode > 3);
3019 FRAG_APPEND_1_CHAR (operandP->vop_mode << 4 | operandP->vop_reg);
3020 /* All 1-bytes except S^# happen here. */
3022 else
3024 /* {@}{q^}foo{(Rn)} or S^#foo */
3025 if (operandP->vop_reg == -1 && operandP->vop_short != 's')
3027 /* "{@}{q^}foo" */
3028 if (to_seg == now_seg)
3030 if (length == 0)
3032 know (operandP->vop_short == ' ');
3033 length_code = STATE_BYTE;
3034 #ifdef OBJ_ELF
3035 if (S_IS_EXTERNAL (this_add_symbol)
3036 || S_IS_WEAK (this_add_symbol))
3037 length_code = STATE_UNDF;
3038 #endif
3039 p = frag_var (rs_machine_dependent, 10, 2,
3040 ENCODE_RELAX (STATE_PC_RELATIVE, length_code),
3041 this_add_symbol, this_add_number,
3042 opcode_low_byteP);
3043 know (operandP->vop_mode == 10 + at);
3044 *p = at << 4;
3045 /* At is the only context we need to carry
3046 to other side of relax() process. Must
3047 be in the correct bit position of VAX
3048 operand spec. byte. */
3050 else
3052 know (length);
3053 know (operandP->vop_short != ' ');
3054 p = frag_more (length + 1);
3055 p[0] = 0xF | ((at + "?\12\14?\16"[length]) << 4);
3056 fix_new (frag_now, p + 1 - frag_now->fr_literal,
3057 length, this_add_symbol,
3058 this_add_number, 1, NO_RELOC);
3061 else
3063 /* to_seg != now_seg */
3064 if (this_add_symbol == NULL)
3066 know (is_absolute);
3067 /* Do @#foo: simpler relocation than foo-.(pc) anyway. */
3068 p = frag_more (5);
3069 p[0] = VAX_ABSOLUTE_MODE; /* @#... */
3070 md_number_to_chars (p + 1, this_add_number, 4);
3071 if (length && length != 4)
3072 as_warn (_("Length specification ignored. Address mode 9F used"));
3074 else
3076 /* {@}{q^}other_seg */
3077 know ((length == 0 && operandP->vop_short == ' ')
3078 || (length > 0 && operandP->vop_short != ' '));
3079 if (is_undefined
3080 #ifdef OBJ_ELF
3081 || S_IS_WEAK(this_add_symbol)
3082 || S_IS_EXTERNAL(this_add_symbol)
3083 #endif
3086 switch (length)
3088 default: length_code = STATE_UNDF; break;
3089 case 1: length_code = STATE_BYTE; break;
3090 case 2: length_code = STATE_WORD; break;
3091 case 4: length_code = STATE_LONG; break;
3093 /* We have a SEG_UNKNOWN symbol. It might
3094 turn out to be in the same segment as
3095 the instruction, permitting relaxation. */
3096 p = frag_var (rs_machine_dependent, 5, 2,
3097 ENCODE_RELAX (STATE_PC_RELATIVE, length_code),
3098 this_add_symbol, this_add_number,
3099 opcode_low_byteP);
3100 p[0] = at << 4;
3102 else
3104 if (length == 0)
3106 know (operandP->vop_short == ' ');
3107 length = 4; /* Longest possible. */
3109 p = frag_more (length + 1);
3110 p[0] = 0xF | ((at + "?\12\14?\16"[length]) << 4);
3111 md_number_to_chars (p + 1, this_add_number, length);
3112 fix_new (frag_now,
3113 p + 1 - frag_now->fr_literal,
3114 length, this_add_symbol,
3115 this_add_number, 1, NO_RELOC);
3120 else
3122 /* {@}{q^}foo(Rn) or S^# or I^# or # */
3123 if (operandP->vop_mode < 0xA)
3125 /* # or S^# or I^# */
3126 if (operandP->vop_access == 'v'
3127 || operandP->vop_access == 'a')
3129 if (operandP->vop_access == 'v')
3130 as_warn (_("Invalid operand: immediate value used as base address."));
3131 else
3132 as_warn (_("Invalid operand: immediate value used as address."));
3133 /* gcc 2.6.3 is known to generate these in at least
3134 one case. */
3136 if (length == 0
3137 && is_absolute && (expP->X_op != O_big)
3138 && operandP->vop_mode == 8 /* No '@'. */
3139 && this_add_number < 64)
3141 operandP->vop_short = 's';
3143 if (operandP->vop_short == 's')
3145 FRAG_APPEND_1_CHAR (this_add_number);
3147 else
3149 /* I^#... */
3150 know (nbytes);
3151 p = frag_more (nbytes + 1);
3152 know (operandP->vop_reg == 0xF);
3153 #ifdef OBJ_ELF
3154 if (flag_want_pic && operandP->vop_mode == 8
3155 && this_add_symbol != NULL)
3157 as_warn (_("Symbol %s used as immediate operand in PIC mode."),
3158 S_GET_NAME (this_add_symbol));
3160 #endif
3161 p[0] = (operandP->vop_mode << 4) | 0xF;
3162 if ((is_absolute) && (expP->X_op != O_big))
3164 /* If nbytes > 4, then we are scrod. We
3165 don't know if the high order bytes
3166 are to be 0xFF or 0x00. BSD4.2 & RMS
3167 say use 0x00. OK --- but this
3168 assembler needs ANOTHER rewrite to
3169 cope properly with this bug. */
3170 md_number_to_chars (p + 1, this_add_number,
3171 min (sizeof (valueT),
3172 (size_t) nbytes));
3173 if ((size_t) nbytes > sizeof (valueT))
3174 memset (p + 1 + sizeof (valueT),
3175 '\0', nbytes - sizeof (valueT));
3177 else
3179 if (expP->X_op == O_big)
3181 /* Problem here is to get the bytes
3182 in the right order. We stored
3183 our constant as LITTLENUMs, not
3184 bytes. */
3185 LITTLENUM_TYPE *lP;
3187 lP = floatP->low;
3188 if (nbytes & 1)
3190 know (nbytes == 1);
3191 p[1] = *lP;
3193 else
3195 for (p++; nbytes; nbytes -= 2, p += 2, lP++)
3196 md_number_to_chars (p, *lP, 2);
3199 else
3201 fix_new (frag_now, p + 1 - frag_now->fr_literal,
3202 nbytes, this_add_symbol,
3203 this_add_number, 0, NO_RELOC);
3208 else
3210 /* {@}{q^}foo(Rn) */
3211 know ((length == 0 && operandP->vop_short == ' ')
3212 || (length > 0 && operandP->vop_short != ' '));
3213 if (length == 0)
3215 if (is_absolute)
3217 long test;
3219 test = this_add_number;
3221 if (test < 0)
3222 test = ~test;
3224 length = test & 0xffff8000 ? 4
3225 : test & 0xffffff80 ? 2
3226 : 1;
3228 else
3230 length = 4;
3233 p = frag_more (1 + length);
3234 know (operandP->vop_reg >= 0);
3235 p[0] = operandP->vop_reg
3236 | ((at | "?\12\14?\16"[length]) << 4);
3237 if (is_absolute)
3239 md_number_to_chars (p + 1, this_add_number, length);
3241 else
3243 fix_new (frag_now, p + 1 - frag_now->fr_literal,
3244 length, this_add_symbol,
3245 this_add_number, 0, NO_RELOC);
3254 void
3255 md_begin (void)
3257 FLONUM_TYPE *fP;
3258 int i;
3260 vip_begin (1, "$", "*", "`");
3262 for (i = 0, fP = float_operand;
3263 fP < float_operand + VIT_MAX_OPERANDS;
3264 i++, fP++)
3266 fP->low = &big_operand_bits[i][0];
3267 fP->high = &big_operand_bits[i][SIZE_OF_LARGE_NUMBER - 1];
3271 bfd_reloc_code_real_type
3272 vax_cons (expressionS *exp, int size)
3274 char *save;
3275 const char *vax_cons_special_reloc;
3277 SKIP_WHITESPACE ();
3278 vax_cons_special_reloc = NULL;
3279 save = input_line_pointer;
3280 if (input_line_pointer[0] == '%')
3282 if (startswith (input_line_pointer + 1, "pcrel"))
3284 input_line_pointer += 6;
3285 vax_cons_special_reloc = "pcrel";
3287 if (vax_cons_special_reloc)
3289 int bad = 0;
3291 switch (size)
3293 case 1:
3294 if (*input_line_pointer != '8')
3295 bad = 1;
3296 input_line_pointer--;
3297 break;
3298 case 2:
3299 if (input_line_pointer[0] != '1' || input_line_pointer[1] != '6')
3300 bad = 1;
3301 break;
3302 case 4:
3303 if (input_line_pointer[0] != '3' || input_line_pointer[1] != '2')
3304 bad = 1;
3305 break;
3306 default:
3307 bad = 1;
3308 break;
3311 if (bad)
3313 as_bad (_("Illegal operands: Only %%r_%s%d allowed in %d-byte data fields"),
3314 vax_cons_special_reloc, size * 8, size);
3316 else
3318 input_line_pointer += 2;
3319 if (*input_line_pointer != '(')
3321 as_bad (_("Illegal operands: %%r_%s%d requires arguments in ()"),
3322 vax_cons_special_reloc, size * 8);
3323 bad = 1;
3327 if (bad)
3329 input_line_pointer = save;
3330 vax_cons_special_reloc = NULL;
3332 else
3334 int c;
3335 char *end = ++input_line_pointer;
3336 int npar = 0;
3338 while (! is_end_of_line[(c = *end)])
3340 if (c == '(')
3341 npar++;
3342 else if (c == ')')
3344 if (!npar)
3345 break;
3346 npar--;
3348 end++;
3351 if (c != ')')
3352 as_bad (_("Illegal operands: %%r_%s%d requires arguments in ()"),
3353 vax_cons_special_reloc, size * 8);
3354 else
3356 *end = '\0';
3357 expression (exp);
3358 *end = c;
3359 if (input_line_pointer != end)
3361 as_bad (_("Illegal operands: %%r_%s%d requires arguments in ()"),
3362 vax_cons_special_reloc, size * 8);
3364 else
3366 input_line_pointer++;
3367 SKIP_WHITESPACE ();
3368 c = *input_line_pointer;
3369 if (! is_end_of_line[c] && c != ',')
3370 as_bad (_("Illegal operands: garbage after %%r_%s%d()"),
3371 vax_cons_special_reloc, size * 8);
3377 if (vax_cons_special_reloc == NULL)
3378 expression (exp);
3379 else
3380 switch (size)
3382 case 1: return BFD_RELOC_8_PCREL;
3383 case 2: return BFD_RELOC_16_PCREL;
3384 case 4: return BFD_RELOC_32_PCREL;
3386 return NO_RELOC;
3389 /* This is called by emit_expr via TC_CONS_FIX_NEW when creating a
3390 reloc for a cons. */
3392 void
3393 vax_cons_fix_new (fragS *frag, int where, unsigned int nbytes, expressionS *exp,
3394 bfd_reloc_code_real_type r)
3396 if (r == NO_RELOC)
3397 r = (nbytes == 1 ? BFD_RELOC_8
3398 : nbytes == 2 ? BFD_RELOC_16
3399 : BFD_RELOC_32);
3401 fix_new_exp (frag, where, (int) nbytes, exp, 0, r);
3404 const char *
3405 md_atof (int type, char * litP, int * sizeP)
3407 return vax_md_atof (type, litP, sizeP);