[gdb/build] Fix enum param_types odr violation
[binutils-gdb.git] / gas / config / tc-vax.c
blob8450bc11257082f3c9d9ee9ce79d7a91471bd44d
1 /* tc-vax.c - vax-specific -
2 Copyright (C) 1987-2023 Free Software Foundation, Inc.
4 This file is part of GAS, the GNU Assembler.
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
21 #include "as.h"
23 #include "vax-inst.h"
24 #include "obstack.h" /* For FRAG_APPEND_1_CHAR macro in "frags.h" */
25 #include "subsegs.h"
26 #include "safe-ctype.h"
28 #ifdef OBJ_ELF
29 #include "elf/vax.h"
30 #endif
32 /* These chars start a comment anywhere in a source file (except inside
33 another comment */
34 const char comment_chars[] = "#";
36 /* These chars only start a comment at the beginning of a line. */
37 /* Note that for the VAX the are the same as comment_chars above. */
38 const char line_comment_chars[] = "#";
40 const char line_separator_chars[] = ";";
42 /* Chars that can be used to separate mant from exp in floating point nums. */
43 const char EXP_CHARS[] = "eE";
45 /* Chars that mean this number is a floating point constant
46 as in 0f123.456
47 or 0H1.234E-12 (see exp chars above). */
48 const char FLT_CHARS[] = "dDfFgGhH";
50 /* Also be aware that MAXIMUM_NUMBER_OF_CHARS_FOR_FLOAT may have to be
51 changed in read.c . Ideally it shouldn't have to know about it at all,
52 but nothing is ideal around here. */
54 /* Hold details of an operand expression. */
55 static expressionS exp_of_operand[VIT_MAX_OPERANDS];
56 static segT seg_of_operand[VIT_MAX_OPERANDS];
58 /* A vax instruction after decoding. */
59 static struct vit v;
61 /* Hold details of big operands. */
62 LITTLENUM_TYPE big_operand_bits[VIT_MAX_OPERANDS][SIZE_OF_LARGE_NUMBER];
63 FLONUM_TYPE float_operand[VIT_MAX_OPERANDS];
64 /* Above is made to point into big_operand_bits by md_begin(). */
66 #ifdef OBJ_ELF
67 #define GLOBAL_OFFSET_TABLE_NAME "_GLOBAL_OFFSET_TABLE_"
68 #define PROCEDURE_LINKAGE_TABLE_NAME "_PROCEDURE_LINKAGE_TABLE_"
69 symbolS *GOT_symbol; /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
70 symbolS *PLT_symbol; /* Pre-defined "_PROCEDURE_LINKAGE_TABLE_". */
71 #endif
73 int flag_hash_long_names; /* -+ */
74 int flag_one; /* -1 */
75 int flag_show_after_trunc; /* -H */
76 int flag_no_hash_mixed_case; /* -h NUM */
77 #ifdef OBJ_ELF
78 int flag_want_pic; /* -k */
79 #endif
81 /* For VAX, relative addresses of "just the right length" are easy.
82 The branch displacement is always the last operand, even in
83 synthetic instructions.
84 For VAX, we encode the relax_substateTs (in e.g. fr_substate) as:
86 4 3 2 1 0 bit number
87 ---/ /--+-------+-------+-------+-------+-------+
88 | what state ? | how long ? |
89 ---/ /--+-------+-------+-------+-------+-------+
91 The "how long" bits are 00=byte, 01=word, 10=long.
92 This is a Un*x convention.
93 Not all lengths are legit for a given value of (what state).
94 The "how long" refers merely to the displacement length.
95 The address usually has some constant bytes in it as well.
97 groups for VAX address relaxing.
99 1. "foo" pc-relative.
100 length of byte, word, long
102 2a. J<cond> where <cond> is a simple flag test.
103 length of byte, word, long.
104 VAX opcodes are: (Hex)
105 bneq/bnequ 12
106 beql/beqlu 13
107 bgtr 14
108 bleq 15
109 bgeq 18
110 blss 19
111 bgtru 1a
112 blequ 1b
113 bvc 1c
114 bvs 1d
115 bgequ/bcc 1e
116 blssu/bcs 1f
117 Always, you complement 0th bit to reverse condition.
118 Always, 1-byte opcode, then 1-byte displacement.
120 2b. J<cond> where cond tests a memory bit.
121 length of byte, word, long.
122 Vax opcodes are: (Hex)
123 bbs e0
124 bbc e1
125 bbss e2
126 bbcs e3
127 bbsc e4
128 bbcc e5
129 Always, you complement 0th bit to reverse condition.
130 Always, 1-byte opcode, longword-address, byte-address, 1-byte-displacement
132 2c. J<cond> where cond tests low-order memory bit
133 length of byte,word,long.
134 Vax opcodes are: (Hex)
135 blbs e8
136 blbc e9
137 Always, you complement 0th bit to reverse condition.
138 Always, 1-byte opcode, longword-address, 1-byte displacement.
140 3. Jbs/Jbr.
141 length of byte,word,long.
142 Vax opcodes are: (Hex)
143 bsbb 10
144 brb 11
145 These are like (2) but there is no condition to reverse.
146 Always, 1 byte opcode, then displacement/absolute.
148 4a. JacbX
149 length of word, long.
150 Vax opcodes are: (Hex)
151 acbw 3d
152 acbf 4f
153 acbd 6f
154 abcb 9d
155 acbl f1
156 acbg 4ffd
157 acbh 6ffd
158 Always, we cannot reverse the sense of the branch; we have a word
159 displacement.
160 The double-byte op-codes don't hurt: we never want to modify the
161 opcode, so we don't care how many bytes are between the opcode and
162 the operand.
164 4b. JXobXXX
165 length of long, long, byte.
166 Vax opcodes are: (Hex)
167 aoblss f2
168 aobleq f3
169 sobgeq f4
170 sobgtr f5
171 Always, we cannot reverse the sense of the branch; we have a byte
172 displacement.
174 The only time we need to modify the opcode is for class 2 instructions.
175 After relax() we may complement the lowest order bit of such instruction
176 to reverse sense of branch.
178 For class 2 instructions, we store context of "where is the opcode literal".
179 We can change an opcode's lowest order bit without breaking anything else.
181 We sometimes store context in the operand literal. This way we can figure out
182 after relax() what the original addressing mode was. */
184 /* These displacements are relative to the start address of the
185 displacement. The first letter is Byte, Word. 2nd letter is
186 Forward, Backward. */
187 #define BF (1+ 127)
188 #define BB (1+-128)
189 #define WF (2+ 32767)
190 #define WB (2+-32768)
191 /* Don't need LF, LB because they always reach. [They are coded as 0.] */
193 #define C(a,b) ENCODE_RELAX(a,b)
194 /* This macro has no side-effects. */
195 #define ENCODE_RELAX(what,length) (((what) << 2) + (length))
196 #define RELAX_STATE(s) ((s) >> 2)
197 #define RELAX_LENGTH(s) ((s) & 3)
199 const relax_typeS md_relax_table[] =
201 {1, 1, 0, 0}, /* error sentinel 0,0 */
202 {1, 1, 0, 0}, /* unused 0,1 */
203 {1, 1, 0, 0}, /* unused 0,2 */
204 {1, 1, 0, 0}, /* unused 0,3 */
206 {BF + 1, BB + 1, 2, C (1, 1)},/* B^"foo" 1,0 */
207 {WF + 1, WB + 1, 3, C (1, 2)},/* W^"foo" 1,1 */
208 {0, 0, 5, 0}, /* L^"foo" 1,2 */
209 {1, 1, 0, 0}, /* unused 1,3 */
211 {BF, BB, 1, C (2, 1)}, /* b<cond> B^"foo" 2,0 */
212 {WF + 2, WB + 2, 4, C (2, 2)},/* br.+? brw X 2,1 */
213 {0, 0, 7, 0}, /* br.+? jmp X 2,2 */
214 {1, 1, 0, 0}, /* unused 2,3 */
216 {BF, BB, 1, C (3, 1)}, /* brb B^foo 3,0 */
217 {WF, WB, 2, C (3, 2)}, /* brw W^foo 3,1 */
218 {0, 0, 5, 0}, /* Jmp L^foo 3,2 */
219 {1, 1, 0, 0}, /* unused 3,3 */
221 {1, 1, 0, 0}, /* unused 4,0 */
222 {WF, WB, 2, C (4, 2)}, /* acb_ ^Wfoo 4,1 */
223 {0, 0, 10, 0}, /* acb_,br,jmp L^foo4,2 */
224 {1, 1, 0, 0}, /* unused 4,3 */
226 {BF, BB, 1, C (5, 1)}, /* Xob___,,foo 5,0 */
227 {WF + 4, WB + 4, 6, C (5, 2)},/* Xob.+2,brb.+3,brw5,1 */
228 {0, 0, 9, 0}, /* Xob.+2,brb.+6,jmp5,2 */
229 {1, 1, 0, 0}, /* unused 5,3 */
232 #undef C
233 #undef BF
234 #undef BB
235 #undef WF
236 #undef WB
238 void float_cons (int);
239 int flonum_gen2vax (int, FLONUM_TYPE *, LITTLENUM_TYPE *);
241 const pseudo_typeS md_pseudo_table[] =
243 {"dfloat", float_cons, 'd'},
244 {"ffloat", float_cons, 'f'},
245 {"gfloat", float_cons, 'g'},
246 {"hfloat", float_cons, 'h'},
247 {"d_floating", float_cons, 'd'},
248 {"f_floating", float_cons, 'f'},
249 {"g_floating", float_cons, 'g'},
250 {"h_floating", float_cons, 'h'},
251 {NULL, NULL, 0},
254 #define STATE_PC_RELATIVE (1)
255 #define STATE_CONDITIONAL_BRANCH (2)
256 #define STATE_ALWAYS_BRANCH (3) /* includes BSB... */
257 #define STATE_COMPLEX_BRANCH (4)
258 #define STATE_COMPLEX_HOP (5)
260 #define STATE_BYTE (0)
261 #define STATE_WORD (1)
262 #define STATE_LONG (2)
263 #define STATE_UNDF (3) /* Symbol undefined in pass1. */
265 #define min(a, b) ((a) < (b) ? (a) : (b))
267 void
268 md_number_to_chars (char con[], valueT value, int nbytes)
270 number_to_chars_littleendian (con, value, nbytes);
273 /* Fix up some data or instructions after we find out the value of a symbol
274 that they reference. */
276 void /* Knows about order of bytes in address. */
277 md_apply_fix (fixS *fixP, valueT *valueP, segT seg ATTRIBUTE_UNUSED)
279 valueT value = * valueP;
281 if (fixP->fx_subsy != (symbolS *) NULL)
282 as_bad_subtract (fixP);
284 if (fixP->fx_addsy == NULL)
285 fixP->fx_done = 1;
287 if (fixP->fx_done)
288 number_to_chars_littleendian (fixP->fx_where + fixP->fx_frag->fr_literal,
289 value, fixP->fx_size);
290 else
291 /* Initialise the part of an instruction frag covered by the
292 relocation. (Many occurrences of frag_more followed by fix_new
293 lack any init of the frag.) Since VAX uses RELA relocs the
294 value we write into this field doesn't really matter. */
295 memset (fixP->fx_where + fixP->fx_frag->fr_literal, 0, fixP->fx_size);
298 /* Convert a number from VAX byte order (little endian)
299 into host byte order.
300 con is the buffer to convert,
301 nbytes is the length of the given buffer. */
302 static long
303 md_chars_to_number (unsigned char con[], int nbytes)
305 long retval;
307 for (retval = 0, con += nbytes - 1; nbytes--; con--)
309 retval <<= BITS_PER_CHAR;
310 retval |= *con;
312 return retval;
315 /* Copy a bignum from in to out.
316 If the output is shorter than the input, copy lower-order
317 littlenums. Return 0 or the number of significant littlenums
318 dropped. Assumes littlenum arrays are densely packed: no unused
319 chars between the littlenums. Uses memcpy() to move littlenums, and
320 wants to know length (in chars) of the input bignum. */
322 static int
323 bignum_copy (LITTLENUM_TYPE *in,
324 int in_length, /* in sizeof(littlenum)s */
325 LITTLENUM_TYPE *out,
326 int out_length /* in sizeof(littlenum)s */)
328 int significant_littlenums_dropped;
330 if (out_length < in_length)
332 LITTLENUM_TYPE *p; /* -> most significant (non-zero) input
333 littlenum. */
335 memcpy ((void *) out, (void *) in,
336 (unsigned int) out_length << LITTLENUM_SHIFT);
337 for (p = in + in_length - 1; p >= in; --p)
339 if (*p)
340 break;
342 significant_littlenums_dropped = p - in - in_length + 1;
344 if (significant_littlenums_dropped < 0)
345 significant_littlenums_dropped = 0;
347 else
349 memcpy ((char *) out, (char *) in,
350 (unsigned int) in_length << LITTLENUM_SHIFT);
352 if (out_length > in_length)
353 memset ((char *) (out + in_length), '\0',
354 (unsigned int) (out_length - in_length) << LITTLENUM_SHIFT);
356 significant_littlenums_dropped = 0;
359 return significant_littlenums_dropped;
362 /* md_estimate_size_before_relax(), called just before relax().
363 Any symbol that is now undefined will not become defined.
364 Return the correct fr_subtype in the frag and the growth beyond
365 fr_fix. */
367 md_estimate_size_before_relax (fragS *fragP, segT segment)
369 if (RELAX_LENGTH (fragP->fr_subtype) == STATE_UNDF)
371 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
372 #ifdef OBJ_ELF
373 || S_IS_WEAK (fragP->fr_symbol)
374 || S_IS_EXTERNAL (fragP->fr_symbol)
375 #endif
378 /* Non-relaxable cases. */
379 int reloc_type = NO_RELOC;
380 char *p;
381 int old_fr_fix;
383 old_fr_fix = fragP->fr_fix;
384 p = &fragP->fr_literal[0] + old_fr_fix;
385 #ifdef OBJ_ELF
386 /* If this is to an undefined symbol, then if it's an indirect
387 reference indicate that is can mutated into a GLOB_DAT or
388 JUMP_SLOT by the loader. We restrict ourselves to no offset
389 due to a limitation in the NetBSD linker. */
391 if (GOT_symbol == NULL)
392 GOT_symbol = symbol_find (GLOBAL_OFFSET_TABLE_NAME);
393 if (PLT_symbol == NULL)
394 PLT_symbol = symbol_find (PROCEDURE_LINKAGE_TABLE_NAME);
395 if ((GOT_symbol == NULL || fragP->fr_symbol != GOT_symbol)
396 && (PLT_symbol == NULL || fragP->fr_symbol != PLT_symbol)
397 && fragP->fr_symbol != NULL
398 && flag_want_pic
399 && (!S_IS_DEFINED (fragP->fr_symbol)
400 || S_IS_WEAK (fragP->fr_symbol)
401 || S_IS_EXTERNAL (fragP->fr_symbol)))
403 /* Indirect references cannot go through the GOT or PLT,
404 let's hope they'll become local in the final link. */
405 if ((ELF_ST_VISIBILITY (S_GET_OTHER (fragP->fr_symbol))
406 != STV_DEFAULT)
407 || (p[0] & 0x10))
408 reloc_type = BFD_RELOC_32_PCREL;
409 else if (((unsigned char *) fragP->fr_opcode)[0] == VAX_CALLS
410 || ((unsigned char *) fragP->fr_opcode)[0] == VAX_CALLG
411 || ((unsigned char *) fragP->fr_opcode)[0] == VAX_JSB
412 || ((unsigned char *) fragP->fr_opcode)[0] == VAX_JMP
413 || S_IS_FUNCTION (fragP->fr_symbol))
414 reloc_type = BFD_RELOC_32_PLT_PCREL;
415 else
416 reloc_type = BFD_RELOC_32_GOT_PCREL;
418 #endif
419 switch (RELAX_STATE (fragP->fr_subtype))
421 case STATE_PC_RELATIVE:
422 p[0] |= VAX_PC_RELATIVE_MODE; /* Preserve @ bit. */
423 fragP->fr_fix += 1 + 4;
424 fix_new (fragP, old_fr_fix + 1, 4, fragP->fr_symbol,
425 fragP->fr_offset, 1, reloc_type);
426 break;
428 case STATE_CONDITIONAL_BRANCH:
429 *fragP->fr_opcode ^= 1; /* Reverse sense of branch. */
430 p[0] = 6;
431 p[1] = VAX_JMP;
432 p[2] = VAX_PC_RELATIVE_MODE; /* ...(PC) */
433 fragP->fr_fix += 1 + 1 + 1 + 4;
434 fix_new (fragP, old_fr_fix + 3, 4, fragP->fr_symbol,
435 fragP->fr_offset, 1, NO_RELOC);
436 break;
438 case STATE_COMPLEX_BRANCH:
439 p[0] = 2;
440 p[1] = 0;
441 p[2] = VAX_BRB;
442 p[3] = 6;
443 p[4] = VAX_JMP;
444 p[5] = VAX_PC_RELATIVE_MODE; /* ...(pc) */
445 fragP->fr_fix += 2 + 2 + 1 + 1 + 4;
446 fix_new (fragP, old_fr_fix + 6, 4, fragP->fr_symbol,
447 fragP->fr_offset, 1, NO_RELOC);
448 break;
450 case STATE_COMPLEX_HOP:
451 p[0] = 2;
452 p[1] = VAX_BRB;
453 p[2] = 6;
454 p[3] = VAX_JMP;
455 p[4] = VAX_PC_RELATIVE_MODE; /* ...(pc) */
456 fragP->fr_fix += 1 + 2 + 1 + 1 + 4;
457 fix_new (fragP, old_fr_fix + 5, 4, fragP->fr_symbol,
458 fragP->fr_offset, 1, NO_RELOC);
459 break;
461 case STATE_ALWAYS_BRANCH:
462 *fragP->fr_opcode += VAX_WIDEN_LONG;
463 p[0] = VAX_PC_RELATIVE_MODE; /* ...(PC) */
464 fragP->fr_fix += 1 + 4;
465 fix_new (fragP, old_fr_fix + 1, 4, fragP->fr_symbol,
466 fragP->fr_offset, 1, NO_RELOC);
467 break;
469 default:
470 abort ();
472 frag_wane (fragP);
474 /* Return the growth in the fixed part of the frag. */
475 return fragP->fr_fix - old_fr_fix;
478 /* Relaxable cases. Set up the initial guess for the variable
479 part of the frag. */
480 switch (RELAX_STATE (fragP->fr_subtype))
482 case STATE_PC_RELATIVE:
483 fragP->fr_subtype = ENCODE_RELAX (STATE_PC_RELATIVE, STATE_BYTE);
484 break;
485 case STATE_CONDITIONAL_BRANCH:
486 fragP->fr_subtype = ENCODE_RELAX (STATE_CONDITIONAL_BRANCH, STATE_BYTE);
487 break;
488 case STATE_COMPLEX_BRANCH:
489 fragP->fr_subtype = ENCODE_RELAX (STATE_COMPLEX_BRANCH, STATE_WORD);
490 break;
491 case STATE_COMPLEX_HOP:
492 fragP->fr_subtype = ENCODE_RELAX (STATE_COMPLEX_HOP, STATE_BYTE);
493 break;
494 case STATE_ALWAYS_BRANCH:
495 fragP->fr_subtype = ENCODE_RELAX (STATE_ALWAYS_BRANCH, STATE_BYTE);
496 break;
500 if (fragP->fr_subtype >= sizeof (md_relax_table) / sizeof (md_relax_table[0]))
501 abort ();
503 /* Return the size of the variable part of the frag. */
504 return md_relax_table[fragP->fr_subtype].rlx_length;
507 /* Called after relax() is finished.
508 In: Address of frag.
509 fr_type == rs_machine_dependent.
510 fr_subtype is what the address relaxed to.
512 Out: Any fixSs and constants are set up.
513 Caller will turn frag into a ".space 0". */
514 void
515 md_convert_frag (bfd *headers ATTRIBUTE_UNUSED,
516 segT seg ATTRIBUTE_UNUSED,
517 fragS *fragP)
519 char *addressP; /* -> _var to change. */
520 char *opcodeP; /* -> opcode char(s) to change. */
521 short int extension = 0; /* Size of relaxed address. */
522 /* Added to fr_fix: incl. ALL var chars. */
523 symbolS *symbolP;
524 long where;
526 know (fragP->fr_type == rs_machine_dependent);
527 where = fragP->fr_fix;
528 addressP = &fragP->fr_literal[0] + where;
529 opcodeP = fragP->fr_opcode;
530 symbolP = fragP->fr_symbol;
531 know (symbolP);
533 switch (fragP->fr_subtype)
535 case ENCODE_RELAX (STATE_PC_RELATIVE, STATE_BYTE):
536 know (*addressP == 0 || *addressP == 0x10); /* '@' bit. */
537 addressP[0] |= 0xAF; /* Byte displacement. */
538 fix_new (fragP, fragP->fr_fix + 1, 1, fragP->fr_symbol,
539 fragP->fr_offset, 1, NO_RELOC);
540 extension = 2;
541 break;
543 case ENCODE_RELAX (STATE_PC_RELATIVE, STATE_WORD):
544 know (*addressP == 0 || *addressP == 0x10); /* '@' bit. */
545 addressP[0] |= 0xCF; /* Word displacement. */
546 fix_new (fragP, fragP->fr_fix + 1, 2, fragP->fr_symbol,
547 fragP->fr_offset, 1, NO_RELOC);
548 extension = 3;
549 break;
551 case ENCODE_RELAX (STATE_PC_RELATIVE, STATE_LONG):
552 know (*addressP == 0 || *addressP == 0x10); /* '@' bit. */
553 addressP[0] |= 0xEF; /* Long word displacement. */
554 fix_new (fragP, fragP->fr_fix + 1, 4, fragP->fr_symbol,
555 fragP->fr_offset, 1, NO_RELOC);
556 extension = 5;
557 break;
559 case ENCODE_RELAX (STATE_CONDITIONAL_BRANCH, STATE_BYTE):
560 fix_new (fragP, fragP->fr_fix, 1, fragP->fr_symbol,
561 fragP->fr_offset, 1, NO_RELOC);
562 extension = 1;
563 break;
565 case ENCODE_RELAX (STATE_CONDITIONAL_BRANCH, STATE_WORD):
566 opcodeP[0] ^= 1; /* Reverse sense of test. */
567 addressP[0] = 3;
568 addressP[1] = VAX_BRW;
569 fix_new (fragP, fragP->fr_fix + 2, 2, fragP->fr_symbol,
570 fragP->fr_offset, 1, NO_RELOC);
571 extension = 4;
572 break;
574 case ENCODE_RELAX (STATE_CONDITIONAL_BRANCH, STATE_LONG):
575 opcodeP[0] ^= 1; /* Reverse sense of test. */
576 addressP[0] = 6;
577 addressP[1] = VAX_JMP;
578 addressP[2] = VAX_PC_RELATIVE_MODE;
579 fix_new (fragP, fragP->fr_fix + 3, 4, fragP->fr_symbol,
580 fragP->fr_offset, 1, NO_RELOC);
581 extension = 7;
582 break;
584 case ENCODE_RELAX (STATE_ALWAYS_BRANCH, STATE_BYTE):
585 fix_new (fragP, fragP->fr_fix, 1, fragP->fr_symbol,
586 fragP->fr_offset, 1, NO_RELOC);
587 extension = 1;
588 break;
590 case ENCODE_RELAX (STATE_ALWAYS_BRANCH, STATE_WORD):
591 opcodeP[0] += VAX_WIDEN_WORD; /* brb -> brw, bsbb -> bsbw */
592 fix_new (fragP, fragP->fr_fix, 2, fragP->fr_symbol, fragP->fr_offset,
593 1, NO_RELOC);
594 extension = 2;
595 break;
597 case ENCODE_RELAX (STATE_ALWAYS_BRANCH, STATE_LONG):
598 opcodeP[0] += VAX_WIDEN_LONG; /* brb -> jmp, bsbb -> jsb */
599 addressP[0] = VAX_PC_RELATIVE_MODE;
600 fix_new (fragP, fragP->fr_fix + 1, 4, fragP->fr_symbol,
601 fragP->fr_offset, 1, NO_RELOC);
602 extension = 5;
603 break;
605 case ENCODE_RELAX (STATE_COMPLEX_BRANCH, STATE_WORD):
606 fix_new (fragP, fragP->fr_fix, 2, fragP->fr_symbol,
607 fragP->fr_offset, 1, NO_RELOC);
608 extension = 2;
609 break;
611 case ENCODE_RELAX (STATE_COMPLEX_BRANCH, STATE_LONG):
612 addressP[0] = 2;
613 addressP[1] = 0;
614 addressP[2] = VAX_BRB;
615 addressP[3] = 6;
616 addressP[4] = VAX_JMP;
617 addressP[5] = VAX_PC_RELATIVE_MODE;
618 fix_new (fragP, fragP->fr_fix + 6, 4, fragP->fr_symbol,
619 fragP->fr_offset, 1, NO_RELOC);
620 extension = 10;
621 break;
623 case ENCODE_RELAX (STATE_COMPLEX_HOP, STATE_BYTE):
624 fix_new (fragP, fragP->fr_fix, 1, fragP->fr_symbol,
625 fragP->fr_offset, 1, NO_RELOC);
626 extension = 1;
627 break;
629 case ENCODE_RELAX (STATE_COMPLEX_HOP, STATE_WORD):
630 addressP[0] = 2;
631 addressP[1] = VAX_BRB;
632 addressP[2] = 3;
633 addressP[3] = VAX_BRW;
634 fix_new (fragP, fragP->fr_fix + 4, 2, fragP->fr_symbol,
635 fragP->fr_offset, 1, NO_RELOC);
636 extension = 6;
637 break;
639 case ENCODE_RELAX (STATE_COMPLEX_HOP, STATE_LONG):
640 addressP[0] = 2;
641 addressP[1] = VAX_BRB;
642 addressP[2] = 6;
643 addressP[3] = VAX_JMP;
644 addressP[4] = VAX_PC_RELATIVE_MODE;
645 fix_new (fragP, fragP->fr_fix + 5, 4, fragP->fr_symbol,
646 fragP->fr_offset, 1, NO_RELOC);
647 extension = 9;
648 break;
650 default:
651 BAD_CASE (fragP->fr_subtype);
652 break;
654 fragP->fr_fix += extension;
657 /* Translate internal format of relocation info into target format.
659 On vax: first 4 bytes are normal unsigned long, next three bytes
660 are symbolnum, least sig. byte first. Last byte is broken up with
661 the upper nibble as nuthin, bit 3 as extern, bits 2 & 1 as length, and
662 bit 0 as pcrel. */
663 #ifdef comment
664 void
665 md_ri_to_chars (char *the_bytes, struct reloc_info_generic ri)
667 /* This is easy. */
668 md_number_to_chars (the_bytes, ri.r_address, sizeof (ri.r_address));
669 /* Now the fun stuff. */
670 the_bytes[6] = (ri.r_symbolnum >> 16) & 0x0ff;
671 the_bytes[5] = (ri.r_symbolnum >> 8) & 0x0ff;
672 the_bytes[4] = ri.r_symbolnum & 0x0ff;
673 the_bytes[7] = (((ri.r_extern << 3) & 0x08) | ((ri.r_length << 1) & 0x06)
674 | ((ri.r_pcrel << 0) & 0x01)) & 0x0F;
677 #endif /* comment */
679 /* BUGS, GRIPES, APOLOGIA, etc.
681 The opcode table 'votstrs' needs to be sorted on opcode frequency.
682 That is, AFTER we hash it with hash_...(), we want most-used opcodes
683 to come out of the hash table faster.
685 I am sorry to inflict yet another VAX assembler on the world, but
686 RMS says we must do everything from scratch, to prevent pin-heads
687 restricting this software.
689 This is a vaguely modular set of routines in C to parse VAX
690 assembly code using DEC mnemonics. It is NOT un*x specific.
692 The idea here is that the assembler has taken care of all:
693 labels
694 macros
695 listing
696 pseudo-ops
697 line continuation
698 comments
699 condensing any whitespace down to exactly one space
700 and all we have to do is parse 1 line into a vax instruction
701 partially formed. We will accept a line, and deliver:
702 an error message (hopefully empty)
703 a skeleton VAX instruction (tree structure)
704 textual pointers to all the operand expressions
705 a warning message that notes a silly operand (hopefully empty)
707 E D I T H I S T O R Y
709 17may86 Dean Elsner. Bug if line ends immediately after opcode.
710 30apr86 Dean Elsner. New vip_op() uses arg block so change call.
711 6jan86 Dean Elsner. Crock vip_begin() to call vip_op_defaults().
712 2jan86 Dean Elsner. Invent synthetic opcodes.
713 Widen vax_opcodeT to 32 bits. Use a bit for VIT_OPCODE_SYNTHETIC,
714 which means this is not a real opcode, it is like a macro; it will
715 be relax()ed into 1 or more instructions.
716 Use another bit for VIT_OPCODE_SPECIAL if the op-code is not optimised
717 like a regular branch instruction. Option added to vip_begin():
718 exclude synthetic opcodes. Invent synthetic_votstrs[].
719 31dec85 Dean Elsner. Invent vit_opcode_nbytes.
720 Also make vit_opcode into a char[]. We now have n-byte vax opcodes,
721 so caller's don't have to know the difference between a 1-byte & a
722 2-byte op-code. Still need vax_opcodeT concept, so we know how
723 big an object must be to hold an op.code.
724 30dec85 Dean Elsner. Widen typedef vax_opcodeT in "vax-inst.h"
725 because vax opcodes may be 16 bits. Our crufty C compiler was
726 happily initialising 8-bit vot_codes with 16-bit numbers!
727 (Wouldn't the 'phone company like to compress data so easily!)
728 29dec85 Dean Elsner. New static table vax_operand_width_size[].
729 Invented so we know hw many bytes a "I^#42" needs in its immediate
730 operand. Revised struct vop in "vax-inst.h": explicitly include
731 byte length of each operand, and it's letter-code datum type.
732 17nov85 Dean Elsner. Name Change.
733 Due to ar(1) truncating names, we learned the hard way that
734 "vax-inst-parse.c" -> "vax-inst-parse." dropping the "o" off
735 the archived object name. SO... we shortened the name of this
736 source file, and changed the makefile. */
738 /* Handle of the OPCODE hash table. */
739 static htab_t op_hash;
741 /* In: 1 character, from "bdfghloqpw" being the data-type of an operand
742 of a vax instruction.
744 Out: the length of an operand of that type, in bytes.
745 Special branch operands types "-?!" have length 0. */
747 static const short int vax_operand_width_size[256] =
749 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
750 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
751 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
752 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
753 0, 0, 1, 0, 8, 0, 4, 8, 16, 0, 0, 0, 4, 0, 0,16, /* ..b.d.fgh...l..o */
754 0, 8, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, /* .q.....w........ */
755 0, 0, 1, 0, 8, 0, 4, 8, 16, 0, 0, 0, 4, 0, 0,16, /* ..b.d.fgh...l..o */
756 0, 8, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, /* .q.....w........ */
757 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
758 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
759 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
760 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
761 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
762 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
763 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
764 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
767 /* This perversion encodes all the vax opcodes as a bunch of strings.
768 RMS says we should build our hash-table at run-time. Hmm.
769 Please would someone arrange these in decreasing frequency of opcode?
770 Because of the way hash_...() works, the most frequently used opcode
771 should be textually first and so on.
773 Input for this table was 'vax.opcodes', awk(1)ed by 'vax.opcodes.c.awk' .
774 So change 'vax.opcodes', then re-generate this table. */
776 #include "opcode/vax.h"
778 /* This is a table of optional op-codes. All of them represent
779 'synthetic' instructions that seem popular.
781 Here we make some pseudo op-codes. Every code has a bit set to say
782 it is synthetic. This lets you catch them if you want to
783 ban these opcodes. They are mnemonics for "elastic" instructions
784 that are supposed to assemble into the fewest bytes needed to do a
785 branch, or to do a conditional branch, or whatever.
787 The opcode is in the usual place [low-order n*8 bits]. This means
788 that if you mask off the bucky bits, the usual rules apply about
789 how long the opcode is.
791 All VAX branch displacements come at the end of the instruction.
792 For simple branches (1-byte opcode + 1-byte displacement) the last
793 operand is coded 'b?' where the "data type" '?' is a clue that we
794 may reverse the sense of the branch (complement lowest order bit)
795 and branch around a jump. This is by far the most common case.
796 That is why the VIT_OPCODE_SYNTHETIC bit is set: it says this is
797 a 0-byte op-code followed by 2 or more bytes of operand address.
799 If the op-code has VIT_OPCODE_SPECIAL set, then we have a more unusual
800 case.
802 For JBSB & JBR the treatment is the similar, except (1) we have a 'bw'
803 option before (2) we can directly JSB/JMP because there is no condition.
804 These operands have 'b-' as their access/data type.
806 That leaves a bunch of random opcodes: JACBx, JxOBxxx. In these
807 cases, we do the same idea. JACBxxx are all marked with a 'b!'
808 JAOBxxx & JSOBxxx are marked with a 'b:'. */
809 #if (VIT_OPCODE_SYNTHETIC != 0x80000000)
810 #error "You have just broken the encoding below, which assumes the sign bit means 'I am an imaginary instruction'."
811 #endif
813 #if (VIT_OPCODE_SPECIAL != 0x40000000)
814 #error "You have just broken the encoding below, which assumes the 0x40 M bit means 'I am not to be "optimised" the way normal branches are'."
815 #endif
817 static const struct vot
818 synthetic_votstrs[] =
820 {"jbsb", {"b-", 0xC0000010}}, /* BSD 4.2 */
821 /* jsb used already */
822 {"jbr", {"b-", 0xC0000011}}, /* BSD 4.2 */
823 {"jr", {"b-", 0xC0000011}}, /* consistent */
824 {"jneq", {"b?", 0x80000012}},
825 {"jnequ", {"b?", 0x80000012}},
826 {"jeql", {"b?", 0x80000013}},
827 {"jeqlu", {"b?", 0x80000013}},
828 {"jgtr", {"b?", 0x80000014}},
829 {"jleq", {"b?", 0x80000015}},
830 /* un-used opcodes here */
831 {"jgeq", {"b?", 0x80000018}},
832 {"jlss", {"b?", 0x80000019}},
833 {"jgtru", {"b?", 0x8000001a}},
834 {"jlequ", {"b?", 0x8000001b}},
835 {"jvc", {"b?", 0x8000001c}},
836 {"jvs", {"b?", 0x8000001d}},
837 {"jgequ", {"b?", 0x8000001e}},
838 {"jcc", {"b?", 0x8000001e}},
839 {"jlssu", {"b?", 0x8000001f}},
840 {"jcs", {"b?", 0x8000001f}},
842 {"jacbw", {"rwrwmwb!", 0xC000003d}},
843 {"jacbf", {"rfrfmfb!", 0xC000004f}},
844 {"jacbd", {"rdrdmdb!", 0xC000006f}},
845 {"jacbb", {"rbrbmbb!", 0xC000009d}},
846 {"jacbl", {"rlrlmlb!", 0xC00000f1}},
847 {"jacbg", {"rgrgmgb!", 0xC0004ffd}},
848 {"jacbh", {"rhrhmhb!", 0xC0006ffd}},
850 {"jbs", {"rlvbb?", 0x800000e0}},
851 {"jbc", {"rlvbb?", 0x800000e1}},
852 {"jbss", {"rlvbb?", 0x800000e2}},
853 {"jbcs", {"rlvbb?", 0x800000e3}},
854 {"jbsc", {"rlvbb?", 0x800000e4}},
855 {"jbcc", {"rlvbb?", 0x800000e5}},
856 {"jbssi", {"rlvbb?", 0x800000e6}},
857 {"jbcci", {"rlvbb?", 0x800000e7}},
858 {"jlbs", {"rlb?", 0x800000e8}},
859 {"jlbc", {"rlb?", 0x800000e9}},
861 {"jaoblss", {"rlmlb:", 0xC00000f2}},
862 {"jaobleq", {"rlmlb:", 0xC00000f3}},
863 {"jsobgeq", {"mlb:", 0xC00000f4}},
864 {"jsobgtr", {"mlb:", 0xC00000f5}},
866 /* CASEx has no branch addresses in our conception of it. */
867 /* You should use ".word ..." statements after the "case ...". */
869 {"", {"", 0}} /* Empty is end sentinel. */
872 /* Because this module is useful for both VMS and UN*X style assemblers
873 and because of the variety of UN*X assemblers we must recognise
874 the different conventions for assembler operand notation. For example
875 VMS says "#42" for immediate mode, while most UN*X say "$42".
876 We permit arbitrary sets of (single) characters to represent the
877 3 concepts that DEC writes '#', '@', '^'. */
879 /* Character tests. */
880 #define VIP_IMMEDIATE 01 /* Character is like DEC # */
881 #define VIP_INDIRECT 02 /* Char is like DEC @ */
882 #define VIP_DISPLEN 04 /* Char is like DEC ^ */
884 #define IMMEDIATEP(c) (vip_metacharacters [(c) & 0xff] & VIP_IMMEDIATE)
885 #define INDIRECTP(c) (vip_metacharacters [(c) & 0xff] & VIP_INDIRECT)
886 #define DISPLENP(c) (vip_metacharacters [(c) & 0xff] & VIP_DISPLEN)
888 /* We assume 8 bits per byte. Use vip_op_defaults() to set these up BEFORE we
889 are ever called. */
891 #if defined(CONST_TABLE)
892 #define _ 0,
893 #define I VIP_IMMEDIATE,
894 #define S VIP_INDIRECT,
895 #define D VIP_DISPLEN,
896 static const char
897 vip_metacharacters[256] =
899 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ /* ^@ ^A ^B ^C ^D ^E ^F ^G ^H ^I ^J ^K ^L ^M ^N ^O*/
900 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ /* ^P ^Q ^R ^S ^T ^U ^V ^W ^X ^Y ^Z ^[ ^\ ^] ^^ ^_ */
901 _ _ _ _ I _ _ _ _ _ S _ _ _ _ _ /* sp ! " # $ % & ' ( ) * + , - . / */
902 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ /*0 1 2 3 4 5 6 7 8 9 : ; < = > ?*/
903 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ /*@ A B C D E F G H I J K L M N O*/
904 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ /*P Q R S T U V W X Y Z [ \ ] ^ _*/
905 D _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ /*` a b c d e f g h i j k l m n o*/
906 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ /*p q r s t u v w x y z { | } ~ ^?*/
908 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
909 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
910 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
911 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
912 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
913 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
914 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
915 _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
917 #undef _
918 #undef I
919 #undef S
920 #undef D
922 #else
924 static char vip_metacharacters[256];
926 static void
927 vip_op_1 (int bit, const char *syms)
929 unsigned char t;
931 while ((t = *syms++) != 0)
932 vip_metacharacters[t] |= bit;
935 /* Can be called any time. More arguments may appear in future. */
936 static void
937 vip_op_defaults (const char *immediate, const char *indirect, const char *displen)
939 vip_op_1 (VIP_IMMEDIATE, immediate);
940 vip_op_1 (VIP_INDIRECT, indirect);
941 vip_op_1 (VIP_DISPLEN, displen);
944 #endif
946 /* Call me once before you decode any lines.
947 I decode votstrs into a hash table at op_hash (which I create).
948 I return an error text or null.
949 If you want, I will include the 'synthetic' jXXX instructions in the
950 instruction table.
951 You must nominate metacharacters for eg DEC's "#", "@", "^". */
953 static void
954 vip_begin (int synthetic_too, /* 1 means include jXXX op-codes. */
955 const char *immediate,
956 const char *indirect,
957 const char *displen)
959 const struct vot *vP; /* scan votstrs */
961 op_hash = str_htab_create ();
963 for (vP = votstrs; *vP->vot_name; vP++)
964 if (str_hash_insert (op_hash, vP->vot_name, &vP->vot_detail, 0) != NULL)
965 as_fatal (_("duplicate %s"), vP->vot_name);
967 if (synthetic_too)
968 for (vP = synthetic_votstrs; *vP->vot_name; vP++)
969 if (str_hash_insert (op_hash, vP->vot_name, &vP->vot_detail, 0) != NULL)
970 as_fatal (_("duplicate %s"), vP->vot_name);
972 #ifndef CONST_TABLE
973 vip_op_defaults (immediate, indirect, displen);
974 #endif
977 /* Take 3 char.s, the last of which may be `\0` (non-existent)
978 and return the VAX register number that they represent.
980 Return -1 if they don't form a register name. Good names return
981 a number from 0:15 inclusive.
983 Case is not important in a name.
985 Register names understood are:
999 R12 AP
1000 R13 FP
1001 R14 SP
1002 R15 PC */
1004 #define AP 12
1005 #define FP 13
1006 #define SP 14
1007 #define PC 15
1009 /* Returns the register number of something like '%r15' or 'ap', supplied
1010 in four single chars. Returns -1 if the register isn't recognized,
1011 0..15 otherwise. */
1012 static int
1013 vax_reg_parse (char c1, char c2, char c3, char c4)
1015 int retval = -1;
1017 #ifdef OBJ_ELF
1018 if (c1 != '%') /* Register prefixes are mandatory for ELF. */
1019 return retval;
1020 c1 = c2;
1021 c2 = c3;
1022 c3 = c4;
1023 #endif
1024 #ifdef OBJ_VMS
1025 if (c4 != 0) /* Register prefixes are not allowed under VMS. */
1026 return retval;
1027 #endif
1028 #ifdef OBJ_AOUT
1029 if (c1 == '%') /* Register prefixes are optional under a.out. */
1031 c1 = c2;
1032 c2 = c3;
1033 c3 = c4;
1035 else if (c3 && c4) /* Can't be 4 characters long. */
1036 return retval;
1037 #endif
1039 c1 = TOLOWER (c1);
1040 c2 = TOLOWER (c2);
1041 if (ISDIGIT (c2) && c1 == 'r')
1043 retval = c2 - '0';
1044 if (ISDIGIT (c3))
1046 retval = retval * 10 + c3 - '0';
1047 retval = (retval > 15) ? -1 : retval;
1048 /* clamp the register value to 1 hex digit */
1050 else if (c3)
1051 retval = -1; /* c3 must be '\0' or a digit. */
1053 else if (c3) /* There are no three letter regs. */
1054 retval = -1;
1055 else if (c2 == 'p')
1057 switch (c1)
1059 case 's':
1060 retval = SP;
1061 break;
1062 case 'f':
1063 retval = FP;
1064 break;
1065 case 'a':
1066 retval = AP;
1067 break;
1068 default:
1069 retval = -1;
1072 else if (c1 == 'p' && c2 == 'c')
1073 retval = PC;
1074 else
1075 retval = -1;
1076 return retval;
1079 /* Parse a vax operand in DEC assembler notation.
1080 For speed, expect a string of whitespace to be reduced to a single ' '.
1081 This is the case for GNU AS, and is easy for other DEC-compatible
1082 assemblers.
1084 Knowledge about DEC VAX assembler operand notation lives here.
1085 This doesn't even know what a register name is, except it believes
1086 all register names are 2 or 3 characters, and lets vax_reg_parse() say
1087 what number each name represents.
1088 It does, however, know that PC, SP etc are special registers so it can
1089 detect addressing modes that are silly for those registers.
1091 Where possible, it delivers 1 fatal or 1 warning message if the operand
1092 is suspect. Exactly what we test for is still evolving.
1095 Arg block.
1097 There were a number of 'mismatched argument type' bugs to vip_op.
1098 The most general solution is to typedef each (of many) arguments.
1099 We used instead a typedef'd argument block. This is less modular
1100 than using separate return pointers for each result, but runs faster
1101 on most engines, and seems to keep programmers happy. It will have
1102 to be done properly if we ever want to use vip_op as a general-purpose
1103 module (it was designed to be).
1107 Doesn't support DEC "G^" format operands. These always take 5 bytes
1108 to express, and code as modes 8F or 9F. Reason: "G^" deprives you of
1109 optimising to (say) a "B^" if you are lucky in the way you link.
1110 When someone builds a linker smart enough to convert "G^" to "B^", "W^"
1111 whenever possible, then we should implement it.
1112 If there is some other use for "G^", feel free to code it in!
1114 speed
1116 If I nested if()s more, I could avoid testing (*err) which would save
1117 time, space and page faults. I didn't nest all those if()s for clarity
1118 and because I think the mode testing can be re-arranged 1st to test the
1119 commoner constructs 1st. Does anybody have statistics on this?
1121 error messages
1123 In future, we should be able to 'compose' error messages in a scratch area
1124 and give the user MUCH more informative error messages. Although this takes
1125 a little more code at run-time, it will make this module much more self-
1126 documenting. As an example of what sucks now: most error messages have
1127 hardwired into them the DEC VAX metacharacters "#^@" which are nothing like
1128 the Un*x characters "$`*", that most users will expect from this AS.
1130 ----
1132 The input is a string, ending with '\0'.
1134 We also require a 'hint' of what kind of operand is expected: so
1135 we can remind caller not to write into literals for instance.
1137 The output is a skeletal instruction.
1139 The algorithm has two parts.
1140 1. extract the syntactic features (parse off all the @^#-()+[] mode crud);
1141 2. express the @^#-()+[] as some parameters suited to further analysis.
1143 2nd step is where we detect the googles of possible invalid combinations
1144 a human (or compiler) might write. Note that if we do a half-way
1145 decent assembler, we don't know how long to make (eg) displacement
1146 fields when we first meet them (because they may not have defined values).
1147 So we must wait until we know how many bits are needed for each address,
1148 then we can know both length and opcodes of instructions.
1149 For reason(s) above, we will pass to our caller a 'broken' instruction
1150 of these major components, from which our caller can generate instructions:
1151 - displacement length I^ S^ L^ B^ W^ unspecified
1152 - mode (many)
1153 - register R0-R15 or absent
1154 - index register R0-R15 or absent
1155 - expression text what we don't parse
1156 - error text(s) why we couldn't understand the operand
1158 ----
1160 To decode output of this, test errtxt. If errtxt[0] == '\0', then
1161 we had no errors that prevented parsing. Also, if we ever report
1162 an internal bug, errtxt[0] is set non-zero. So one test tells you
1163 if the other outputs are to be taken seriously.
1165 ----
1167 Dec defines the semantics of address modes (and values)
1168 by a two-letter code, explained here.
1170 letter 1: access type
1172 a address calculation - no data access, registers forbidden
1173 b branch displacement
1174 m read - let go of bus - write back "modify"
1175 r read
1176 v bit field address: like 'a' but registers are OK
1177 w write
1178 space no operator (eg ".long foo") [our convention]
1180 letter 2: data type (i.e. width, alignment)
1182 b byte
1183 d double precision floating point (D format)
1184 f single precision floating point (F format)
1185 g G format floating
1186 h H format floating
1187 l longword
1188 o octaword
1189 q quadword
1190 w word
1191 ? simple synthetic branch operand
1192 - unconditional synthetic JSB/JSR operand
1193 ! complex synthetic branch operand
1195 The '-?!' letter 2's are not for external consumption. They are used
1196 for various assemblers. Generally, all unknown widths are assumed 0.
1197 We don't limit your choice of width character.
1199 DEC operands are hard work to parse. For example, '@' as the first
1200 character means indirect (deferred) mode but elsewhere it is a shift
1201 operator.
1202 The long-winded explanation of how this is supposed to work is
1203 cancelled. Read a DEC vax manual.
1204 We try hard not to parse anything that MIGHT be part of the expression
1205 buried in that syntax. For example if we see @...(Rn) we don't check
1206 for '-' before the '(' because mode @-(Rn) does not exist.
1208 After parsing we have:
1210 at 1 if leading '@' (or Un*x '*')
1211 len takes one value from " bilsw". eg B^ -> 'b'.
1212 hash 1 if leading '#' (or Un*x '$')
1213 expr_begin, expr_end the expression we did not parse
1214 even though we don't interpret it, we make use
1215 of its presence or absence.
1216 sign -1: -(Rn) 0: absent +1: (Rn)+
1217 paren 1 if () are around register
1218 reg major register number 0:15 -1 means absent
1219 ndx index register number 0:15 -1 means absent
1221 Again, I dare not explain it: just trace ALL the code!
1223 Summary of vip_op outputs.
1225 mode reg len ndx
1226 (Rn) => @Rn
1227 {@}Rn 5+@ n ' ' optional
1228 branch operand 0 -1 ' ' -1
1229 S^#foo 0 -1 's' -1
1230 -(Rn) 7 n ' ' optional
1231 {@}(Rn)+ 8+@ n ' ' optional
1232 {@}#foo, no S^ 8+@ PC " i" optional
1233 {@}{q^}{(Rn)} 10+@+q option " bwl" optional */
1235 /* Dissect user-input 'optext' (which is something like "@B^foo@bar(AP)[FP]:")
1236 using the vop in vopP. vopP's vop_access and vop_width. We fill _ndx, _reg,
1237 _mode, _short, _warn, _error, _expr_begin, _expr_end and _nbytes. */
1239 static void
1240 vip_op (char *optext, struct vop *vopP)
1242 /* Track operand text forward. */
1243 char *p;
1244 /* Track operand text backward. */
1245 char *q;
1246 /* 1 if leading '@' ('*') seen. */
1247 int at;
1248 /* one of " bilsw" */
1249 char len;
1250 /* 1 if leading '#' ('$') seen. */
1251 int hash;
1252 /* -1, 0 or +1. */
1253 int sign = 0;
1254 /* 1 if () surround register. */
1255 int paren = 0;
1256 /* Register number, -1:absent. */
1257 int reg = 0;
1258 /* Index register number -1:absent. */
1259 int ndx = 0;
1260 /* Report illegal operand, ""==OK. */
1261 /* " " is a FAKE error: means we won. */
1262 /* ANY err that begins with ' ' is a fake. */
1263 /* " " is converted to "" before return. */
1264 const char *err;
1265 /* Warn about weird modes pf address. */
1266 const char *wrn;
1267 /* Preserve q in case we backup. */
1268 char *oldq = NULL;
1269 /* Build up 4-bit operand mode here. */
1270 /* Note: index mode is in ndx, this is. */
1271 /* The major mode of operand address. */
1272 int mode = 0;
1273 /* Notice how we move wrong-arg-type bugs INSIDE this module: if we
1274 get the types wrong below, we lose at compile time rather than at
1275 lint or run time. */
1276 char access_mode; /* vop_access. */
1278 access_mode = vopP->vop_access;
1279 /* None of our code bugs (yet), no user text errors, no warnings
1280 even. */
1281 err = wrn = 0;
1283 p = optext;
1285 if (*p == ' ') /* Expect all whitespace reduced to ' '. */
1286 p++; /* skip over whitespace */
1288 if ((at = INDIRECTP (*p)) != 0)
1289 { /* 1 if *p=='@'(or '*' for Un*x) */
1290 p++; /* at is determined */
1291 if (*p == ' ') /* Expect all whitespace reduced to ' '. */
1292 p++; /* skip over whitespace */
1295 /* This code is subtle. It tries to detect all legal (letter)'^'
1296 but it doesn't waste time explicitly testing for premature '\0' because
1297 this case is rejected as a mismatch against either (letter) or '^'. */
1299 char c;
1301 c = *p;
1302 c = TOLOWER (c);
1303 if (DISPLENP (p[1]) && strchr ("bilws", len = c))
1304 p += 2; /* Skip (letter) '^'. */
1305 else /* No (letter) '^' seen. */
1306 len = ' '; /* Len is determined. */
1309 if (*p == ' ') /* Expect all whitespace reduced to ' '. */
1310 p++;
1312 if ((hash = IMMEDIATEP (*p)) != 0) /* 1 if *p=='#' ('$' for Un*x) */
1313 p++; /* Hash is determined. */
1315 /* p points to what may be the beginning of an expression.
1316 We have peeled off the front all that is peelable.
1317 We know at, len, hash.
1319 Lets point q at the end of the text and parse that (backwards). */
1321 for (q = p; *q; q++)
1323 q--; /* Now q points at last char of text. */
1325 if (*q == ' ' && q >= p) /* Expect all whitespace reduced to ' '. */
1326 q--;
1328 /* Reverse over whitespace, but don't. */
1329 /* Run back over *p. */
1331 /* As a matter of policy here, we look for [Rn], although both Rn and S^#
1332 forbid [Rn]. This is because it is easy, and because only a sick
1333 cyborg would have [...] trailing an expression in a VAX-like assembler.
1334 A meticulous parser would first check for Rn followed by '(' or '['
1335 and not parse a trailing ']' if it found another. We just ban expressions
1336 ending in ']'. */
1337 if (*q == ']')
1339 while (q >= p && *q != '[')
1340 q--;
1341 /* Either q<p or we got matching '['. */
1342 if (q < p)
1343 err = _("no '[' to match ']'");
1344 else
1346 /* Confusers like "[]" will eventually lose with a bad register
1347 * name error. So again we don't need to check for early '\0'. */
1348 if (q[3] == ']')
1349 ndx = vax_reg_parse (q[1], q[2], 0, 0);
1350 else if (q[4] == ']')
1351 ndx = vax_reg_parse (q[1], q[2], q[3], 0);
1352 else if (q[5] == ']')
1353 ndx = vax_reg_parse (q[1], q[2], q[3], q[4]);
1354 else
1355 ndx = -1;
1356 /* Since we saw a ']' we will demand a register name in the [].
1357 * If luser hasn't given us one: be rude. */
1358 if (ndx < 0)
1359 err = _("bad register in []");
1360 else if (ndx == PC)
1361 err = _("[PC] index banned");
1362 else
1363 /* Point q just before "[...]". */
1364 q--;
1367 else
1368 /* No ']', so no iNDeX register. */
1369 ndx = -1;
1371 /* If err = "..." then we lost: run away.
1372 Otherwise ndx == -1 if there was no "[...]".
1373 Otherwise, ndx is index register number, and q points before "[...]". */
1375 if (*q == ' ' && q >= p) /* Expect all whitespace reduced to ' '. */
1376 q--;
1377 /* Reverse over whitespace, but don't. */
1378 /* Run back over *p. */
1379 if (!err || !*err)
1381 /* no ()+ or -() seen yet */
1382 sign = 0;
1384 if (q > p + 3 && *q == '+' && q[-1] == ')')
1386 sign = 1; /* we saw a ")+" */
1387 q--; /* q points to ')' */
1390 if (*q == ')' && q > p + 2)
1392 paren = 1; /* assume we have "(...)" */
1393 while (q >= p && *q != '(')
1394 q--;
1395 /* either q<p or we got matching '(' */
1396 if (q < p)
1397 err = _("no '(' to match ')'");
1398 else
1400 /* Confusers like "()" will eventually lose with a bad register
1401 name error. So again we don't need to check for early '\0'. */
1402 if (q[3] == ')')
1403 reg = vax_reg_parse (q[1], q[2], 0, 0);
1404 else if (q[4] == ')')
1405 reg = vax_reg_parse (q[1], q[2], q[3], 0);
1406 else if (q[5] == ')')
1407 reg = vax_reg_parse (q[1], q[2], q[3], q[4]);
1408 else
1409 reg = -1;
1410 /* Since we saw a ')' we will demand a register name in the ')'.
1411 This is nasty: why can't our hypothetical assembler permit
1412 parenthesised expressions? BECAUSE I AM LAZY! That is why.
1413 Abuse luser if we didn't spy a register name. */
1414 if (reg < 0)
1416 /* JF allow parenthesized expressions. I hope this works. */
1417 paren = 0;
1418 while (*q != ')')
1419 q++;
1420 /* err = "unknown register in ()"; */
1422 else
1423 q--; /* point just before '(' of "(...)" */
1424 /* If err == "..." then we lost. Run away.
1425 Otherwise if reg >= 0 then we saw (Rn). */
1427 /* If err == "..." then we lost.
1428 Otherwise paren==1 and reg = register in "()". */
1430 else
1431 paren = 0;
1432 /* If err == "..." then we lost.
1433 Otherwise, q points just before "(Rn)", if any.
1434 If there was a "(...)" then paren==1, and reg is the register. */
1436 /* We should only seek '-' of "-(...)" if:
1437 we saw "(...)" paren == 1
1438 we have no errors so far ! *err
1439 we did not see '+' of "(...)+" sign < 1
1440 We don't check len. We want a specific error message later if
1441 user tries "x^...-(Rn)". This is a feature not a bug. */
1442 if (!err || !*err)
1444 if (paren && sign < 1)/* !sign is adequate test */
1446 if (*q == '-')
1448 sign = -1;
1449 q--;
1452 /* We have back-tracked over most
1453 of the crud at the end of an operand.
1454 Unless err, we know: sign, paren. If paren, we know reg.
1455 The last case is of an expression "Rn".
1456 This is worth hunting for if !err, !paren.
1457 We wouldn't be here if err.
1458 We remember to save q, in case we didn't want "Rn" anyway. */
1459 if (!paren)
1461 if (*q == ' ' && q >= p) /* Expect all whitespace reduced to ' '. */
1462 q--;
1463 /* Reverse over whitespace, but don't. */
1464 /* Run back over *p. */
1465 /* Room for Rn or Rnn (include prefix) exactly? */
1466 if (q > p && q < p + 4)
1467 reg = vax_reg_parse (p[0], p[1],
1468 q < p + 2 ? 0 : p[2],
1469 q < p + 3 ? 0 : p[3]);
1470 else
1471 reg = -1; /* Always comes here if no register at all. */
1472 /* Here with a definitive reg value. */
1473 if (reg >= 0)
1475 oldq = q;
1476 q = p - 1;
1481 /* have reg. -1:absent; else 0:15. */
1483 /* We have: err, at, len, hash, ndx, sign, paren, reg.
1484 Also, any remaining expression is from *p through *q inclusive.
1485 Should there be no expression, q==p-1. So expression length = q-p+1.
1486 This completes the first part: parsing the operand text. */
1488 /* We now want to boil the data down, checking consistency on the way.
1489 We want: len, mode, reg, ndx, err, p, q, wrn, bug.
1490 We will deliver a 4-bit reg, and a 4-bit mode. */
1492 /* Case of branch operand. Different. No L^B^W^I^S^ allowed for instance.
1494 in: at ?
1495 len ?
1496 hash ?
1497 p:q ?
1498 sign ?
1499 paren ?
1500 reg ?
1501 ndx ?
1503 out: mode 0
1504 reg -1
1505 len ' '
1506 p:q whatever was input
1507 ndx -1
1508 err " " or error message, and other outputs trashed. */
1509 /* Branch operands have restricted forms. */
1510 if ((!err || !*err) && access_mode == 'b')
1512 if (at || hash || sign || paren || ndx >= 0 || reg >= 0 || len != ' ')
1513 err = _("invalid branch operand");
1514 else
1515 err = " ";
1518 /* Since nobody seems to use it: comment this 'feature'(?) out for now. */
1519 #ifdef NEVER
1520 /* Case of stand-alone operand. e.g. ".long foo"
1522 in: at ?
1523 len ?
1524 hash ?
1525 p:q ?
1526 sign ?
1527 paren ?
1528 reg ?
1529 ndx ?
1531 out: mode 0
1532 reg -1
1533 len ' '
1534 p:q whatever was input
1535 ndx -1
1536 err " " or error message, and other outputs trashed. */
1537 if ((!err || !*err) && access_mode == ' ')
1539 if (at)
1540 err = _("address prohibits @");
1541 else if (hash)
1542 err = _("address prohibits #");
1543 else if (sign)
1545 if (sign < 0)
1546 err = _("address prohibits -()");
1547 else
1548 err = _("address prohibits ()+");
1550 else if (paren)
1551 err = _("address prohibits ()");
1552 else if (ndx >= 0)
1553 err = _("address prohibits []");
1554 else if (reg >= 0)
1555 err = _("address prohibits register");
1556 else if (len != ' ')
1557 err = _("address prohibits displacement length specifier");
1558 else
1560 err = " "; /* succeed */
1561 mode = 0;
1564 #endif
1566 /* Case of S^#.
1568 in: at 0
1569 len 's' definition
1570 hash 1 demand
1571 p:q demand not empty
1572 sign 0 by paren==0
1573 paren 0 by "()" scan logic because "S^" seen
1574 reg -1 or nn by mistake
1575 ndx -1
1577 out: mode 0
1578 reg -1
1579 len 's'
1581 ndx -1 */
1582 if ((!err || !*err) && len == 's')
1584 if (!hash || paren || at || ndx >= 0)
1585 err = _("invalid operand of S^#");
1586 else
1588 if (reg >= 0)
1590 /* Darn! we saw S^#Rnn ! put the Rnn back in
1591 expression. KLUDGE! Use oldq so we don't
1592 need to know exact length of reg name. */
1593 q = oldq;
1594 reg = 0;
1596 /* We have all the expression we will ever get. */
1597 if (p > q)
1598 err = _("S^# needs expression");
1599 else if (access_mode == 'r')
1601 err = " "; /* WIN! */
1602 mode = 0;
1604 else
1605 err = _("S^# may only read-access");
1609 /* Case of -(Rn), which is weird case.
1611 in: at 0
1612 len '
1613 hash 0
1614 p:q q<p
1615 sign -1 by definition
1616 paren 1 by definition
1617 reg present by definition
1618 ndx optional
1620 out: mode 7
1621 reg present
1622 len ' '
1623 exp "" enforce empty expression
1624 ndx optional warn if same as reg. */
1625 if ((!err || !*err) && sign < 0)
1627 if (len != ' ' || hash || at || p <= q)
1628 err = _("invalid operand of -()");
1629 else
1631 err = " "; /* win */
1632 mode = 7;
1633 if (reg == PC)
1634 wrn = _("-(PC) unpredictable");
1635 else if (reg == ndx)
1636 wrn = _("[]index same as -()register: unpredictable");
1640 /* We convert "(Rn)" to "@Rn" for our convenience.
1641 (I hope this is convenient: has someone got a better way to parse this?)
1642 A side-effect of this is that "@Rn" is a valid operand. */
1643 if (paren && !sign && !hash && !at && len == ' ' && p > q)
1645 at = 1;
1646 paren = 0;
1649 /* Case of (Rn)+, which is slightly different.
1651 in: at
1652 len ' '
1653 hash 0
1654 p:q q<p
1655 sign +1 by definition
1656 paren 1 by definition
1657 reg present by definition
1658 ndx optional
1660 out: mode 8+@
1661 reg present
1662 len ' '
1663 exp "" enforce empty expression
1664 ndx optional warn if same as reg. */
1665 if ((!err || !*err) && sign > 0)
1667 if (len != ' ' || hash || p <= q)
1668 err = _("invalid operand of ()+");
1669 else
1671 err = " "; /* win */
1672 mode = 8 + (at ? 1 : 0);
1673 if (reg == PC)
1674 wrn = _("(PC)+ unpredictable");
1675 else if (reg == ndx)
1676 wrn = _("[]index same as ()+register: unpredictable");
1680 /* Case of #, without S^.
1682 in: at
1683 len ' ' or 'i'
1684 hash 1 by definition
1686 sign 0
1687 paren 0
1688 reg absent
1689 ndx optional
1691 out: mode 8+@
1692 reg PC
1693 len ' ' or 'i'
1695 ndx optional. */
1696 if ((!err || !*err) && hash)
1698 if (len != 'i' && len != ' ')
1699 err = _("# conflicts length");
1700 else if (paren)
1701 err = _("# bars register");
1702 else
1704 if (reg >= 0)
1706 /* Darn! we saw #Rnn! Put the Rnn back into the expression.
1707 By using oldq, we don't need to know how long Rnn was.
1708 KLUDGE! */
1709 q = oldq;
1710 reg = -1; /* No register any more. */
1712 err = " "; /* Win. */
1714 /* JF a bugfix, I think! */
1715 if (at && access_mode == 'a')
1716 vopP->vop_nbytes = 4;
1718 mode = (at ? 9 : 8);
1719 reg = PC;
1720 if ((access_mode == 'm' || access_mode == 'w') && !at)
1721 wrn = _("writing or modifying # is unpredictable");
1724 /* If !*err, then sign == 0
1725 hash == 0 */
1727 /* Case of Rn. We separate this one because it has a few special
1728 errors the remaining modes lack.
1730 in: at optional
1731 len ' '
1732 hash 0 by program logic
1733 p:q empty
1734 sign 0 by program logic
1735 paren 0 by definition
1736 reg present by definition
1737 ndx optional
1739 out: mode 5+@
1740 reg present
1741 len ' ' enforce no length
1742 exp "" enforce empty expression
1743 ndx optional warn if same as reg. */
1744 if ((!err || !*err) && !paren && reg >= 0)
1746 if (len != ' ')
1747 err = _("length not needed");
1748 else if (at)
1750 err = " "; /* win */
1751 mode = 6; /* @Rn */
1753 else if (ndx >= 0)
1754 err = _("can't []index a register, because it has no address");
1755 else if (access_mode == 'a')
1756 err = _("a register has no address");
1757 else
1759 /* Idea here is to detect from length of datum
1760 and from register number if we will touch PC.
1761 Warn if we do.
1762 vop_nbytes is number of bytes in operand.
1763 Compute highest byte affected, compare to PC0. */
1764 if ((vopP->vop_nbytes + reg * 4) > 60)
1765 wrn = _("PC part of operand unpredictable");
1766 err = " "; /* win */
1767 mode = 5; /* Rn */
1770 /* If !*err, sign == 0
1771 hash == 0
1772 paren == 1 OR reg==-1 */
1774 /* Rest of cases fit into one bunch.
1776 in: at optional
1777 len ' ' or 'b' or 'w' or 'l'
1778 hash 0 by program logic
1779 p:q expected (empty is not an error)
1780 sign 0 by program logic
1781 paren optional
1782 reg optional
1783 ndx optional
1785 out: mode 10 + @ + len
1786 reg optional
1787 len ' ' or 'b' or 'w' or 'l'
1788 exp maybe empty
1789 ndx optional warn if same as reg. */
1790 if (!err || !*err)
1792 err = " "; /* win (always) */
1793 mode = 10 + (at ? 1 : 0);
1794 switch (len)
1796 case 'l':
1797 mode += 2;
1798 /* Fall through. */
1799 case 'w':
1800 mode += 2;
1801 /* Fall through. */
1802 case ' ': /* Assumed B^ until our caller changes it. */
1803 case 'b':
1804 break;
1808 /* here with completely specified mode
1811 expression p,q
1812 ndx. */
1814 if (*err == ' ')
1815 err = 0; /* " " is no longer an error. */
1817 vopP->vop_mode = mode;
1818 vopP->vop_reg = reg;
1819 vopP->vop_short = len;
1820 vopP->vop_expr_begin = p;
1821 vopP->vop_expr_end = q;
1822 vopP->vop_ndx = ndx;
1823 vopP->vop_error = err;
1824 vopP->vop_warn = wrn;
1827 /* This converts a string into a vax instruction.
1828 The string must be a bare single instruction in dec-vax (with BSD4 frobs)
1829 format.
1830 It provides some error messages: at most one fatal error message (which
1831 stops the scan) and at most one warning message for each operand.
1832 The vax instruction is returned in exploded form, since we have no
1833 knowledge of how you parse (or evaluate) your expressions.
1834 We do however strip off and decode addressing modes and operation
1835 mnemonic.
1837 The exploded instruction is returned to a struct vit of your choice.
1838 #include "vax-inst.h" to know what a struct vit is.
1840 This function's value is a string. If it is not "" then an internal
1841 logic error was found: read this code to assign meaning to the string.
1842 No argument string should generate such an error string:
1843 it means a bug in our code, not in the user's text.
1845 You MUST have called vip_begin() once before using this function. */
1847 static void
1848 vip (struct vit *vitP, /* We build an exploded instruction here. */
1849 char *instring) /* Text of a vax instruction: we modify. */
1851 /* How to bit-encode this opcode. */
1852 struct vot_wot *vwP;
1853 /* 1/skip whitespace.2/scan vot_how */
1854 char *p;
1855 char *q;
1856 /* counts number of operands seen */
1857 unsigned char count;
1858 /* scan operands in struct vit */
1859 struct vop *operandp;
1860 /* error over all operands */
1861 const char *alloperr;
1862 /* Remember char, (we clobber it with '\0' temporarily). */
1863 char c;
1864 /* Op-code of this instruction. */
1865 vax_opcodeT oc;
1867 if (*instring == ' ')
1868 ++instring;
1870 /* MUST end in end-of-string or exactly 1 space. */
1871 for (p = instring; *p && *p != ' '; p++)
1874 /* Scanned up to end of operation-code. */
1875 /* Operation-code is ended with whitespace. */
1876 if (p - instring == 0)
1878 vitP->vit_error = _("No operator");
1879 count = 0;
1880 memset (vitP->vit_opcode, '\0', sizeof (vitP->vit_opcode));
1882 else
1884 c = *p;
1885 *p = '\0';
1886 /* Here with instring pointing to what better be an op-name, and p
1887 pointing to character just past that.
1888 We trust instring points to an op-name, with no whitespace. */
1889 vwP = (struct vot_wot *) str_hash_find (op_hash, instring);
1890 /* Restore char after op-code. */
1891 *p = c;
1892 if (vwP == 0)
1894 vitP->vit_error = _("Unknown operator");
1895 count = 0;
1896 memset (vitP->vit_opcode, '\0', sizeof (vitP->vit_opcode));
1898 else
1900 /* We found a match! So let's pick up as many operands as the
1901 instruction wants, and even gripe if there are too many.
1902 We expect comma to separate each operand.
1903 We let instring track the text, while p tracks a part of the
1904 struct vot. */
1905 const char *howp;
1906 /* The lines below know about 2-byte opcodes starting FD,FE or FF.
1907 They also understand synthetic opcodes. Note:
1908 we return 32 bits of opcode, including bucky bits, BUT
1909 an opcode length is either 8 or 16 bits for vit_opcode_nbytes. */
1910 oc = vwP->vot_code; /* The op-code. */
1911 vitP->vit_opcode_nbytes = (oc & 0xFF) >= 0xFD ? 2 : 1;
1912 md_number_to_chars (vitP->vit_opcode, oc, 4);
1913 count = 0; /* No operands seen yet. */
1914 instring = p; /* Point just past operation code. */
1915 alloperr = "";
1916 for (howp = vwP->vot_how, operandp = vitP->vit_operand;
1917 !(alloperr && *alloperr) && *howp;
1918 operandp++, howp += 2)
1920 /* Here to parse one operand. Leave instring pointing just
1921 past any one ',' that marks the end of this operand. */
1922 if (!howp[1])
1923 as_fatal (_("odd number of bytes in operand description"));
1924 else if (*instring)
1926 for (q = instring; (c = *q) && c != ','; q++)
1928 /* Q points to ',' or '\0' that ends argument. C is that
1929 character. */
1930 *q = 0;
1931 operandp->vop_width = howp[1];
1932 operandp->vop_nbytes = vax_operand_width_size[(unsigned) howp[1]];
1933 operandp->vop_access = howp[0];
1934 vip_op (instring, operandp);
1935 *q = c; /* Restore input text. */
1936 if (operandp->vop_error)
1937 alloperr = _("Bad operand");
1938 instring = q + (c ? 1 : 0); /* Next operand (if any). */
1939 count++; /* Won another argument, may have an operr. */
1941 else
1942 alloperr = _("Not enough operands");
1944 if (!*alloperr)
1946 if (*instring == ' ')
1947 instring++;
1948 if (*instring)
1949 alloperr = _("Too many operands");
1951 vitP->vit_error = alloperr;
1954 vitP->vit_operands = count;
1957 #ifdef test
1959 /* Test program for above. */
1961 struct vit myvit; /* Build an exploded vax instruction here. */
1962 char answer[100]; /* Human types a line of vax assembler here. */
1963 char *mybug; /* "" or an internal logic diagnostic. */
1964 int mycount; /* Number of operands. */
1965 struct vop *myvop; /* Scan operands from myvit. */
1966 int mysynth; /* 1 means want synthetic opcodes. */
1967 char my_immediate[200];
1968 char my_indirect[200];
1969 char my_displen[200];
1972 main (void)
1974 char *p;
1976 printf ("0 means no synthetic instructions. ");
1977 printf ("Value for vip_begin? ");
1978 gets (answer);
1979 sscanf (answer, "%d", &mysynth);
1980 printf ("Synthetic opcodes %s be included.\n", mysynth ? "will" : "will not");
1981 printf ("enter immediate symbols eg enter # ");
1982 gets (my_immediate);
1983 printf ("enter indirect symbols eg enter @ ");
1984 gets (my_indirect);
1985 printf ("enter displen symbols eg enter ^ ");
1986 gets (my_displen);
1988 vip_begin (mysynth, my_immediate, my_indirect, my_displen)
1990 printf ("An empty input line will quit you from the vax instruction parser\n");
1991 for (;;)
1993 printf ("vax instruction: ");
1994 fflush (stdout);
1995 gets (answer);
1996 if (!*answer)
1997 break; /* Out of for each input text loop. */
1999 vip (& myvit, answer);
2000 if (*myvit.vit_error)
2001 printf ("ERR:\"%s\"\n", myvit.vit_error);
2003 printf ("opcode=");
2004 for (mycount = myvit.vit_opcode_nbytes, p = myvit.vit_opcode;
2005 mycount;
2006 mycount--, p++)
2007 printf ("%02x ", *p & 0xFF);
2009 printf (" operand count=%d.\n", mycount = myvit.vit_operands);
2010 for (myvop = myvit.vit_operand; mycount; mycount--, myvop++)
2012 printf ("mode=%xx reg=%xx ndx=%xx len='%c'=%c%c%d. expr=\"",
2013 myvop->vop_mode, myvop->vop_reg, myvop->vop_ndx,
2014 myvop->vop_short, myvop->vop_access, myvop->vop_width,
2015 myvop->vop_nbytes);
2016 for (p = myvop->vop_expr_begin; p <= myvop->vop_expr_end; p++)
2017 putchar (*p);
2019 printf ("\"\n");
2020 if (myvop->vop_error)
2021 printf (" err:\"%s\"\n", myvop->vop_error);
2023 if (myvop->vop_warn)
2024 printf (" wrn:\"%s\"\n", myvop->vop_warn);
2027 vip_end ();
2028 exit (EXIT_SUCCESS);
2031 #endif
2033 #ifdef TEST /* #Define to use this testbed. */
2035 /* Follows a test program for this function.
2036 We declare arrays non-local in case some of our tiny-minded machines
2037 default to small stacks. Also, helps with some debuggers. */
2039 char answer[100]; /* Human types into here. */
2040 char *p; /* */
2041 char *myerr;
2042 char *mywrn;
2043 char *mybug;
2044 char myaccess;
2045 char mywidth;
2046 char mymode;
2047 char myreg;
2048 char mylen;
2049 char *myleft;
2050 char *myright;
2051 char myndx;
2052 int my_operand_length;
2053 char my_immediate[200];
2054 char my_indirect[200];
2055 char my_displen[200];
2058 main (void)
2060 printf ("enter immediate symbols eg enter # ");
2061 gets (my_immediate);
2062 printf ("enter indirect symbols eg enter @ ");
2063 gets (my_indirect);
2064 printf ("enter displen symbols eg enter ^ ");
2065 gets (my_displen);
2066 vip_op_defaults (my_immediate, my_indirect, my_displen);
2068 for (;;)
2070 printf ("access,width (eg 'ab' or 'wh') [empty line to quit] : ");
2071 fflush (stdout);
2072 gets (answer);
2073 if (!answer[0])
2074 exit (EXIT_SUCCESS);
2075 myaccess = answer[0];
2076 mywidth = answer[1];
2077 switch (mywidth)
2079 case 'b':
2080 my_operand_length = 1;
2081 break;
2082 case 'd':
2083 my_operand_length = 8;
2084 break;
2085 case 'f':
2086 my_operand_length = 4;
2087 break;
2088 case 'g':
2089 my_operand_length = 16;
2090 break;
2091 case 'h':
2092 my_operand_length = 32;
2093 break;
2094 case 'l':
2095 my_operand_length = 4;
2096 break;
2097 case 'o':
2098 my_operand_length = 16;
2099 break;
2100 case 'q':
2101 my_operand_length = 8;
2102 break;
2103 case 'w':
2104 my_operand_length = 2;
2105 break;
2106 case '!':
2107 case '?':
2108 case '-':
2109 my_operand_length = 0;
2110 break;
2112 default:
2113 my_operand_length = 2;
2114 printf ("I don't understand access width %c\n", mywidth);
2115 break;
2117 printf ("VAX assembler instruction operand: ");
2118 fflush (stdout);
2119 gets (answer);
2120 mybug = vip_op (answer, myaccess, mywidth, my_operand_length,
2121 &mymode, &myreg, &mylen, &myleft, &myright, &myndx,
2122 &myerr, &mywrn);
2123 if (*myerr)
2125 printf ("error: \"%s\"\n", myerr);
2126 if (*mybug)
2127 printf (" bug: \"%s\"\n", mybug);
2129 else
2131 if (*mywrn)
2132 printf ("warning: \"%s\"\n", mywrn);
2133 mumble ("mode", mymode);
2134 mumble ("register", myreg);
2135 mumble ("index", myndx);
2136 printf ("width:'%c' ", mylen);
2137 printf ("expression: \"");
2138 while (myleft <= myright)
2139 putchar (*myleft++);
2140 printf ("\"\n");
2145 void
2146 mumble (char *text, int value)
2148 printf ("%s:", text);
2149 if (value >= 0)
2150 printf ("%xx", value);
2151 else
2152 printf ("ABSENT");
2153 printf (" ");
2156 #endif
2158 int md_short_jump_size = 3;
2159 int md_long_jump_size = 6;
2161 void
2162 md_create_short_jump (char *ptr,
2163 addressT from_addr,
2164 addressT to_addr ATTRIBUTE_UNUSED,
2165 fragS *frag ATTRIBUTE_UNUSED,
2166 symbolS *to_symbol ATTRIBUTE_UNUSED)
2168 valueT offset;
2170 /* This former calculation was off by two:
2171 offset = to_addr - (from_addr + 1);
2172 We need to account for the one byte instruction and also its
2173 two byte operand. */
2174 offset = to_addr - (from_addr + 1 + 2);
2175 *ptr++ = VAX_BRW; /* Branch with word (16 bit) offset. */
2176 md_number_to_chars (ptr, offset, 2);
2179 void
2180 md_create_long_jump (char *ptr,
2181 addressT from_addr,
2182 addressT to_addr,
2183 fragS *frag ATTRIBUTE_UNUSED,
2184 symbolS *to_symbol ATTRIBUTE_UNUSED)
2186 valueT offset;
2188 /* Account for 1 byte instruction, 1 byte of address specifier and
2189 4 bytes of offset from PC. */
2190 offset = to_addr - (from_addr + 1 + 1 + 4);
2191 *ptr++ = VAX_JMP;
2192 *ptr++ = VAX_PC_RELATIVE_MODE;
2193 md_number_to_chars (ptr, offset, 4);
2196 #ifdef OBJ_VMS
2197 const char *md_shortopts = "d:STt:V+1h:Hv::";
2198 #elif defined(OBJ_ELF)
2199 const char *md_shortopts = "d:STt:VkKQ:";
2200 #else
2201 const char *md_shortopts = "d:STt:V";
2202 #endif
2203 struct option md_longopts[] =
2205 #ifdef OBJ_ELF
2206 #define OPTION_PIC (OPTION_MD_BASE)
2207 { "pic", no_argument, NULL, OPTION_PIC },
2208 #endif
2209 { NULL, no_argument, NULL, 0 }
2211 size_t md_longopts_size = sizeof (md_longopts);
2214 md_parse_option (int c, const char *arg)
2216 switch (c)
2218 case 'S':
2219 as_warn (_("SYMBOL TABLE not implemented"));
2220 break;
2222 case 'T':
2223 as_warn (_("TOKEN TRACE not implemented"));
2224 break;
2226 case 'd':
2227 as_warn (_("Displacement length %s ignored!"), arg);
2228 break;
2230 case 't':
2231 as_warn (_("I don't need or use temp. file \"%s\"."), arg);
2232 break;
2234 case 'V':
2235 as_warn (_("I don't use an interpass file! -V ignored"));
2236 break;
2238 #ifdef OBJ_VMS
2239 case '+': /* For g++. Hash any name > 31 chars long. */
2240 flag_hash_long_names = 1;
2241 break;
2243 case '1': /* For backward compatibility. */
2244 flag_one = 1;
2245 break;
2247 case 'H': /* Show new symbol after hash truncation. */
2248 flag_show_after_trunc = 1;
2249 break;
2251 case 'h': /* No hashing of mixed-case names. */
2253 extern char vms_name_mapping;
2254 vms_name_mapping = atoi (arg);
2255 flag_no_hash_mixed_case = 1;
2257 break;
2259 case 'v':
2261 extern char *compiler_version_string;
2263 if (!arg || !*arg || access (arg, 0) == 0)
2264 return 0; /* Have caller show the assembler version. */
2265 compiler_version_string = arg;
2267 break;
2268 #endif
2270 #ifdef OBJ_ELF
2271 case OPTION_PIC:
2272 case 'k':
2273 flag_want_pic = 1;
2274 break; /* -pic, Position Independent Code. */
2276 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment
2277 section should be emitted or not. FIXME: Not implemented. */
2278 case 'Q':
2279 break;
2280 #endif
2282 default:
2283 return 0;
2286 return 1;
2289 void
2290 md_show_usage (FILE *stream)
2292 fprintf (stream, _("\
2293 VAX options:\n\
2294 -d LENGTH ignored\n\
2295 -J ignored\n\
2296 -S ignored\n\
2297 -t FILE ignored\n\
2298 -T ignored\n\
2299 -V ignored\n"));
2300 #ifdef OBJ_VMS
2301 fprintf (stream, _("\
2302 VMS options:\n\
2303 -+ hash encode names longer than 31 characters\n\
2304 -1 `const' handling compatible with gcc 1.x\n\
2305 -H show new symbol after hash truncation\n\
2306 -h NUM don't hash mixed-case names, and adjust case:\n\
2307 0 = upper, 2 = lower, 3 = preserve case\n\
2308 -v\"VERSION\" code being assembled was produced by compiler \"VERSION\"\n"));
2309 #endif
2312 /* We have no need to default values of symbols. */
2314 symbolS *
2315 md_undefined_symbol (char *name ATTRIBUTE_UNUSED)
2317 return NULL;
2320 /* Round up a section size to the appropriate boundary. */
2321 valueT
2322 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
2324 /* Byte alignment is fine */
2325 return size;
2328 /* Exactly what point is a PC-relative offset relative TO?
2329 On the vax, they're relative to the address of the offset, plus
2330 its size. */
2331 long
2332 md_pcrel_from (fixS *fixP)
2334 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
2337 arelent *
2338 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
2340 arelent *reloc;
2341 bfd_reloc_code_real_type code;
2343 if (fixp->fx_tcbit)
2344 abort ();
2346 if (fixp->fx_r_type != NO_RELOC)
2348 code = fixp->fx_r_type;
2350 if (fixp->fx_pcrel)
2352 switch (code)
2354 case BFD_RELOC_8_PCREL:
2355 case BFD_RELOC_16_PCREL:
2356 case BFD_RELOC_32_PCREL:
2357 #ifdef OBJ_ELF
2358 case BFD_RELOC_8_GOT_PCREL:
2359 case BFD_RELOC_16_GOT_PCREL:
2360 case BFD_RELOC_32_GOT_PCREL:
2361 case BFD_RELOC_8_PLT_PCREL:
2362 case BFD_RELOC_16_PLT_PCREL:
2363 case BFD_RELOC_32_PLT_PCREL:
2364 #endif
2365 break;
2366 default:
2367 as_bad_where (fixp->fx_file, fixp->fx_line,
2368 _("Cannot make %s relocation PC relative"),
2369 bfd_get_reloc_code_name (code));
2373 else
2375 #define F(SZ,PCREL) (((SZ) << 1) + (PCREL))
2376 switch (F (fixp->fx_size, fixp->fx_pcrel))
2378 #define MAP(SZ,PCREL,TYPE) case F(SZ,PCREL): code = (TYPE); break
2379 MAP (1, 0, BFD_RELOC_8);
2380 MAP (2, 0, BFD_RELOC_16);
2381 MAP (4, 0, BFD_RELOC_32);
2382 MAP (1, 1, BFD_RELOC_8_PCREL);
2383 MAP (2, 1, BFD_RELOC_16_PCREL);
2384 MAP (4, 1, BFD_RELOC_32_PCREL);
2385 default:
2386 abort ();
2389 #undef F
2390 #undef MAP
2392 reloc = XNEW (arelent);
2393 reloc->sym_ptr_ptr = XNEW (asymbol *);
2394 *reloc->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
2395 reloc->address = fixp->fx_frag->fr_address + fixp->fx_where;
2396 #ifndef OBJ_ELF
2397 if (fixp->fx_pcrel)
2398 reloc->addend = fixp->fx_addnumber;
2399 else
2400 reloc->addend = 0;
2401 #else
2402 reloc->addend = fixp->fx_offset;
2403 #endif
2405 reloc->howto = bfd_reloc_type_lookup (stdoutput, code);
2406 gas_assert (reloc->howto != 0);
2408 return reloc;
2411 /* vax:md_assemble() emit frags for 1 instruction given in textual form. */
2412 void
2413 md_assemble (char *instruction_string)
2415 /* Non-zero if operand expression's segment is not known yet. */
2416 int is_undefined;
2417 /* Non-zero if operand expression's segment is absolute. */
2418 int is_absolute;
2419 int length_code;
2420 char *p;
2421 /* An operand. Scans all operands. */
2422 struct vop *operandP;
2423 char *save_input_line_pointer;
2424 /* What used to live after an expression. */
2425 char c_save;
2426 /* 1: instruction_string bad for all passes. */
2427 int goofed;
2428 /* Points to slot just after last operand. */
2429 struct vop *end_operandP;
2430 /* Points to expression values for this operand. */
2431 expressionS *expP;
2432 segT *segP;
2434 /* These refer to an instruction operand expression. */
2435 /* Target segment of the address. */
2436 segT to_seg;
2437 valueT this_add_number;
2438 /* Positive (minuend) symbol. */
2439 symbolS *this_add_symbol;
2440 /* As a number. */
2441 long opcode_as_number;
2442 /* Least significant byte 1st. */
2443 char *opcode_as_chars;
2444 /* As an array of characters. */
2445 /* Least significant byte 1st */
2446 char *opcode_low_byteP;
2447 /* length (bytes) meant by vop_short. */
2448 int length;
2449 /* 0, or 1 if '@' is in addressing mode. */
2450 int at;
2451 /* From vop_nbytes: vax_operand_width (in bytes) */
2452 int nbytes;
2453 FLONUM_TYPE *floatP;
2454 LITTLENUM_TYPE literal_float[8];
2455 /* Big enough for any floating point literal. */
2457 vip (&v, instruction_string);
2459 /* Now we try to find as many as_warn()s as we can. If we do any as_warn()s
2460 then goofed=1. Notice that we don't make any frags yet.
2461 Should goofed be 1, then this instruction will wedge in any pass,
2462 and we can safely flush it, without causing interpass symbol phase
2463 errors. That is, without changing label values in different passes. */
2464 if ((goofed = (*v.vit_error)) != 0)
2466 as_fatal (_("Ignoring statement due to \"%s\""), v.vit_error);
2468 /* We need to use expression() and friends, which require us to diddle
2469 input_line_pointer. So we save it and restore it later. */
2470 save_input_line_pointer = input_line_pointer;
2471 for (operandP = v.vit_operand,
2472 expP = exp_of_operand,
2473 segP = seg_of_operand,
2474 floatP = float_operand,
2475 end_operandP = v.vit_operand + v.vit_operands;
2477 operandP < end_operandP;
2479 operandP++, expP++, segP++, floatP++)
2481 if (operandP->vop_error)
2483 as_fatal (_("Aborting because statement has \"%s\""), operandP->vop_error);
2484 goofed = 1;
2486 else
2488 /* Statement has no syntax goofs: let's sniff the expression. */
2489 int can_be_short = 0; /* 1 if a bignum can be reduced to a short literal. */
2491 input_line_pointer = operandP->vop_expr_begin;
2492 c_save = operandP->vop_expr_end[1];
2493 operandP->vop_expr_end[1] = '\0';
2494 /* If to_seg == SEG_PASS1, expression() will have set need_pass_2 = 1. */
2495 *segP = expression (expP);
2496 switch (expP->X_op)
2498 case O_absent:
2499 /* for BSD4.2 compatibility, missing expression is absolute 0 */
2500 expP->X_op = O_constant;
2501 expP->X_add_number = 0;
2502 /* For SEG_ABSOLUTE, we shouldn't need to set X_op_symbol,
2503 X_add_symbol to any particular value. But, we will program
2504 defensively. Since this situation occurs rarely so it costs
2505 us little to do, and stops Dean worrying about the origin of
2506 random bits in expressionS's. */
2507 expP->X_add_symbol = NULL;
2508 expP->X_op_symbol = NULL;
2509 break;
2511 case O_symbol:
2512 case O_constant:
2513 break;
2515 default:
2516 /* Major bug. We can't handle the case of a
2517 SEG_OP expression in a VIT_OPCODE_SYNTHETIC
2518 variable-length instruction.
2519 We don't have a frag type that is smart enough to
2520 relax a SEG_OP, and so we just force all
2521 SEG_OPs to behave like SEG_PASS1s.
2522 Clearly, if there is a demand we can invent a new or
2523 modified frag type and then coding up a frag for this
2524 case will be easy. SEG_OP was invented for the
2525 .words after a CASE opcode, and was never intended for
2526 instruction operands. */
2527 need_pass_2 = 1;
2528 as_fatal (_("Can't relocate expression"));
2529 break;
2531 case O_big:
2532 /* Preserve the bits. */
2533 if (expP->X_add_number > 0)
2535 bignum_copy (generic_bignum, expP->X_add_number,
2536 floatP->low, SIZE_OF_LARGE_NUMBER);
2538 else
2540 know (expP->X_add_number < 0);
2541 flonum_copy (&generic_floating_point_number,
2542 floatP);
2543 if (strchr ("s i", operandP->vop_short))
2545 /* Could possibly become S^# */
2546 flonum_gen2vax (-expP->X_add_number, floatP, literal_float);
2547 switch (-expP->X_add_number)
2549 case 'f':
2550 can_be_short =
2551 (literal_float[0] & 0xFC0F) == 0x4000
2552 && literal_float[1] == 0;
2553 break;
2555 case 'd':
2556 can_be_short =
2557 (literal_float[0] & 0xFC0F) == 0x4000
2558 && literal_float[1] == 0
2559 && literal_float[2] == 0
2560 && literal_float[3] == 0;
2561 break;
2563 case 'g':
2564 can_be_short =
2565 (literal_float[0] & 0xFF81) == 0x4000
2566 && literal_float[1] == 0
2567 && literal_float[2] == 0
2568 && literal_float[3] == 0;
2569 break;
2571 case 'h':
2572 can_be_short = ((literal_float[0] & 0xFFF8) == 0x4000
2573 && (literal_float[1] & 0xE000) == 0
2574 && literal_float[2] == 0
2575 && literal_float[3] == 0
2576 && literal_float[4] == 0
2577 && literal_float[5] == 0
2578 && literal_float[6] == 0
2579 && literal_float[7] == 0);
2580 break;
2582 default:
2583 BAD_CASE (-expP->X_add_number);
2584 break;
2589 if (operandP->vop_short == 's'
2590 || operandP->vop_short == 'i'
2591 || (operandP->vop_short == ' '
2592 && operandP->vop_reg == 0xF
2593 && (operandP->vop_mode & 0xE) == 0x8))
2595 /* Saw a '#'. */
2596 if (operandP->vop_short == ' ')
2598 /* We must chose S^ or I^. */
2599 if (expP->X_add_number > 0)
2601 /* Bignum: Short literal impossible. */
2602 operandP->vop_short = 'i';
2603 operandP->vop_mode = 8;
2604 operandP->vop_reg = 0xF; /* VAX PC. */
2606 else
2608 /* Flonum: Try to do it. */
2609 if (can_be_short)
2611 operandP->vop_short = 's';
2612 operandP->vop_mode = 0;
2613 operandP->vop_ndx = -1;
2614 operandP->vop_reg = -1;
2615 expP->X_op = O_constant;
2617 else
2619 operandP->vop_short = 'i';
2620 operandP->vop_mode = 8;
2621 operandP->vop_reg = 0xF; /* VAX PC */
2623 } /* bignum or flonum ? */
2624 } /* if #, but no S^ or I^ seen. */
2625 /* No more ' ' case: either 's' or 'i'. */
2626 if (operandP->vop_short == 's')
2628 /* Wants to be a short literal. */
2629 if (expP->X_add_number > 0)
2631 as_warn (_("Bignum not permitted in short literal. Immediate mode assumed."));
2632 operandP->vop_short = 'i';
2633 operandP->vop_mode = 8;
2634 operandP->vop_reg = 0xF; /* VAX PC. */
2636 else
2638 if (!can_be_short)
2640 as_warn (_("Can't do flonum short literal: immediate mode used."));
2641 operandP->vop_short = 'i';
2642 operandP->vop_mode = 8;
2643 operandP->vop_reg = 0xF; /* VAX PC. */
2645 else
2647 /* Encode short literal now. */
2648 int temp = 0;
2650 switch (-expP->X_add_number)
2652 case 'f':
2653 case 'd':
2654 temp = literal_float[0] >> 4;
2655 break;
2657 case 'g':
2658 temp = literal_float[0] >> 1;
2659 break;
2661 case 'h':
2662 temp = ((literal_float[0] << 3) & 070)
2663 | ((literal_float[1] >> 13) & 07);
2664 break;
2666 default:
2667 BAD_CASE (-expP->X_add_number);
2668 break;
2671 floatP->low[0] = temp & 077;
2672 floatP->low[1] = 0;
2676 else
2678 /* I^# seen: set it up if float. */
2679 if (expP->X_add_number < 0)
2681 memcpy (floatP->low, literal_float, sizeof (literal_float));
2683 } /* if S^# seen. */
2685 else
2687 as_warn (_("A bignum/flonum may not be a displacement: 0x%"
2688 PRIx64 " used"),
2689 (uint64_t) (expP->X_add_number = 0x80000000L));
2690 /* Chosen so luser gets the most offset bits to patch later. */
2692 expP->X_add_number = floatP->low[0]
2693 | ((LITTLENUM_MASK & (floatP->low[1])) << LITTLENUM_NUMBER_OF_BITS);
2695 /* For the O_big case we have:
2696 If vop_short == 's' then a short floating literal is in the
2697 lowest 6 bits of floatP -> low [0], which is
2698 big_operand_bits [---] [0].
2699 If vop_short == 'i' then the appropriate number of elements
2700 of big_operand_bits [---] [...] are set up with the correct
2701 bits.
2702 Also, just in case width is byte word or long, we copy the lowest
2703 32 bits of the number to X_add_number. */
2704 break;
2706 if (input_line_pointer != operandP->vop_expr_end + 1)
2708 as_fatal ("Junk at end of expression \"%s\"", input_line_pointer);
2709 goofed = 1;
2711 operandP->vop_expr_end[1] = c_save;
2715 input_line_pointer = save_input_line_pointer;
2717 if (need_pass_2 || goofed)
2718 return;
2720 dwarf2_emit_insn (0);
2721 /* Emit op-code. */
2722 /* Remember where it is, in case we want to modify the op-code later. */
2723 opcode_low_byteP = frag_more (v.vit_opcode_nbytes);
2724 memcpy (opcode_low_byteP, v.vit_opcode, v.vit_opcode_nbytes);
2725 opcode_as_chars = v.vit_opcode;
2726 opcode_as_number = md_chars_to_number ((unsigned char *) opcode_as_chars, 4);
2727 for (operandP = v.vit_operand,
2728 expP = exp_of_operand,
2729 segP = seg_of_operand,
2730 floatP = float_operand,
2731 end_operandP = v.vit_operand + v.vit_operands;
2733 operandP < end_operandP;
2735 operandP++,
2736 floatP++,
2737 segP++,
2738 expP++)
2740 if (operandP->vop_ndx >= 0)
2742 /* Indexed addressing byte. */
2743 /* Legality of indexed mode already checked: it is OK. */
2744 FRAG_APPEND_1_CHAR (0x40 + operandP->vop_ndx);
2745 } /* if(vop_ndx>=0) */
2747 /* Here to make main operand frag(s). */
2748 this_add_number = expP->X_add_number;
2749 this_add_symbol = expP->X_add_symbol;
2750 to_seg = *segP;
2751 is_undefined = (to_seg == undefined_section);
2752 is_absolute = (to_seg == absolute_section);
2753 at = operandP->vop_mode & 1;
2754 length = (operandP->vop_short == 'b'
2755 ? 1 : (operandP->vop_short == 'w'
2756 ? 2 : (operandP->vop_short == 'l'
2757 ? 4 : 0)));
2758 nbytes = operandP->vop_nbytes;
2759 if (operandP->vop_access == 'b')
2761 if (to_seg == now_seg || is_undefined)
2763 /* If is_undefined, then it might BECOME now_seg. */
2764 if (nbytes)
2766 p = frag_more (nbytes);
2767 fix_new (frag_now, p - frag_now->fr_literal, nbytes,
2768 this_add_symbol, this_add_number, 1, NO_RELOC);
2770 else
2772 /* to_seg==now_seg || to_seg == SEG_UNKNOWN */
2773 /* nbytes==0 */
2774 length_code = is_undefined ? STATE_UNDF : STATE_BYTE;
2775 if (opcode_as_number & VIT_OPCODE_SPECIAL)
2777 if (operandP->vop_width == VAX_WIDTH_UNCONDITIONAL_JUMP)
2779 /* br or jsb */
2780 frag_var (rs_machine_dependent, 5, 1,
2781 ENCODE_RELAX (STATE_ALWAYS_BRANCH, length_code),
2782 this_add_symbol, this_add_number,
2783 opcode_low_byteP);
2785 else
2787 if (operandP->vop_width == VAX_WIDTH_WORD_JUMP)
2789 length_code = STATE_WORD;
2790 /* JF: There is no state_byte for this one! */
2791 frag_var (rs_machine_dependent, 10, 2,
2792 ENCODE_RELAX (STATE_COMPLEX_BRANCH, length_code),
2793 this_add_symbol, this_add_number,
2794 opcode_low_byteP);
2796 else
2798 know (operandP->vop_width == VAX_WIDTH_BYTE_JUMP);
2799 frag_var (rs_machine_dependent, 9, 1,
2800 ENCODE_RELAX (STATE_COMPLEX_HOP, length_code),
2801 this_add_symbol, this_add_number,
2802 opcode_low_byteP);
2806 else
2808 know (operandP->vop_width == VAX_WIDTH_CONDITIONAL_JUMP);
2809 frag_var (rs_machine_dependent, 7, 1,
2810 ENCODE_RELAX (STATE_CONDITIONAL_BRANCH, length_code),
2811 this_add_symbol, this_add_number,
2812 opcode_low_byteP);
2816 else
2818 /* to_seg != now_seg && to_seg != SEG_UNKNOWN */
2819 /* --- SEG FLOAT MAY APPEAR HERE --- */
2820 if (is_absolute)
2822 if (nbytes)
2824 know (!(opcode_as_number & VIT_OPCODE_SYNTHETIC));
2825 p = frag_more (nbytes);
2826 /* Conventional relocation. */
2827 fix_new (frag_now, p - frag_now->fr_literal, nbytes,
2828 section_symbol (absolute_section),
2829 this_add_number, 1, NO_RELOC);
2831 else
2833 know (opcode_as_number & VIT_OPCODE_SYNTHETIC);
2834 if (opcode_as_number & VIT_OPCODE_SPECIAL)
2836 if (operandP->vop_width == VAX_WIDTH_UNCONDITIONAL_JUMP)
2838 /* br or jsb */
2839 *opcode_low_byteP = opcode_as_chars[0] + VAX_WIDEN_LONG;
2840 know (opcode_as_chars[1] == 0);
2841 p = frag_more (5);
2842 p[0] = VAX_ABSOLUTE_MODE; /* @#... */
2843 md_number_to_chars (p + 1, this_add_number, 4);
2844 /* Now (eg) JMP @#foo or JSB @#foo. */
2846 else
2848 if (operandP->vop_width == VAX_WIDTH_WORD_JUMP)
2850 p = frag_more (10);
2851 p[0] = 2;
2852 p[1] = 0;
2853 p[2] = VAX_BRB;
2854 p[3] = 6;
2855 p[4] = VAX_JMP;
2856 p[5] = VAX_ABSOLUTE_MODE; /* @#... */
2857 md_number_to_chars (p + 6, this_add_number, 4);
2858 /* Now (eg) ACBx 1f
2859 BRB 2f
2860 1: JMP @#foo
2861 2: */
2863 else
2865 know (operandP->vop_width == VAX_WIDTH_BYTE_JUMP);
2866 p = frag_more (9);
2867 p[0] = 2;
2868 p[1] = VAX_BRB;
2869 p[2] = 6;
2870 p[3] = VAX_JMP;
2871 p[4] = VAX_ABSOLUTE_MODE; /* @#... */
2872 md_number_to_chars (p + 5, this_add_number, 4);
2873 /* Now (eg) xOBxxx 1f
2874 BRB 2f
2875 1: JMP @#foo
2876 2: */
2880 else
2882 /* b<cond> */
2883 *opcode_low_byteP ^= 1;
2884 /* To reverse the condition in a VAX branch,
2885 complement the lowest order bit. */
2886 p = frag_more (7);
2887 p[0] = 6;
2888 p[1] = VAX_JMP;
2889 p[2] = VAX_ABSOLUTE_MODE; /* @#... */
2890 md_number_to_chars (p + 3, this_add_number, 4);
2891 /* Now (eg) BLEQ 1f
2892 JMP @#foo
2893 1: */
2897 else
2899 /* to_seg != now_seg && !is_undefinfed && !is_absolute */
2900 if (nbytes > 0)
2902 /* Pc-relative. Conventional relocation. */
2903 know (!(opcode_as_number & VIT_OPCODE_SYNTHETIC));
2904 p = frag_more (nbytes);
2905 fix_new (frag_now, p - frag_now->fr_literal, nbytes,
2906 section_symbol (absolute_section),
2907 this_add_number, 1, NO_RELOC);
2909 else
2911 know (opcode_as_number & VIT_OPCODE_SYNTHETIC);
2912 if (opcode_as_number & VIT_OPCODE_SPECIAL)
2914 if (operandP->vop_width == VAX_WIDTH_UNCONDITIONAL_JUMP)
2916 /* br or jsb */
2917 know (opcode_as_chars[1] == 0);
2918 *opcode_low_byteP = opcode_as_chars[0] + VAX_WIDEN_LONG;
2919 p = frag_more (5);
2920 p[0] = VAX_PC_RELATIVE_MODE;
2921 fix_new (frag_now,
2922 p + 1 - frag_now->fr_literal, 4,
2923 this_add_symbol,
2924 this_add_number, 1, NO_RELOC);
2925 /* Now eg JMP foo or JSB foo. */
2927 else
2929 if (operandP->vop_width == VAX_WIDTH_WORD_JUMP)
2931 p = frag_more (10);
2932 p[0] = 0;
2933 p[1] = 2;
2934 p[2] = VAX_BRB;
2935 p[3] = 6;
2936 p[4] = VAX_JMP;
2937 p[5] = VAX_PC_RELATIVE_MODE;
2938 fix_new (frag_now,
2939 p + 6 - frag_now->fr_literal, 4,
2940 this_add_symbol,
2941 this_add_number, 1, NO_RELOC);
2942 /* Now (eg) ACBx 1f
2943 BRB 2f
2944 1: JMP foo
2945 2: */
2947 else
2949 know (operandP->vop_width == VAX_WIDTH_BYTE_JUMP);
2950 p = frag_more (10);
2951 p[0] = 2;
2952 p[1] = VAX_BRB;
2953 p[2] = 6;
2954 p[3] = VAX_JMP;
2955 p[4] = VAX_PC_RELATIVE_MODE;
2956 fix_new (frag_now,
2957 p + 5 - frag_now->fr_literal,
2958 4, this_add_symbol,
2959 this_add_number, 1, NO_RELOC);
2960 /* Now (eg) xOBxxx 1f
2961 BRB 2f
2962 1: JMP foo
2963 2: */
2967 else
2969 know (operandP->vop_width == VAX_WIDTH_CONDITIONAL_JUMP);
2970 *opcode_low_byteP ^= 1; /* Reverse branch condition. */
2971 p = frag_more (7);
2972 p[0] = 6;
2973 p[1] = VAX_JMP;
2974 p[2] = VAX_PC_RELATIVE_MODE;
2975 fix_new (frag_now, p + 3 - frag_now->fr_literal,
2976 4, this_add_symbol,
2977 this_add_number, 1, NO_RELOC);
2983 else
2985 /* So it is ordinary operand. */
2986 know (operandP->vop_access != 'b');
2987 /* ' ' target-independent: elsewhere. */
2988 know (operandP->vop_access != ' ');
2989 know (operandP->vop_access == 'a'
2990 || operandP->vop_access == 'm'
2991 || operandP->vop_access == 'r'
2992 || operandP->vop_access == 'v'
2993 || operandP->vop_access == 'w');
2994 if (operandP->vop_short == 's')
2996 if (is_absolute)
2998 if (this_add_number >= 64)
3000 as_warn (_("Short literal overflow(%ld.), immediate mode assumed."),
3001 (long) this_add_number);
3002 operandP->vop_short = 'i';
3003 operandP->vop_mode = 8;
3004 operandP->vop_reg = 0xF;
3007 else
3009 as_warn (_("Forced short literal to immediate mode. now_seg=%s to_seg=%s"),
3010 segment_name (now_seg), segment_name (to_seg));
3011 operandP->vop_short = 'i';
3012 operandP->vop_mode = 8;
3013 operandP->vop_reg = 0xF;
3016 if (operandP->vop_reg >= 0 && (operandP->vop_mode < 8
3017 || (operandP->vop_reg != 0xF && operandP->vop_mode < 10)))
3019 /* One byte operand. */
3020 know (operandP->vop_mode > 3);
3021 FRAG_APPEND_1_CHAR (operandP->vop_mode << 4 | operandP->vop_reg);
3022 /* All 1-bytes except S^# happen here. */
3024 else
3026 /* {@}{q^}foo{(Rn)} or S^#foo */
3027 if (operandP->vop_reg == -1 && operandP->vop_short != 's')
3029 /* "{@}{q^}foo" */
3030 if (to_seg == now_seg)
3032 if (length == 0)
3034 know (operandP->vop_short == ' ');
3035 length_code = STATE_BYTE;
3036 #ifdef OBJ_ELF
3037 if (S_IS_EXTERNAL (this_add_symbol)
3038 || S_IS_WEAK (this_add_symbol))
3039 length_code = STATE_UNDF;
3040 #endif
3041 p = frag_var (rs_machine_dependent, 10, 2,
3042 ENCODE_RELAX (STATE_PC_RELATIVE, length_code),
3043 this_add_symbol, this_add_number,
3044 opcode_low_byteP);
3045 know (operandP->vop_mode == 10 + at);
3046 *p = at << 4;
3047 /* At is the only context we need to carry
3048 to other side of relax() process. Must
3049 be in the correct bit position of VAX
3050 operand spec. byte. */
3052 else
3054 know (length);
3055 know (operandP->vop_short != ' ');
3056 p = frag_more (length + 1);
3057 p[0] = 0xF | ((at + "?\12\14?\16"[length]) << 4);
3058 fix_new (frag_now, p + 1 - frag_now->fr_literal,
3059 length, this_add_symbol,
3060 this_add_number, 1, NO_RELOC);
3063 else
3065 /* to_seg != now_seg */
3066 if (this_add_symbol == NULL)
3068 know (is_absolute);
3069 /* Do @#foo: simpler relocation than foo-.(pc) anyway. */
3070 p = frag_more (5);
3071 p[0] = VAX_ABSOLUTE_MODE; /* @#... */
3072 md_number_to_chars (p + 1, this_add_number, 4);
3073 if (length && length != 4)
3074 as_warn (_("Length specification ignored. Address mode 9F used"));
3076 else
3078 /* {@}{q^}other_seg */
3079 know ((length == 0 && operandP->vop_short == ' ')
3080 || (length > 0 && operandP->vop_short != ' '));
3081 if (is_undefined
3082 #ifdef OBJ_ELF
3083 || S_IS_WEAK(this_add_symbol)
3084 || S_IS_EXTERNAL(this_add_symbol)
3085 #endif
3088 switch (length)
3090 default: length_code = STATE_UNDF; break;
3091 case 1: length_code = STATE_BYTE; break;
3092 case 2: length_code = STATE_WORD; break;
3093 case 4: length_code = STATE_LONG; break;
3095 /* We have a SEG_UNKNOWN symbol. It might
3096 turn out to be in the same segment as
3097 the instruction, permitting relaxation. */
3098 p = frag_var (rs_machine_dependent, 5, 2,
3099 ENCODE_RELAX (STATE_PC_RELATIVE, length_code),
3100 this_add_symbol, this_add_number,
3101 opcode_low_byteP);
3102 p[0] = at << 4;
3104 else
3106 if (length == 0)
3108 know (operandP->vop_short == ' ');
3109 length = 4; /* Longest possible. */
3111 p = frag_more (length + 1);
3112 p[0] = 0xF | ((at + "?\12\14?\16"[length]) << 4);
3113 md_number_to_chars (p + 1, this_add_number, length);
3114 fix_new (frag_now,
3115 p + 1 - frag_now->fr_literal,
3116 length, this_add_symbol,
3117 this_add_number, 1, NO_RELOC);
3122 else
3124 /* {@}{q^}foo(Rn) or S^# or I^# or # */
3125 if (operandP->vop_mode < 0xA)
3127 /* # or S^# or I^# */
3128 if (operandP->vop_access == 'v'
3129 || operandP->vop_access == 'a')
3131 if (operandP->vop_access == 'v')
3132 as_warn (_("Invalid operand: immediate value used as base address."));
3133 else
3134 as_warn (_("Invalid operand: immediate value used as address."));
3135 /* gcc 2.6.3 is known to generate these in at least
3136 one case. */
3138 if (length == 0
3139 && is_absolute && (expP->X_op != O_big)
3140 && operandP->vop_mode == 8 /* No '@'. */
3141 && this_add_number < 64)
3143 operandP->vop_short = 's';
3145 if (operandP->vop_short == 's')
3147 FRAG_APPEND_1_CHAR (this_add_number);
3149 else
3151 /* I^#... */
3152 know (nbytes);
3153 p = frag_more (nbytes + 1);
3154 know (operandP->vop_reg == 0xF);
3155 #ifdef OBJ_ELF
3156 if (flag_want_pic && operandP->vop_mode == 8
3157 && this_add_symbol != NULL)
3159 as_warn (_("Symbol %s used as immediate operand in PIC mode."),
3160 S_GET_NAME (this_add_symbol));
3162 #endif
3163 p[0] = (operandP->vop_mode << 4) | 0xF;
3164 if ((is_absolute) && (expP->X_op != O_big))
3166 /* If nbytes > 4, then we are scrod. We
3167 don't know if the high order bytes
3168 are to be 0xFF or 0x00. BSD4.2 & RMS
3169 say use 0x00. OK --- but this
3170 assembler needs ANOTHER rewrite to
3171 cope properly with this bug. */
3172 md_number_to_chars (p + 1, this_add_number,
3173 min (sizeof (valueT),
3174 (size_t) nbytes));
3175 if ((size_t) nbytes > sizeof (valueT))
3176 memset (p + 1 + sizeof (valueT),
3177 '\0', nbytes - sizeof (valueT));
3179 else
3181 if (expP->X_op == O_big)
3183 /* Problem here is to get the bytes
3184 in the right order. We stored
3185 our constant as LITTLENUMs, not
3186 bytes. */
3187 LITTLENUM_TYPE *lP;
3189 lP = floatP->low;
3190 if (nbytes & 1)
3192 know (nbytes == 1);
3193 p[1] = *lP;
3195 else
3197 for (p++; nbytes; nbytes -= 2, p += 2, lP++)
3198 md_number_to_chars (p, *lP, 2);
3201 else
3203 fix_new (frag_now, p + 1 - frag_now->fr_literal,
3204 nbytes, this_add_symbol,
3205 this_add_number, 0, NO_RELOC);
3210 else
3212 /* {@}{q^}foo(Rn) */
3213 know ((length == 0 && operandP->vop_short == ' ')
3214 || (length > 0 && operandP->vop_short != ' '));
3215 if (length == 0)
3217 if (is_absolute)
3219 long test;
3221 test = this_add_number;
3223 if (test < 0)
3224 test = ~test;
3226 length = test & 0xffff8000 ? 4
3227 : test & 0xffffff80 ? 2
3228 : 1;
3230 else
3232 length = 4;
3235 p = frag_more (1 + length);
3236 know (operandP->vop_reg >= 0);
3237 p[0] = operandP->vop_reg
3238 | ((at | "?\12\14?\16"[length]) << 4);
3239 if (is_absolute)
3241 md_number_to_chars (p + 1, this_add_number, length);
3243 else
3245 fix_new (frag_now, p + 1 - frag_now->fr_literal,
3246 length, this_add_symbol,
3247 this_add_number, 0, NO_RELOC);
3256 void
3257 md_begin (void)
3259 FLONUM_TYPE *fP;
3260 int i;
3262 vip_begin (1, "$", "*", "`");
3264 for (i = 0, fP = float_operand;
3265 fP < float_operand + VIT_MAX_OPERANDS;
3266 i++, fP++)
3268 fP->low = &big_operand_bits[i][0];
3269 fP->high = &big_operand_bits[i][SIZE_OF_LARGE_NUMBER - 1];
3273 bfd_reloc_code_real_type
3274 vax_cons (expressionS *exp, int size)
3276 char *save;
3277 const char *vax_cons_special_reloc;
3279 SKIP_WHITESPACE ();
3280 vax_cons_special_reloc = NULL;
3281 save = input_line_pointer;
3282 if (input_line_pointer[0] == '%')
3284 if (startswith (input_line_pointer + 1, "pcrel"))
3286 input_line_pointer += 6;
3287 vax_cons_special_reloc = "pcrel";
3289 if (vax_cons_special_reloc)
3291 int bad = 0;
3293 switch (size)
3295 case 1:
3296 if (*input_line_pointer != '8')
3297 bad = 1;
3298 input_line_pointer--;
3299 break;
3300 case 2:
3301 if (input_line_pointer[0] != '1' || input_line_pointer[1] != '6')
3302 bad = 1;
3303 break;
3304 case 4:
3305 if (input_line_pointer[0] != '3' || input_line_pointer[1] != '2')
3306 bad = 1;
3307 break;
3308 default:
3309 bad = 1;
3310 break;
3313 if (bad)
3315 as_bad (_("Illegal operands: Only %%r_%s%d allowed in %d-byte data fields"),
3316 vax_cons_special_reloc, size * 8, size);
3318 else
3320 input_line_pointer += 2;
3321 if (*input_line_pointer != '(')
3323 as_bad (_("Illegal operands: %%r_%s%d requires arguments in ()"),
3324 vax_cons_special_reloc, size * 8);
3325 bad = 1;
3329 if (bad)
3331 input_line_pointer = save;
3332 vax_cons_special_reloc = NULL;
3334 else
3336 int c;
3337 char *end = ++input_line_pointer;
3338 int npar = 0;
3340 while (! is_end_of_line[(c = *end)])
3342 if (c == '(')
3343 npar++;
3344 else if (c == ')')
3346 if (!npar)
3347 break;
3348 npar--;
3350 end++;
3353 if (c != ')')
3354 as_bad (_("Illegal operands: %%r_%s%d requires arguments in ()"),
3355 vax_cons_special_reloc, size * 8);
3356 else
3358 *end = '\0';
3359 expression (exp);
3360 *end = c;
3361 if (input_line_pointer != end)
3363 as_bad (_("Illegal operands: %%r_%s%d requires arguments in ()"),
3364 vax_cons_special_reloc, size * 8);
3366 else
3368 input_line_pointer++;
3369 SKIP_WHITESPACE ();
3370 c = *input_line_pointer;
3371 if (! is_end_of_line[c] && c != ',')
3372 as_bad (_("Illegal operands: garbage after %%r_%s%d()"),
3373 vax_cons_special_reloc, size * 8);
3379 if (vax_cons_special_reloc == NULL)
3380 expression (exp);
3381 else
3382 switch (size)
3384 case 1: return BFD_RELOC_8_PCREL;
3385 case 2: return BFD_RELOC_16_PCREL;
3386 case 4: return BFD_RELOC_32_PCREL;
3388 return NO_RELOC;
3391 /* This is called by emit_expr via TC_CONS_FIX_NEW when creating a
3392 reloc for a cons. */
3394 void
3395 vax_cons_fix_new (fragS *frag, int where, unsigned int nbytes, expressionS *exp,
3396 bfd_reloc_code_real_type r)
3398 if (r == NO_RELOC)
3399 r = (nbytes == 1 ? BFD_RELOC_8
3400 : nbytes == 2 ? BFD_RELOC_16
3401 : BFD_RELOC_32);
3403 fix_new_exp (frag, where, (int) nbytes, exp, 0, r);
3406 const char *
3407 md_atof (int type, char * litP, int * sizeP)
3409 return vax_md_atof (type, litP, sizeP);