gas/
[binutils.git] / gas / config / tc-i386.c
blob514ff4bff8d8d79957c47753af78f94bba9eb299
1 /* i386.c -- Assemble code for the Intel 80386
2 Copyright 1989, 1991, 1992, 1993, 1994, 1995, 1996, 1997, 1998, 1999,
3 2000, 2001, 2002, 2003, 2004, 2005
4 Free Software Foundation, Inc.
6 This file is part of GAS, the GNU Assembler.
8 GAS is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 2, or (at your option)
11 any later version.
13 GAS is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with GAS; see the file COPYING. If not, write to the Free
20 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
21 02110-1301, USA. */
23 /* Intel 80386 machine specific gas.
24 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
25 x86_64 support by Jan Hubicka (jh@suse.cz)
26 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
27 Bugs & suggestions are completely welcome. This is free software.
28 Please help us make it better. */
30 #include "as.h"
31 #include "safe-ctype.h"
32 #include "subsegs.h"
33 #include "dwarf2dbg.h"
34 #include "dw2gencfi.h"
35 #include "opcode/i386.h"
36 #include "elf/x86-64.h"
38 #ifndef REGISTER_WARNINGS
39 #define REGISTER_WARNINGS 1
40 #endif
42 #ifndef INFER_ADDR_PREFIX
43 #define INFER_ADDR_PREFIX 1
44 #endif
46 #ifndef SCALE1_WHEN_NO_INDEX
47 /* Specifying a scale factor besides 1 when there is no index is
48 futile. eg. `mov (%ebx,2),%al' does exactly the same as
49 `mov (%ebx),%al'. To slavishly follow what the programmer
50 specified, set SCALE1_WHEN_NO_INDEX to 0. */
51 #define SCALE1_WHEN_NO_INDEX 1
52 #endif
54 #ifndef DEFAULT_ARCH
55 #define DEFAULT_ARCH "i386"
56 #endif
58 #ifndef INLINE
59 #if __GNUC__ >= 2
60 #define INLINE __inline__
61 #else
62 #define INLINE
63 #endif
64 #endif
66 static INLINE unsigned int mode_from_disp_size PARAMS ((unsigned int));
67 static INLINE int fits_in_signed_byte PARAMS ((offsetT));
68 static INLINE int fits_in_unsigned_byte PARAMS ((offsetT));
69 static INLINE int fits_in_unsigned_word PARAMS ((offsetT));
70 static INLINE int fits_in_signed_word PARAMS ((offsetT));
71 static INLINE int fits_in_unsigned_long PARAMS ((offsetT));
72 static INLINE int fits_in_signed_long PARAMS ((offsetT));
73 static int smallest_imm_type PARAMS ((offsetT));
74 static offsetT offset_in_range PARAMS ((offsetT, int));
75 static int add_prefix PARAMS ((unsigned int));
76 static void set_code_flag PARAMS ((int));
77 static void set_16bit_gcc_code_flag PARAMS ((int));
78 static void set_intel_syntax PARAMS ((int));
79 static void set_cpu_arch PARAMS ((int));
80 #ifdef TE_PE
81 static void pe_directive_secrel PARAMS ((int));
82 #endif
83 static char *output_invalid PARAMS ((int c));
84 static int i386_operand PARAMS ((char *operand_string));
85 static int i386_intel_operand PARAMS ((char *operand_string, int got_a_float));
86 static const reg_entry *parse_register PARAMS ((char *reg_string,
87 char **end_op));
88 static char *parse_insn PARAMS ((char *, char *));
89 static char *parse_operands PARAMS ((char *, const char *));
90 static void swap_operands PARAMS ((void));
91 static void optimize_imm PARAMS ((void));
92 static void optimize_disp PARAMS ((void));
93 static int match_template PARAMS ((void));
94 static int check_string PARAMS ((void));
95 static int process_suffix PARAMS ((void));
96 static int check_byte_reg PARAMS ((void));
97 static int check_long_reg PARAMS ((void));
98 static int check_qword_reg PARAMS ((void));
99 static int check_word_reg PARAMS ((void));
100 static int finalize_imm PARAMS ((void));
101 static int process_operands PARAMS ((void));
102 static const seg_entry *build_modrm_byte PARAMS ((void));
103 static void output_insn PARAMS ((void));
104 static void output_branch PARAMS ((void));
105 static void output_jump PARAMS ((void));
106 static void output_interseg_jump PARAMS ((void));
107 static void output_imm PARAMS ((fragS *insn_start_frag,
108 offsetT insn_start_off));
109 static void output_disp PARAMS ((fragS *insn_start_frag,
110 offsetT insn_start_off));
111 #ifndef I386COFF
112 static void s_bss PARAMS ((int));
113 #endif
115 static const char *default_arch = DEFAULT_ARCH;
117 /* 'md_assemble ()' gathers together information and puts it into a
118 i386_insn. */
120 union i386_op
122 expressionS *disps;
123 expressionS *imms;
124 const reg_entry *regs;
127 struct _i386_insn
129 /* TM holds the template for the insn were currently assembling. */
130 template tm;
132 /* SUFFIX holds the instruction mnemonic suffix if given.
133 (e.g. 'l' for 'movl') */
134 char suffix;
136 /* OPERANDS gives the number of given operands. */
137 unsigned int operands;
139 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
140 of given register, displacement, memory operands and immediate
141 operands. */
142 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
144 /* TYPES [i] is the type (see above #defines) which tells us how to
145 use OP[i] for the corresponding operand. */
146 unsigned int types[MAX_OPERANDS];
148 /* Displacement expression, immediate expression, or register for each
149 operand. */
150 union i386_op op[MAX_OPERANDS];
152 /* Flags for operands. */
153 unsigned int flags[MAX_OPERANDS];
154 #define Operand_PCrel 1
156 /* Relocation type for operand */
157 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
159 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
160 the base index byte below. */
161 const reg_entry *base_reg;
162 const reg_entry *index_reg;
163 unsigned int log2_scale_factor;
165 /* SEG gives the seg_entries of this insn. They are zero unless
166 explicit segment overrides are given. */
167 const seg_entry *seg[2];
169 /* PREFIX holds all the given prefix opcodes (usually null).
170 PREFIXES is the number of prefix opcodes. */
171 unsigned int prefixes;
172 unsigned char prefix[MAX_PREFIXES];
174 /* RM and SIB are the modrm byte and the sib byte where the
175 addressing modes of this insn are encoded. */
177 modrm_byte rm;
178 rex_byte rex;
179 sib_byte sib;
182 typedef struct _i386_insn i386_insn;
184 /* List of chars besides those in app.c:symbol_chars that can start an
185 operand. Used to prevent the scrubber eating vital white-space. */
186 const char extra_symbol_chars[] = "*%-(["
187 #ifdef LEX_AT
189 #endif
190 #ifdef LEX_QM
192 #endif
195 #if (defined (TE_I386AIX) \
196 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
197 && !defined (TE_LINUX) \
198 && !defined (TE_NETWARE) \
199 && !defined (TE_FreeBSD) \
200 && !defined (TE_NetBSD)))
201 /* This array holds the chars that always start a comment. If the
202 pre-processor is disabled, these aren't very useful. */
203 const char comment_chars[] = "#/";
204 #define PREFIX_SEPARATOR '\\'
206 /* This array holds the chars that only start a comment at the beginning of
207 a line. If the line seems to have the form '# 123 filename'
208 .line and .file directives will appear in the pre-processed output.
209 Note that input_file.c hand checks for '#' at the beginning of the
210 first line of the input file. This is because the compiler outputs
211 #NO_APP at the beginning of its output.
212 Also note that comments started like this one will always work if
213 '/' isn't otherwise defined. */
214 const char line_comment_chars[] = "#";
216 #else
217 /* Putting '/' here makes it impossible to use the divide operator.
218 However, we need it for compatibility with SVR4 systems. */
219 const char comment_chars[] = "#";
220 #define PREFIX_SEPARATOR '/'
222 const char line_comment_chars[] = "/#";
223 #endif
225 const char line_separator_chars[] = ";";
227 /* Chars that can be used to separate mant from exp in floating point
228 nums. */
229 const char EXP_CHARS[] = "eE";
231 /* Chars that mean this number is a floating point constant
232 As in 0f12.456
233 or 0d1.2345e12. */
234 const char FLT_CHARS[] = "fFdDxX";
236 /* Tables for lexical analysis. */
237 static char mnemonic_chars[256];
238 static char register_chars[256];
239 static char operand_chars[256];
240 static char identifier_chars[256];
241 static char digit_chars[256];
243 /* Lexical macros. */
244 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
245 #define is_operand_char(x) (operand_chars[(unsigned char) x])
246 #define is_register_char(x) (register_chars[(unsigned char) x])
247 #define is_space_char(x) ((x) == ' ')
248 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
249 #define is_digit_char(x) (digit_chars[(unsigned char) x])
251 /* All non-digit non-letter characters that may occur in an operand. */
252 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
254 /* md_assemble() always leaves the strings it's passed unaltered. To
255 effect this we maintain a stack of saved characters that we've smashed
256 with '\0's (indicating end of strings for various sub-fields of the
257 assembler instruction). */
258 static char save_stack[32];
259 static char *save_stack_p;
260 #define END_STRING_AND_SAVE(s) \
261 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
262 #define RESTORE_END_STRING(s) \
263 do { *(s) = *--save_stack_p; } while (0)
265 /* The instruction we're assembling. */
266 static i386_insn i;
268 /* Possible templates for current insn. */
269 static const templates *current_templates;
271 /* Per instruction expressionS buffers: 2 displacements & 2 immediate max. */
272 static expressionS disp_expressions[2], im_expressions[2];
274 /* Current operand we are working on. */
275 static int this_operand;
277 /* We support four different modes. FLAG_CODE variable is used to distinguish
278 these. */
280 enum flag_code {
281 CODE_32BIT,
282 CODE_16BIT,
283 CODE_64BIT };
284 #define NUM_FLAG_CODE ((int) CODE_64BIT + 1)
286 static enum flag_code flag_code;
287 static int use_rela_relocations = 0;
289 /* The names used to print error messages. */
290 static const char *flag_code_names[] =
292 "32",
293 "16",
294 "64"
297 /* 1 for intel syntax,
298 0 if att syntax. */
299 static int intel_syntax = 0;
301 /* 1 if register prefix % not required. */
302 static int allow_naked_reg = 0;
304 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
305 leave, push, and pop instructions so that gcc has the same stack
306 frame as in 32 bit mode. */
307 static char stackop_size = '\0';
309 /* Non-zero to optimize code alignment. */
310 int optimize_align_code = 1;
312 /* Non-zero to quieten some warnings. */
313 static int quiet_warnings = 0;
315 /* CPU name. */
316 static const char *cpu_arch_name = NULL;
317 static const char *cpu_sub_arch_name = NULL;
319 /* CPU feature flags. */
320 static unsigned int cpu_arch_flags = CpuUnknownFlags | CpuNo64;
322 /* If set, conditional jumps are not automatically promoted to handle
323 larger than a byte offset. */
324 static unsigned int no_cond_jump_promotion = 0;
326 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
327 static symbolS *GOT_symbol;
329 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
330 unsigned int x86_dwarf2_return_column;
332 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
333 int x86_cie_data_alignment;
335 /* Interface to relax_segment.
336 There are 3 major relax states for 386 jump insns because the
337 different types of jumps add different sizes to frags when we're
338 figuring out what sort of jump to choose to reach a given label. */
340 /* Types. */
341 #define UNCOND_JUMP 0
342 #define COND_JUMP 1
343 #define COND_JUMP86 2
345 /* Sizes. */
346 #define CODE16 1
347 #define SMALL 0
348 #define SMALL16 (SMALL | CODE16)
349 #define BIG 2
350 #define BIG16 (BIG | CODE16)
352 #ifndef INLINE
353 #ifdef __GNUC__
354 #define INLINE __inline__
355 #else
356 #define INLINE
357 #endif
358 #endif
360 #define ENCODE_RELAX_STATE(type, size) \
361 ((relax_substateT) (((type) << 2) | (size)))
362 #define TYPE_FROM_RELAX_STATE(s) \
363 ((s) >> 2)
364 #define DISP_SIZE_FROM_RELAX_STATE(s) \
365 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
367 /* This table is used by relax_frag to promote short jumps to long
368 ones where necessary. SMALL (short) jumps may be promoted to BIG
369 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
370 don't allow a short jump in a 32 bit code segment to be promoted to
371 a 16 bit offset jump because it's slower (requires data size
372 prefix), and doesn't work, unless the destination is in the bottom
373 64k of the code segment (The top 16 bits of eip are zeroed). */
375 const relax_typeS md_relax_table[] =
377 /* The fields are:
378 1) most positive reach of this state,
379 2) most negative reach of this state,
380 3) how many bytes this mode will have in the variable part of the frag
381 4) which index into the table to try if we can't fit into this one. */
383 /* UNCOND_JUMP states. */
384 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
385 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
386 /* dword jmp adds 4 bytes to frag:
387 0 extra opcode bytes, 4 displacement bytes. */
388 {0, 0, 4, 0},
389 /* word jmp adds 2 byte2 to frag:
390 0 extra opcode bytes, 2 displacement bytes. */
391 {0, 0, 2, 0},
393 /* COND_JUMP states. */
394 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
395 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
396 /* dword conditionals adds 5 bytes to frag:
397 1 extra opcode byte, 4 displacement bytes. */
398 {0, 0, 5, 0},
399 /* word conditionals add 3 bytes to frag:
400 1 extra opcode byte, 2 displacement bytes. */
401 {0, 0, 3, 0},
403 /* COND_JUMP86 states. */
404 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
405 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
406 /* dword conditionals adds 5 bytes to frag:
407 1 extra opcode byte, 4 displacement bytes. */
408 {0, 0, 5, 0},
409 /* word conditionals add 4 bytes to frag:
410 1 displacement byte and a 3 byte long branch insn. */
411 {0, 0, 4, 0}
414 static const arch_entry cpu_arch[] = {
415 {"i8086", Cpu086 },
416 {"i186", Cpu086|Cpu186 },
417 {"i286", Cpu086|Cpu186|Cpu286 },
418 {"i386", Cpu086|Cpu186|Cpu286|Cpu386 },
419 {"i486", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486 },
420 {"i586", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586 },
421 {"i686", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686 },
422 {"pentium", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586 },
423 {"pentiumpro",Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686 },
424 {"pentiumii", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuMMX },
425 {"pentiumiii",Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuMMX|CpuMMX2|CpuSSE },
426 {"pentium4", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuP4|CpuMMX|CpuMMX2|CpuSSE|CpuSSE2 },
427 {"prescott", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuP4|CpuMMX|CpuMMX2|CpuSSE|CpuSSE2|CpuPNI },
428 {"k6", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|CpuK6|CpuMMX },
429 {"k6_2", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|CpuK6|CpuMMX|Cpu3dnow },
430 {"athlon", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuK6|CpuAthlon|CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA },
431 {"sledgehammer",Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuK6|CpuAthlon|CpuSledgehammer|CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA|CpuSSE|CpuSSE2 },
432 {"opteron", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuK6|CpuAthlon|CpuSledgehammer|CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA|CpuSSE|CpuSSE2 },
433 {".mmx", CpuMMX },
434 {".sse", CpuMMX|CpuMMX2|CpuSSE },
435 {".sse2", CpuMMX|CpuMMX2|CpuSSE|CpuSSE2 },
436 {".sse3", CpuMMX|CpuMMX2|CpuSSE|CpuSSE2|CpuSSE3 },
437 {".3dnow", CpuMMX|Cpu3dnow },
438 {".3dnowa", CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA },
439 {".padlock", CpuPadLock },
440 {".pacifica", CpuSVME },
441 {".svme", CpuSVME },
442 {NULL, 0 }
445 const pseudo_typeS md_pseudo_table[] =
447 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
448 {"align", s_align_bytes, 0},
449 #else
450 {"align", s_align_ptwo, 0},
451 #endif
452 {"arch", set_cpu_arch, 0},
453 #ifndef I386COFF
454 {"bss", s_bss, 0},
455 #endif
456 {"ffloat", float_cons, 'f'},
457 {"dfloat", float_cons, 'd'},
458 {"tfloat", float_cons, 'x'},
459 {"value", cons, 2},
460 {"noopt", s_ignore, 0},
461 {"optim", s_ignore, 0},
462 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
463 {"code16", set_code_flag, CODE_16BIT},
464 {"code32", set_code_flag, CODE_32BIT},
465 {"code64", set_code_flag, CODE_64BIT},
466 {"intel_syntax", set_intel_syntax, 1},
467 {"att_syntax", set_intel_syntax, 0},
468 {"file", (void (*) PARAMS ((int))) dwarf2_directive_file, 0},
469 {"loc", dwarf2_directive_loc, 0},
470 #ifdef TE_PE
471 {"secrel32", pe_directive_secrel, 0},
472 #endif
473 {0, 0, 0}
476 /* For interface with expression (). */
477 extern char *input_line_pointer;
479 /* Hash table for instruction mnemonic lookup. */
480 static struct hash_control *op_hash;
482 /* Hash table for register lookup. */
483 static struct hash_control *reg_hash;
485 void
486 i386_align_code (fragP, count)
487 fragS *fragP;
488 int count;
490 /* Various efficient no-op patterns for aligning code labels.
491 Note: Don't try to assemble the instructions in the comments.
492 0L and 0w are not legal. */
493 static const char f32_1[] =
494 {0x90}; /* nop */
495 static const char f32_2[] =
496 {0x89,0xf6}; /* movl %esi,%esi */
497 static const char f32_3[] =
498 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
499 static const char f32_4[] =
500 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
501 static const char f32_5[] =
502 {0x90, /* nop */
503 0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
504 static const char f32_6[] =
505 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
506 static const char f32_7[] =
507 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
508 static const char f32_8[] =
509 {0x90, /* nop */
510 0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
511 static const char f32_9[] =
512 {0x89,0xf6, /* movl %esi,%esi */
513 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
514 static const char f32_10[] =
515 {0x8d,0x76,0x00, /* leal 0(%esi),%esi */
516 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
517 static const char f32_11[] =
518 {0x8d,0x74,0x26,0x00, /* leal 0(%esi,1),%esi */
519 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
520 static const char f32_12[] =
521 {0x8d,0xb6,0x00,0x00,0x00,0x00, /* leal 0L(%esi),%esi */
522 0x8d,0xbf,0x00,0x00,0x00,0x00}; /* leal 0L(%edi),%edi */
523 static const char f32_13[] =
524 {0x8d,0xb6,0x00,0x00,0x00,0x00, /* leal 0L(%esi),%esi */
525 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
526 static const char f32_14[] =
527 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00, /* leal 0L(%esi,1),%esi */
528 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
529 static const char f32_15[] =
530 {0xeb,0x0d,0x90,0x90,0x90,0x90,0x90, /* jmp .+15; lotsa nops */
531 0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90};
532 static const char f16_3[] =
533 {0x8d,0x74,0x00}; /* lea 0(%esi),%esi */
534 static const char f16_4[] =
535 {0x8d,0xb4,0x00,0x00}; /* lea 0w(%si),%si */
536 static const char f16_5[] =
537 {0x90, /* nop */
538 0x8d,0xb4,0x00,0x00}; /* lea 0w(%si),%si */
539 static const char f16_6[] =
540 {0x89,0xf6, /* mov %si,%si */
541 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
542 static const char f16_7[] =
543 {0x8d,0x74,0x00, /* lea 0(%si),%si */
544 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
545 static const char f16_8[] =
546 {0x8d,0xb4,0x00,0x00, /* lea 0w(%si),%si */
547 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
548 static const char *const f32_patt[] = {
549 f32_1, f32_2, f32_3, f32_4, f32_5, f32_6, f32_7, f32_8,
550 f32_9, f32_10, f32_11, f32_12, f32_13, f32_14, f32_15
552 static const char *const f16_patt[] = {
553 f32_1, f32_2, f16_3, f16_4, f16_5, f16_6, f16_7, f16_8,
554 f32_15, f32_15, f32_15, f32_15, f32_15, f32_15, f32_15
557 if (count <= 0 || count > 15)
558 return;
560 /* The recommended way to pad 64bit code is to use NOPs preceded by
561 maximally four 0x66 prefixes. Balance the size of nops. */
562 if (flag_code == CODE_64BIT)
564 int i;
565 int nnops = (count + 3) / 4;
566 int len = count / nnops;
567 int remains = count - nnops * len;
568 int pos = 0;
570 for (i = 0; i < remains; i++)
572 memset (fragP->fr_literal + fragP->fr_fix + pos, 0x66, len);
573 fragP->fr_literal[fragP->fr_fix + pos + len] = 0x90;
574 pos += len + 1;
576 for (; i < nnops; i++)
578 memset (fragP->fr_literal + fragP->fr_fix + pos, 0x66, len - 1);
579 fragP->fr_literal[fragP->fr_fix + pos + len - 1] = 0x90;
580 pos += len;
583 else
584 if (flag_code == CODE_16BIT)
586 memcpy (fragP->fr_literal + fragP->fr_fix,
587 f16_patt[count - 1], count);
588 if (count > 8)
589 /* Adjust jump offset. */
590 fragP->fr_literal[fragP->fr_fix + 1] = count - 2;
592 else
593 memcpy (fragP->fr_literal + fragP->fr_fix,
594 f32_patt[count - 1], count);
595 fragP->fr_var = count;
598 static INLINE unsigned int
599 mode_from_disp_size (t)
600 unsigned int t;
602 return (t & Disp8) ? 1 : (t & (Disp16 | Disp32 | Disp32S)) ? 2 : 0;
605 static INLINE int
606 fits_in_signed_byte (num)
607 offsetT num;
609 return (num >= -128) && (num <= 127);
612 static INLINE int
613 fits_in_unsigned_byte (num)
614 offsetT num;
616 return (num & 0xff) == num;
619 static INLINE int
620 fits_in_unsigned_word (num)
621 offsetT num;
623 return (num & 0xffff) == num;
626 static INLINE int
627 fits_in_signed_word (num)
628 offsetT num;
630 return (-32768 <= num) && (num <= 32767);
632 static INLINE int
633 fits_in_signed_long (num)
634 offsetT num ATTRIBUTE_UNUSED;
636 #ifndef BFD64
637 return 1;
638 #else
639 return (!(((offsetT) -1 << 31) & num)
640 || (((offsetT) -1 << 31) & num) == ((offsetT) -1 << 31));
641 #endif
642 } /* fits_in_signed_long() */
643 static INLINE int
644 fits_in_unsigned_long (num)
645 offsetT num ATTRIBUTE_UNUSED;
647 #ifndef BFD64
648 return 1;
649 #else
650 return (num & (((offsetT) 2 << 31) - 1)) == num;
651 #endif
652 } /* fits_in_unsigned_long() */
654 static int
655 smallest_imm_type (num)
656 offsetT num;
658 if (cpu_arch_flags != (Cpu086 | Cpu186 | Cpu286 | Cpu386 | Cpu486 | CpuNo64))
660 /* This code is disabled on the 486 because all the Imm1 forms
661 in the opcode table are slower on the i486. They're the
662 versions with the implicitly specified single-position
663 displacement, which has another syntax if you really want to
664 use that form. */
665 if (num == 1)
666 return Imm1 | Imm8 | Imm8S | Imm16 | Imm32 | Imm32S | Imm64;
668 return (fits_in_signed_byte (num)
669 ? (Imm8S | Imm8 | Imm16 | Imm32 | Imm32S | Imm64)
670 : fits_in_unsigned_byte (num)
671 ? (Imm8 | Imm16 | Imm32 | Imm32S | Imm64)
672 : (fits_in_signed_word (num) || fits_in_unsigned_word (num))
673 ? (Imm16 | Imm32 | Imm32S | Imm64)
674 : fits_in_signed_long (num)
675 ? (Imm32 | Imm32S | Imm64)
676 : fits_in_unsigned_long (num)
677 ? (Imm32 | Imm64)
678 : Imm64);
681 static offsetT
682 offset_in_range (val, size)
683 offsetT val;
684 int size;
686 addressT mask;
688 switch (size)
690 case 1: mask = ((addressT) 1 << 8) - 1; break;
691 case 2: mask = ((addressT) 1 << 16) - 1; break;
692 case 4: mask = ((addressT) 2 << 31) - 1; break;
693 #ifdef BFD64
694 case 8: mask = ((addressT) 2 << 63) - 1; break;
695 #endif
696 default: abort ();
699 /* If BFD64, sign extend val. */
700 if (!use_rela_relocations)
701 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
702 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
704 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
706 char buf1[40], buf2[40];
708 sprint_value (buf1, val);
709 sprint_value (buf2, val & mask);
710 as_warn (_("%s shortened to %s"), buf1, buf2);
712 return val & mask;
715 /* Returns 0 if attempting to add a prefix where one from the same
716 class already exists, 1 if non rep/repne added, 2 if rep/repne
717 added. */
718 static int
719 add_prefix (prefix)
720 unsigned int prefix;
722 int ret = 1;
723 int q;
725 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
726 && flag_code == CODE_64BIT)
727 q = REX_PREFIX;
728 else
729 switch (prefix)
731 default:
732 abort ();
734 case CS_PREFIX_OPCODE:
735 case DS_PREFIX_OPCODE:
736 case ES_PREFIX_OPCODE:
737 case FS_PREFIX_OPCODE:
738 case GS_PREFIX_OPCODE:
739 case SS_PREFIX_OPCODE:
740 q = SEG_PREFIX;
741 break;
743 case REPNE_PREFIX_OPCODE:
744 case REPE_PREFIX_OPCODE:
745 ret = 2;
746 /* fall thru */
747 case LOCK_PREFIX_OPCODE:
748 q = LOCKREP_PREFIX;
749 break;
751 case FWAIT_OPCODE:
752 q = WAIT_PREFIX;
753 break;
755 case ADDR_PREFIX_OPCODE:
756 q = ADDR_PREFIX;
757 break;
759 case DATA_PREFIX_OPCODE:
760 q = DATA_PREFIX;
761 break;
764 if (i.prefix[q] != 0)
766 as_bad (_("same type of prefix used twice"));
767 return 0;
770 i.prefixes += 1;
771 i.prefix[q] = prefix;
772 return ret;
775 static void
776 set_code_flag (value)
777 int value;
779 flag_code = value;
780 cpu_arch_flags &= ~(Cpu64 | CpuNo64);
781 cpu_arch_flags |= (flag_code == CODE_64BIT ? Cpu64 : CpuNo64);
782 if (value == CODE_64BIT && !(cpu_arch_flags & CpuSledgehammer))
784 as_bad (_("64bit mode not supported on this CPU."));
786 if (value == CODE_32BIT && !(cpu_arch_flags & Cpu386))
788 as_bad (_("32bit mode not supported on this CPU."));
790 stackop_size = '\0';
793 static void
794 set_16bit_gcc_code_flag (new_code_flag)
795 int new_code_flag;
797 flag_code = new_code_flag;
798 cpu_arch_flags &= ~(Cpu64 | CpuNo64);
799 cpu_arch_flags |= (flag_code == CODE_64BIT ? Cpu64 : CpuNo64);
800 stackop_size = LONG_MNEM_SUFFIX;
803 static void
804 set_intel_syntax (syntax_flag)
805 int syntax_flag;
807 /* Find out if register prefixing is specified. */
808 int ask_naked_reg = 0;
810 SKIP_WHITESPACE ();
811 if (!is_end_of_line[(unsigned char) *input_line_pointer])
813 char *string = input_line_pointer;
814 int e = get_symbol_end ();
816 if (strcmp (string, "prefix") == 0)
817 ask_naked_reg = 1;
818 else if (strcmp (string, "noprefix") == 0)
819 ask_naked_reg = -1;
820 else
821 as_bad (_("bad argument to syntax directive."));
822 *input_line_pointer = e;
824 demand_empty_rest_of_line ();
826 intel_syntax = syntax_flag;
828 if (ask_naked_reg == 0)
829 allow_naked_reg = (intel_syntax
830 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
831 else
832 allow_naked_reg = (ask_naked_reg < 0);
834 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
835 identifier_chars['$'] = intel_syntax ? '$' : 0;
838 static void
839 set_cpu_arch (dummy)
840 int dummy ATTRIBUTE_UNUSED;
842 SKIP_WHITESPACE ();
844 if (!is_end_of_line[(unsigned char) *input_line_pointer])
846 char *string = input_line_pointer;
847 int e = get_symbol_end ();
848 int i;
850 for (i = 0; cpu_arch[i].name; i++)
852 if (strcmp (string, cpu_arch[i].name) == 0)
854 if (*string != '.')
856 cpu_arch_name = cpu_arch[i].name;
857 cpu_sub_arch_name = NULL;
858 cpu_arch_flags = (cpu_arch[i].flags
859 | (flag_code == CODE_64BIT ? Cpu64 : CpuNo64));
860 break;
862 if ((cpu_arch_flags | cpu_arch[i].flags) != cpu_arch_flags)
864 cpu_sub_arch_name = cpu_arch[i].name;
865 cpu_arch_flags |= cpu_arch[i].flags;
867 *input_line_pointer = e;
868 demand_empty_rest_of_line ();
869 return;
872 if (!cpu_arch[i].name)
873 as_bad (_("no such architecture: `%s'"), string);
875 *input_line_pointer = e;
877 else
878 as_bad (_("missing cpu architecture"));
880 no_cond_jump_promotion = 0;
881 if (*input_line_pointer == ','
882 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
884 char *string = ++input_line_pointer;
885 int e = get_symbol_end ();
887 if (strcmp (string, "nojumps") == 0)
888 no_cond_jump_promotion = 1;
889 else if (strcmp (string, "jumps") == 0)
891 else
892 as_bad (_("no such architecture modifier: `%s'"), string);
894 *input_line_pointer = e;
897 demand_empty_rest_of_line ();
900 unsigned long
901 i386_mach ()
903 if (!strcmp (default_arch, "x86_64"))
904 return bfd_mach_x86_64;
905 else if (!strcmp (default_arch, "i386"))
906 return bfd_mach_i386_i386;
907 else
908 as_fatal (_("Unknown architecture"));
911 void
912 md_begin ()
914 const char *hash_err;
916 /* Initialize op_hash hash table. */
917 op_hash = hash_new ();
920 const template *optab;
921 templates *core_optab;
923 /* Setup for loop. */
924 optab = i386_optab;
925 core_optab = (templates *) xmalloc (sizeof (templates));
926 core_optab->start = optab;
928 while (1)
930 ++optab;
931 if (optab->name == NULL
932 || strcmp (optab->name, (optab - 1)->name) != 0)
934 /* different name --> ship out current template list;
935 add to hash table; & begin anew. */
936 core_optab->end = optab;
937 hash_err = hash_insert (op_hash,
938 (optab - 1)->name,
939 (PTR) core_optab);
940 if (hash_err)
942 as_fatal (_("Internal Error: Can't hash %s: %s"),
943 (optab - 1)->name,
944 hash_err);
946 if (optab->name == NULL)
947 break;
948 core_optab = (templates *) xmalloc (sizeof (templates));
949 core_optab->start = optab;
954 /* Initialize reg_hash hash table. */
955 reg_hash = hash_new ();
957 const reg_entry *regtab;
959 for (regtab = i386_regtab;
960 regtab < i386_regtab + sizeof (i386_regtab) / sizeof (i386_regtab[0]);
961 regtab++)
963 hash_err = hash_insert (reg_hash, regtab->reg_name, (PTR) regtab);
964 if (hash_err)
965 as_fatal (_("Internal Error: Can't hash %s: %s"),
966 regtab->reg_name,
967 hash_err);
971 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
973 int c;
974 char *p;
976 for (c = 0; c < 256; c++)
978 if (ISDIGIT (c))
980 digit_chars[c] = c;
981 mnemonic_chars[c] = c;
982 register_chars[c] = c;
983 operand_chars[c] = c;
985 else if (ISLOWER (c))
987 mnemonic_chars[c] = c;
988 register_chars[c] = c;
989 operand_chars[c] = c;
991 else if (ISUPPER (c))
993 mnemonic_chars[c] = TOLOWER (c);
994 register_chars[c] = mnemonic_chars[c];
995 operand_chars[c] = c;
998 if (ISALPHA (c) || ISDIGIT (c))
999 identifier_chars[c] = c;
1000 else if (c >= 128)
1002 identifier_chars[c] = c;
1003 operand_chars[c] = c;
1007 #ifdef LEX_AT
1008 identifier_chars['@'] = '@';
1009 #endif
1010 #ifdef LEX_QM
1011 identifier_chars['?'] = '?';
1012 operand_chars['?'] = '?';
1013 #endif
1014 digit_chars['-'] = '-';
1015 mnemonic_chars['-'] = '-';
1016 identifier_chars['_'] = '_';
1017 identifier_chars['.'] = '.';
1019 for (p = operand_special_chars; *p != '\0'; p++)
1020 operand_chars[(unsigned char) *p] = *p;
1023 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1024 if (IS_ELF)
1026 record_alignment (text_section, 2);
1027 record_alignment (data_section, 2);
1028 record_alignment (bss_section, 2);
1030 #endif
1032 if (flag_code == CODE_64BIT)
1034 x86_dwarf2_return_column = 16;
1035 x86_cie_data_alignment = -8;
1037 else
1039 x86_dwarf2_return_column = 8;
1040 x86_cie_data_alignment = -4;
1044 void
1045 i386_print_statistics (file)
1046 FILE *file;
1048 hash_print_statistics (file, "i386 opcode", op_hash);
1049 hash_print_statistics (file, "i386 register", reg_hash);
1052 #ifdef DEBUG386
1054 /* Debugging routines for md_assemble. */
1055 static void pi PARAMS ((char *, i386_insn *));
1056 static void pte PARAMS ((template *));
1057 static void pt PARAMS ((unsigned int));
1058 static void pe PARAMS ((expressionS *));
1059 static void ps PARAMS ((symbolS *));
1061 static void
1062 pi (line, x)
1063 char *line;
1064 i386_insn *x;
1066 unsigned int i;
1068 fprintf (stdout, "%s: template ", line);
1069 pte (&x->tm);
1070 fprintf (stdout, " address: base %s index %s scale %x\n",
1071 x->base_reg ? x->base_reg->reg_name : "none",
1072 x->index_reg ? x->index_reg->reg_name : "none",
1073 x->log2_scale_factor);
1074 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
1075 x->rm.mode, x->rm.reg, x->rm.regmem);
1076 fprintf (stdout, " sib: base %x index %x scale %x\n",
1077 x->sib.base, x->sib.index, x->sib.scale);
1078 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
1079 (x->rex & REX_MODE64) != 0,
1080 (x->rex & REX_EXTX) != 0,
1081 (x->rex & REX_EXTY) != 0,
1082 (x->rex & REX_EXTZ) != 0);
1083 for (i = 0; i < x->operands; i++)
1085 fprintf (stdout, " #%d: ", i + 1);
1086 pt (x->types[i]);
1087 fprintf (stdout, "\n");
1088 if (x->types[i]
1089 & (Reg | SReg2 | SReg3 | Control | Debug | Test | RegMMX | RegXMM))
1090 fprintf (stdout, "%s\n", x->op[i].regs->reg_name);
1091 if (x->types[i] & Imm)
1092 pe (x->op[i].imms);
1093 if (x->types[i] & Disp)
1094 pe (x->op[i].disps);
1098 static void
1099 pte (t)
1100 template *t;
1102 unsigned int i;
1103 fprintf (stdout, " %d operands ", t->operands);
1104 fprintf (stdout, "opcode %x ", t->base_opcode);
1105 if (t->extension_opcode != None)
1106 fprintf (stdout, "ext %x ", t->extension_opcode);
1107 if (t->opcode_modifier & D)
1108 fprintf (stdout, "D");
1109 if (t->opcode_modifier & W)
1110 fprintf (stdout, "W");
1111 fprintf (stdout, "\n");
1112 for (i = 0; i < t->operands; i++)
1114 fprintf (stdout, " #%d type ", i + 1);
1115 pt (t->operand_types[i]);
1116 fprintf (stdout, "\n");
1120 static void
1121 pe (e)
1122 expressionS *e;
1124 fprintf (stdout, " operation %d\n", e->X_op);
1125 fprintf (stdout, " add_number %ld (%lx)\n",
1126 (long) e->X_add_number, (long) e->X_add_number);
1127 if (e->X_add_symbol)
1129 fprintf (stdout, " add_symbol ");
1130 ps (e->X_add_symbol);
1131 fprintf (stdout, "\n");
1133 if (e->X_op_symbol)
1135 fprintf (stdout, " op_symbol ");
1136 ps (e->X_op_symbol);
1137 fprintf (stdout, "\n");
1141 static void
1142 ps (s)
1143 symbolS *s;
1145 fprintf (stdout, "%s type %s%s",
1146 S_GET_NAME (s),
1147 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
1148 segment_name (S_GET_SEGMENT (s)));
1151 struct type_name
1153 unsigned int mask;
1154 char *tname;
1157 static const type_names[] =
1159 { Reg8, "r8" },
1160 { Reg16, "r16" },
1161 { Reg32, "r32" },
1162 { Reg64, "r64" },
1163 { Imm8, "i8" },
1164 { Imm8S, "i8s" },
1165 { Imm16, "i16" },
1166 { Imm32, "i32" },
1167 { Imm32S, "i32s" },
1168 { Imm64, "i64" },
1169 { Imm1, "i1" },
1170 { BaseIndex, "BaseIndex" },
1171 { Disp8, "d8" },
1172 { Disp16, "d16" },
1173 { Disp32, "d32" },
1174 { Disp32S, "d32s" },
1175 { Disp64, "d64" },
1176 { InOutPortReg, "InOutPortReg" },
1177 { ShiftCount, "ShiftCount" },
1178 { Control, "control reg" },
1179 { Test, "test reg" },
1180 { Debug, "debug reg" },
1181 { FloatReg, "FReg" },
1182 { FloatAcc, "FAcc" },
1183 { SReg2, "SReg2" },
1184 { SReg3, "SReg3" },
1185 { Acc, "Acc" },
1186 { JumpAbsolute, "Jump Absolute" },
1187 { RegMMX, "rMMX" },
1188 { RegXMM, "rXMM" },
1189 { EsSeg, "es" },
1190 { 0, "" }
1193 static void
1194 pt (t)
1195 unsigned int t;
1197 const struct type_name *ty;
1199 for (ty = type_names; ty->mask; ty++)
1200 if (t & ty->mask)
1201 fprintf (stdout, "%s, ", ty->tname);
1202 fflush (stdout);
1205 #endif /* DEBUG386 */
1207 static bfd_reloc_code_real_type
1208 reloc (unsigned int size,
1209 int pcrel,
1210 int sign,
1211 bfd_reloc_code_real_type other)
1213 if (other != NO_RELOC)
1215 reloc_howto_type *reloc;
1217 if (size == 8)
1218 switch (other)
1220 case BFD_RELOC_X86_64_TPOFF32:
1221 other = BFD_RELOC_X86_64_TPOFF64;
1222 break;
1223 case BFD_RELOC_X86_64_DTPOFF32:
1224 other = BFD_RELOC_X86_64_DTPOFF64;
1225 break;
1226 default:
1227 break;
1229 reloc = bfd_reloc_type_lookup (stdoutput, other);
1230 if (!reloc)
1231 as_bad (_("unknown relocation (%u)"), other);
1232 else if (size != bfd_get_reloc_size (reloc))
1233 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
1234 bfd_get_reloc_size (reloc),
1235 size);
1236 else if (pcrel && !reloc->pc_relative)
1237 as_bad (_("non-pc-relative relocation for pc-relative field"));
1238 else if ((reloc->complain_on_overflow == complain_overflow_signed
1239 && !sign)
1240 || (reloc->complain_on_overflow == complain_overflow_unsigned
1241 && sign > 0))
1242 as_bad (_("relocated field and relocation type differ in signedness"));
1243 else
1244 return other;
1245 return NO_RELOC;
1248 if (pcrel)
1250 if (!sign)
1251 as_bad (_("there are no unsigned pc-relative relocations"));
1252 switch (size)
1254 case 1: return BFD_RELOC_8_PCREL;
1255 case 2: return BFD_RELOC_16_PCREL;
1256 case 4: return BFD_RELOC_32_PCREL;
1257 case 8: return BFD_RELOC_64_PCREL;
1259 as_bad (_("cannot do %u byte pc-relative relocation"), size);
1261 else
1263 if (sign > 0)
1264 switch (size)
1266 case 4: return BFD_RELOC_X86_64_32S;
1268 else
1269 switch (size)
1271 case 1: return BFD_RELOC_8;
1272 case 2: return BFD_RELOC_16;
1273 case 4: return BFD_RELOC_32;
1274 case 8: return BFD_RELOC_64;
1276 as_bad (_("cannot do %s %u byte relocation"),
1277 sign > 0 ? "signed" : "unsigned", size);
1280 abort ();
1281 return BFD_RELOC_NONE;
1284 /* Here we decide which fixups can be adjusted to make them relative to
1285 the beginning of the section instead of the symbol. Basically we need
1286 to make sure that the dynamic relocations are done correctly, so in
1287 some cases we force the original symbol to be used. */
1290 tc_i386_fix_adjustable (fixP)
1291 fixS *fixP ATTRIBUTE_UNUSED;
1293 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1294 if (!IS_ELF)
1295 return 1;
1297 /* Don't adjust pc-relative references to merge sections in 64-bit
1298 mode. */
1299 if (use_rela_relocations
1300 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
1301 && fixP->fx_pcrel)
1302 return 0;
1304 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
1305 and changed later by validate_fix. */
1306 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
1307 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
1308 return 0;
1310 /* adjust_reloc_syms doesn't know about the GOT. */
1311 if (fixP->fx_r_type == BFD_RELOC_386_GOTOFF
1312 || fixP->fx_r_type == BFD_RELOC_386_PLT32
1313 || fixP->fx_r_type == BFD_RELOC_386_GOT32
1314 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
1315 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
1316 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
1317 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
1318 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
1319 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
1320 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
1321 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
1322 || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
1323 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
1324 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
1325 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
1326 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
1327 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
1328 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
1329 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
1330 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
1331 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
1332 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
1333 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
1334 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
1335 return 0;
1336 #endif
1337 return 1;
1340 static int intel_float_operand PARAMS ((const char *mnemonic));
1342 static int
1343 intel_float_operand (mnemonic)
1344 const char *mnemonic;
1346 /* Note that the value returned is meaningful only for opcodes with (memory)
1347 operands, hence the code here is free to improperly handle opcodes that
1348 have no operands (for better performance and smaller code). */
1350 if (mnemonic[0] != 'f')
1351 return 0; /* non-math */
1353 switch (mnemonic[1])
1355 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
1356 the fs segment override prefix not currently handled because no
1357 call path can make opcodes without operands get here */
1358 case 'i':
1359 return 2 /* integer op */;
1360 case 'l':
1361 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
1362 return 3; /* fldcw/fldenv */
1363 break;
1364 case 'n':
1365 if (mnemonic[2] != 'o' /* fnop */)
1366 return 3; /* non-waiting control op */
1367 break;
1368 case 'r':
1369 if (mnemonic[2] == 's')
1370 return 3; /* frstor/frstpm */
1371 break;
1372 case 's':
1373 if (mnemonic[2] == 'a')
1374 return 3; /* fsave */
1375 if (mnemonic[2] == 't')
1377 switch (mnemonic[3])
1379 case 'c': /* fstcw */
1380 case 'd': /* fstdw */
1381 case 'e': /* fstenv */
1382 case 's': /* fsts[gw] */
1383 return 3;
1386 break;
1387 case 'x':
1388 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
1389 return 0; /* fxsave/fxrstor are not really math ops */
1390 break;
1393 return 1;
1396 /* This is the guts of the machine-dependent assembler. LINE points to a
1397 machine dependent instruction. This function is supposed to emit
1398 the frags/bytes it assembles to. */
1400 void
1401 md_assemble (line)
1402 char *line;
1404 int j;
1405 char mnemonic[MAX_MNEM_SIZE];
1407 /* Initialize globals. */
1408 memset (&i, '\0', sizeof (i));
1409 for (j = 0; j < MAX_OPERANDS; j++)
1410 i.reloc[j] = NO_RELOC;
1411 memset (disp_expressions, '\0', sizeof (disp_expressions));
1412 memset (im_expressions, '\0', sizeof (im_expressions));
1413 save_stack_p = save_stack;
1415 /* First parse an instruction mnemonic & call i386_operand for the operands.
1416 We assume that the scrubber has arranged it so that line[0] is the valid
1417 start of a (possibly prefixed) mnemonic. */
1419 line = parse_insn (line, mnemonic);
1420 if (line == NULL)
1421 return;
1423 line = parse_operands (line, mnemonic);
1424 if (line == NULL)
1425 return;
1427 /* Now we've parsed the mnemonic into a set of templates, and have the
1428 operands at hand. */
1430 /* All intel opcodes have reversed operands except for "bound" and
1431 "enter". We also don't reverse intersegment "jmp" and "call"
1432 instructions with 2 immediate operands so that the immediate segment
1433 precedes the offset, as it does when in AT&T mode. "enter" and the
1434 intersegment "jmp" and "call" instructions are the only ones that
1435 have two immediate operands. */
1436 if (intel_syntax && i.operands > 1
1437 && (strcmp (mnemonic, "bound") != 0)
1438 && (strcmp (mnemonic, "invlpga") != 0)
1439 && !((i.types[0] & Imm) && (i.types[1] & Imm)))
1440 swap_operands ();
1442 if (i.imm_operands)
1443 optimize_imm ();
1445 /* Don't optimize displacement for movabs since it only takes 64bit
1446 displacement. */
1447 if (i.disp_operands
1448 && (flag_code != CODE_64BIT
1449 || strcmp (mnemonic, "movabs") != 0))
1450 optimize_disp ();
1452 /* Next, we find a template that matches the given insn,
1453 making sure the overlap of the given operands types is consistent
1454 with the template operand types. */
1456 if (!match_template ())
1457 return;
1459 if (intel_syntax)
1461 /* Undo SYSV386_COMPAT brokenness when in Intel mode. See i386.h */
1462 if (SYSV386_COMPAT
1463 && (i.tm.base_opcode & 0xfffffde0) == 0xdce0)
1464 i.tm.base_opcode ^= FloatR;
1466 /* Zap movzx and movsx suffix. The suffix may have been set from
1467 "word ptr" or "byte ptr" on the source operand, but we'll use
1468 the suffix later to choose the destination register. */
1469 if ((i.tm.base_opcode & ~9) == 0x0fb6)
1471 if (i.reg_operands < 2
1472 && !i.suffix
1473 && (~i.tm.opcode_modifier
1474 & (No_bSuf
1475 | No_wSuf
1476 | No_lSuf
1477 | No_sSuf
1478 | No_xSuf
1479 | No_qSuf)))
1480 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
1482 i.suffix = 0;
1486 if (i.tm.opcode_modifier & FWait)
1487 if (!add_prefix (FWAIT_OPCODE))
1488 return;
1490 /* Check string instruction segment overrides. */
1491 if ((i.tm.opcode_modifier & IsString) != 0 && i.mem_operands != 0)
1493 if (!check_string ())
1494 return;
1497 if (!process_suffix ())
1498 return;
1500 /* Make still unresolved immediate matches conform to size of immediate
1501 given in i.suffix. */
1502 if (!finalize_imm ())
1503 return;
1505 if (i.types[0] & Imm1)
1506 i.imm_operands = 0; /* kludge for shift insns. */
1507 if (i.types[0] & ImplicitRegister)
1508 i.reg_operands--;
1509 if (i.types[1] & ImplicitRegister)
1510 i.reg_operands--;
1511 if (i.types[2] & ImplicitRegister)
1512 i.reg_operands--;
1514 if (i.tm.opcode_modifier & ImmExt)
1516 expressionS *exp;
1518 if ((i.tm.cpu_flags & CpuPNI) && i.operands > 0)
1520 /* These Intel Prescott New Instructions have the fixed
1521 operands with an opcode suffix which is coded in the same
1522 place as an 8-bit immediate field would be. Here we check
1523 those operands and remove them afterwards. */
1524 unsigned int x;
1526 for (x = 0; x < i.operands; x++)
1527 if (i.op[x].regs->reg_num != x)
1528 as_bad (_("can't use register '%%%s' as operand %d in '%s'."),
1529 i.op[x].regs->reg_name, x + 1, i.tm.name);
1530 i.operands = 0;
1533 /* These AMD 3DNow! and Intel Katmai New Instructions have an
1534 opcode suffix which is coded in the same place as an 8-bit
1535 immediate field would be. Here we fake an 8-bit immediate
1536 operand from the opcode suffix stored in tm.extension_opcode. */
1538 assert (i.imm_operands == 0 && i.operands <= 2 && 2 < MAX_OPERANDS);
1540 exp = &im_expressions[i.imm_operands++];
1541 i.op[i.operands].imms = exp;
1542 i.types[i.operands++] = Imm8;
1543 exp->X_op = O_constant;
1544 exp->X_add_number = i.tm.extension_opcode;
1545 i.tm.extension_opcode = None;
1548 /* For insns with operands there are more diddles to do to the opcode. */
1549 if (i.operands)
1551 if (!process_operands ())
1552 return;
1554 else if (!quiet_warnings && (i.tm.opcode_modifier & Ugh) != 0)
1556 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
1557 as_warn (_("translating to `%sp'"), i.tm.name);
1560 /* Handle conversion of 'int $3' --> special int3 insn. */
1561 if (i.tm.base_opcode == INT_OPCODE && i.op[0].imms->X_add_number == 3)
1563 i.tm.base_opcode = INT3_OPCODE;
1564 i.imm_operands = 0;
1567 if ((i.tm.opcode_modifier & (Jump | JumpByte | JumpDword))
1568 && i.op[0].disps->X_op == O_constant)
1570 /* Convert "jmp constant" (and "call constant") to a jump (call) to
1571 the absolute address given by the constant. Since ix86 jumps and
1572 calls are pc relative, we need to generate a reloc. */
1573 i.op[0].disps->X_add_symbol = &abs_symbol;
1574 i.op[0].disps->X_op = O_symbol;
1577 if ((i.tm.opcode_modifier & Rex64) != 0)
1578 i.rex |= REX_MODE64;
1580 /* For 8 bit registers we need an empty rex prefix. Also if the
1581 instruction already has a prefix, we need to convert old
1582 registers to new ones. */
1584 if (((i.types[0] & Reg8) != 0
1585 && (i.op[0].regs->reg_flags & RegRex64) != 0)
1586 || ((i.types[1] & Reg8) != 0
1587 && (i.op[1].regs->reg_flags & RegRex64) != 0)
1588 || (((i.types[0] & Reg8) != 0 || (i.types[1] & Reg8) != 0)
1589 && i.rex != 0))
1591 int x;
1593 i.rex |= REX_OPCODE;
1594 for (x = 0; x < 2; x++)
1596 /* Look for 8 bit operand that uses old registers. */
1597 if ((i.types[x] & Reg8) != 0
1598 && (i.op[x].regs->reg_flags & RegRex64) == 0)
1600 /* In case it is "hi" register, give up. */
1601 if (i.op[x].regs->reg_num > 3)
1602 as_bad (_("can't encode register '%%%s' in an instruction requiring REX prefix."),
1603 i.op[x].regs->reg_name);
1605 /* Otherwise it is equivalent to the extended register.
1606 Since the encoding doesn't change this is merely
1607 cosmetic cleanup for debug output. */
1609 i.op[x].regs = i.op[x].regs + 8;
1614 if (i.rex != 0)
1615 add_prefix (REX_OPCODE | i.rex);
1617 /* We are ready to output the insn. */
1618 output_insn ();
1621 static char *
1622 parse_insn (line, mnemonic)
1623 char *line;
1624 char *mnemonic;
1626 char *l = line;
1627 char *token_start = l;
1628 char *mnem_p;
1629 int supported;
1630 const template *t;
1632 /* Non-zero if we found a prefix only acceptable with string insns. */
1633 const char *expecting_string_instruction = NULL;
1635 while (1)
1637 mnem_p = mnemonic;
1638 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
1640 mnem_p++;
1641 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
1643 as_bad (_("no such instruction: `%s'"), token_start);
1644 return NULL;
1646 l++;
1648 if (!is_space_char (*l)
1649 && *l != END_OF_INSN
1650 && (intel_syntax
1651 || (*l != PREFIX_SEPARATOR
1652 && *l != ',')))
1654 as_bad (_("invalid character %s in mnemonic"),
1655 output_invalid (*l));
1656 return NULL;
1658 if (token_start == l)
1660 if (!intel_syntax && *l == PREFIX_SEPARATOR)
1661 as_bad (_("expecting prefix; got nothing"));
1662 else
1663 as_bad (_("expecting mnemonic; got nothing"));
1664 return NULL;
1667 /* Look up instruction (or prefix) via hash table. */
1668 current_templates = hash_find (op_hash, mnemonic);
1670 if (*l != END_OF_INSN
1671 && (!is_space_char (*l) || l[1] != END_OF_INSN)
1672 && current_templates
1673 && (current_templates->start->opcode_modifier & IsPrefix))
1675 if (current_templates->start->cpu_flags
1676 & (flag_code != CODE_64BIT ? Cpu64 : CpuNo64))
1678 as_bad ((flag_code != CODE_64BIT
1679 ? _("`%s' is only supported in 64-bit mode")
1680 : _("`%s' is not supported in 64-bit mode")),
1681 current_templates->start->name);
1682 return NULL;
1684 /* If we are in 16-bit mode, do not allow addr16 or data16.
1685 Similarly, in 32-bit mode, do not allow addr32 or data32. */
1686 if ((current_templates->start->opcode_modifier & (Size16 | Size32))
1687 && flag_code != CODE_64BIT
1688 && (((current_templates->start->opcode_modifier & Size32) != 0)
1689 ^ (flag_code == CODE_16BIT)))
1691 as_bad (_("redundant %s prefix"),
1692 current_templates->start->name);
1693 return NULL;
1695 /* Add prefix, checking for repeated prefixes. */
1696 switch (add_prefix (current_templates->start->base_opcode))
1698 case 0:
1699 return NULL;
1700 case 2:
1701 expecting_string_instruction = current_templates->start->name;
1702 break;
1704 /* Skip past PREFIX_SEPARATOR and reset token_start. */
1705 token_start = ++l;
1707 else
1708 break;
1711 if (!current_templates)
1713 /* See if we can get a match by trimming off a suffix. */
1714 switch (mnem_p[-1])
1716 case WORD_MNEM_SUFFIX:
1717 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
1718 i.suffix = SHORT_MNEM_SUFFIX;
1719 else
1720 case BYTE_MNEM_SUFFIX:
1721 case QWORD_MNEM_SUFFIX:
1722 i.suffix = mnem_p[-1];
1723 mnem_p[-1] = '\0';
1724 current_templates = hash_find (op_hash, mnemonic);
1725 break;
1726 case SHORT_MNEM_SUFFIX:
1727 case LONG_MNEM_SUFFIX:
1728 if (!intel_syntax)
1730 i.suffix = mnem_p[-1];
1731 mnem_p[-1] = '\0';
1732 current_templates = hash_find (op_hash, mnemonic);
1734 break;
1736 /* Intel Syntax. */
1737 case 'd':
1738 if (intel_syntax)
1740 if (intel_float_operand (mnemonic) == 1)
1741 i.suffix = SHORT_MNEM_SUFFIX;
1742 else
1743 i.suffix = LONG_MNEM_SUFFIX;
1744 mnem_p[-1] = '\0';
1745 current_templates = hash_find (op_hash, mnemonic);
1747 break;
1749 if (!current_templates)
1751 as_bad (_("no such instruction: `%s'"), token_start);
1752 return NULL;
1756 if (current_templates->start->opcode_modifier & (Jump | JumpByte))
1758 /* Check for a branch hint. We allow ",pt" and ",pn" for
1759 predict taken and predict not taken respectively.
1760 I'm not sure that branch hints actually do anything on loop
1761 and jcxz insns (JumpByte) for current Pentium4 chips. They
1762 may work in the future and it doesn't hurt to accept them
1763 now. */
1764 if (l[0] == ',' && l[1] == 'p')
1766 if (l[2] == 't')
1768 if (!add_prefix (DS_PREFIX_OPCODE))
1769 return NULL;
1770 l += 3;
1772 else if (l[2] == 'n')
1774 if (!add_prefix (CS_PREFIX_OPCODE))
1775 return NULL;
1776 l += 3;
1780 /* Any other comma loses. */
1781 if (*l == ',')
1783 as_bad (_("invalid character %s in mnemonic"),
1784 output_invalid (*l));
1785 return NULL;
1788 /* Check if instruction is supported on specified architecture. */
1789 supported = 0;
1790 for (t = current_templates->start; t < current_templates->end; ++t)
1792 if (!((t->cpu_flags & ~(Cpu64 | CpuNo64))
1793 & ~(cpu_arch_flags & ~(Cpu64 | CpuNo64))))
1794 supported |= 1;
1795 if (!(t->cpu_flags & (flag_code == CODE_64BIT ? CpuNo64 : Cpu64)))
1796 supported |= 2;
1798 if (!(supported & 2))
1800 as_bad (flag_code == CODE_64BIT
1801 ? _("`%s' is not supported in 64-bit mode")
1802 : _("`%s' is only supported in 64-bit mode"),
1803 current_templates->start->name);
1804 return NULL;
1806 if (!(supported & 1))
1808 as_warn (_("`%s' is not supported on `%s%s'"),
1809 current_templates->start->name,
1810 cpu_arch_name,
1811 cpu_sub_arch_name ? cpu_sub_arch_name : "");
1813 else if ((Cpu386 & ~cpu_arch_flags) && (flag_code != CODE_16BIT))
1815 as_warn (_("use .code16 to ensure correct addressing mode"));
1818 /* Check for rep/repne without a string instruction. */
1819 if (expecting_string_instruction)
1821 static templates override;
1823 for (t = current_templates->start; t < current_templates->end; ++t)
1824 if (t->opcode_modifier & IsString)
1825 break;
1826 if (t >= current_templates->end)
1828 as_bad (_("expecting string instruction after `%s'"),
1829 expecting_string_instruction);
1830 return NULL;
1832 for (override.start = t; t < current_templates->end; ++t)
1833 if (!(t->opcode_modifier & IsString))
1834 break;
1835 override.end = t;
1836 current_templates = &override;
1839 return l;
1842 static char *
1843 parse_operands (l, mnemonic)
1844 char *l;
1845 const char *mnemonic;
1847 char *token_start;
1849 /* 1 if operand is pending after ','. */
1850 unsigned int expecting_operand = 0;
1852 /* Non-zero if operand parens not balanced. */
1853 unsigned int paren_not_balanced;
1855 while (*l != END_OF_INSN)
1857 /* Skip optional white space before operand. */
1858 if (is_space_char (*l))
1859 ++l;
1860 if (!is_operand_char (*l) && *l != END_OF_INSN)
1862 as_bad (_("invalid character %s before operand %d"),
1863 output_invalid (*l),
1864 i.operands + 1);
1865 return NULL;
1867 token_start = l; /* after white space */
1868 paren_not_balanced = 0;
1869 while (paren_not_balanced || *l != ',')
1871 if (*l == END_OF_INSN)
1873 if (paren_not_balanced)
1875 if (!intel_syntax)
1876 as_bad (_("unbalanced parenthesis in operand %d."),
1877 i.operands + 1);
1878 else
1879 as_bad (_("unbalanced brackets in operand %d."),
1880 i.operands + 1);
1881 return NULL;
1883 else
1884 break; /* we are done */
1886 else if (!is_operand_char (*l) && !is_space_char (*l))
1888 as_bad (_("invalid character %s in operand %d"),
1889 output_invalid (*l),
1890 i.operands + 1);
1891 return NULL;
1893 if (!intel_syntax)
1895 if (*l == '(')
1896 ++paren_not_balanced;
1897 if (*l == ')')
1898 --paren_not_balanced;
1900 else
1902 if (*l == '[')
1903 ++paren_not_balanced;
1904 if (*l == ']')
1905 --paren_not_balanced;
1907 l++;
1909 if (l != token_start)
1910 { /* Yes, we've read in another operand. */
1911 unsigned int operand_ok;
1912 this_operand = i.operands++;
1913 if (i.operands > MAX_OPERANDS)
1915 as_bad (_("spurious operands; (%d operands/instruction max)"),
1916 MAX_OPERANDS);
1917 return NULL;
1919 /* Now parse operand adding info to 'i' as we go along. */
1920 END_STRING_AND_SAVE (l);
1922 if (intel_syntax)
1923 operand_ok =
1924 i386_intel_operand (token_start,
1925 intel_float_operand (mnemonic));
1926 else
1927 operand_ok = i386_operand (token_start);
1929 RESTORE_END_STRING (l);
1930 if (!operand_ok)
1931 return NULL;
1933 else
1935 if (expecting_operand)
1937 expecting_operand_after_comma:
1938 as_bad (_("expecting operand after ','; got nothing"));
1939 return NULL;
1941 if (*l == ',')
1943 as_bad (_("expecting operand before ','; got nothing"));
1944 return NULL;
1948 /* Now *l must be either ',' or END_OF_INSN. */
1949 if (*l == ',')
1951 if (*++l == END_OF_INSN)
1953 /* Just skip it, if it's \n complain. */
1954 goto expecting_operand_after_comma;
1956 expecting_operand = 1;
1959 return l;
1962 static void
1963 swap_operands ()
1965 union i386_op temp_op;
1966 unsigned int temp_type;
1967 enum bfd_reloc_code_real temp_reloc;
1968 int xchg1 = 0;
1969 int xchg2 = 0;
1971 if (i.operands == 2)
1973 xchg1 = 0;
1974 xchg2 = 1;
1976 else if (i.operands == 3)
1978 xchg1 = 0;
1979 xchg2 = 2;
1981 temp_type = i.types[xchg2];
1982 i.types[xchg2] = i.types[xchg1];
1983 i.types[xchg1] = temp_type;
1984 temp_op = i.op[xchg2];
1985 i.op[xchg2] = i.op[xchg1];
1986 i.op[xchg1] = temp_op;
1987 temp_reloc = i.reloc[xchg2];
1988 i.reloc[xchg2] = i.reloc[xchg1];
1989 i.reloc[xchg1] = temp_reloc;
1991 if (i.mem_operands == 2)
1993 const seg_entry *temp_seg;
1994 temp_seg = i.seg[0];
1995 i.seg[0] = i.seg[1];
1996 i.seg[1] = temp_seg;
2000 /* Try to ensure constant immediates are represented in the smallest
2001 opcode possible. */
2002 static void
2003 optimize_imm ()
2005 char guess_suffix = 0;
2006 int op;
2008 if (i.suffix)
2009 guess_suffix = i.suffix;
2010 else if (i.reg_operands)
2012 /* Figure out a suffix from the last register operand specified.
2013 We can't do this properly yet, ie. excluding InOutPortReg,
2014 but the following works for instructions with immediates.
2015 In any case, we can't set i.suffix yet. */
2016 for (op = i.operands; --op >= 0;)
2017 if (i.types[op] & Reg)
2019 if (i.types[op] & Reg8)
2020 guess_suffix = BYTE_MNEM_SUFFIX;
2021 else if (i.types[op] & Reg16)
2022 guess_suffix = WORD_MNEM_SUFFIX;
2023 else if (i.types[op] & Reg32)
2024 guess_suffix = LONG_MNEM_SUFFIX;
2025 else if (i.types[op] & Reg64)
2026 guess_suffix = QWORD_MNEM_SUFFIX;
2027 break;
2030 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
2031 guess_suffix = WORD_MNEM_SUFFIX;
2033 for (op = i.operands; --op >= 0;)
2034 if (i.types[op] & Imm)
2036 switch (i.op[op].imms->X_op)
2038 case O_constant:
2039 /* If a suffix is given, this operand may be shortened. */
2040 switch (guess_suffix)
2042 case LONG_MNEM_SUFFIX:
2043 i.types[op] |= Imm32 | Imm64;
2044 break;
2045 case WORD_MNEM_SUFFIX:
2046 i.types[op] |= Imm16 | Imm32S | Imm32 | Imm64;
2047 break;
2048 case BYTE_MNEM_SUFFIX:
2049 i.types[op] |= Imm16 | Imm8 | Imm8S | Imm32S | Imm32 | Imm64;
2050 break;
2053 /* If this operand is at most 16 bits, convert it
2054 to a signed 16 bit number before trying to see
2055 whether it will fit in an even smaller size.
2056 This allows a 16-bit operand such as $0xffe0 to
2057 be recognised as within Imm8S range. */
2058 if ((i.types[op] & Imm16)
2059 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
2061 i.op[op].imms->X_add_number =
2062 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
2064 if ((i.types[op] & Imm32)
2065 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
2066 == 0))
2068 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
2069 ^ ((offsetT) 1 << 31))
2070 - ((offsetT) 1 << 31));
2072 i.types[op] |= smallest_imm_type (i.op[op].imms->X_add_number);
2074 /* We must avoid matching of Imm32 templates when 64bit
2075 only immediate is available. */
2076 if (guess_suffix == QWORD_MNEM_SUFFIX)
2077 i.types[op] &= ~Imm32;
2078 break;
2080 case O_absent:
2081 case O_register:
2082 abort ();
2084 /* Symbols and expressions. */
2085 default:
2086 /* Convert symbolic operand to proper sizes for matching. */
2087 switch (guess_suffix)
2089 case QWORD_MNEM_SUFFIX:
2090 i.types[op] &= Imm64 | Imm32S;
2091 break;
2092 case LONG_MNEM_SUFFIX:
2093 i.types[op] &= Imm32;
2094 break;
2095 case WORD_MNEM_SUFFIX:
2096 i.types[op] &= Imm16;
2097 break;
2098 case BYTE_MNEM_SUFFIX:
2099 i.types[op] &= Imm8 | Imm8S;
2100 break;
2102 break;
2107 /* Try to use the smallest displacement type too. */
2108 static void
2109 optimize_disp ()
2111 int op;
2113 for (op = i.operands; --op >= 0;)
2114 if (i.types[op] & Disp)
2116 if (i.op[op].disps->X_op == O_constant)
2118 offsetT disp = i.op[op].disps->X_add_number;
2120 if ((i.types[op] & Disp16)
2121 && (disp & ~(offsetT) 0xffff) == 0)
2123 /* If this operand is at most 16 bits, convert
2124 to a signed 16 bit number and don't use 64bit
2125 displacement. */
2126 disp = (((disp & 0xffff) ^ 0x8000) - 0x8000);
2127 i.types[op] &= ~Disp64;
2129 if ((i.types[op] & Disp32)
2130 && (disp & ~(((offsetT) 2 << 31) - 1)) == 0)
2132 /* If this operand is at most 32 bits, convert
2133 to a signed 32 bit number and don't use 64bit
2134 displacement. */
2135 disp &= (((offsetT) 2 << 31) - 1);
2136 disp = (disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
2137 i.types[op] &= ~Disp64;
2139 if (!disp && (i.types[op] & BaseIndex))
2141 i.types[op] &= ~Disp;
2142 i.op[op].disps = 0;
2143 i.disp_operands--;
2145 else if (flag_code == CODE_64BIT)
2147 if (fits_in_signed_long (disp))
2149 i.types[op] &= ~Disp64;
2150 i.types[op] |= Disp32S;
2152 if (fits_in_unsigned_long (disp))
2153 i.types[op] |= Disp32;
2155 if ((i.types[op] & (Disp32 | Disp32S | Disp16))
2156 && fits_in_signed_byte (disp))
2157 i.types[op] |= Disp8;
2159 else
2160 /* We only support 64bit displacement on constants. */
2161 i.types[op] &= ~Disp64;
2165 static int
2166 match_template ()
2168 /* Points to template once we've found it. */
2169 const template *t;
2170 unsigned int overlap0, overlap1, overlap2;
2171 unsigned int found_reverse_match;
2172 int suffix_check;
2174 #define MATCH(overlap, given, template) \
2175 ((overlap & ~JumpAbsolute) \
2176 && (((given) & (BaseIndex | JumpAbsolute)) \
2177 == ((overlap) & (BaseIndex | JumpAbsolute))))
2179 /* If given types r0 and r1 are registers they must be of the same type
2180 unless the expected operand type register overlap is null.
2181 Note that Acc in a template matches every size of reg. */
2182 #define CONSISTENT_REGISTER_MATCH(m0, g0, t0, m1, g1, t1) \
2183 (((g0) & Reg) == 0 || ((g1) & Reg) == 0 \
2184 || ((g0) & Reg) == ((g1) & Reg) \
2185 || ((((m0) & Acc) ? Reg : (t0)) & (((m1) & Acc) ? Reg : (t1)) & Reg) == 0 )
2187 overlap0 = 0;
2188 overlap1 = 0;
2189 overlap2 = 0;
2190 found_reverse_match = 0;
2191 suffix_check = (i.suffix == BYTE_MNEM_SUFFIX
2192 ? No_bSuf
2193 : (i.suffix == WORD_MNEM_SUFFIX
2194 ? No_wSuf
2195 : (i.suffix == SHORT_MNEM_SUFFIX
2196 ? No_sSuf
2197 : (i.suffix == LONG_MNEM_SUFFIX
2198 ? No_lSuf
2199 : (i.suffix == QWORD_MNEM_SUFFIX
2200 ? No_qSuf
2201 : (i.suffix == LONG_DOUBLE_MNEM_SUFFIX
2202 ? No_xSuf : 0))))));
2204 t = current_templates->start;
2205 if (i.suffix == QWORD_MNEM_SUFFIX
2206 && flag_code != CODE_64BIT
2207 && (intel_syntax
2208 ? !(t->opcode_modifier & IgnoreSize)
2209 && !intel_float_operand (t->name)
2210 : intel_float_operand (t->name) != 2)
2211 && (!(t->operand_types[0] & (RegMMX | RegXMM))
2212 || !(t->operand_types[t->operands > 1] & (RegMMX | RegXMM)))
2213 && (t->base_opcode != 0x0fc7
2214 || t->extension_opcode != 1 /* cmpxchg8b */))
2215 t = current_templates->end;
2216 for (; t < current_templates->end; t++)
2218 /* Must have right number of operands. */
2219 if (i.operands != t->operands)
2220 continue;
2222 /* Check the suffix, except for some instructions in intel mode. */
2223 if ((t->opcode_modifier & suffix_check)
2224 && !(intel_syntax
2225 && (t->opcode_modifier & IgnoreSize)))
2226 continue;
2228 /* Do not verify operands when there are none. */
2229 else if (!t->operands)
2231 if (t->cpu_flags & ~cpu_arch_flags)
2232 continue;
2233 /* We've found a match; break out of loop. */
2234 break;
2237 overlap0 = i.types[0] & t->operand_types[0];
2238 switch (t->operands)
2240 case 1:
2241 if (!MATCH (overlap0, i.types[0], t->operand_types[0]))
2242 continue;
2243 break;
2244 case 2:
2245 case 3:
2246 overlap1 = i.types[1] & t->operand_types[1];
2247 if (!MATCH (overlap0, i.types[0], t->operand_types[0])
2248 || !MATCH (overlap1, i.types[1], t->operand_types[1])
2249 || !CONSISTENT_REGISTER_MATCH (overlap0, i.types[0],
2250 t->operand_types[0],
2251 overlap1, i.types[1],
2252 t->operand_types[1]))
2254 /* Check if other direction is valid ... */
2255 if ((t->opcode_modifier & (D | FloatD)) == 0)
2256 continue;
2258 /* Try reversing direction of operands. */
2259 overlap0 = i.types[0] & t->operand_types[1];
2260 overlap1 = i.types[1] & t->operand_types[0];
2261 if (!MATCH (overlap0, i.types[0], t->operand_types[1])
2262 || !MATCH (overlap1, i.types[1], t->operand_types[0])
2263 || !CONSISTENT_REGISTER_MATCH (overlap0, i.types[0],
2264 t->operand_types[1],
2265 overlap1, i.types[1],
2266 t->operand_types[0]))
2268 /* Does not match either direction. */
2269 continue;
2271 /* found_reverse_match holds which of D or FloatDR
2272 we've found. */
2273 found_reverse_match = t->opcode_modifier & (D | FloatDR);
2275 /* Found a forward 2 operand match here. */
2276 else if (t->operands == 3)
2278 /* Here we make use of the fact that there are no
2279 reverse match 3 operand instructions, and all 3
2280 operand instructions only need to be checked for
2281 register consistency between operands 2 and 3. */
2282 overlap2 = i.types[2] & t->operand_types[2];
2283 if (!MATCH (overlap2, i.types[2], t->operand_types[2])
2284 || !CONSISTENT_REGISTER_MATCH (overlap1, i.types[1],
2285 t->operand_types[1],
2286 overlap2, i.types[2],
2287 t->operand_types[2]))
2289 continue;
2291 /* Found either forward/reverse 2 or 3 operand match here:
2292 slip through to break. */
2294 if (t->cpu_flags & ~cpu_arch_flags)
2296 found_reverse_match = 0;
2297 continue;
2299 /* We've found a match; break out of loop. */
2300 break;
2303 if (t == current_templates->end)
2305 /* We found no match. */
2306 as_bad (_("suffix or operands invalid for `%s'"),
2307 current_templates->start->name);
2308 return 0;
2311 if (!quiet_warnings)
2313 if (!intel_syntax
2314 && ((i.types[0] & JumpAbsolute)
2315 != (t->operand_types[0] & JumpAbsolute)))
2317 as_warn (_("indirect %s without `*'"), t->name);
2320 if ((t->opcode_modifier & (IsPrefix | IgnoreSize))
2321 == (IsPrefix | IgnoreSize))
2323 /* Warn them that a data or address size prefix doesn't
2324 affect assembly of the next line of code. */
2325 as_warn (_("stand-alone `%s' prefix"), t->name);
2329 /* Copy the template we found. */
2330 i.tm = *t;
2331 if (found_reverse_match)
2333 /* If we found a reverse match we must alter the opcode
2334 direction bit. found_reverse_match holds bits to change
2335 (different for int & float insns). */
2337 i.tm.base_opcode ^= found_reverse_match;
2339 i.tm.operand_types[0] = t->operand_types[1];
2340 i.tm.operand_types[1] = t->operand_types[0];
2343 return 1;
2346 static int
2347 check_string ()
2349 int mem_op = (i.types[0] & AnyMem) ? 0 : 1;
2350 if ((i.tm.operand_types[mem_op] & EsSeg) != 0)
2352 if (i.seg[0] != NULL && i.seg[0] != &es)
2354 as_bad (_("`%s' operand %d must use `%%es' segment"),
2355 i.tm.name,
2356 mem_op + 1);
2357 return 0;
2359 /* There's only ever one segment override allowed per instruction.
2360 This instruction possibly has a legal segment override on the
2361 second operand, so copy the segment to where non-string
2362 instructions store it, allowing common code. */
2363 i.seg[0] = i.seg[1];
2365 else if ((i.tm.operand_types[mem_op + 1] & EsSeg) != 0)
2367 if (i.seg[1] != NULL && i.seg[1] != &es)
2369 as_bad (_("`%s' operand %d must use `%%es' segment"),
2370 i.tm.name,
2371 mem_op + 2);
2372 return 0;
2375 return 1;
2378 static int
2379 process_suffix (void)
2381 /* If matched instruction specifies an explicit instruction mnemonic
2382 suffix, use it. */
2383 if (i.tm.opcode_modifier & (Size16 | Size32 | Size64))
2385 if (i.tm.opcode_modifier & Size16)
2386 i.suffix = WORD_MNEM_SUFFIX;
2387 else if (i.tm.opcode_modifier & Size64)
2388 i.suffix = QWORD_MNEM_SUFFIX;
2389 else
2390 i.suffix = LONG_MNEM_SUFFIX;
2392 else if (i.reg_operands)
2394 /* If there's no instruction mnemonic suffix we try to invent one
2395 based on register operands. */
2396 if (!i.suffix)
2398 /* We take i.suffix from the last register operand specified,
2399 Destination register type is more significant than source
2400 register type. */
2401 int op;
2403 for (op = i.operands; --op >= 0;)
2404 if ((i.types[op] & Reg)
2405 && !(i.tm.operand_types[op] & InOutPortReg))
2407 i.suffix = ((i.types[op] & Reg8) ? BYTE_MNEM_SUFFIX :
2408 (i.types[op] & Reg16) ? WORD_MNEM_SUFFIX :
2409 (i.types[op] & Reg64) ? QWORD_MNEM_SUFFIX :
2410 LONG_MNEM_SUFFIX);
2411 break;
2414 else if (i.suffix == BYTE_MNEM_SUFFIX)
2416 if (!check_byte_reg ())
2417 return 0;
2419 else if (i.suffix == LONG_MNEM_SUFFIX)
2421 if (!check_long_reg ())
2422 return 0;
2424 else if (i.suffix == QWORD_MNEM_SUFFIX)
2426 if (!check_qword_reg ())
2427 return 0;
2429 else if (i.suffix == WORD_MNEM_SUFFIX)
2431 if (!check_word_reg ())
2432 return 0;
2434 else if (intel_syntax && (i.tm.opcode_modifier & IgnoreSize))
2435 /* Do nothing if the instruction is going to ignore the prefix. */
2437 else
2438 abort ();
2440 else if ((i.tm.opcode_modifier & DefaultSize)
2441 && !i.suffix
2442 /* exclude fldenv/frstor/fsave/fstenv */
2443 && (i.tm.opcode_modifier & No_sSuf))
2445 i.suffix = stackop_size;
2447 else if (intel_syntax
2448 && !i.suffix
2449 && ((i.tm.operand_types[0] & JumpAbsolute)
2450 || (i.tm.opcode_modifier & (JumpByte|JumpInterSegment))
2451 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
2452 && i.tm.extension_opcode <= 3)))
2454 switch (flag_code)
2456 case CODE_64BIT:
2457 if (!(i.tm.opcode_modifier & No_qSuf))
2459 i.suffix = QWORD_MNEM_SUFFIX;
2460 break;
2462 case CODE_32BIT:
2463 if (!(i.tm.opcode_modifier & No_lSuf))
2464 i.suffix = LONG_MNEM_SUFFIX;
2465 break;
2466 case CODE_16BIT:
2467 if (!(i.tm.opcode_modifier & No_wSuf))
2468 i.suffix = WORD_MNEM_SUFFIX;
2469 break;
2473 if (!i.suffix)
2475 if (!intel_syntax)
2477 if (i.tm.opcode_modifier & W)
2479 as_bad (_("no instruction mnemonic suffix given and no register operands; can't size instruction"));
2480 return 0;
2483 else
2485 unsigned int suffixes = ~i.tm.opcode_modifier
2486 & (No_bSuf
2487 | No_wSuf
2488 | No_lSuf
2489 | No_sSuf
2490 | No_xSuf
2491 | No_qSuf);
2493 if ((i.tm.opcode_modifier & W)
2494 || ((suffixes & (suffixes - 1))
2495 && !(i.tm.opcode_modifier & (DefaultSize | IgnoreSize))))
2497 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
2498 return 0;
2503 /* Change the opcode based on the operand size given by i.suffix;
2504 We don't need to change things for byte insns. */
2506 if (i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
2508 /* It's not a byte, select word/dword operation. */
2509 if (i.tm.opcode_modifier & W)
2511 if (i.tm.opcode_modifier & ShortForm)
2512 i.tm.base_opcode |= 8;
2513 else
2514 i.tm.base_opcode |= 1;
2517 /* Now select between word & dword operations via the operand
2518 size prefix, except for instructions that will ignore this
2519 prefix anyway. */
2520 if (i.suffix != QWORD_MNEM_SUFFIX
2521 && i.suffix != LONG_DOUBLE_MNEM_SUFFIX
2522 && !(i.tm.opcode_modifier & (IgnoreSize | FloatMF))
2523 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
2524 || (flag_code == CODE_64BIT
2525 && (i.tm.opcode_modifier & JumpByte))))
2527 unsigned int prefix = DATA_PREFIX_OPCODE;
2529 if (i.tm.opcode_modifier & JumpByte) /* jcxz, loop */
2530 prefix = ADDR_PREFIX_OPCODE;
2532 if (!add_prefix (prefix))
2533 return 0;
2536 /* Set mode64 for an operand. */
2537 if (i.suffix == QWORD_MNEM_SUFFIX
2538 && flag_code == CODE_64BIT
2539 && (i.tm.opcode_modifier & NoRex64) == 0)
2540 i.rex |= REX_MODE64;
2542 /* Size floating point instruction. */
2543 if (i.suffix == LONG_MNEM_SUFFIX)
2544 if (i.tm.opcode_modifier & FloatMF)
2545 i.tm.base_opcode ^= 4;
2548 return 1;
2551 static int
2552 check_byte_reg (void)
2554 int op;
2556 for (op = i.operands; --op >= 0;)
2558 /* If this is an eight bit register, it's OK. If it's the 16 or
2559 32 bit version of an eight bit register, we will just use the
2560 low portion, and that's OK too. */
2561 if (i.types[op] & Reg8)
2562 continue;
2564 /* movzx and movsx should not generate this warning. */
2565 if (intel_syntax
2566 && (i.tm.base_opcode == 0xfb7
2567 || i.tm.base_opcode == 0xfb6
2568 || i.tm.base_opcode == 0x63
2569 || i.tm.base_opcode == 0xfbe
2570 || i.tm.base_opcode == 0xfbf))
2571 continue;
2573 if ((i.types[op] & WordReg) && i.op[op].regs->reg_num < 4)
2575 /* Prohibit these changes in the 64bit mode, since the
2576 lowering is more complicated. */
2577 if (flag_code == CODE_64BIT
2578 && (i.tm.operand_types[op] & InOutPortReg) == 0)
2580 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2581 i.op[op].regs->reg_name,
2582 i.suffix);
2583 return 0;
2585 #if REGISTER_WARNINGS
2586 if (!quiet_warnings
2587 && (i.tm.operand_types[op] & InOutPortReg) == 0)
2588 as_warn (_("using `%%%s' instead of `%%%s' due to `%c' suffix"),
2589 (i.op[op].regs + (i.types[op] & Reg16
2590 ? REGNAM_AL - REGNAM_AX
2591 : REGNAM_AL - REGNAM_EAX))->reg_name,
2592 i.op[op].regs->reg_name,
2593 i.suffix);
2594 #endif
2595 continue;
2597 /* Any other register is bad. */
2598 if (i.types[op] & (Reg | RegMMX | RegXMM
2599 | SReg2 | SReg3
2600 | Control | Debug | Test
2601 | FloatReg | FloatAcc))
2603 as_bad (_("`%%%s' not allowed with `%s%c'"),
2604 i.op[op].regs->reg_name,
2605 i.tm.name,
2606 i.suffix);
2607 return 0;
2610 return 1;
2613 static int
2614 check_long_reg ()
2616 int op;
2618 for (op = i.operands; --op >= 0;)
2619 /* Reject eight bit registers, except where the template requires
2620 them. (eg. movzb) */
2621 if ((i.types[op] & Reg8) != 0
2622 && (i.tm.operand_types[op] & (Reg16 | Reg32 | Acc)) != 0)
2624 as_bad (_("`%%%s' not allowed with `%s%c'"),
2625 i.op[op].regs->reg_name,
2626 i.tm.name,
2627 i.suffix);
2628 return 0;
2630 /* Warn if the e prefix on a general reg is missing. */
2631 else if ((!quiet_warnings || flag_code == CODE_64BIT)
2632 && (i.types[op] & Reg16) != 0
2633 && (i.tm.operand_types[op] & (Reg32 | Acc)) != 0)
2635 /* Prohibit these changes in the 64bit mode, since the
2636 lowering is more complicated. */
2637 if (flag_code == CODE_64BIT)
2639 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2640 i.op[op].regs->reg_name,
2641 i.suffix);
2642 return 0;
2644 #if REGISTER_WARNINGS
2645 else
2646 as_warn (_("using `%%%s' instead of `%%%s' due to `%c' suffix"),
2647 (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
2648 i.op[op].regs->reg_name,
2649 i.suffix);
2650 #endif
2652 /* Warn if the r prefix on a general reg is missing. */
2653 else if ((i.types[op] & Reg64) != 0
2654 && (i.tm.operand_types[op] & (Reg32 | Acc)) != 0)
2656 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2657 i.op[op].regs->reg_name,
2658 i.suffix);
2659 return 0;
2661 return 1;
2664 static int
2665 check_qword_reg ()
2667 int op;
2669 for (op = i.operands; --op >= 0; )
2670 /* Reject eight bit registers, except where the template requires
2671 them. (eg. movzb) */
2672 if ((i.types[op] & Reg8) != 0
2673 && (i.tm.operand_types[op] & (Reg16 | Reg32 | Acc)) != 0)
2675 as_bad (_("`%%%s' not allowed with `%s%c'"),
2676 i.op[op].regs->reg_name,
2677 i.tm.name,
2678 i.suffix);
2679 return 0;
2681 /* Warn if the e prefix on a general reg is missing. */
2682 else if (((i.types[op] & Reg16) != 0
2683 || (i.types[op] & Reg32) != 0)
2684 && (i.tm.operand_types[op] & (Reg32 | Acc)) != 0)
2686 /* Prohibit these changes in the 64bit mode, since the
2687 lowering is more complicated. */
2688 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2689 i.op[op].regs->reg_name,
2690 i.suffix);
2691 return 0;
2693 return 1;
2696 static int
2697 check_word_reg ()
2699 int op;
2700 for (op = i.operands; --op >= 0;)
2701 /* Reject eight bit registers, except where the template requires
2702 them. (eg. movzb) */
2703 if ((i.types[op] & Reg8) != 0
2704 && (i.tm.operand_types[op] & (Reg16 | Reg32 | Acc)) != 0)
2706 as_bad (_("`%%%s' not allowed with `%s%c'"),
2707 i.op[op].regs->reg_name,
2708 i.tm.name,
2709 i.suffix);
2710 return 0;
2712 /* Warn if the e prefix on a general reg is present. */
2713 else if ((!quiet_warnings || flag_code == CODE_64BIT)
2714 && (i.types[op] & Reg32) != 0
2715 && (i.tm.operand_types[op] & (Reg16 | Acc)) != 0)
2717 /* Prohibit these changes in the 64bit mode, since the
2718 lowering is more complicated. */
2719 if (flag_code == CODE_64BIT)
2721 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2722 i.op[op].regs->reg_name,
2723 i.suffix);
2724 return 0;
2726 else
2727 #if REGISTER_WARNINGS
2728 as_warn (_("using `%%%s' instead of `%%%s' due to `%c' suffix"),
2729 (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
2730 i.op[op].regs->reg_name,
2731 i.suffix);
2732 #endif
2734 return 1;
2737 static int
2738 finalize_imm ()
2740 unsigned int overlap0, overlap1, overlap2;
2742 overlap0 = i.types[0] & i.tm.operand_types[0];
2743 if ((overlap0 & (Imm8 | Imm8S | Imm16 | Imm32 | Imm32S | Imm64))
2744 && overlap0 != Imm8 && overlap0 != Imm8S
2745 && overlap0 != Imm16 && overlap0 != Imm32S
2746 && overlap0 != Imm32 && overlap0 != Imm64)
2748 if (i.suffix)
2750 overlap0 &= (i.suffix == BYTE_MNEM_SUFFIX
2751 ? Imm8 | Imm8S
2752 : (i.suffix == WORD_MNEM_SUFFIX
2753 ? Imm16
2754 : (i.suffix == QWORD_MNEM_SUFFIX
2755 ? Imm64 | Imm32S
2756 : Imm32)));
2758 else if (overlap0 == (Imm16 | Imm32S | Imm32)
2759 || overlap0 == (Imm16 | Imm32)
2760 || overlap0 == (Imm16 | Imm32S))
2762 overlap0 = ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0)
2763 ? Imm16 : Imm32S);
2765 if (overlap0 != Imm8 && overlap0 != Imm8S
2766 && overlap0 != Imm16 && overlap0 != Imm32S
2767 && overlap0 != Imm32 && overlap0 != Imm64)
2769 as_bad (_("no instruction mnemonic suffix given; can't determine immediate size"));
2770 return 0;
2773 i.types[0] = overlap0;
2775 overlap1 = i.types[1] & i.tm.operand_types[1];
2776 if ((overlap1 & (Imm8 | Imm8S | Imm16 | Imm32S | Imm32 | Imm64))
2777 && overlap1 != Imm8 && overlap1 != Imm8S
2778 && overlap1 != Imm16 && overlap1 != Imm32S
2779 && overlap1 != Imm32 && overlap1 != Imm64)
2781 if (i.suffix)
2783 overlap1 &= (i.suffix == BYTE_MNEM_SUFFIX
2784 ? Imm8 | Imm8S
2785 : (i.suffix == WORD_MNEM_SUFFIX
2786 ? Imm16
2787 : (i.suffix == QWORD_MNEM_SUFFIX
2788 ? Imm64 | Imm32S
2789 : Imm32)));
2791 else if (overlap1 == (Imm16 | Imm32 | Imm32S)
2792 || overlap1 == (Imm16 | Imm32)
2793 || overlap1 == (Imm16 | Imm32S))
2795 overlap1 = ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0)
2796 ? Imm16 : Imm32S);
2798 if (overlap1 != Imm8 && overlap1 != Imm8S
2799 && overlap1 != Imm16 && overlap1 != Imm32S
2800 && overlap1 != Imm32 && overlap1 != Imm64)
2802 as_bad (_("no instruction mnemonic suffix given; can't determine immediate size %x %c"),overlap1, i.suffix);
2803 return 0;
2806 i.types[1] = overlap1;
2808 overlap2 = i.types[2] & i.tm.operand_types[2];
2809 assert ((overlap2 & Imm) == 0);
2810 i.types[2] = overlap2;
2812 return 1;
2815 static int
2816 process_operands ()
2818 /* Default segment register this instruction will use for memory
2819 accesses. 0 means unknown. This is only for optimizing out
2820 unnecessary segment overrides. */
2821 const seg_entry *default_seg = 0;
2823 /* The imul $imm, %reg instruction is converted into
2824 imul $imm, %reg, %reg, and the clr %reg instruction
2825 is converted into xor %reg, %reg. */
2826 if (i.tm.opcode_modifier & regKludge)
2828 unsigned int first_reg_op = (i.types[0] & Reg) ? 0 : 1;
2829 /* Pretend we saw the extra register operand. */
2830 assert (i.op[first_reg_op + 1].regs == 0);
2831 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
2832 i.types[first_reg_op + 1] = i.types[first_reg_op];
2833 i.reg_operands = 2;
2836 if (i.tm.opcode_modifier & ShortForm)
2838 /* The register or float register operand is in operand 0 or 1. */
2839 unsigned int op = (i.types[0] & (Reg | FloatReg)) ? 0 : 1;
2840 /* Register goes in low 3 bits of opcode. */
2841 i.tm.base_opcode |= i.op[op].regs->reg_num;
2842 if ((i.op[op].regs->reg_flags & RegRex) != 0)
2843 i.rex |= REX_EXTZ;
2844 if (!quiet_warnings && (i.tm.opcode_modifier & Ugh) != 0)
2846 /* Warn about some common errors, but press on regardless.
2847 The first case can be generated by gcc (<= 2.8.1). */
2848 if (i.operands == 2)
2850 /* Reversed arguments on faddp, fsubp, etc. */
2851 as_warn (_("translating to `%s %%%s,%%%s'"), i.tm.name,
2852 i.op[1].regs->reg_name,
2853 i.op[0].regs->reg_name);
2855 else
2857 /* Extraneous `l' suffix on fp insn. */
2858 as_warn (_("translating to `%s %%%s'"), i.tm.name,
2859 i.op[0].regs->reg_name);
2863 else if (i.tm.opcode_modifier & Modrm)
2865 /* The opcode is completed (modulo i.tm.extension_opcode which
2866 must be put into the modrm byte). Now, we make the modrm and
2867 index base bytes based on all the info we've collected. */
2869 default_seg = build_modrm_byte ();
2871 else if (i.tm.opcode_modifier & (Seg2ShortForm | Seg3ShortForm))
2873 if (i.tm.base_opcode == POP_SEG_SHORT
2874 && i.op[0].regs->reg_num == 1)
2876 as_bad (_("you can't `pop %%cs'"));
2877 return 0;
2879 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
2880 if ((i.op[0].regs->reg_flags & RegRex) != 0)
2881 i.rex |= REX_EXTZ;
2883 else if ((i.tm.base_opcode & ~(D | W)) == MOV_AX_DISP32)
2885 default_seg = &ds;
2887 else if ((i.tm.opcode_modifier & IsString) != 0)
2889 /* For the string instructions that allow a segment override
2890 on one of their operands, the default segment is ds. */
2891 default_seg = &ds;
2894 if ((i.tm.base_opcode == 0x8d /* lea */
2895 || (i.tm.cpu_flags & CpuSVME))
2896 && i.seg[0] && !quiet_warnings)
2897 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
2899 /* If a segment was explicitly specified, and the specified segment
2900 is not the default, use an opcode prefix to select it. If we
2901 never figured out what the default segment is, then default_seg
2902 will be zero at this point, and the specified segment prefix will
2903 always be used. */
2904 if ((i.seg[0]) && (i.seg[0] != default_seg))
2906 if (!add_prefix (i.seg[0]->seg_prefix))
2907 return 0;
2909 return 1;
2912 static const seg_entry *
2913 build_modrm_byte ()
2915 const seg_entry *default_seg = 0;
2917 /* i.reg_operands MUST be the number of real register operands;
2918 implicit registers do not count. */
2919 if (i.reg_operands == 2)
2921 unsigned int source, dest;
2922 source = ((i.types[0]
2923 & (Reg | RegMMX | RegXMM
2924 | SReg2 | SReg3
2925 | Control | Debug | Test))
2926 ? 0 : 1);
2927 dest = source + 1;
2929 i.rm.mode = 3;
2930 /* One of the register operands will be encoded in the i.tm.reg
2931 field, the other in the combined i.tm.mode and i.tm.regmem
2932 fields. If no form of this instruction supports a memory
2933 destination operand, then we assume the source operand may
2934 sometimes be a memory operand and so we need to store the
2935 destination in the i.rm.reg field. */
2936 if ((i.tm.operand_types[dest] & AnyMem) == 0)
2938 i.rm.reg = i.op[dest].regs->reg_num;
2939 i.rm.regmem = i.op[source].regs->reg_num;
2940 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
2941 i.rex |= REX_EXTX;
2942 if ((i.op[source].regs->reg_flags & RegRex) != 0)
2943 i.rex |= REX_EXTZ;
2945 else
2947 i.rm.reg = i.op[source].regs->reg_num;
2948 i.rm.regmem = i.op[dest].regs->reg_num;
2949 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
2950 i.rex |= REX_EXTZ;
2951 if ((i.op[source].regs->reg_flags & RegRex) != 0)
2952 i.rex |= REX_EXTX;
2954 if (flag_code != CODE_64BIT && (i.rex & (REX_EXTX | REX_EXTZ)))
2956 if (!((i.types[0] | i.types[1]) & Control))
2957 abort ();
2958 i.rex &= ~(REX_EXTX | REX_EXTZ);
2959 add_prefix (LOCK_PREFIX_OPCODE);
2962 else
2963 { /* If it's not 2 reg operands... */
2964 if (i.mem_operands)
2966 unsigned int fake_zero_displacement = 0;
2967 unsigned int op = ((i.types[0] & AnyMem)
2969 : (i.types[1] & AnyMem) ? 1 : 2);
2971 default_seg = &ds;
2973 if (i.base_reg == 0)
2975 i.rm.mode = 0;
2976 if (!i.disp_operands)
2977 fake_zero_displacement = 1;
2978 if (i.index_reg == 0)
2980 /* Operand is just <disp> */
2981 if (flag_code == CODE_64BIT)
2983 /* 64bit mode overwrites the 32bit absolute
2984 addressing by RIP relative addressing and
2985 absolute addressing is encoded by one of the
2986 redundant SIB forms. */
2987 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
2988 i.sib.base = NO_BASE_REGISTER;
2989 i.sib.index = NO_INDEX_REGISTER;
2990 i.types[op] = ((i.prefix[ADDR_PREFIX] == 0) ? Disp32S : Disp32);
2992 else if ((flag_code == CODE_16BIT) ^ (i.prefix[ADDR_PREFIX] != 0))
2994 i.rm.regmem = NO_BASE_REGISTER_16;
2995 i.types[op] = Disp16;
2997 else
2999 i.rm.regmem = NO_BASE_REGISTER;
3000 i.types[op] = Disp32;
3003 else /* !i.base_reg && i.index_reg */
3005 i.sib.index = i.index_reg->reg_num;
3006 i.sib.base = NO_BASE_REGISTER;
3007 i.sib.scale = i.log2_scale_factor;
3008 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
3009 i.types[op] &= ~Disp;
3010 if (flag_code != CODE_64BIT)
3011 i.types[op] |= Disp32; /* Must be 32 bit */
3012 else
3013 i.types[op] |= Disp32S;
3014 if ((i.index_reg->reg_flags & RegRex) != 0)
3015 i.rex |= REX_EXTY;
3018 /* RIP addressing for 64bit mode. */
3019 else if (i.base_reg->reg_type == BaseIndex)
3021 i.rm.regmem = NO_BASE_REGISTER;
3022 i.types[op] &= ~ Disp;
3023 i.types[op] |= Disp32S;
3024 i.flags[op] = Operand_PCrel;
3025 if (! i.disp_operands)
3026 fake_zero_displacement = 1;
3028 else if (i.base_reg->reg_type & Reg16)
3030 switch (i.base_reg->reg_num)
3032 case 3: /* (%bx) */
3033 if (i.index_reg == 0)
3034 i.rm.regmem = 7;
3035 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
3036 i.rm.regmem = i.index_reg->reg_num - 6;
3037 break;
3038 case 5: /* (%bp) */
3039 default_seg = &ss;
3040 if (i.index_reg == 0)
3042 i.rm.regmem = 6;
3043 if ((i.types[op] & Disp) == 0)
3045 /* fake (%bp) into 0(%bp) */
3046 i.types[op] |= Disp8;
3047 fake_zero_displacement = 1;
3050 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
3051 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
3052 break;
3053 default: /* (%si) -> 4 or (%di) -> 5 */
3054 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
3056 i.rm.mode = mode_from_disp_size (i.types[op]);
3058 else /* i.base_reg and 32/64 bit mode */
3060 if (flag_code == CODE_64BIT
3061 && (i.types[op] & Disp))
3062 i.types[op] = (i.types[op] & Disp8) | (i.prefix[ADDR_PREFIX] == 0 ? Disp32S : Disp32);
3064 i.rm.regmem = i.base_reg->reg_num;
3065 if ((i.base_reg->reg_flags & RegRex) != 0)
3066 i.rex |= REX_EXTZ;
3067 i.sib.base = i.base_reg->reg_num;
3068 /* x86-64 ignores REX prefix bit here to avoid decoder
3069 complications. */
3070 if ((i.base_reg->reg_num & 7) == EBP_REG_NUM)
3072 default_seg = &ss;
3073 if (i.disp_operands == 0)
3075 fake_zero_displacement = 1;
3076 i.types[op] |= Disp8;
3079 else if (i.base_reg->reg_num == ESP_REG_NUM)
3081 default_seg = &ss;
3083 i.sib.scale = i.log2_scale_factor;
3084 if (i.index_reg == 0)
3086 /* <disp>(%esp) becomes two byte modrm with no index
3087 register. We've already stored the code for esp
3088 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
3089 Any base register besides %esp will not use the
3090 extra modrm byte. */
3091 i.sib.index = NO_INDEX_REGISTER;
3092 #if !SCALE1_WHEN_NO_INDEX
3093 /* Another case where we force the second modrm byte. */
3094 if (i.log2_scale_factor)
3095 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
3096 #endif
3098 else
3100 i.sib.index = i.index_reg->reg_num;
3101 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
3102 if ((i.index_reg->reg_flags & RegRex) != 0)
3103 i.rex |= REX_EXTY;
3105 i.rm.mode = mode_from_disp_size (i.types[op]);
3108 if (fake_zero_displacement)
3110 /* Fakes a zero displacement assuming that i.types[op]
3111 holds the correct displacement size. */
3112 expressionS *exp;
3114 assert (i.op[op].disps == 0);
3115 exp = &disp_expressions[i.disp_operands++];
3116 i.op[op].disps = exp;
3117 exp->X_op = O_constant;
3118 exp->X_add_number = 0;
3119 exp->X_add_symbol = (symbolS *) 0;
3120 exp->X_op_symbol = (symbolS *) 0;
3124 /* Fill in i.rm.reg or i.rm.regmem field with register operand
3125 (if any) based on i.tm.extension_opcode. Again, we must be
3126 careful to make sure that segment/control/debug/test/MMX
3127 registers are coded into the i.rm.reg field. */
3128 if (i.reg_operands)
3130 unsigned int op =
3131 ((i.types[0]
3132 & (Reg | RegMMX | RegXMM
3133 | SReg2 | SReg3
3134 | Control | Debug | Test))
3136 : ((i.types[1]
3137 & (Reg | RegMMX | RegXMM
3138 | SReg2 | SReg3
3139 | Control | Debug | Test))
3141 : 2));
3142 /* If there is an extension opcode to put here, the register
3143 number must be put into the regmem field. */
3144 if (i.tm.extension_opcode != None)
3146 i.rm.regmem = i.op[op].regs->reg_num;
3147 if ((i.op[op].regs->reg_flags & RegRex) != 0)
3148 i.rex |= REX_EXTZ;
3150 else
3152 i.rm.reg = i.op[op].regs->reg_num;
3153 if ((i.op[op].regs->reg_flags & RegRex) != 0)
3154 i.rex |= REX_EXTX;
3157 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
3158 must set it to 3 to indicate this is a register operand
3159 in the regmem field. */
3160 if (!i.mem_operands)
3161 i.rm.mode = 3;
3164 /* Fill in i.rm.reg field with extension opcode (if any). */
3165 if (i.tm.extension_opcode != None)
3166 i.rm.reg = i.tm.extension_opcode;
3168 return default_seg;
3171 static void
3172 output_branch ()
3174 char *p;
3175 int code16;
3176 int prefix;
3177 relax_substateT subtype;
3178 symbolS *sym;
3179 offsetT off;
3181 code16 = 0;
3182 if (flag_code == CODE_16BIT)
3183 code16 = CODE16;
3185 prefix = 0;
3186 if (i.prefix[DATA_PREFIX] != 0)
3188 prefix = 1;
3189 i.prefixes -= 1;
3190 code16 ^= CODE16;
3192 /* Pentium4 branch hints. */
3193 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
3194 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
3196 prefix++;
3197 i.prefixes--;
3199 if (i.prefix[REX_PREFIX] != 0)
3201 prefix++;
3202 i.prefixes--;
3205 if (i.prefixes != 0 && !intel_syntax)
3206 as_warn (_("skipping prefixes on this instruction"));
3208 /* It's always a symbol; End frag & setup for relax.
3209 Make sure there is enough room in this frag for the largest
3210 instruction we may generate in md_convert_frag. This is 2
3211 bytes for the opcode and room for the prefix and largest
3212 displacement. */
3213 frag_grow (prefix + 2 + 4);
3214 /* Prefix and 1 opcode byte go in fr_fix. */
3215 p = frag_more (prefix + 1);
3216 if (i.prefix[DATA_PREFIX] != 0)
3217 *p++ = DATA_PREFIX_OPCODE;
3218 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
3219 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
3220 *p++ = i.prefix[SEG_PREFIX];
3221 if (i.prefix[REX_PREFIX] != 0)
3222 *p++ = i.prefix[REX_PREFIX];
3223 *p = i.tm.base_opcode;
3225 if ((unsigned char) *p == JUMP_PC_RELATIVE)
3226 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, SMALL);
3227 else if ((cpu_arch_flags & Cpu386) != 0)
3228 subtype = ENCODE_RELAX_STATE (COND_JUMP, SMALL);
3229 else
3230 subtype = ENCODE_RELAX_STATE (COND_JUMP86, SMALL);
3231 subtype |= code16;
3233 sym = i.op[0].disps->X_add_symbol;
3234 off = i.op[0].disps->X_add_number;
3236 if (i.op[0].disps->X_op != O_constant
3237 && i.op[0].disps->X_op != O_symbol)
3239 /* Handle complex expressions. */
3240 sym = make_expr_symbol (i.op[0].disps);
3241 off = 0;
3244 /* 1 possible extra opcode + 4 byte displacement go in var part.
3245 Pass reloc in fr_var. */
3246 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
3249 static void
3250 output_jump ()
3252 char *p;
3253 int size;
3254 fixS *fixP;
3256 if (i.tm.opcode_modifier & JumpByte)
3258 /* This is a loop or jecxz type instruction. */
3259 size = 1;
3260 if (i.prefix[ADDR_PREFIX] != 0)
3262 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
3263 i.prefixes -= 1;
3265 /* Pentium4 branch hints. */
3266 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
3267 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
3269 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
3270 i.prefixes--;
3273 else
3275 int code16;
3277 code16 = 0;
3278 if (flag_code == CODE_16BIT)
3279 code16 = CODE16;
3281 if (i.prefix[DATA_PREFIX] != 0)
3283 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
3284 i.prefixes -= 1;
3285 code16 ^= CODE16;
3288 size = 4;
3289 if (code16)
3290 size = 2;
3293 if (i.prefix[REX_PREFIX] != 0)
3295 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
3296 i.prefixes -= 1;
3299 if (i.prefixes != 0 && !intel_syntax)
3300 as_warn (_("skipping prefixes on this instruction"));
3302 p = frag_more (1 + size);
3303 *p++ = i.tm.base_opcode;
3305 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3306 i.op[0].disps, 1, reloc (size, 1, 1, i.reloc[0]));
3308 /* All jumps handled here are signed, but don't use a signed limit
3309 check for 32 and 16 bit jumps as we want to allow wrap around at
3310 4G and 64k respectively. */
3311 if (size == 1)
3312 fixP->fx_signed = 1;
3315 static void
3316 output_interseg_jump ()
3318 char *p;
3319 int size;
3320 int prefix;
3321 int code16;
3323 code16 = 0;
3324 if (flag_code == CODE_16BIT)
3325 code16 = CODE16;
3327 prefix = 0;
3328 if (i.prefix[DATA_PREFIX] != 0)
3330 prefix = 1;
3331 i.prefixes -= 1;
3332 code16 ^= CODE16;
3334 if (i.prefix[REX_PREFIX] != 0)
3336 prefix++;
3337 i.prefixes -= 1;
3340 size = 4;
3341 if (code16)
3342 size = 2;
3344 if (i.prefixes != 0 && !intel_syntax)
3345 as_warn (_("skipping prefixes on this instruction"));
3347 /* 1 opcode; 2 segment; offset */
3348 p = frag_more (prefix + 1 + 2 + size);
3350 if (i.prefix[DATA_PREFIX] != 0)
3351 *p++ = DATA_PREFIX_OPCODE;
3353 if (i.prefix[REX_PREFIX] != 0)
3354 *p++ = i.prefix[REX_PREFIX];
3356 *p++ = i.tm.base_opcode;
3357 if (i.op[1].imms->X_op == O_constant)
3359 offsetT n = i.op[1].imms->X_add_number;
3361 if (size == 2
3362 && !fits_in_unsigned_word (n)
3363 && !fits_in_signed_word (n))
3365 as_bad (_("16-bit jump out of range"));
3366 return;
3368 md_number_to_chars (p, n, size);
3370 else
3371 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3372 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
3373 if (i.op[0].imms->X_op != O_constant)
3374 as_bad (_("can't handle non absolute segment in `%s'"),
3375 i.tm.name);
3376 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
3379 static void
3380 output_insn ()
3382 fragS *insn_start_frag;
3383 offsetT insn_start_off;
3385 /* Tie dwarf2 debug info to the address at the start of the insn.
3386 We can't do this after the insn has been output as the current
3387 frag may have been closed off. eg. by frag_var. */
3388 dwarf2_emit_insn (0);
3390 insn_start_frag = frag_now;
3391 insn_start_off = frag_now_fix ();
3393 /* Output jumps. */
3394 if (i.tm.opcode_modifier & Jump)
3395 output_branch ();
3396 else if (i.tm.opcode_modifier & (JumpByte | JumpDword))
3397 output_jump ();
3398 else if (i.tm.opcode_modifier & JumpInterSegment)
3399 output_interseg_jump ();
3400 else
3402 /* Output normal instructions here. */
3403 char *p;
3404 unsigned char *q;
3406 /* All opcodes on i386 have either 1 or 2 bytes. We may use one
3407 more higher byte to specify a prefix the instruction
3408 requires. */
3409 if ((i.tm.base_opcode & 0xff0000) != 0)
3411 if ((i.tm.cpu_flags & CpuPadLock) != 0)
3413 unsigned int prefix;
3414 prefix = (i.tm.base_opcode >> 16) & 0xff;
3416 if (prefix != REPE_PREFIX_OPCODE
3417 || i.prefix[LOCKREP_PREFIX] != REPE_PREFIX_OPCODE)
3418 add_prefix (prefix);
3420 else
3421 add_prefix ((i.tm.base_opcode >> 16) & 0xff);
3424 /* The prefix bytes. */
3425 for (q = i.prefix;
3426 q < i.prefix + sizeof (i.prefix) / sizeof (i.prefix[0]);
3427 q++)
3429 if (*q)
3431 p = frag_more (1);
3432 md_number_to_chars (p, (valueT) *q, 1);
3436 /* Now the opcode; be careful about word order here! */
3437 if (fits_in_unsigned_byte (i.tm.base_opcode))
3439 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
3441 else
3443 p = frag_more (2);
3445 /* Put out high byte first: can't use md_number_to_chars! */
3446 *p++ = (i.tm.base_opcode >> 8) & 0xff;
3447 *p = i.tm.base_opcode & 0xff;
3450 /* Now the modrm byte and sib byte (if present). */
3451 if (i.tm.opcode_modifier & Modrm)
3453 p = frag_more (1);
3454 md_number_to_chars (p,
3455 (valueT) (i.rm.regmem << 0
3456 | i.rm.reg << 3
3457 | i.rm.mode << 6),
3459 /* If i.rm.regmem == ESP (4)
3460 && i.rm.mode != (Register mode)
3461 && not 16 bit
3462 ==> need second modrm byte. */
3463 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
3464 && i.rm.mode != 3
3465 && !(i.base_reg && (i.base_reg->reg_type & Reg16) != 0))
3467 p = frag_more (1);
3468 md_number_to_chars (p,
3469 (valueT) (i.sib.base << 0
3470 | i.sib.index << 3
3471 | i.sib.scale << 6),
3476 if (i.disp_operands)
3477 output_disp (insn_start_frag, insn_start_off);
3479 if (i.imm_operands)
3480 output_imm (insn_start_frag, insn_start_off);
3483 #ifdef DEBUG386
3484 if (flag_debug)
3486 pi (line, &i);
3488 #endif /* DEBUG386 */
3491 static void
3492 output_disp (insn_start_frag, insn_start_off)
3493 fragS *insn_start_frag;
3494 offsetT insn_start_off;
3496 char *p;
3497 unsigned int n;
3499 for (n = 0; n < i.operands; n++)
3501 if (i.types[n] & Disp)
3503 if (i.op[n].disps->X_op == O_constant)
3505 int size;
3506 offsetT val;
3508 size = 4;
3509 if (i.types[n] & (Disp8 | Disp16 | Disp64))
3511 size = 2;
3512 if (i.types[n] & Disp8)
3513 size = 1;
3514 if (i.types[n] & Disp64)
3515 size = 8;
3517 val = offset_in_range (i.op[n].disps->X_add_number,
3518 size);
3519 p = frag_more (size);
3520 md_number_to_chars (p, val, size);
3522 else
3524 enum bfd_reloc_code_real reloc_type;
3525 int size = 4;
3526 int sign = 0;
3527 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
3529 /* The PC relative address is computed relative
3530 to the instruction boundary, so in case immediate
3531 fields follows, we need to adjust the value. */
3532 if (pcrel && i.imm_operands)
3534 int imm_size = 4;
3535 unsigned int n1;
3537 for (n1 = 0; n1 < i.operands; n1++)
3538 if (i.types[n1] & Imm)
3540 if (i.types[n1] & (Imm8 | Imm8S | Imm16 | Imm64))
3542 imm_size = 2;
3543 if (i.types[n1] & (Imm8 | Imm8S))
3544 imm_size = 1;
3545 if (i.types[n1] & Imm64)
3546 imm_size = 8;
3548 break;
3550 /* We should find the immediate. */
3551 if (n1 == i.operands)
3552 abort ();
3553 i.op[n].disps->X_add_number -= imm_size;
3556 if (i.types[n] & Disp32S)
3557 sign = 1;
3559 if (i.types[n] & (Disp16 | Disp64))
3561 size = 2;
3562 if (i.types[n] & Disp64)
3563 size = 8;
3566 p = frag_more (size);
3567 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
3568 if (GOT_symbol
3569 && GOT_symbol == i.op[n].disps->X_add_symbol
3570 && (((reloc_type == BFD_RELOC_32
3571 || reloc_type == BFD_RELOC_X86_64_32S)
3572 && (i.op[n].disps->X_op == O_symbol
3573 || (i.op[n].disps->X_op == O_add
3574 && ((symbol_get_value_expression
3575 (i.op[n].disps->X_op_symbol)->X_op)
3576 == O_subtract))))
3577 || reloc_type == BFD_RELOC_32_PCREL))
3579 offsetT add;
3581 if (insn_start_frag == frag_now)
3582 add = (p - frag_now->fr_literal) - insn_start_off;
3583 else
3585 fragS *fr;
3587 add = insn_start_frag->fr_fix - insn_start_off;
3588 for (fr = insn_start_frag->fr_next;
3589 fr && fr != frag_now; fr = fr->fr_next)
3590 add += fr->fr_fix;
3591 add += p - frag_now->fr_literal;
3594 if (flag_code != CODE_64BIT)
3595 reloc_type = BFD_RELOC_386_GOTPC;
3596 else
3597 reloc_type = BFD_RELOC_X86_64_GOTPC32;
3598 i.op[n].disps->X_add_number += add;
3600 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3601 i.op[n].disps, pcrel, reloc_type);
3607 static void
3608 output_imm (insn_start_frag, insn_start_off)
3609 fragS *insn_start_frag;
3610 offsetT insn_start_off;
3612 char *p;
3613 unsigned int n;
3615 for (n = 0; n < i.operands; n++)
3617 if (i.types[n] & Imm)
3619 if (i.op[n].imms->X_op == O_constant)
3621 int size;
3622 offsetT val;
3624 size = 4;
3625 if (i.types[n] & (Imm8 | Imm8S | Imm16 | Imm64))
3627 size = 2;
3628 if (i.types[n] & (Imm8 | Imm8S))
3629 size = 1;
3630 else if (i.types[n] & Imm64)
3631 size = 8;
3633 val = offset_in_range (i.op[n].imms->X_add_number,
3634 size);
3635 p = frag_more (size);
3636 md_number_to_chars (p, val, size);
3638 else
3640 /* Not absolute_section.
3641 Need a 32-bit fixup (don't support 8bit
3642 non-absolute imms). Try to support other
3643 sizes ... */
3644 enum bfd_reloc_code_real reloc_type;
3645 int size = 4;
3646 int sign = 0;
3648 if ((i.types[n] & (Imm32S))
3649 && (i.suffix == QWORD_MNEM_SUFFIX
3650 || (!i.suffix && (i.tm.opcode_modifier & No_lSuf))))
3651 sign = 1;
3652 if (i.types[n] & (Imm8 | Imm8S | Imm16 | Imm64))
3654 size = 2;
3655 if (i.types[n] & (Imm8 | Imm8S))
3656 size = 1;
3657 if (i.types[n] & Imm64)
3658 size = 8;
3661 p = frag_more (size);
3662 reloc_type = reloc (size, 0, sign, i.reloc[n]);
3664 /* This is tough to explain. We end up with this one if we
3665 * have operands that look like
3666 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
3667 * obtain the absolute address of the GOT, and it is strongly
3668 * preferable from a performance point of view to avoid using
3669 * a runtime relocation for this. The actual sequence of
3670 * instructions often look something like:
3672 * call .L66
3673 * .L66:
3674 * popl %ebx
3675 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
3677 * The call and pop essentially return the absolute address
3678 * of the label .L66 and store it in %ebx. The linker itself
3679 * will ultimately change the first operand of the addl so
3680 * that %ebx points to the GOT, but to keep things simple, the
3681 * .o file must have this operand set so that it generates not
3682 * the absolute address of .L66, but the absolute address of
3683 * itself. This allows the linker itself simply treat a GOTPC
3684 * relocation as asking for a pcrel offset to the GOT to be
3685 * added in, and the addend of the relocation is stored in the
3686 * operand field for the instruction itself.
3688 * Our job here is to fix the operand so that it would add
3689 * the correct offset so that %ebx would point to itself. The
3690 * thing that is tricky is that .-.L66 will point to the
3691 * beginning of the instruction, so we need to further modify
3692 * the operand so that it will point to itself. There are
3693 * other cases where you have something like:
3695 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
3697 * and here no correction would be required. Internally in
3698 * the assembler we treat operands of this form as not being
3699 * pcrel since the '.' is explicitly mentioned, and I wonder
3700 * whether it would simplify matters to do it this way. Who
3701 * knows. In earlier versions of the PIC patches, the
3702 * pcrel_adjust field was used to store the correction, but
3703 * since the expression is not pcrel, I felt it would be
3704 * confusing to do it this way. */
3706 if ((reloc_type == BFD_RELOC_32
3707 || reloc_type == BFD_RELOC_X86_64_32S)
3708 && GOT_symbol
3709 && GOT_symbol == i.op[n].imms->X_add_symbol
3710 && (i.op[n].imms->X_op == O_symbol
3711 || (i.op[n].imms->X_op == O_add
3712 && ((symbol_get_value_expression
3713 (i.op[n].imms->X_op_symbol)->X_op)
3714 == O_subtract))))
3716 offsetT add;
3718 if (insn_start_frag == frag_now)
3719 add = (p - frag_now->fr_literal) - insn_start_off;
3720 else
3722 fragS *fr;
3724 add = insn_start_frag->fr_fix - insn_start_off;
3725 for (fr = insn_start_frag->fr_next;
3726 fr && fr != frag_now; fr = fr->fr_next)
3727 add += fr->fr_fix;
3728 add += p - frag_now->fr_literal;
3731 if (flag_code != CODE_64BIT)
3732 reloc_type = BFD_RELOC_386_GOTPC;
3733 else
3734 reloc_type = BFD_RELOC_X86_64_GOTPC32;
3735 i.op[n].imms->X_add_number += add;
3737 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3738 i.op[n].imms, 0, reloc_type);
3744 #if (!defined (OBJ_ELF) && !defined (OBJ_MAYBE_ELF)) || defined (LEX_AT)
3745 # define lex_got(reloc, adjust, types) NULL
3746 #else
3747 /* Parse operands of the form
3748 <symbol>@GOTOFF+<nnn>
3749 and similar .plt or .got references.
3751 If we find one, set up the correct relocation in RELOC and copy the
3752 input string, minus the `@GOTOFF' into a malloc'd buffer for
3753 parsing by the calling routine. Return this buffer, and if ADJUST
3754 is non-null set it to the length of the string we removed from the
3755 input line. Otherwise return NULL. */
3756 static char *
3757 lex_got (enum bfd_reloc_code_real *reloc,
3758 int *adjust,
3759 unsigned int *types)
3761 static const char * const mode_name[NUM_FLAG_CODE] = { "32", "16", "64" };
3762 static const struct {
3763 const char *str;
3764 const enum bfd_reloc_code_real rel[NUM_FLAG_CODE];
3765 const unsigned int types64;
3766 } gotrel[] = {
3767 { "PLT", { BFD_RELOC_386_PLT32, 0, BFD_RELOC_X86_64_PLT32 }, Imm32|Imm32S|Disp32 },
3768 { "GOTOFF", { BFD_RELOC_386_GOTOFF, 0, BFD_RELOC_X86_64_GOTOFF64 }, Imm64|Disp64 },
3769 { "GOTPCREL", { 0, 0, BFD_RELOC_X86_64_GOTPCREL }, Imm32|Imm32S|Disp32 },
3770 { "TLSGD", { BFD_RELOC_386_TLS_GD, 0, BFD_RELOC_X86_64_TLSGD }, Imm32|Imm32S|Disp32 },
3771 { "TLSLDM", { BFD_RELOC_386_TLS_LDM, 0, 0 }, 0 },
3772 { "TLSLD", { 0, 0, BFD_RELOC_X86_64_TLSLD }, Imm32|Imm32S|Disp32 },
3773 { "GOTTPOFF", { BFD_RELOC_386_TLS_IE_32, 0, BFD_RELOC_X86_64_GOTTPOFF }, Imm32|Imm32S|Disp32 },
3774 { "TPOFF", { BFD_RELOC_386_TLS_LE_32, 0, BFD_RELOC_X86_64_TPOFF32 }, Imm32|Imm32S|Imm64|Disp32|Disp64 },
3775 { "NTPOFF", { BFD_RELOC_386_TLS_LE, 0, 0 }, 0 },
3776 { "DTPOFF", { BFD_RELOC_386_TLS_LDO_32, 0, BFD_RELOC_X86_64_DTPOFF32 }, Imm32|Imm32S|Imm64|Disp32|Disp64 },
3777 { "GOTNTPOFF",{ BFD_RELOC_386_TLS_GOTIE, 0, 0 }, 0 },
3778 { "INDNTPOFF",{ BFD_RELOC_386_TLS_IE, 0, 0 }, 0 },
3779 { "GOT", { BFD_RELOC_386_GOT32, 0, BFD_RELOC_X86_64_GOT32 }, Imm32|Imm32S|Disp32 }
3781 char *cp;
3782 unsigned int j;
3784 if (!IS_ELF)
3785 return NULL;
3787 for (cp = input_line_pointer; *cp != '@'; cp++)
3788 if (is_end_of_line[(unsigned char) *cp])
3789 return NULL;
3791 for (j = 0; j < sizeof (gotrel) / sizeof (gotrel[0]); j++)
3793 int len;
3795 len = strlen (gotrel[j].str);
3796 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
3798 if (gotrel[j].rel[(unsigned int) flag_code] != 0)
3800 int first, second;
3801 char *tmpbuf, *past_reloc;
3803 *reloc = gotrel[j].rel[(unsigned int) flag_code];
3804 if (adjust)
3805 *adjust = len;
3807 if (types)
3809 if (flag_code != CODE_64BIT)
3810 *types = Imm32|Disp32;
3811 else
3812 *types = gotrel[j].types64;
3815 if (GOT_symbol == NULL)
3816 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
3818 /* Replace the relocation token with ' ', so that
3819 errors like foo@GOTOFF1 will be detected. */
3821 /* The length of the first part of our input line. */
3822 first = cp - input_line_pointer;
3824 /* The second part goes from after the reloc token until
3825 (and including) an end_of_line char. Don't use strlen
3826 here as the end_of_line char may not be a NUL. */
3827 past_reloc = cp + 1 + len;
3828 for (cp = past_reloc; !is_end_of_line[(unsigned char) *cp++]; )
3830 second = cp - past_reloc;
3832 /* Allocate and copy string. The trailing NUL shouldn't
3833 be necessary, but be safe. */
3834 tmpbuf = xmalloc (first + second + 2);
3835 memcpy (tmpbuf, input_line_pointer, first);
3836 tmpbuf[first] = ' ';
3837 memcpy (tmpbuf + first + 1, past_reloc, second);
3838 tmpbuf[first + second + 1] = '\0';
3839 return tmpbuf;
3842 as_bad (_("@%s reloc is not supported in %s bit mode"),
3843 gotrel[j].str, mode_name[(unsigned int) flag_code]);
3844 return NULL;
3848 /* Might be a symbol version string. Don't as_bad here. */
3849 return NULL;
3852 /* x86_cons_fix_new is called via the expression parsing code when a
3853 reloc is needed. We use this hook to get the correct .got reloc. */
3854 static enum bfd_reloc_code_real got_reloc = NO_RELOC;
3856 void
3857 x86_cons_fix_new (frag, off, len, exp)
3858 fragS *frag;
3859 unsigned int off;
3860 unsigned int len;
3861 expressionS *exp;
3863 enum bfd_reloc_code_real r = reloc (len, 0, -1, got_reloc);
3864 got_reloc = NO_RELOC;
3865 fix_new_exp (frag, off, len, exp, 0, r);
3868 void
3869 x86_cons (exp, size)
3870 expressionS *exp;
3871 int size;
3873 if (size == 4 || (flag_code == CODE_64BIT && size == 8))
3875 /* Handle @GOTOFF and the like in an expression. */
3876 char *save;
3877 char *gotfree_input_line;
3878 int adjust;
3880 save = input_line_pointer;
3881 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
3882 if (gotfree_input_line)
3883 input_line_pointer = gotfree_input_line;
3885 expression (exp);
3887 if (gotfree_input_line)
3889 /* expression () has merrily parsed up to the end of line,
3890 or a comma - in the wrong buffer. Transfer how far
3891 input_line_pointer has moved to the right buffer. */
3892 input_line_pointer = (save
3893 + (input_line_pointer - gotfree_input_line)
3894 + adjust);
3895 free (gotfree_input_line);
3898 else
3899 expression (exp);
3901 #endif
3903 #ifdef TE_PE
3905 void
3906 x86_pe_cons_fix_new (frag, off, len, exp)
3907 fragS *frag;
3908 unsigned int off;
3909 unsigned int len;
3910 expressionS *exp;
3912 enum bfd_reloc_code_real r = reloc (len, 0, -1, NO_RELOC);
3914 if (exp->X_op == O_secrel)
3916 exp->X_op = O_symbol;
3917 r = BFD_RELOC_32_SECREL;
3920 fix_new_exp (frag, off, len, exp, 0, r);
3923 static void
3924 pe_directive_secrel (dummy)
3925 int dummy ATTRIBUTE_UNUSED;
3927 expressionS exp;
3931 expression (&exp);
3932 if (exp.X_op == O_symbol)
3933 exp.X_op = O_secrel;
3935 emit_expr (&exp, 4);
3937 while (*input_line_pointer++ == ',');
3939 input_line_pointer--;
3940 demand_empty_rest_of_line ();
3943 #endif
3945 static int i386_immediate PARAMS ((char *));
3947 static int
3948 i386_immediate (imm_start)
3949 char *imm_start;
3951 char *save_input_line_pointer;
3952 char *gotfree_input_line;
3953 segT exp_seg = 0;
3954 expressionS *exp;
3955 unsigned int types = ~0U;
3957 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
3959 as_bad (_("only 1 or 2 immediate operands are allowed"));
3960 return 0;
3963 exp = &im_expressions[i.imm_operands++];
3964 i.op[this_operand].imms = exp;
3966 if (is_space_char (*imm_start))
3967 ++imm_start;
3969 save_input_line_pointer = input_line_pointer;
3970 input_line_pointer = imm_start;
3972 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
3973 if (gotfree_input_line)
3974 input_line_pointer = gotfree_input_line;
3976 exp_seg = expression (exp);
3978 SKIP_WHITESPACE ();
3979 if (*input_line_pointer)
3980 as_bad (_("junk `%s' after expression"), input_line_pointer);
3982 input_line_pointer = save_input_line_pointer;
3983 if (gotfree_input_line)
3984 free (gotfree_input_line);
3986 if (exp->X_op == O_absent || exp->X_op == O_big)
3988 /* Missing or bad expr becomes absolute 0. */
3989 as_bad (_("missing or invalid immediate expression `%s' taken as 0"),
3990 imm_start);
3991 exp->X_op = O_constant;
3992 exp->X_add_number = 0;
3993 exp->X_add_symbol = (symbolS *) 0;
3994 exp->X_op_symbol = (symbolS *) 0;
3996 else if (exp->X_op == O_constant)
3998 /* Size it properly later. */
3999 i.types[this_operand] |= Imm64;
4000 /* If BFD64, sign extend val. */
4001 if (!use_rela_relocations)
4002 if ((exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
4003 exp->X_add_number = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
4005 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
4006 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
4007 && exp_seg != absolute_section
4008 && exp_seg != text_section
4009 && exp_seg != data_section
4010 && exp_seg != bss_section
4011 && exp_seg != undefined_section
4012 && !bfd_is_com_section (exp_seg))
4014 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
4015 return 0;
4017 #endif
4018 else
4020 /* This is an address. The size of the address will be
4021 determined later, depending on destination register,
4022 suffix, or the default for the section. */
4023 i.types[this_operand] |= Imm8 | Imm16 | Imm32 | Imm32S | Imm64;
4024 i.types[this_operand] &= types;
4027 return 1;
4030 static char *i386_scale PARAMS ((char *));
4032 static char *
4033 i386_scale (scale)
4034 char *scale;
4036 offsetT val;
4037 char *save = input_line_pointer;
4039 input_line_pointer = scale;
4040 val = get_absolute_expression ();
4042 switch (val)
4044 case 1:
4045 i.log2_scale_factor = 0;
4046 break;
4047 case 2:
4048 i.log2_scale_factor = 1;
4049 break;
4050 case 4:
4051 i.log2_scale_factor = 2;
4052 break;
4053 case 8:
4054 i.log2_scale_factor = 3;
4055 break;
4056 default:
4058 char sep = *input_line_pointer;
4060 *input_line_pointer = '\0';
4061 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
4062 scale);
4063 *input_line_pointer = sep;
4064 input_line_pointer = save;
4065 return NULL;
4068 if (i.log2_scale_factor != 0 && i.index_reg == 0)
4070 as_warn (_("scale factor of %d without an index register"),
4071 1 << i.log2_scale_factor);
4072 #if SCALE1_WHEN_NO_INDEX
4073 i.log2_scale_factor = 0;
4074 #endif
4076 scale = input_line_pointer;
4077 input_line_pointer = save;
4078 return scale;
4081 static int i386_displacement PARAMS ((char *, char *));
4083 static int
4084 i386_displacement (disp_start, disp_end)
4085 char *disp_start;
4086 char *disp_end;
4088 expressionS *exp;
4089 segT exp_seg = 0;
4090 char *save_input_line_pointer;
4091 char *gotfree_input_line;
4092 int bigdisp = Disp32;
4093 unsigned int types = Disp;
4095 if (flag_code == CODE_64BIT)
4097 if (i.prefix[ADDR_PREFIX] == 0)
4098 bigdisp = Disp64 | Disp32S | Disp32;
4100 else if ((flag_code == CODE_16BIT) ^ (i.prefix[ADDR_PREFIX] != 0))
4101 bigdisp = Disp16;
4102 i.types[this_operand] |= bigdisp;
4104 exp = &disp_expressions[i.disp_operands];
4105 i.op[this_operand].disps = exp;
4106 i.disp_operands++;
4107 save_input_line_pointer = input_line_pointer;
4108 input_line_pointer = disp_start;
4109 END_STRING_AND_SAVE (disp_end);
4111 #ifndef GCC_ASM_O_HACK
4112 #define GCC_ASM_O_HACK 0
4113 #endif
4114 #if GCC_ASM_O_HACK
4115 END_STRING_AND_SAVE (disp_end + 1);
4116 if ((i.types[this_operand] & BaseIndex) != 0
4117 && displacement_string_end[-1] == '+')
4119 /* This hack is to avoid a warning when using the "o"
4120 constraint within gcc asm statements.
4121 For instance:
4123 #define _set_tssldt_desc(n,addr,limit,type) \
4124 __asm__ __volatile__ ( \
4125 "movw %w2,%0\n\t" \
4126 "movw %w1,2+%0\n\t" \
4127 "rorl $16,%1\n\t" \
4128 "movb %b1,4+%0\n\t" \
4129 "movb %4,5+%0\n\t" \
4130 "movb $0,6+%0\n\t" \
4131 "movb %h1,7+%0\n\t" \
4132 "rorl $16,%1" \
4133 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
4135 This works great except that the output assembler ends
4136 up looking a bit weird if it turns out that there is
4137 no offset. You end up producing code that looks like:
4139 #APP
4140 movw $235,(%eax)
4141 movw %dx,2+(%eax)
4142 rorl $16,%edx
4143 movb %dl,4+(%eax)
4144 movb $137,5+(%eax)
4145 movb $0,6+(%eax)
4146 movb %dh,7+(%eax)
4147 rorl $16,%edx
4148 #NO_APP
4150 So here we provide the missing zero. */
4152 *displacement_string_end = '0';
4154 #endif
4155 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
4156 if (gotfree_input_line)
4157 input_line_pointer = gotfree_input_line;
4159 exp_seg = expression (exp);
4161 SKIP_WHITESPACE ();
4162 if (*input_line_pointer)
4163 as_bad (_("junk `%s' after expression"), input_line_pointer);
4164 #if GCC_ASM_O_HACK
4165 RESTORE_END_STRING (disp_end + 1);
4166 #endif
4167 RESTORE_END_STRING (disp_end);
4168 input_line_pointer = save_input_line_pointer;
4169 if (gotfree_input_line)
4170 free (gotfree_input_line);
4172 /* We do this to make sure that the section symbol is in
4173 the symbol table. We will ultimately change the relocation
4174 to be relative to the beginning of the section. */
4175 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
4176 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
4177 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
4179 if (exp->X_op != O_symbol)
4181 as_bad (_("bad expression used with @%s"),
4182 (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
4183 ? "GOTPCREL"
4184 : "GOTOFF"));
4185 return 0;
4188 if (S_IS_LOCAL (exp->X_add_symbol)
4189 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section)
4190 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
4191 exp->X_op = O_subtract;
4192 exp->X_op_symbol = GOT_symbol;
4193 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
4194 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
4195 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
4196 i.reloc[this_operand] = BFD_RELOC_64;
4197 else
4198 i.reloc[this_operand] = BFD_RELOC_32;
4201 if (exp->X_op == O_absent || exp->X_op == O_big)
4203 /* Missing or bad expr becomes absolute 0. */
4204 as_bad (_("missing or invalid displacement expression `%s' taken as 0"),
4205 disp_start);
4206 exp->X_op = O_constant;
4207 exp->X_add_number = 0;
4208 exp->X_add_symbol = (symbolS *) 0;
4209 exp->X_op_symbol = (symbolS *) 0;
4212 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
4213 if (exp->X_op != O_constant
4214 && OUTPUT_FLAVOR == bfd_target_aout_flavour
4215 && exp_seg != absolute_section
4216 && exp_seg != text_section
4217 && exp_seg != data_section
4218 && exp_seg != bss_section
4219 && exp_seg != undefined_section
4220 && !bfd_is_com_section (exp_seg))
4222 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
4223 return 0;
4225 #endif
4227 if (!(i.types[this_operand] & ~Disp))
4228 i.types[this_operand] &= types;
4230 return 1;
4233 static int i386_index_check PARAMS ((const char *));
4235 /* Make sure the memory operand we've been dealt is valid.
4236 Return 1 on success, 0 on a failure. */
4238 static int
4239 i386_index_check (operand_string)
4240 const char *operand_string;
4242 int ok;
4243 #if INFER_ADDR_PREFIX
4244 int fudged = 0;
4246 tryprefix:
4247 #endif
4248 ok = 1;
4249 if ((current_templates->start->cpu_flags & CpuSVME)
4250 && current_templates->end[-1].operand_types[0] == AnyMem)
4252 /* Memory operands of SVME insns are special in that they only allow
4253 rAX as their memory address and ignore any segment override. */
4254 unsigned RegXX;
4256 /* SKINIT is even more restrictive: it always requires EAX. */
4257 if (strcmp (current_templates->start->name, "skinit") == 0)
4258 RegXX = Reg32;
4259 else if (flag_code == CODE_64BIT)
4260 RegXX = i.prefix[ADDR_PREFIX] == 0 ? Reg64 : Reg32;
4261 else
4262 RegXX = (flag_code == CODE_16BIT) ^ (i.prefix[ADDR_PREFIX] != 0)
4263 ? Reg16
4264 : Reg32;
4265 if (!i.base_reg
4266 || !(i.base_reg->reg_type & Acc)
4267 || !(i.base_reg->reg_type & RegXX)
4268 || i.index_reg
4269 || (i.types[0] & Disp))
4270 ok = 0;
4272 else if (flag_code == CODE_64BIT)
4274 unsigned RegXX = (i.prefix[ADDR_PREFIX] == 0 ? Reg64 : Reg32);
4276 if ((i.base_reg
4277 && ((i.base_reg->reg_type & RegXX) == 0)
4278 && (i.base_reg->reg_type != BaseIndex
4279 || i.index_reg))
4280 || (i.index_reg
4281 && ((i.index_reg->reg_type & (RegXX | BaseIndex))
4282 != (RegXX | BaseIndex))))
4283 ok = 0;
4285 else
4287 if ((flag_code == CODE_16BIT) ^ (i.prefix[ADDR_PREFIX] != 0))
4289 /* 16bit checks. */
4290 if ((i.base_reg
4291 && ((i.base_reg->reg_type & (Reg16 | BaseIndex | RegRex))
4292 != (Reg16 | BaseIndex)))
4293 || (i.index_reg
4294 && (((i.index_reg->reg_type & (Reg16 | BaseIndex))
4295 != (Reg16 | BaseIndex))
4296 || !(i.base_reg
4297 && i.base_reg->reg_num < 6
4298 && i.index_reg->reg_num >= 6
4299 && i.log2_scale_factor == 0))))
4300 ok = 0;
4302 else
4304 /* 32bit checks. */
4305 if ((i.base_reg
4306 && (i.base_reg->reg_type & (Reg32 | RegRex)) != Reg32)
4307 || (i.index_reg
4308 && ((i.index_reg->reg_type & (Reg32 | BaseIndex | RegRex))
4309 != (Reg32 | BaseIndex))))
4310 ok = 0;
4313 if (!ok)
4315 #if INFER_ADDR_PREFIX
4316 if (i.prefix[ADDR_PREFIX] == 0)
4318 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
4319 i.prefixes += 1;
4320 /* Change the size of any displacement too. At most one of
4321 Disp16 or Disp32 is set.
4322 FIXME. There doesn't seem to be any real need for separate
4323 Disp16 and Disp32 flags. The same goes for Imm16 and Imm32.
4324 Removing them would probably clean up the code quite a lot. */
4325 if (flag_code != CODE_64BIT && (i.types[this_operand] & (Disp16 | Disp32)))
4326 i.types[this_operand] ^= (Disp16 | Disp32);
4327 fudged = 1;
4328 goto tryprefix;
4330 if (fudged)
4331 as_bad (_("`%s' is not a valid base/index expression"),
4332 operand_string);
4333 else
4334 #endif
4335 as_bad (_("`%s' is not a valid %s bit base/index expression"),
4336 operand_string,
4337 flag_code_names[flag_code]);
4339 return ok;
4342 /* Parse OPERAND_STRING into the i386_insn structure I. Returns non-zero
4343 on error. */
4345 static int
4346 i386_operand (operand_string)
4347 char *operand_string;
4349 const reg_entry *r;
4350 char *end_op;
4351 char *op_string = operand_string;
4353 if (is_space_char (*op_string))
4354 ++op_string;
4356 /* We check for an absolute prefix (differentiating,
4357 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
4358 if (*op_string == ABSOLUTE_PREFIX)
4360 ++op_string;
4361 if (is_space_char (*op_string))
4362 ++op_string;
4363 i.types[this_operand] |= JumpAbsolute;
4366 /* Check if operand is a register. */
4367 if ((*op_string == REGISTER_PREFIX || allow_naked_reg)
4368 && (r = parse_register (op_string, &end_op)) != NULL)
4370 /* Check for a segment override by searching for ':' after a
4371 segment register. */
4372 op_string = end_op;
4373 if (is_space_char (*op_string))
4374 ++op_string;
4375 if (*op_string == ':' && (r->reg_type & (SReg2 | SReg3)))
4377 switch (r->reg_num)
4379 case 0:
4380 i.seg[i.mem_operands] = &es;
4381 break;
4382 case 1:
4383 i.seg[i.mem_operands] = &cs;
4384 break;
4385 case 2:
4386 i.seg[i.mem_operands] = &ss;
4387 break;
4388 case 3:
4389 i.seg[i.mem_operands] = &ds;
4390 break;
4391 case 4:
4392 i.seg[i.mem_operands] = &fs;
4393 break;
4394 case 5:
4395 i.seg[i.mem_operands] = &gs;
4396 break;
4399 /* Skip the ':' and whitespace. */
4400 ++op_string;
4401 if (is_space_char (*op_string))
4402 ++op_string;
4404 if (!is_digit_char (*op_string)
4405 && !is_identifier_char (*op_string)
4406 && *op_string != '('
4407 && *op_string != ABSOLUTE_PREFIX)
4409 as_bad (_("bad memory operand `%s'"), op_string);
4410 return 0;
4412 /* Handle case of %es:*foo. */
4413 if (*op_string == ABSOLUTE_PREFIX)
4415 ++op_string;
4416 if (is_space_char (*op_string))
4417 ++op_string;
4418 i.types[this_operand] |= JumpAbsolute;
4420 goto do_memory_reference;
4422 if (*op_string)
4424 as_bad (_("junk `%s' after register"), op_string);
4425 return 0;
4427 i.types[this_operand] |= r->reg_type & ~BaseIndex;
4428 i.op[this_operand].regs = r;
4429 i.reg_operands++;
4431 else if (*op_string == REGISTER_PREFIX)
4433 as_bad (_("bad register name `%s'"), op_string);
4434 return 0;
4436 else if (*op_string == IMMEDIATE_PREFIX)
4438 ++op_string;
4439 if (i.types[this_operand] & JumpAbsolute)
4441 as_bad (_("immediate operand illegal with absolute jump"));
4442 return 0;
4444 if (!i386_immediate (op_string))
4445 return 0;
4447 else if (is_digit_char (*op_string)
4448 || is_identifier_char (*op_string)
4449 || *op_string == '(')
4451 /* This is a memory reference of some sort. */
4452 char *base_string;
4454 /* Start and end of displacement string expression (if found). */
4455 char *displacement_string_start;
4456 char *displacement_string_end;
4458 do_memory_reference:
4459 if ((i.mem_operands == 1
4460 && (current_templates->start->opcode_modifier & IsString) == 0)
4461 || i.mem_operands == 2)
4463 as_bad (_("too many memory references for `%s'"),
4464 current_templates->start->name);
4465 return 0;
4468 /* Check for base index form. We detect the base index form by
4469 looking for an ')' at the end of the operand, searching
4470 for the '(' matching it, and finding a REGISTER_PREFIX or ','
4471 after the '('. */
4472 base_string = op_string + strlen (op_string);
4474 --base_string;
4475 if (is_space_char (*base_string))
4476 --base_string;
4478 /* If we only have a displacement, set-up for it to be parsed later. */
4479 displacement_string_start = op_string;
4480 displacement_string_end = base_string + 1;
4482 if (*base_string == ')')
4484 char *temp_string;
4485 unsigned int parens_balanced = 1;
4486 /* We've already checked that the number of left & right ()'s are
4487 equal, so this loop will not be infinite. */
4490 base_string--;
4491 if (*base_string == ')')
4492 parens_balanced++;
4493 if (*base_string == '(')
4494 parens_balanced--;
4496 while (parens_balanced);
4498 temp_string = base_string;
4500 /* Skip past '(' and whitespace. */
4501 ++base_string;
4502 if (is_space_char (*base_string))
4503 ++base_string;
4505 if (*base_string == ','
4506 || ((*base_string == REGISTER_PREFIX || allow_naked_reg)
4507 && (i.base_reg = parse_register (base_string, &end_op)) != NULL))
4509 displacement_string_end = temp_string;
4511 i.types[this_operand] |= BaseIndex;
4513 if (i.base_reg)
4515 base_string = end_op;
4516 if (is_space_char (*base_string))
4517 ++base_string;
4520 /* There may be an index reg or scale factor here. */
4521 if (*base_string == ',')
4523 ++base_string;
4524 if (is_space_char (*base_string))
4525 ++base_string;
4527 if ((*base_string == REGISTER_PREFIX || allow_naked_reg)
4528 && (i.index_reg = parse_register (base_string, &end_op)) != NULL)
4530 base_string = end_op;
4531 if (is_space_char (*base_string))
4532 ++base_string;
4533 if (*base_string == ',')
4535 ++base_string;
4536 if (is_space_char (*base_string))
4537 ++base_string;
4539 else if (*base_string != ')')
4541 as_bad (_("expecting `,' or `)' after index register in `%s'"),
4542 operand_string);
4543 return 0;
4546 else if (*base_string == REGISTER_PREFIX)
4548 as_bad (_("bad register name `%s'"), base_string);
4549 return 0;
4552 /* Check for scale factor. */
4553 if (*base_string != ')')
4555 char *end_scale = i386_scale (base_string);
4557 if (!end_scale)
4558 return 0;
4560 base_string = end_scale;
4561 if (is_space_char (*base_string))
4562 ++base_string;
4563 if (*base_string != ')')
4565 as_bad (_("expecting `)' after scale factor in `%s'"),
4566 operand_string);
4567 return 0;
4570 else if (!i.index_reg)
4572 as_bad (_("expecting index register or scale factor after `,'; got '%c'"),
4573 *base_string);
4574 return 0;
4577 else if (*base_string != ')')
4579 as_bad (_("expecting `,' or `)' after base register in `%s'"),
4580 operand_string);
4581 return 0;
4584 else if (*base_string == REGISTER_PREFIX)
4586 as_bad (_("bad register name `%s'"), base_string);
4587 return 0;
4591 /* If there's an expression beginning the operand, parse it,
4592 assuming displacement_string_start and
4593 displacement_string_end are meaningful. */
4594 if (displacement_string_start != displacement_string_end)
4596 if (!i386_displacement (displacement_string_start,
4597 displacement_string_end))
4598 return 0;
4601 /* Special case for (%dx) while doing input/output op. */
4602 if (i.base_reg
4603 && i.base_reg->reg_type == (Reg16 | InOutPortReg)
4604 && i.index_reg == 0
4605 && i.log2_scale_factor == 0
4606 && i.seg[i.mem_operands] == 0
4607 && (i.types[this_operand] & Disp) == 0)
4609 i.types[this_operand] = InOutPortReg;
4610 return 1;
4613 if (i386_index_check (operand_string) == 0)
4614 return 0;
4615 i.mem_operands++;
4617 else
4619 /* It's not a memory operand; argh! */
4620 as_bad (_("invalid char %s beginning operand %d `%s'"),
4621 output_invalid (*op_string),
4622 this_operand + 1,
4623 op_string);
4624 return 0;
4626 return 1; /* Normal return. */
4629 /* md_estimate_size_before_relax()
4631 Called just before relax() for rs_machine_dependent frags. The x86
4632 assembler uses these frags to handle variable size jump
4633 instructions.
4635 Any symbol that is now undefined will not become defined.
4636 Return the correct fr_subtype in the frag.
4637 Return the initial "guess for variable size of frag" to caller.
4638 The guess is actually the growth beyond the fixed part. Whatever
4639 we do to grow the fixed or variable part contributes to our
4640 returned value. */
4643 md_estimate_size_before_relax (fragP, segment)
4644 fragS *fragP;
4645 segT segment;
4647 /* We've already got fragP->fr_subtype right; all we have to do is
4648 check for un-relaxable symbols. On an ELF system, we can't relax
4649 an externally visible symbol, because it may be overridden by a
4650 shared library. */
4651 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
4652 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
4653 || (IS_ELF
4654 && (S_IS_EXTERNAL (fragP->fr_symbol)
4655 || S_IS_WEAK (fragP->fr_symbol)))
4656 #endif
4659 /* Symbol is undefined in this segment, or we need to keep a
4660 reloc so that weak symbols can be overridden. */
4661 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
4662 enum bfd_reloc_code_real reloc_type;
4663 unsigned char *opcode;
4664 int old_fr_fix;
4666 if (fragP->fr_var != NO_RELOC)
4667 reloc_type = fragP->fr_var;
4668 else if (size == 2)
4669 reloc_type = BFD_RELOC_16_PCREL;
4670 else
4671 reloc_type = BFD_RELOC_32_PCREL;
4673 old_fr_fix = fragP->fr_fix;
4674 opcode = (unsigned char *) fragP->fr_opcode;
4676 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
4678 case UNCOND_JUMP:
4679 /* Make jmp (0xeb) a (d)word displacement jump. */
4680 opcode[0] = 0xe9;
4681 fragP->fr_fix += size;
4682 fix_new (fragP, old_fr_fix, size,
4683 fragP->fr_symbol,
4684 fragP->fr_offset, 1,
4685 reloc_type);
4686 break;
4688 case COND_JUMP86:
4689 if (size == 2
4690 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
4692 /* Negate the condition, and branch past an
4693 unconditional jump. */
4694 opcode[0] ^= 1;
4695 opcode[1] = 3;
4696 /* Insert an unconditional jump. */
4697 opcode[2] = 0xe9;
4698 /* We added two extra opcode bytes, and have a two byte
4699 offset. */
4700 fragP->fr_fix += 2 + 2;
4701 fix_new (fragP, old_fr_fix + 2, 2,
4702 fragP->fr_symbol,
4703 fragP->fr_offset, 1,
4704 reloc_type);
4705 break;
4707 /* Fall through. */
4709 case COND_JUMP:
4710 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
4712 fixS *fixP;
4714 fragP->fr_fix += 1;
4715 fixP = fix_new (fragP, old_fr_fix, 1,
4716 fragP->fr_symbol,
4717 fragP->fr_offset, 1,
4718 BFD_RELOC_8_PCREL);
4719 fixP->fx_signed = 1;
4720 break;
4723 /* This changes the byte-displacement jump 0x7N
4724 to the (d)word-displacement jump 0x0f,0x8N. */
4725 opcode[1] = opcode[0] + 0x10;
4726 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
4727 /* We've added an opcode byte. */
4728 fragP->fr_fix += 1 + size;
4729 fix_new (fragP, old_fr_fix + 1, size,
4730 fragP->fr_symbol,
4731 fragP->fr_offset, 1,
4732 reloc_type);
4733 break;
4735 default:
4736 BAD_CASE (fragP->fr_subtype);
4737 break;
4739 frag_wane (fragP);
4740 return fragP->fr_fix - old_fr_fix;
4743 /* Guess size depending on current relax state. Initially the relax
4744 state will correspond to a short jump and we return 1, because
4745 the variable part of the frag (the branch offset) is one byte
4746 long. However, we can relax a section more than once and in that
4747 case we must either set fr_subtype back to the unrelaxed state,
4748 or return the value for the appropriate branch. */
4749 return md_relax_table[fragP->fr_subtype].rlx_length;
4752 /* Called after relax() is finished.
4754 In: Address of frag.
4755 fr_type == rs_machine_dependent.
4756 fr_subtype is what the address relaxed to.
4758 Out: Any fixSs and constants are set up.
4759 Caller will turn frag into a ".space 0". */
4761 void
4762 md_convert_frag (abfd, sec, fragP)
4763 bfd *abfd ATTRIBUTE_UNUSED;
4764 segT sec ATTRIBUTE_UNUSED;
4765 fragS *fragP;
4767 unsigned char *opcode;
4768 unsigned char *where_to_put_displacement = NULL;
4769 offsetT target_address;
4770 offsetT opcode_address;
4771 unsigned int extension = 0;
4772 offsetT displacement_from_opcode_start;
4774 opcode = (unsigned char *) fragP->fr_opcode;
4776 /* Address we want to reach in file space. */
4777 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
4779 /* Address opcode resides at in file space. */
4780 opcode_address = fragP->fr_address + fragP->fr_fix;
4782 /* Displacement from opcode start to fill into instruction. */
4783 displacement_from_opcode_start = target_address - opcode_address;
4785 if ((fragP->fr_subtype & BIG) == 0)
4787 /* Don't have to change opcode. */
4788 extension = 1; /* 1 opcode + 1 displacement */
4789 where_to_put_displacement = &opcode[1];
4791 else
4793 if (no_cond_jump_promotion
4794 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
4795 as_warn_where (fragP->fr_file, fragP->fr_line, _("long jump required"));
4797 switch (fragP->fr_subtype)
4799 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
4800 extension = 4; /* 1 opcode + 4 displacement */
4801 opcode[0] = 0xe9;
4802 where_to_put_displacement = &opcode[1];
4803 break;
4805 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
4806 extension = 2; /* 1 opcode + 2 displacement */
4807 opcode[0] = 0xe9;
4808 where_to_put_displacement = &opcode[1];
4809 break;
4811 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
4812 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
4813 extension = 5; /* 2 opcode + 4 displacement */
4814 opcode[1] = opcode[0] + 0x10;
4815 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
4816 where_to_put_displacement = &opcode[2];
4817 break;
4819 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
4820 extension = 3; /* 2 opcode + 2 displacement */
4821 opcode[1] = opcode[0] + 0x10;
4822 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
4823 where_to_put_displacement = &opcode[2];
4824 break;
4826 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
4827 extension = 4;
4828 opcode[0] ^= 1;
4829 opcode[1] = 3;
4830 opcode[2] = 0xe9;
4831 where_to_put_displacement = &opcode[3];
4832 break;
4834 default:
4835 BAD_CASE (fragP->fr_subtype);
4836 break;
4840 /* Now put displacement after opcode. */
4841 md_number_to_chars ((char *) where_to_put_displacement,
4842 (valueT) (displacement_from_opcode_start - extension),
4843 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
4844 fragP->fr_fix += extension;
4847 /* Size of byte displacement jmp. */
4848 int md_short_jump_size = 2;
4850 /* Size of dword displacement jmp. */
4851 int md_long_jump_size = 5;
4853 /* Size of relocation record. */
4854 const int md_reloc_size = 8;
4856 void
4857 md_create_short_jump (ptr, from_addr, to_addr, frag, to_symbol)
4858 char *ptr;
4859 addressT from_addr, to_addr;
4860 fragS *frag ATTRIBUTE_UNUSED;
4861 symbolS *to_symbol ATTRIBUTE_UNUSED;
4863 offsetT offset;
4865 offset = to_addr - (from_addr + 2);
4866 /* Opcode for byte-disp jump. */
4867 md_number_to_chars (ptr, (valueT) 0xeb, 1);
4868 md_number_to_chars (ptr + 1, (valueT) offset, 1);
4871 void
4872 md_create_long_jump (ptr, from_addr, to_addr, frag, to_symbol)
4873 char *ptr;
4874 addressT from_addr, to_addr;
4875 fragS *frag ATTRIBUTE_UNUSED;
4876 symbolS *to_symbol ATTRIBUTE_UNUSED;
4878 offsetT offset;
4880 offset = to_addr - (from_addr + 5);
4881 md_number_to_chars (ptr, (valueT) 0xe9, 1);
4882 md_number_to_chars (ptr + 1, (valueT) offset, 4);
4885 /* Apply a fixup (fixS) to segment data, once it has been determined
4886 by our caller that we have all the info we need to fix it up.
4888 On the 386, immediates, displacements, and data pointers are all in
4889 the same (little-endian) format, so we don't need to care about which
4890 we are handling. */
4892 void
4893 md_apply_fix (fixP, valP, seg)
4894 /* The fix we're to put in. */
4895 fixS *fixP;
4896 /* Pointer to the value of the bits. */
4897 valueT *valP;
4898 /* Segment fix is from. */
4899 segT seg ATTRIBUTE_UNUSED;
4901 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
4902 valueT value = *valP;
4904 #if !defined (TE_Mach)
4905 if (fixP->fx_pcrel)
4907 switch (fixP->fx_r_type)
4909 default:
4910 break;
4912 case BFD_RELOC_64:
4913 fixP->fx_r_type = BFD_RELOC_64_PCREL;
4914 break;
4915 case BFD_RELOC_32:
4916 case BFD_RELOC_X86_64_32S:
4917 fixP->fx_r_type = BFD_RELOC_32_PCREL;
4918 break;
4919 case BFD_RELOC_16:
4920 fixP->fx_r_type = BFD_RELOC_16_PCREL;
4921 break;
4922 case BFD_RELOC_8:
4923 fixP->fx_r_type = BFD_RELOC_8_PCREL;
4924 break;
4928 if (fixP->fx_addsy != NULL
4929 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
4930 || fixP->fx_r_type == BFD_RELOC_64_PCREL
4931 || fixP->fx_r_type == BFD_RELOC_16_PCREL
4932 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
4933 && !use_rela_relocations)
4935 /* This is a hack. There should be a better way to handle this.
4936 This covers for the fact that bfd_install_relocation will
4937 subtract the current location (for partial_inplace, PC relative
4938 relocations); see more below. */
4939 #ifndef OBJ_AOUT
4940 if (IS_ELF
4941 #ifdef TE_PE
4942 || OUTPUT_FLAVOR == bfd_target_coff_flavour
4943 #endif
4945 value += fixP->fx_where + fixP->fx_frag->fr_address;
4946 #endif
4947 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
4948 if (IS_ELF)
4950 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
4952 if ((sym_seg == seg
4953 || (symbol_section_p (fixP->fx_addsy)
4954 && sym_seg != absolute_section))
4955 && !generic_force_reloc (fixP))
4957 /* Yes, we add the values in twice. This is because
4958 bfd_install_relocation subtracts them out again. I think
4959 bfd_install_relocation is broken, but I don't dare change
4960 it. FIXME. */
4961 value += fixP->fx_where + fixP->fx_frag->fr_address;
4964 #endif
4965 #if defined (OBJ_COFF) && defined (TE_PE)
4966 /* For some reason, the PE format does not store a
4967 section address offset for a PC relative symbol. */
4968 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
4969 #if defined(BFD_ASSEMBLER) || defined(S_IS_WEAK)
4970 || S_IS_WEAK (fixP->fx_addsy)
4971 #endif
4973 value += md_pcrel_from (fixP);
4974 #endif
4977 /* Fix a few things - the dynamic linker expects certain values here,
4978 and we must not disappoint it. */
4979 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
4980 if (IS_ELF && fixP->fx_addsy)
4981 switch (fixP->fx_r_type)
4983 case BFD_RELOC_386_PLT32:
4984 case BFD_RELOC_X86_64_PLT32:
4985 /* Make the jump instruction point to the address of the operand. At
4986 runtime we merely add the offset to the actual PLT entry. */
4987 value = -4;
4988 break;
4990 case BFD_RELOC_386_TLS_GD:
4991 case BFD_RELOC_386_TLS_LDM:
4992 case BFD_RELOC_386_TLS_IE_32:
4993 case BFD_RELOC_386_TLS_IE:
4994 case BFD_RELOC_386_TLS_GOTIE:
4995 case BFD_RELOC_X86_64_TLSGD:
4996 case BFD_RELOC_X86_64_TLSLD:
4997 case BFD_RELOC_X86_64_GOTTPOFF:
4998 value = 0; /* Fully resolved at runtime. No addend. */
4999 /* Fallthrough */
5000 case BFD_RELOC_386_TLS_LE:
5001 case BFD_RELOC_386_TLS_LDO_32:
5002 case BFD_RELOC_386_TLS_LE_32:
5003 case BFD_RELOC_X86_64_DTPOFF32:
5004 case BFD_RELOC_X86_64_DTPOFF64:
5005 case BFD_RELOC_X86_64_TPOFF32:
5006 case BFD_RELOC_X86_64_TPOFF64:
5007 S_SET_THREAD_LOCAL (fixP->fx_addsy);
5008 break;
5010 case BFD_RELOC_386_GOT32:
5011 case BFD_RELOC_X86_64_GOT32:
5012 value = 0; /* Fully resolved at runtime. No addend. */
5013 break;
5015 case BFD_RELOC_VTABLE_INHERIT:
5016 case BFD_RELOC_VTABLE_ENTRY:
5017 fixP->fx_done = 0;
5018 return;
5020 default:
5021 break;
5023 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
5024 *valP = value;
5025 #endif /* !defined (TE_Mach) */
5027 /* Are we finished with this relocation now? */
5028 if (fixP->fx_addsy == NULL)
5029 fixP->fx_done = 1;
5030 else if (use_rela_relocations)
5032 fixP->fx_no_overflow = 1;
5033 /* Remember value for tc_gen_reloc. */
5034 fixP->fx_addnumber = value;
5035 value = 0;
5038 md_number_to_chars (p, value, fixP->fx_size);
5041 #define MAX_LITTLENUMS 6
5043 /* Turn the string pointed to by litP into a floating point constant
5044 of type TYPE, and emit the appropriate bytes. The number of
5045 LITTLENUMS emitted is stored in *SIZEP. An error message is
5046 returned, or NULL on OK. */
5048 char *
5049 md_atof (type, litP, sizeP)
5050 int type;
5051 char *litP;
5052 int *sizeP;
5054 int prec;
5055 LITTLENUM_TYPE words[MAX_LITTLENUMS];
5056 LITTLENUM_TYPE *wordP;
5057 char *t;
5059 switch (type)
5061 case 'f':
5062 case 'F':
5063 prec = 2;
5064 break;
5066 case 'd':
5067 case 'D':
5068 prec = 4;
5069 break;
5071 case 'x':
5072 case 'X':
5073 prec = 5;
5074 break;
5076 default:
5077 *sizeP = 0;
5078 return _("Bad call to md_atof ()");
5080 t = atof_ieee (input_line_pointer, type, words);
5081 if (t)
5082 input_line_pointer = t;
5084 *sizeP = prec * sizeof (LITTLENUM_TYPE);
5085 /* This loops outputs the LITTLENUMs in REVERSE order; in accord with
5086 the bigendian 386. */
5087 for (wordP = words + prec - 1; prec--;)
5089 md_number_to_chars (litP, (valueT) (*wordP--), sizeof (LITTLENUM_TYPE));
5090 litP += sizeof (LITTLENUM_TYPE);
5092 return 0;
5095 static char output_invalid_buf[8];
5097 static char *
5098 output_invalid (c)
5099 int c;
5101 if (ISPRINT (c))
5102 sprintf (output_invalid_buf, "'%c'", c);
5103 else
5104 sprintf (output_invalid_buf, "(0x%x)", (unsigned) c);
5105 return output_invalid_buf;
5108 /* REG_STRING starts *before* REGISTER_PREFIX. */
5110 static const reg_entry *
5111 parse_register (reg_string, end_op)
5112 char *reg_string;
5113 char **end_op;
5115 char *s = reg_string;
5116 char *p;
5117 char reg_name_given[MAX_REG_NAME_SIZE + 1];
5118 const reg_entry *r;
5120 /* Skip possible REGISTER_PREFIX and possible whitespace. */
5121 if (*s == REGISTER_PREFIX)
5122 ++s;
5124 if (is_space_char (*s))
5125 ++s;
5127 p = reg_name_given;
5128 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
5130 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
5131 return (const reg_entry *) NULL;
5132 s++;
5135 /* For naked regs, make sure that we are not dealing with an identifier.
5136 This prevents confusing an identifier like `eax_var' with register
5137 `eax'. */
5138 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
5139 return (const reg_entry *) NULL;
5141 *end_op = s;
5143 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
5145 /* Handle floating point regs, allowing spaces in the (i) part. */
5146 if (r == i386_regtab /* %st is first entry of table */)
5148 if (is_space_char (*s))
5149 ++s;
5150 if (*s == '(')
5152 ++s;
5153 if (is_space_char (*s))
5154 ++s;
5155 if (*s >= '0' && *s <= '7')
5157 r = &i386_float_regtab[*s - '0'];
5158 ++s;
5159 if (is_space_char (*s))
5160 ++s;
5161 if (*s == ')')
5163 *end_op = s + 1;
5164 return r;
5167 /* We have "%st(" then garbage. */
5168 return (const reg_entry *) NULL;
5172 if (r != NULL
5173 && ((r->reg_flags & (RegRex64 | RegRex)) | (r->reg_type & Reg64)) != 0
5174 && (r->reg_type != Control || !(cpu_arch_flags & CpuSledgehammer))
5175 && flag_code != CODE_64BIT)
5176 return (const reg_entry *) NULL;
5178 return r;
5181 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5182 const char *md_shortopts = "kVQ:sqn";
5183 #else
5184 const char *md_shortopts = "qn";
5185 #endif
5187 struct option md_longopts[] = {
5188 #define OPTION_32 (OPTION_MD_BASE + 0)
5189 {"32", no_argument, NULL, OPTION_32},
5190 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5191 #define OPTION_64 (OPTION_MD_BASE + 1)
5192 {"64", no_argument, NULL, OPTION_64},
5193 #endif
5194 {NULL, no_argument, NULL, 0}
5196 size_t md_longopts_size = sizeof (md_longopts);
5199 md_parse_option (c, arg)
5200 int c;
5201 char *arg ATTRIBUTE_UNUSED;
5203 switch (c)
5205 case 'n':
5206 optimize_align_code = 0;
5207 break;
5209 case 'q':
5210 quiet_warnings = 1;
5211 break;
5213 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5214 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
5215 should be emitted or not. FIXME: Not implemented. */
5216 case 'Q':
5217 break;
5219 /* -V: SVR4 argument to print version ID. */
5220 case 'V':
5221 print_version_id ();
5222 break;
5224 /* -k: Ignore for FreeBSD compatibility. */
5225 case 'k':
5226 break;
5228 case 's':
5229 /* -s: On i386 Solaris, this tells the native assembler to use
5230 .stab instead of .stab.excl. We always use .stab anyhow. */
5231 break;
5233 case OPTION_64:
5235 const char **list, **l;
5237 list = bfd_target_list ();
5238 for (l = list; *l != NULL; l++)
5239 if (strcmp (*l, "elf64-x86-64") == 0)
5241 default_arch = "x86_64";
5242 break;
5244 if (*l == NULL)
5245 as_fatal (_("No compiled in support for x86_64"));
5246 free (list);
5248 break;
5249 #endif
5251 case OPTION_32:
5252 default_arch = "i386";
5253 break;
5255 default:
5256 return 0;
5258 return 1;
5261 void
5262 md_show_usage (stream)
5263 FILE *stream;
5265 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5266 fprintf (stream, _("\
5267 -Q ignored\n\
5268 -V print assembler version number\n\
5269 -k ignored\n\
5270 -n Do not optimize code alignment\n\
5271 -q quieten some warnings\n\
5272 -s ignored\n"));
5273 #else
5274 fprintf (stream, _("\
5275 -n Do not optimize code alignment\n\
5276 -q quieten some warnings\n"));
5277 #endif
5280 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
5281 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))
5283 /* Pick the target format to use. */
5285 const char *
5286 i386_target_format ()
5288 if (!strcmp (default_arch, "x86_64"))
5289 set_code_flag (CODE_64BIT);
5290 else if (!strcmp (default_arch, "i386"))
5291 set_code_flag (CODE_32BIT);
5292 else
5293 as_fatal (_("Unknown architecture"));
5294 switch (OUTPUT_FLAVOR)
5296 #ifdef OBJ_MAYBE_AOUT
5297 case bfd_target_aout_flavour:
5298 return AOUT_TARGET_FORMAT;
5299 #endif
5300 #ifdef OBJ_MAYBE_COFF
5301 case bfd_target_coff_flavour:
5302 return "coff-i386";
5303 #endif
5304 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
5305 case bfd_target_elf_flavour:
5307 if (flag_code == CODE_64BIT)
5308 use_rela_relocations = 1;
5309 return flag_code == CODE_64BIT ? "elf64-x86-64" : ELF_TARGET_FORMAT;
5311 #endif
5312 default:
5313 abort ();
5314 return NULL;
5318 #endif /* OBJ_MAYBE_ more than one */
5320 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))
5321 void i386_elf_emit_arch_note ()
5323 if (IS_ELF && cpu_arch_name != NULL)
5325 char *p;
5326 asection *seg = now_seg;
5327 subsegT subseg = now_subseg;
5328 Elf_Internal_Note i_note;
5329 Elf_External_Note e_note;
5330 asection *note_secp;
5331 int len;
5333 /* Create the .note section. */
5334 note_secp = subseg_new (".note", 0);
5335 bfd_set_section_flags (stdoutput,
5336 note_secp,
5337 SEC_HAS_CONTENTS | SEC_READONLY);
5339 /* Process the arch string. */
5340 len = strlen (cpu_arch_name);
5342 i_note.namesz = len + 1;
5343 i_note.descsz = 0;
5344 i_note.type = NT_ARCH;
5345 p = frag_more (sizeof (e_note.namesz));
5346 md_number_to_chars (p, (valueT) i_note.namesz, sizeof (e_note.namesz));
5347 p = frag_more (sizeof (e_note.descsz));
5348 md_number_to_chars (p, (valueT) i_note.descsz, sizeof (e_note.descsz));
5349 p = frag_more (sizeof (e_note.type));
5350 md_number_to_chars (p, (valueT) i_note.type, sizeof (e_note.type));
5351 p = frag_more (len + 1);
5352 strcpy (p, cpu_arch_name);
5354 frag_align (2, 0, 0);
5356 subseg_set (seg, subseg);
5359 #endif
5361 symbolS *
5362 md_undefined_symbol (name)
5363 char *name;
5365 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
5366 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
5367 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
5368 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
5370 if (!GOT_symbol)
5372 if (symbol_find (name))
5373 as_bad (_("GOT already in symbol table"));
5374 GOT_symbol = symbol_new (name, undefined_section,
5375 (valueT) 0, &zero_address_frag);
5377 return GOT_symbol;
5379 return 0;
5382 /* Round up a section size to the appropriate boundary. */
5384 valueT
5385 md_section_align (segment, size)
5386 segT segment ATTRIBUTE_UNUSED;
5387 valueT size;
5389 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
5390 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
5392 /* For a.out, force the section size to be aligned. If we don't do
5393 this, BFD will align it for us, but it will not write out the
5394 final bytes of the section. This may be a bug in BFD, but it is
5395 easier to fix it here since that is how the other a.out targets
5396 work. */
5397 int align;
5399 align = bfd_get_section_alignment (stdoutput, segment);
5400 size = ((size + (1 << align) - 1) & ((valueT) -1 << align));
5402 #endif
5404 return size;
5407 /* On the i386, PC-relative offsets are relative to the start of the
5408 next instruction. That is, the address of the offset, plus its
5409 size, since the offset is always the last part of the insn. */
5411 long
5412 md_pcrel_from (fixP)
5413 fixS *fixP;
5415 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
5418 #ifndef I386COFF
5420 static void
5421 s_bss (ignore)
5422 int ignore ATTRIBUTE_UNUSED;
5424 int temp;
5426 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5427 if (IS_ELF)
5428 obj_elf_section_change_hook ();
5429 #endif
5430 temp = get_absolute_expression ();
5431 subseg_set (bss_section, (subsegT) temp);
5432 demand_empty_rest_of_line ();
5435 #endif
5437 void
5438 i386_validate_fix (fixp)
5439 fixS *fixp;
5441 if (fixp->fx_subsy && fixp->fx_subsy == GOT_symbol)
5443 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
5445 if (flag_code != CODE_64BIT)
5446 abort ();
5447 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
5449 else
5451 if (flag_code != CODE_64BIT)
5452 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
5453 else
5454 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
5456 fixp->fx_subsy = 0;
5460 arelent *
5461 tc_gen_reloc (section, fixp)
5462 asection *section ATTRIBUTE_UNUSED;
5463 fixS *fixp;
5465 arelent *rel;
5466 bfd_reloc_code_real_type code;
5468 switch (fixp->fx_r_type)
5470 case BFD_RELOC_X86_64_PLT32:
5471 case BFD_RELOC_X86_64_GOT32:
5472 case BFD_RELOC_X86_64_GOTPCREL:
5473 case BFD_RELOC_386_PLT32:
5474 case BFD_RELOC_386_GOT32:
5475 case BFD_RELOC_386_GOTOFF:
5476 case BFD_RELOC_386_GOTPC:
5477 case BFD_RELOC_386_TLS_GD:
5478 case BFD_RELOC_386_TLS_LDM:
5479 case BFD_RELOC_386_TLS_LDO_32:
5480 case BFD_RELOC_386_TLS_IE_32:
5481 case BFD_RELOC_386_TLS_IE:
5482 case BFD_RELOC_386_TLS_GOTIE:
5483 case BFD_RELOC_386_TLS_LE_32:
5484 case BFD_RELOC_386_TLS_LE:
5485 case BFD_RELOC_X86_64_TLSGD:
5486 case BFD_RELOC_X86_64_TLSLD:
5487 case BFD_RELOC_X86_64_DTPOFF32:
5488 case BFD_RELOC_X86_64_DTPOFF64:
5489 case BFD_RELOC_X86_64_GOTTPOFF:
5490 case BFD_RELOC_X86_64_TPOFF32:
5491 case BFD_RELOC_X86_64_TPOFF64:
5492 case BFD_RELOC_X86_64_GOTOFF64:
5493 case BFD_RELOC_X86_64_GOTPC32:
5494 case BFD_RELOC_RVA:
5495 case BFD_RELOC_VTABLE_ENTRY:
5496 case BFD_RELOC_VTABLE_INHERIT:
5497 #ifdef TE_PE
5498 case BFD_RELOC_32_SECREL:
5499 #endif
5500 code = fixp->fx_r_type;
5501 break;
5502 case BFD_RELOC_X86_64_32S:
5503 if (!fixp->fx_pcrel)
5505 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
5506 code = fixp->fx_r_type;
5507 break;
5509 default:
5510 if (fixp->fx_pcrel)
5512 switch (fixp->fx_size)
5514 default:
5515 as_bad_where (fixp->fx_file, fixp->fx_line,
5516 _("can not do %d byte pc-relative relocation"),
5517 fixp->fx_size);
5518 code = BFD_RELOC_32_PCREL;
5519 break;
5520 case 1: code = BFD_RELOC_8_PCREL; break;
5521 case 2: code = BFD_RELOC_16_PCREL; break;
5522 case 4: code = BFD_RELOC_32_PCREL; break;
5523 #ifdef BFD64
5524 case 8: code = BFD_RELOC_64_PCREL; break;
5525 #endif
5528 else
5530 switch (fixp->fx_size)
5532 default:
5533 as_bad_where (fixp->fx_file, fixp->fx_line,
5534 _("can not do %d byte relocation"),
5535 fixp->fx_size);
5536 code = BFD_RELOC_32;
5537 break;
5538 case 1: code = BFD_RELOC_8; break;
5539 case 2: code = BFD_RELOC_16; break;
5540 case 4: code = BFD_RELOC_32; break;
5541 #ifdef BFD64
5542 case 8: code = BFD_RELOC_64; break;
5543 #endif
5546 break;
5549 if ((code == BFD_RELOC_32 || code == BFD_RELOC_32_PCREL)
5550 && GOT_symbol
5551 && fixp->fx_addsy == GOT_symbol)
5553 if (flag_code != CODE_64BIT)
5554 code = BFD_RELOC_386_GOTPC;
5555 else
5556 code = BFD_RELOC_X86_64_GOTPC32;
5559 rel = (arelent *) xmalloc (sizeof (arelent));
5560 rel->sym_ptr_ptr = (asymbol **) xmalloc (sizeof (asymbol *));
5561 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
5563 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
5565 if (!use_rela_relocations)
5567 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
5568 vtable entry to be used in the relocation's section offset. */
5569 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
5570 rel->address = fixp->fx_offset;
5572 rel->addend = 0;
5574 /* Use the rela in 64bit mode. */
5575 else
5577 if (!fixp->fx_pcrel)
5578 rel->addend = fixp->fx_offset;
5579 else
5580 switch (code)
5582 case BFD_RELOC_X86_64_PLT32:
5583 case BFD_RELOC_X86_64_GOT32:
5584 case BFD_RELOC_X86_64_GOTPCREL:
5585 case BFD_RELOC_X86_64_TLSGD:
5586 case BFD_RELOC_X86_64_TLSLD:
5587 case BFD_RELOC_X86_64_GOTTPOFF:
5588 rel->addend = fixp->fx_offset - fixp->fx_size;
5589 break;
5590 default:
5591 rel->addend = (section->vma
5592 - fixp->fx_size
5593 + fixp->fx_addnumber
5594 + md_pcrel_from (fixp));
5595 break;
5599 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
5600 if (rel->howto == NULL)
5602 as_bad_where (fixp->fx_file, fixp->fx_line,
5603 _("cannot represent relocation type %s"),
5604 bfd_get_reloc_code_name (code));
5605 /* Set howto to a garbage value so that we can keep going. */
5606 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
5607 assert (rel->howto != NULL);
5610 return rel;
5614 /* Parse operands using Intel syntax. This implements a recursive descent
5615 parser based on the BNF grammar published in Appendix B of the MASM 6.1
5616 Programmer's Guide.
5618 FIXME: We do not recognize the full operand grammar defined in the MASM
5619 documentation. In particular, all the structure/union and
5620 high-level macro operands are missing.
5622 Uppercase words are terminals, lower case words are non-terminals.
5623 Objects surrounded by double brackets '[[' ']]' are optional. Vertical
5624 bars '|' denote choices. Most grammar productions are implemented in
5625 functions called 'intel_<production>'.
5627 Initial production is 'expr'.
5629 addOp + | -
5631 alpha [a-zA-Z]
5633 binOp & | AND | \| | OR | ^ | XOR
5635 byteRegister AL | AH | BL | BH | CL | CH | DL | DH
5637 constant digits [[ radixOverride ]]
5639 dataType BYTE | WORD | DWORD | FWORD | QWORD | TBYTE | OWORD | XMMWORD
5641 digits decdigit
5642 | digits decdigit
5643 | digits hexdigit
5645 decdigit [0-9]
5647 e04 e04 addOp e05
5648 | e05
5650 e05 e05 binOp e06
5651 | e06
5653 e06 e06 mulOp e09
5654 | e09
5656 e09 OFFSET e10
5657 | SHORT e10
5658 | + e10
5659 | - e10
5660 | ~ e10
5661 | NOT e10
5662 | e09 PTR e10
5663 | e09 : e10
5664 | e10
5666 e10 e10 [ expr ]
5667 | e11
5669 e11 ( expr )
5670 | [ expr ]
5671 | constant
5672 | dataType
5673 | id
5675 | register
5677 => expr expr cmpOp e04
5678 | e04
5680 gpRegister AX | EAX | BX | EBX | CX | ECX | DX | EDX
5681 | BP | EBP | SP | ESP | DI | EDI | SI | ESI
5683 hexdigit a | b | c | d | e | f
5684 | A | B | C | D | E | F
5686 id alpha
5687 | id alpha
5688 | id decdigit
5690 mulOp * | / | % | MOD | << | SHL | >> | SHR
5692 quote " | '
5694 register specialRegister
5695 | gpRegister
5696 | byteRegister
5698 segmentRegister CS | DS | ES | FS | GS | SS
5700 specialRegister CR0 | CR2 | CR3 | CR4
5701 | DR0 | DR1 | DR2 | DR3 | DR6 | DR7
5702 | TR3 | TR4 | TR5 | TR6 | TR7
5704 We simplify the grammar in obvious places (e.g., register parsing is
5705 done by calling parse_register) and eliminate immediate left recursion
5706 to implement a recursive-descent parser.
5708 expr e04 expr'
5710 expr' cmpOp e04 expr'
5711 | Empty
5713 e04 e05 e04'
5715 e04' addOp e05 e04'
5716 | Empty
5718 e05 e06 e05'
5720 e05' binOp e06 e05'
5721 | Empty
5723 e06 e09 e06'
5725 e06' mulOp e09 e06'
5726 | Empty
5728 e09 OFFSET e10 e09'
5729 | SHORT e10'
5730 | + e10'
5731 | - e10'
5732 | ~ e10'
5733 | NOT e10'
5734 | e10 e09'
5736 e09' PTR e10 e09'
5737 | : e10 e09'
5738 | Empty
5740 e10 e11 e10'
5742 e10' [ expr ] e10'
5743 | Empty
5745 e11 ( expr )
5746 | [ expr ]
5747 | BYTE
5748 | WORD
5749 | DWORD
5750 | FWORD
5751 | QWORD
5752 | TBYTE
5753 | OWORD
5754 | XMMWORD
5757 | register
5758 | id
5759 | constant */
5761 /* Parsing structure for the intel syntax parser. Used to implement the
5762 semantic actions for the operand grammar. */
5763 struct intel_parser_s
5765 char *op_string; /* The string being parsed. */
5766 int got_a_float; /* Whether the operand is a float. */
5767 int op_modifier; /* Operand modifier. */
5768 int is_mem; /* 1 if operand is memory reference. */
5769 int in_offset; /* >=1 if parsing operand of offset. */
5770 int in_bracket; /* >=1 if parsing operand in brackets. */
5771 const reg_entry *reg; /* Last register reference found. */
5772 char *disp; /* Displacement string being built. */
5773 char *next_operand; /* Resume point when splitting operands. */
5776 static struct intel_parser_s intel_parser;
5778 /* Token structure for parsing intel syntax. */
5779 struct intel_token
5781 int code; /* Token code. */
5782 const reg_entry *reg; /* Register entry for register tokens. */
5783 char *str; /* String representation. */
5786 static struct intel_token cur_token, prev_token;
5788 /* Token codes for the intel parser. Since T_SHORT is already used
5789 by COFF, undefine it first to prevent a warning. */
5790 #define T_NIL -1
5791 #define T_CONST 1
5792 #define T_REG 2
5793 #define T_BYTE 3
5794 #define T_WORD 4
5795 #define T_DWORD 5
5796 #define T_FWORD 6
5797 #define T_QWORD 7
5798 #define T_TBYTE 8
5799 #define T_XMMWORD 9
5800 #undef T_SHORT
5801 #define T_SHORT 10
5802 #define T_OFFSET 11
5803 #define T_PTR 12
5804 #define T_ID 13
5805 #define T_SHL 14
5806 #define T_SHR 15
5808 /* Prototypes for intel parser functions. */
5809 static int intel_match_token PARAMS ((int code));
5810 static void intel_get_token PARAMS ((void));
5811 static void intel_putback_token PARAMS ((void));
5812 static int intel_expr PARAMS ((void));
5813 static int intel_e04 PARAMS ((void));
5814 static int intel_e05 PARAMS ((void));
5815 static int intel_e06 PARAMS ((void));
5816 static int intel_e09 PARAMS ((void));
5817 static int intel_bracket_expr PARAMS ((void));
5818 static int intel_e10 PARAMS ((void));
5819 static int intel_e11 PARAMS ((void));
5821 static int
5822 i386_intel_operand (operand_string, got_a_float)
5823 char *operand_string;
5824 int got_a_float;
5826 int ret;
5827 char *p;
5829 p = intel_parser.op_string = xstrdup (operand_string);
5830 intel_parser.disp = (char *) xmalloc (strlen (operand_string) + 1);
5832 for (;;)
5834 /* Initialize token holders. */
5835 cur_token.code = prev_token.code = T_NIL;
5836 cur_token.reg = prev_token.reg = NULL;
5837 cur_token.str = prev_token.str = NULL;
5839 /* Initialize parser structure. */
5840 intel_parser.got_a_float = got_a_float;
5841 intel_parser.op_modifier = 0;
5842 intel_parser.is_mem = 0;
5843 intel_parser.in_offset = 0;
5844 intel_parser.in_bracket = 0;
5845 intel_parser.reg = NULL;
5846 intel_parser.disp[0] = '\0';
5847 intel_parser.next_operand = NULL;
5849 /* Read the first token and start the parser. */
5850 intel_get_token ();
5851 ret = intel_expr ();
5853 if (!ret)
5854 break;
5856 if (cur_token.code != T_NIL)
5858 as_bad (_("invalid operand for '%s' ('%s' unexpected)"),
5859 current_templates->start->name, cur_token.str);
5860 ret = 0;
5862 /* If we found a memory reference, hand it over to i386_displacement
5863 to fill in the rest of the operand fields. */
5864 else if (intel_parser.is_mem)
5866 if ((i.mem_operands == 1
5867 && (current_templates->start->opcode_modifier & IsString) == 0)
5868 || i.mem_operands == 2)
5870 as_bad (_("too many memory references for '%s'"),
5871 current_templates->start->name);
5872 ret = 0;
5874 else
5876 char *s = intel_parser.disp;
5877 i.mem_operands++;
5879 if (!quiet_warnings && intel_parser.is_mem < 0)
5880 /* See the comments in intel_bracket_expr. */
5881 as_warn (_("Treating `%s' as memory reference"), operand_string);
5883 /* Add the displacement expression. */
5884 if (*s != '\0')
5885 ret = i386_displacement (s, s + strlen (s));
5886 if (ret)
5888 /* Swap base and index in 16-bit memory operands like
5889 [si+bx]. Since i386_index_check is also used in AT&T
5890 mode we have to do that here. */
5891 if (i.base_reg
5892 && i.index_reg
5893 && (i.base_reg->reg_type & Reg16)
5894 && (i.index_reg->reg_type & Reg16)
5895 && i.base_reg->reg_num >= 6
5896 && i.index_reg->reg_num < 6)
5898 const reg_entry *base = i.index_reg;
5900 i.index_reg = i.base_reg;
5901 i.base_reg = base;
5903 ret = i386_index_check (operand_string);
5908 /* Constant and OFFSET expressions are handled by i386_immediate. */
5909 else if ((intel_parser.op_modifier & (1 << T_OFFSET))
5910 || intel_parser.reg == NULL)
5911 ret = i386_immediate (intel_parser.disp);
5913 if (intel_parser.next_operand && this_operand >= MAX_OPERANDS - 1)
5914 ret = 0;
5915 if (!ret || !intel_parser.next_operand)
5916 break;
5917 intel_parser.op_string = intel_parser.next_operand;
5918 this_operand = i.operands++;
5921 free (p);
5922 free (intel_parser.disp);
5924 return ret;
5927 #define NUM_ADDRESS_REGS (!!i.base_reg + !!i.index_reg)
5929 /* expr e04 expr'
5931 expr' cmpOp e04 expr'
5932 | Empty */
5933 static int
5934 intel_expr ()
5936 /* XXX Implement the comparison operators. */
5937 return intel_e04 ();
5940 /* e04 e05 e04'
5942 e04' addOp e05 e04'
5943 | Empty */
5944 static int
5945 intel_e04 ()
5947 int nregs = -1;
5949 for (;;)
5951 if (!intel_e05())
5952 return 0;
5954 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
5955 i.base_reg = i386_regtab + REGNAM_AL; /* al is invalid as base */
5957 if (cur_token.code == '+')
5958 nregs = -1;
5959 else if (cur_token.code == '-')
5960 nregs = NUM_ADDRESS_REGS;
5961 else
5962 return 1;
5964 strcat (intel_parser.disp, cur_token.str);
5965 intel_match_token (cur_token.code);
5969 /* e05 e06 e05'
5971 e05' binOp e06 e05'
5972 | Empty */
5973 static int
5974 intel_e05 ()
5976 int nregs = ~NUM_ADDRESS_REGS;
5978 for (;;)
5980 if (!intel_e06())
5981 return 0;
5983 if (cur_token.code == '&' || cur_token.code == '|' || cur_token.code == '^')
5985 char str[2];
5987 str[0] = cur_token.code;
5988 str[1] = 0;
5989 strcat (intel_parser.disp, str);
5991 else
5992 break;
5994 intel_match_token (cur_token.code);
5996 if (nregs < 0)
5997 nregs = ~nregs;
5999 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
6000 i.base_reg = i386_regtab + REGNAM_AL + 1; /* cl is invalid as base */
6001 return 1;
6004 /* e06 e09 e06'
6006 e06' mulOp e09 e06'
6007 | Empty */
6008 static int
6009 intel_e06 ()
6011 int nregs = ~NUM_ADDRESS_REGS;
6013 for (;;)
6015 if (!intel_e09())
6016 return 0;
6018 if (cur_token.code == '*' || cur_token.code == '/' || cur_token.code == '%')
6020 char str[2];
6022 str[0] = cur_token.code;
6023 str[1] = 0;
6024 strcat (intel_parser.disp, str);
6026 else if (cur_token.code == T_SHL)
6027 strcat (intel_parser.disp, "<<");
6028 else if (cur_token.code == T_SHR)
6029 strcat (intel_parser.disp, ">>");
6030 else
6031 break;
6033 intel_match_token (cur_token.code);
6035 if (nregs < 0)
6036 nregs = ~nregs;
6038 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
6039 i.base_reg = i386_regtab + REGNAM_AL + 2; /* dl is invalid as base */
6040 return 1;
6043 /* e09 OFFSET e09
6044 | SHORT e09
6045 | + e09
6046 | - e09
6047 | ~ e09
6048 | NOT e09
6049 | e10 e09'
6051 e09' PTR e10 e09'
6052 | : e10 e09'
6053 | Empty */
6054 static int
6055 intel_e09 ()
6057 int nregs = ~NUM_ADDRESS_REGS;
6058 int in_offset = 0;
6060 for (;;)
6062 /* Don't consume constants here. */
6063 if (cur_token.code == '+' || cur_token.code == '-')
6065 /* Need to look one token ahead - if the next token
6066 is a constant, the current token is its sign. */
6067 int next_code;
6069 intel_match_token (cur_token.code);
6070 next_code = cur_token.code;
6071 intel_putback_token ();
6072 if (next_code == T_CONST)
6073 break;
6076 /* e09 OFFSET e09 */
6077 if (cur_token.code == T_OFFSET)
6079 if (!in_offset++)
6080 ++intel_parser.in_offset;
6083 /* e09 SHORT e09 */
6084 else if (cur_token.code == T_SHORT)
6085 intel_parser.op_modifier |= 1 << T_SHORT;
6087 /* e09 + e09 */
6088 else if (cur_token.code == '+')
6089 strcat (intel_parser.disp, "+");
6091 /* e09 - e09
6092 | ~ e09
6093 | NOT e09 */
6094 else if (cur_token.code == '-' || cur_token.code == '~')
6096 char str[2];
6098 if (nregs < 0)
6099 nregs = ~nregs;
6100 str[0] = cur_token.code;
6101 str[1] = 0;
6102 strcat (intel_parser.disp, str);
6105 /* e09 e10 e09' */
6106 else
6107 break;
6109 intel_match_token (cur_token.code);
6112 for (;;)
6114 if (!intel_e10 ())
6115 return 0;
6117 /* e09' PTR e10 e09' */
6118 if (cur_token.code == T_PTR)
6120 char suffix;
6122 if (prev_token.code == T_BYTE)
6123 suffix = BYTE_MNEM_SUFFIX;
6125 else if (prev_token.code == T_WORD)
6127 if (current_templates->start->name[0] == 'l'
6128 && current_templates->start->name[2] == 's'
6129 && current_templates->start->name[3] == 0)
6130 suffix = BYTE_MNEM_SUFFIX; /* so it will cause an error */
6131 else if (intel_parser.got_a_float == 2) /* "fi..." */
6132 suffix = SHORT_MNEM_SUFFIX;
6133 else
6134 suffix = WORD_MNEM_SUFFIX;
6137 else if (prev_token.code == T_DWORD)
6139 if (current_templates->start->name[0] == 'l'
6140 && current_templates->start->name[2] == 's'
6141 && current_templates->start->name[3] == 0)
6142 suffix = WORD_MNEM_SUFFIX;
6143 else if (flag_code == CODE_16BIT
6144 && (current_templates->start->opcode_modifier
6145 & (Jump|JumpDword|JumpInterSegment)))
6146 suffix = LONG_DOUBLE_MNEM_SUFFIX;
6147 else if (intel_parser.got_a_float == 1) /* "f..." */
6148 suffix = SHORT_MNEM_SUFFIX;
6149 else
6150 suffix = LONG_MNEM_SUFFIX;
6153 else if (prev_token.code == T_FWORD)
6155 if (current_templates->start->name[0] == 'l'
6156 && current_templates->start->name[2] == 's'
6157 && current_templates->start->name[3] == 0)
6158 suffix = LONG_MNEM_SUFFIX;
6159 else if (!intel_parser.got_a_float)
6161 if (flag_code == CODE_16BIT)
6162 add_prefix (DATA_PREFIX_OPCODE);
6163 suffix = LONG_DOUBLE_MNEM_SUFFIX;
6165 else
6166 suffix = BYTE_MNEM_SUFFIX; /* so it will cause an error */
6169 else if (prev_token.code == T_QWORD)
6171 if (intel_parser.got_a_float == 1) /* "f..." */
6172 suffix = LONG_MNEM_SUFFIX;
6173 else
6174 suffix = QWORD_MNEM_SUFFIX;
6177 else if (prev_token.code == T_TBYTE)
6179 if (intel_parser.got_a_float == 1)
6180 suffix = LONG_DOUBLE_MNEM_SUFFIX;
6181 else
6182 suffix = BYTE_MNEM_SUFFIX; /* so it will cause an error */
6185 else if (prev_token.code == T_XMMWORD)
6187 /* XXX ignored for now, but accepted since gcc uses it */
6188 suffix = 0;
6191 else
6193 as_bad (_("Unknown operand modifier `%s'"), prev_token.str);
6194 return 0;
6197 if (current_templates->start->base_opcode == 0x8d /* lea */)
6199 else if (!i.suffix)
6200 i.suffix = suffix;
6201 else if (i.suffix != suffix)
6203 as_bad (_("Conflicting operand modifiers"));
6204 return 0;
6209 /* e09' : e10 e09' */
6210 else if (cur_token.code == ':')
6212 if (prev_token.code != T_REG)
6214 /* While {call,jmp} SSSS:OOOO is MASM syntax only when SSSS is a
6215 segment/group identifier (which we don't have), using comma
6216 as the operand separator there is even less consistent, since
6217 there all branches only have a single operand. */
6218 if (this_operand != 0
6219 || intel_parser.in_offset
6220 || intel_parser.in_bracket
6221 || (!(current_templates->start->opcode_modifier
6222 & (Jump|JumpDword|JumpInterSegment))
6223 && !(current_templates->start->operand_types[0]
6224 & JumpAbsolute)))
6225 return intel_match_token (T_NIL);
6226 /* Remember the start of the 2nd operand and terminate 1st
6227 operand here.
6228 XXX This isn't right, yet (when SSSS:OOOO is right operand of
6229 another expression), but it gets at least the simplest case
6230 (a plain number or symbol on the left side) right. */
6231 intel_parser.next_operand = intel_parser.op_string;
6232 *--intel_parser.op_string = '\0';
6233 return intel_match_token (':');
6237 /* e09' Empty */
6238 else
6239 break;
6241 intel_match_token (cur_token.code);
6245 if (in_offset)
6247 --intel_parser.in_offset;
6248 if (nregs < 0)
6249 nregs = ~nregs;
6250 if (NUM_ADDRESS_REGS > nregs)
6252 as_bad (_("Invalid operand to `OFFSET'"));
6253 return 0;
6255 intel_parser.op_modifier |= 1 << T_OFFSET;
6258 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
6259 i.base_reg = i386_regtab + REGNAM_AL + 3; /* bl is invalid as base */
6260 return 1;
6263 static int
6264 intel_bracket_expr ()
6266 int was_offset = intel_parser.op_modifier & (1 << T_OFFSET);
6267 const char *start = intel_parser.op_string;
6268 int len;
6270 if (i.op[this_operand].regs)
6271 return intel_match_token (T_NIL);
6273 intel_match_token ('[');
6275 /* Mark as a memory operand only if it's not already known to be an
6276 offset expression. If it's an offset expression, we need to keep
6277 the brace in. */
6278 if (!intel_parser.in_offset)
6280 ++intel_parser.in_bracket;
6281 /* Unfortunately gas always diverged from MASM in a respect that can't
6282 be easily fixed without risking to break code sequences likely to be
6283 encountered (the testsuite even check for this): MASM doesn't consider
6284 an expression inside brackets unconditionally as a memory reference.
6285 When that is e.g. a constant, an offset expression, or the sum of the
6286 two, this is still taken as a constant load. gas, however, always
6287 treated these as memory references. As a compromise, we'll try to make
6288 offset expressions inside brackets work the MASM way (since that's
6289 less likely to be found in real world code), but make constants alone
6290 continue to work the traditional gas way. In either case, issue a
6291 warning. */
6292 intel_parser.op_modifier &= ~was_offset;
6294 else
6295 strcat (intel_parser.disp, "[");
6297 /* Add a '+' to the displacement string if necessary. */
6298 if (*intel_parser.disp != '\0'
6299 && *(intel_parser.disp + strlen (intel_parser.disp) - 1) != '+')
6300 strcat (intel_parser.disp, "+");
6302 if (intel_expr ()
6303 && (len = intel_parser.op_string - start - 1,
6304 intel_match_token (']')))
6306 /* Preserve brackets when the operand is an offset expression. */
6307 if (intel_parser.in_offset)
6308 strcat (intel_parser.disp, "]");
6309 else
6311 --intel_parser.in_bracket;
6312 if (i.base_reg || i.index_reg)
6313 intel_parser.is_mem = 1;
6314 if (!intel_parser.is_mem)
6316 if (!(intel_parser.op_modifier & (1 << T_OFFSET)))
6317 /* Defer the warning until all of the operand was parsed. */
6318 intel_parser.is_mem = -1;
6319 else if (!quiet_warnings)
6320 as_warn (_("`[%.*s]' taken to mean just `%.*s'"), len, start, len, start);
6323 intel_parser.op_modifier |= was_offset;
6325 return 1;
6327 return 0;
6330 /* e10 e11 e10'
6332 e10' [ expr ] e10'
6333 | Empty */
6334 static int
6335 intel_e10 ()
6337 if (!intel_e11 ())
6338 return 0;
6340 while (cur_token.code == '[')
6342 if (!intel_bracket_expr ())
6343 return 0;
6346 return 1;
6349 /* e11 ( expr )
6350 | [ expr ]
6351 | BYTE
6352 | WORD
6353 | DWORD
6354 | FWORD
6355 | QWORD
6356 | TBYTE
6357 | OWORD
6358 | XMMWORD
6361 | register
6362 | id
6363 | constant */
6364 static int
6365 intel_e11 ()
6367 switch (cur_token.code)
6369 /* e11 ( expr ) */
6370 case '(':
6371 intel_match_token ('(');
6372 strcat (intel_parser.disp, "(");
6374 if (intel_expr () && intel_match_token (')'))
6376 strcat (intel_parser.disp, ")");
6377 return 1;
6379 return 0;
6381 /* e11 [ expr ] */
6382 case '[':
6383 /* Operands for jump/call inside brackets denote absolute addresses.
6384 XXX This shouldn't be needed anymore (or if it should rather live
6385 in intel_bracket_expr). */
6386 if (current_templates->start->opcode_modifier
6387 & (Jump|JumpDword|JumpByte|JumpInterSegment))
6388 i.types[this_operand] |= JumpAbsolute;
6390 return intel_bracket_expr ();
6392 /* e11 $
6393 | . */
6394 case '.':
6395 strcat (intel_parser.disp, cur_token.str);
6396 intel_match_token (cur_token.code);
6398 /* Mark as a memory operand only if it's not already known to be an
6399 offset expression. */
6400 if (!intel_parser.in_offset)
6401 intel_parser.is_mem = 1;
6403 return 1;
6405 /* e11 register */
6406 case T_REG:
6408 const reg_entry *reg = intel_parser.reg = cur_token.reg;
6410 intel_match_token (T_REG);
6412 /* Check for segment change. */
6413 if (cur_token.code == ':')
6415 if (!(reg->reg_type & (SReg2 | SReg3)))
6417 as_bad (_("`%s' is not a valid segment register"), reg->reg_name);
6418 return 0;
6420 else if (i.seg[i.mem_operands])
6421 as_warn (_("Extra segment override ignored"));
6422 else
6424 if (!intel_parser.in_offset)
6425 intel_parser.is_mem = 1;
6426 switch (reg->reg_num)
6428 case 0:
6429 i.seg[i.mem_operands] = &es;
6430 break;
6431 case 1:
6432 i.seg[i.mem_operands] = &cs;
6433 break;
6434 case 2:
6435 i.seg[i.mem_operands] = &ss;
6436 break;
6437 case 3:
6438 i.seg[i.mem_operands] = &ds;
6439 break;
6440 case 4:
6441 i.seg[i.mem_operands] = &fs;
6442 break;
6443 case 5:
6444 i.seg[i.mem_operands] = &gs;
6445 break;
6450 /* Not a segment register. Check for register scaling. */
6451 else if (cur_token.code == '*')
6453 if (!intel_parser.in_bracket)
6455 as_bad (_("Register scaling only allowed in memory operands"));
6456 return 0;
6459 if (reg->reg_type & Reg16) /* Disallow things like [si*1]. */
6460 reg = i386_regtab + REGNAM_AX + 4; /* sp is invalid as index */
6461 else if (i.index_reg)
6462 reg = i386_regtab + REGNAM_EAX + 4; /* esp is invalid as index */
6464 /* What follows must be a valid scale. */
6465 intel_match_token ('*');
6466 i.index_reg = reg;
6467 i.types[this_operand] |= BaseIndex;
6469 /* Set the scale after setting the register (otherwise,
6470 i386_scale will complain) */
6471 if (cur_token.code == '+' || cur_token.code == '-')
6473 char *str, sign = cur_token.code;
6474 intel_match_token (cur_token.code);
6475 if (cur_token.code != T_CONST)
6477 as_bad (_("Syntax error: Expecting a constant, got `%s'"),
6478 cur_token.str);
6479 return 0;
6481 str = (char *) xmalloc (strlen (cur_token.str) + 2);
6482 strcpy (str + 1, cur_token.str);
6483 *str = sign;
6484 if (!i386_scale (str))
6485 return 0;
6486 free (str);
6488 else if (!i386_scale (cur_token.str))
6489 return 0;
6490 intel_match_token (cur_token.code);
6493 /* No scaling. If this is a memory operand, the register is either a
6494 base register (first occurrence) or an index register (second
6495 occurrence). */
6496 else if (intel_parser.in_bracket && !(reg->reg_type & (SReg2 | SReg3)))
6499 if (!i.base_reg)
6500 i.base_reg = reg;
6501 else if (!i.index_reg)
6502 i.index_reg = reg;
6503 else
6505 as_bad (_("Too many register references in memory operand"));
6506 return 0;
6509 i.types[this_operand] |= BaseIndex;
6512 /* Offset modifier. Add the register to the displacement string to be
6513 parsed as an immediate expression after we're done. */
6514 else if (intel_parser.in_offset)
6516 as_warn (_("Using register names in OFFSET expressions is deprecated"));
6517 strcat (intel_parser.disp, reg->reg_name);
6520 /* It's neither base nor index nor offset. */
6521 else if (!intel_parser.is_mem)
6523 i.types[this_operand] |= reg->reg_type & ~BaseIndex;
6524 i.op[this_operand].regs = reg;
6525 i.reg_operands++;
6527 else
6529 as_bad (_("Invalid use of register"));
6530 return 0;
6533 /* Since registers are not part of the displacement string (except
6534 when we're parsing offset operands), we may need to remove any
6535 preceding '+' from the displacement string. */
6536 if (*intel_parser.disp != '\0'
6537 && !intel_parser.in_offset)
6539 char *s = intel_parser.disp;
6540 s += strlen (s) - 1;
6541 if (*s == '+')
6542 *s = '\0';
6545 return 1;
6548 /* e11 BYTE
6549 | WORD
6550 | DWORD
6551 | FWORD
6552 | QWORD
6553 | TBYTE
6554 | OWORD
6555 | XMMWORD */
6556 case T_BYTE:
6557 case T_WORD:
6558 case T_DWORD:
6559 case T_FWORD:
6560 case T_QWORD:
6561 case T_TBYTE:
6562 case T_XMMWORD:
6563 intel_match_token (cur_token.code);
6565 if (cur_token.code == T_PTR)
6566 return 1;
6568 /* It must have been an identifier. */
6569 intel_putback_token ();
6570 cur_token.code = T_ID;
6571 /* FALLTHRU */
6573 /* e11 id
6574 | constant */
6575 case T_ID:
6576 if (!intel_parser.in_offset && intel_parser.is_mem <= 0)
6578 symbolS *symbolP;
6580 /* The identifier represents a memory reference only if it's not
6581 preceded by an offset modifier and if it's not an equate. */
6582 symbolP = symbol_find(cur_token.str);
6583 if (!symbolP || S_GET_SEGMENT(symbolP) != absolute_section)
6584 intel_parser.is_mem = 1;
6586 /* FALLTHRU */
6588 case T_CONST:
6589 case '-':
6590 case '+':
6592 char *save_str, sign = 0;
6594 /* Allow constants that start with `+' or `-'. */
6595 if (cur_token.code == '-' || cur_token.code == '+')
6597 sign = cur_token.code;
6598 intel_match_token (cur_token.code);
6599 if (cur_token.code != T_CONST)
6601 as_bad (_("Syntax error: Expecting a constant, got `%s'"),
6602 cur_token.str);
6603 return 0;
6607 save_str = (char *) xmalloc (strlen (cur_token.str) + 2);
6608 strcpy (save_str + !!sign, cur_token.str);
6609 if (sign)
6610 *save_str = sign;
6612 /* Get the next token to check for register scaling. */
6613 intel_match_token (cur_token.code);
6615 /* Check if this constant is a scaling factor for an index register. */
6616 if (cur_token.code == '*')
6618 if (intel_match_token ('*') && cur_token.code == T_REG)
6620 const reg_entry *reg = cur_token.reg;
6622 if (!intel_parser.in_bracket)
6624 as_bad (_("Register scaling only allowed in memory operands"));
6625 return 0;
6628 if (reg->reg_type & Reg16) /* Disallow things like [1*si]. */
6629 reg = i386_regtab + REGNAM_AX + 4; /* sp is invalid as index */
6630 else if (i.index_reg)
6631 reg = i386_regtab + REGNAM_EAX + 4; /* esp is invalid as index */
6633 /* The constant is followed by `* reg', so it must be
6634 a valid scale. */
6635 i.index_reg = reg;
6636 i.types[this_operand] |= BaseIndex;
6638 /* Set the scale after setting the register (otherwise,
6639 i386_scale will complain) */
6640 if (!i386_scale (save_str))
6641 return 0;
6642 intel_match_token (T_REG);
6644 /* Since registers are not part of the displacement
6645 string, we may need to remove any preceding '+' from
6646 the displacement string. */
6647 if (*intel_parser.disp != '\0')
6649 char *s = intel_parser.disp;
6650 s += strlen (s) - 1;
6651 if (*s == '+')
6652 *s = '\0';
6655 free (save_str);
6657 return 1;
6660 /* The constant was not used for register scaling. Since we have
6661 already consumed the token following `*' we now need to put it
6662 back in the stream. */
6663 intel_putback_token ();
6666 /* Add the constant to the displacement string. */
6667 strcat (intel_parser.disp, save_str);
6668 free (save_str);
6670 return 1;
6674 as_bad (_("Unrecognized token '%s'"), cur_token.str);
6675 return 0;
6678 /* Match the given token against cur_token. If they match, read the next
6679 token from the operand string. */
6680 static int
6681 intel_match_token (code)
6682 int code;
6684 if (cur_token.code == code)
6686 intel_get_token ();
6687 return 1;
6689 else
6691 as_bad (_("Unexpected token `%s'"), cur_token.str);
6692 return 0;
6696 /* Read a new token from intel_parser.op_string and store it in cur_token. */
6697 static void
6698 intel_get_token ()
6700 char *end_op;
6701 const reg_entry *reg;
6702 struct intel_token new_token;
6704 new_token.code = T_NIL;
6705 new_token.reg = NULL;
6706 new_token.str = NULL;
6708 /* Free the memory allocated to the previous token and move
6709 cur_token to prev_token. */
6710 if (prev_token.str)
6711 free (prev_token.str);
6713 prev_token = cur_token;
6715 /* Skip whitespace. */
6716 while (is_space_char (*intel_parser.op_string))
6717 intel_parser.op_string++;
6719 /* Return an empty token if we find nothing else on the line. */
6720 if (*intel_parser.op_string == '\0')
6722 cur_token = new_token;
6723 return;
6726 /* The new token cannot be larger than the remainder of the operand
6727 string. */
6728 new_token.str = (char *) xmalloc (strlen (intel_parser.op_string) + 1);
6729 new_token.str[0] = '\0';
6731 if (strchr ("0123456789", *intel_parser.op_string))
6733 char *p = new_token.str;
6734 char *q = intel_parser.op_string;
6735 new_token.code = T_CONST;
6737 /* Allow any kind of identifier char to encompass floating point and
6738 hexadecimal numbers. */
6739 while (is_identifier_char (*q))
6740 *p++ = *q++;
6741 *p = '\0';
6743 /* Recognize special symbol names [0-9][bf]. */
6744 if (strlen (intel_parser.op_string) == 2
6745 && (intel_parser.op_string[1] == 'b'
6746 || intel_parser.op_string[1] == 'f'))
6747 new_token.code = T_ID;
6750 else if ((*intel_parser.op_string == REGISTER_PREFIX || allow_naked_reg)
6751 && ((reg = parse_register (intel_parser.op_string, &end_op)) != NULL))
6753 new_token.code = T_REG;
6754 new_token.reg = reg;
6756 if (*intel_parser.op_string == REGISTER_PREFIX)
6758 new_token.str[0] = REGISTER_PREFIX;
6759 new_token.str[1] = '\0';
6762 strcat (new_token.str, reg->reg_name);
6765 else if (is_identifier_char (*intel_parser.op_string))
6767 char *p = new_token.str;
6768 char *q = intel_parser.op_string;
6770 /* A '.' or '$' followed by an identifier char is an identifier.
6771 Otherwise, it's operator '.' followed by an expression. */
6772 if ((*q == '.' || *q == '$') && !is_identifier_char (*(q + 1)))
6774 new_token.code = '.';
6775 new_token.str[0] = '.';
6776 new_token.str[1] = '\0';
6778 else
6780 while (is_identifier_char (*q) || *q == '@')
6781 *p++ = *q++;
6782 *p = '\0';
6784 if (strcasecmp (new_token.str, "NOT") == 0)
6785 new_token.code = '~';
6787 else if (strcasecmp (new_token.str, "MOD") == 0)
6788 new_token.code = '%';
6790 else if (strcasecmp (new_token.str, "AND") == 0)
6791 new_token.code = '&';
6793 else if (strcasecmp (new_token.str, "OR") == 0)
6794 new_token.code = '|';
6796 else if (strcasecmp (new_token.str, "XOR") == 0)
6797 new_token.code = '^';
6799 else if (strcasecmp (new_token.str, "SHL") == 0)
6800 new_token.code = T_SHL;
6802 else if (strcasecmp (new_token.str, "SHR") == 0)
6803 new_token.code = T_SHR;
6805 else if (strcasecmp (new_token.str, "BYTE") == 0)
6806 new_token.code = T_BYTE;
6808 else if (strcasecmp (new_token.str, "WORD") == 0)
6809 new_token.code = T_WORD;
6811 else if (strcasecmp (new_token.str, "DWORD") == 0)
6812 new_token.code = T_DWORD;
6814 else if (strcasecmp (new_token.str, "FWORD") == 0)
6815 new_token.code = T_FWORD;
6817 else if (strcasecmp (new_token.str, "QWORD") == 0)
6818 new_token.code = T_QWORD;
6820 else if (strcasecmp (new_token.str, "TBYTE") == 0
6821 /* XXX remove (gcc still uses it) */
6822 || strcasecmp (new_token.str, "XWORD") == 0)
6823 new_token.code = T_TBYTE;
6825 else if (strcasecmp (new_token.str, "XMMWORD") == 0
6826 || strcasecmp (new_token.str, "OWORD") == 0)
6827 new_token.code = T_XMMWORD;
6829 else if (strcasecmp (new_token.str, "PTR") == 0)
6830 new_token.code = T_PTR;
6832 else if (strcasecmp (new_token.str, "SHORT") == 0)
6833 new_token.code = T_SHORT;
6835 else if (strcasecmp (new_token.str, "OFFSET") == 0)
6837 new_token.code = T_OFFSET;
6839 /* ??? This is not mentioned in the MASM grammar but gcc
6840 makes use of it with -mintel-syntax. OFFSET may be
6841 followed by FLAT: */
6842 if (strncasecmp (q, " FLAT:", 6) == 0)
6843 strcat (new_token.str, " FLAT:");
6846 /* ??? This is not mentioned in the MASM grammar. */
6847 else if (strcasecmp (new_token.str, "FLAT") == 0)
6849 new_token.code = T_OFFSET;
6850 if (*q == ':')
6851 strcat (new_token.str, ":");
6852 else
6853 as_bad (_("`:' expected"));
6856 else
6857 new_token.code = T_ID;
6861 else if (strchr ("+-/*%|&^:[]()~", *intel_parser.op_string))
6863 new_token.code = *intel_parser.op_string;
6864 new_token.str[0] = *intel_parser.op_string;
6865 new_token.str[1] = '\0';
6868 else if (strchr ("<>", *intel_parser.op_string)
6869 && *intel_parser.op_string == *(intel_parser.op_string + 1))
6871 new_token.code = *intel_parser.op_string == '<' ? T_SHL : T_SHR;
6872 new_token.str[0] = *intel_parser.op_string;
6873 new_token.str[1] = *intel_parser.op_string;
6874 new_token.str[2] = '\0';
6877 else
6878 as_bad (_("Unrecognized token `%s'"), intel_parser.op_string);
6880 intel_parser.op_string += strlen (new_token.str);
6881 cur_token = new_token;
6884 /* Put cur_token back into the token stream and make cur_token point to
6885 prev_token. */
6886 static void
6887 intel_putback_token ()
6889 if (cur_token.code != T_NIL)
6891 intel_parser.op_string -= strlen (cur_token.str);
6892 free (cur_token.str);
6894 cur_token = prev_token;
6896 /* Forget prev_token. */
6897 prev_token.code = T_NIL;
6898 prev_token.reg = NULL;
6899 prev_token.str = NULL;
6903 tc_x86_regname_to_dw2regnum (const char *regname)
6905 unsigned int regnum;
6906 unsigned int regnames_count;
6907 static const char *const regnames_32[] =
6909 "eax", "ecx", "edx", "ebx",
6910 "esp", "ebp", "esi", "edi",
6911 "eip", "eflags", NULL,
6912 "st0", "st1", "st2", "st3",
6913 "st4", "st5", "st6", "st7",
6914 NULL, NULL,
6915 "xmm0", "xmm1", "xmm2", "xmm3",
6916 "xmm4", "xmm5", "xmm6", "xmm7",
6917 "mm0", "mm1", "mm2", "mm3",
6918 "mm4", "mm5", "mm6", "mm7"
6920 static const char *const regnames_64[] =
6922 "rax", "rdx", "rcx", "rbx",
6923 "rsi", "rdi", "rbp", "rsp",
6924 "r8", "r9", "r10", "r11",
6925 "r12", "r13", "r14", "r15",
6926 "rip",
6927 "xmm0", "xmm1", "xmm2", "xmm3",
6928 "xmm4", "xmm5", "xmm6", "xmm7",
6929 "xmm8", "xmm9", "xmm10", "xmm11",
6930 "xmm12", "xmm13", "xmm14", "xmm15",
6931 "st0", "st1", "st2", "st3",
6932 "st4", "st5", "st6", "st7",
6933 "mm0", "mm1", "mm2", "mm3",
6934 "mm4", "mm5", "mm6", "mm7"
6936 const char *const *regnames;
6938 if (flag_code == CODE_64BIT)
6940 regnames = regnames_64;
6941 regnames_count = ARRAY_SIZE (regnames_64);
6943 else
6945 regnames = regnames_32;
6946 regnames_count = ARRAY_SIZE (regnames_32);
6949 for (regnum = 0; regnum < regnames_count; regnum++)
6950 if (regnames[regnum] != NULL
6951 && strcmp (regname, regnames[regnum]) == 0)
6952 return regnum;
6954 return -1;
6957 void
6958 tc_x86_frame_initial_instructions (void)
6960 static unsigned int sp_regno;
6962 if (!sp_regno)
6963 sp_regno = tc_x86_regname_to_dw2regnum (flag_code == CODE_64BIT
6964 ? "rsp" : "esp");
6966 cfi_add_CFA_def_cfa (sp_regno, -x86_cie_data_alignment);
6967 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
6971 i386_elf_section_type (const char *str, size_t len)
6973 if (flag_code == CODE_64BIT
6974 && len == sizeof ("unwind") - 1
6975 && strncmp (str, "unwind", 6) == 0)
6976 return SHT_X86_64_UNWIND;
6978 return -1;
6981 #ifdef TE_PE
6982 void
6983 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
6985 expressionS expr;
6987 expr.X_op = O_secrel;
6988 expr.X_add_symbol = symbol;
6989 expr.X_add_number = 0;
6990 emit_expr (&expr, size);
6992 #endif