2006-02-14 Paolo Bonzini <bonzini@gnu.org>
[binutils.git] / gas / config / tc-i386.c
blob337149ee76d27565c2eef2ed024d9d478c14b3ed
1 /* i386.c -- Assemble code for the Intel 80386
2 Copyright 1989, 1991, 1992, 1993, 1994, 1995, 1996, 1997, 1998, 1999,
3 2000, 2001, 2002, 2003, 2004, 2005, 2006
4 Free Software Foundation, Inc.
6 This file is part of GAS, the GNU Assembler.
8 GAS is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 2, or (at your option)
11 any later version.
13 GAS is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with GAS; see the file COPYING. If not, write to the Free
20 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
21 02110-1301, USA. */
23 /* Intel 80386 machine specific gas.
24 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
25 x86_64 support by Jan Hubicka (jh@suse.cz)
26 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
27 Bugs & suggestions are completely welcome. This is free software.
28 Please help us make it better. */
30 #include "as.h"
31 #include "safe-ctype.h"
32 #include "subsegs.h"
33 #include "dwarf2dbg.h"
34 #include "dw2gencfi.h"
35 #include "opcode/i386.h"
36 #include "elf/x86-64.h"
38 #ifndef REGISTER_WARNINGS
39 #define REGISTER_WARNINGS 1
40 #endif
42 #ifndef INFER_ADDR_PREFIX
43 #define INFER_ADDR_PREFIX 1
44 #endif
46 #ifndef SCALE1_WHEN_NO_INDEX
47 /* Specifying a scale factor besides 1 when there is no index is
48 futile. eg. `mov (%ebx,2),%al' does exactly the same as
49 `mov (%ebx),%al'. To slavishly follow what the programmer
50 specified, set SCALE1_WHEN_NO_INDEX to 0. */
51 #define SCALE1_WHEN_NO_INDEX 1
52 #endif
54 #ifndef DEFAULT_ARCH
55 #define DEFAULT_ARCH "i386"
56 #endif
58 #ifndef INLINE
59 #if __GNUC__ >= 2
60 #define INLINE __inline__
61 #else
62 #define INLINE
63 #endif
64 #endif
66 static INLINE unsigned int mode_from_disp_size PARAMS ((unsigned int));
67 static INLINE int fits_in_signed_byte PARAMS ((offsetT));
68 static INLINE int fits_in_unsigned_byte PARAMS ((offsetT));
69 static INLINE int fits_in_unsigned_word PARAMS ((offsetT));
70 static INLINE int fits_in_signed_word PARAMS ((offsetT));
71 static INLINE int fits_in_unsigned_long PARAMS ((offsetT));
72 static INLINE int fits_in_signed_long PARAMS ((offsetT));
73 static int smallest_imm_type PARAMS ((offsetT));
74 static offsetT offset_in_range PARAMS ((offsetT, int));
75 static int add_prefix PARAMS ((unsigned int));
76 static void set_code_flag PARAMS ((int));
77 static void set_16bit_gcc_code_flag PARAMS ((int));
78 static void set_intel_syntax PARAMS ((int));
79 static void set_cpu_arch PARAMS ((int));
80 #ifdef TE_PE
81 static void pe_directive_secrel PARAMS ((int));
82 #endif
83 static void signed_cons PARAMS ((int));
84 static char *output_invalid PARAMS ((int c));
85 static int i386_operand PARAMS ((char *operand_string));
86 static int i386_intel_operand PARAMS ((char *operand_string, int got_a_float));
87 static const reg_entry *parse_register PARAMS ((char *reg_string,
88 char **end_op));
89 static char *parse_insn PARAMS ((char *, char *));
90 static char *parse_operands PARAMS ((char *, const char *));
91 static void swap_operands PARAMS ((void));
92 static void optimize_imm PARAMS ((void));
93 static void optimize_disp PARAMS ((void));
94 static int match_template PARAMS ((void));
95 static int check_string PARAMS ((void));
96 static int process_suffix PARAMS ((void));
97 static int check_byte_reg PARAMS ((void));
98 static int check_long_reg PARAMS ((void));
99 static int check_qword_reg PARAMS ((void));
100 static int check_word_reg PARAMS ((void));
101 static int finalize_imm PARAMS ((void));
102 static int process_operands PARAMS ((void));
103 static const seg_entry *build_modrm_byte PARAMS ((void));
104 static void output_insn PARAMS ((void));
105 static void output_branch PARAMS ((void));
106 static void output_jump PARAMS ((void));
107 static void output_interseg_jump PARAMS ((void));
108 static void output_imm PARAMS ((fragS *insn_start_frag,
109 offsetT insn_start_off));
110 static void output_disp PARAMS ((fragS *insn_start_frag,
111 offsetT insn_start_off));
112 #ifndef I386COFF
113 static void s_bss PARAMS ((int));
114 #endif
115 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
116 static void handle_large_common (int small ATTRIBUTE_UNUSED);
117 #endif
119 static const char *default_arch = DEFAULT_ARCH;
121 /* 'md_assemble ()' gathers together information and puts it into a
122 i386_insn. */
124 union i386_op
126 expressionS *disps;
127 expressionS *imms;
128 const reg_entry *regs;
131 struct _i386_insn
133 /* TM holds the template for the insn were currently assembling. */
134 template tm;
136 /* SUFFIX holds the instruction mnemonic suffix if given.
137 (e.g. 'l' for 'movl') */
138 char suffix;
140 /* OPERANDS gives the number of given operands. */
141 unsigned int operands;
143 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
144 of given register, displacement, memory operands and immediate
145 operands. */
146 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
148 /* TYPES [i] is the type (see above #defines) which tells us how to
149 use OP[i] for the corresponding operand. */
150 unsigned int types[MAX_OPERANDS];
152 /* Displacement expression, immediate expression, or register for each
153 operand. */
154 union i386_op op[MAX_OPERANDS];
156 /* Flags for operands. */
157 unsigned int flags[MAX_OPERANDS];
158 #define Operand_PCrel 1
160 /* Relocation type for operand */
161 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
163 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
164 the base index byte below. */
165 const reg_entry *base_reg;
166 const reg_entry *index_reg;
167 unsigned int log2_scale_factor;
169 /* SEG gives the seg_entries of this insn. They are zero unless
170 explicit segment overrides are given. */
171 const seg_entry *seg[2];
173 /* PREFIX holds all the given prefix opcodes (usually null).
174 PREFIXES is the number of prefix opcodes. */
175 unsigned int prefixes;
176 unsigned char prefix[MAX_PREFIXES];
178 /* RM and SIB are the modrm byte and the sib byte where the
179 addressing modes of this insn are encoded. */
181 modrm_byte rm;
182 rex_byte rex;
183 sib_byte sib;
186 typedef struct _i386_insn i386_insn;
188 /* List of chars besides those in app.c:symbol_chars that can start an
189 operand. Used to prevent the scrubber eating vital white-space. */
190 const char extra_symbol_chars[] = "*%-(["
191 #ifdef LEX_AT
193 #endif
194 #ifdef LEX_QM
196 #endif
199 #if (defined (TE_I386AIX) \
200 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
201 && !defined (TE_GNU) \
202 && !defined (TE_LINUX) \
203 && !defined (TE_NETWARE) \
204 && !defined (TE_FreeBSD) \
205 && !defined (TE_NetBSD)))
206 /* This array holds the chars that always start a comment. If the
207 pre-processor is disabled, these aren't very useful. The option
208 --divide will remove '/' from this list. */
209 const char *i386_comment_chars = "#/";
210 #define SVR4_COMMENT_CHARS 1
211 #define PREFIX_SEPARATOR '\\'
213 #else
214 const char *i386_comment_chars = "#";
215 #define PREFIX_SEPARATOR '/'
216 #endif
218 /* This array holds the chars that only start a comment at the beginning of
219 a line. If the line seems to have the form '# 123 filename'
220 .line and .file directives will appear in the pre-processed output.
221 Note that input_file.c hand checks for '#' at the beginning of the
222 first line of the input file. This is because the compiler outputs
223 #NO_APP at the beginning of its output.
224 Also note that comments started like this one will always work if
225 '/' isn't otherwise defined. */
226 const char line_comment_chars[] = "#/";
228 const char line_separator_chars[] = ";";
230 /* Chars that can be used to separate mant from exp in floating point
231 nums. */
232 const char EXP_CHARS[] = "eE";
234 /* Chars that mean this number is a floating point constant
235 As in 0f12.456
236 or 0d1.2345e12. */
237 const char FLT_CHARS[] = "fFdDxX";
239 /* Tables for lexical analysis. */
240 static char mnemonic_chars[256];
241 static char register_chars[256];
242 static char operand_chars[256];
243 static char identifier_chars[256];
244 static char digit_chars[256];
246 /* Lexical macros. */
247 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
248 #define is_operand_char(x) (operand_chars[(unsigned char) x])
249 #define is_register_char(x) (register_chars[(unsigned char) x])
250 #define is_space_char(x) ((x) == ' ')
251 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
252 #define is_digit_char(x) (digit_chars[(unsigned char) x])
254 /* All non-digit non-letter characters that may occur in an operand. */
255 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
257 /* md_assemble() always leaves the strings it's passed unaltered. To
258 effect this we maintain a stack of saved characters that we've smashed
259 with '\0's (indicating end of strings for various sub-fields of the
260 assembler instruction). */
261 static char save_stack[32];
262 static char *save_stack_p;
263 #define END_STRING_AND_SAVE(s) \
264 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
265 #define RESTORE_END_STRING(s) \
266 do { *(s) = *--save_stack_p; } while (0)
268 /* The instruction we're assembling. */
269 static i386_insn i;
271 /* Possible templates for current insn. */
272 static const templates *current_templates;
274 /* Per instruction expressionS buffers: 2 displacements & 2 immediate max. */
275 static expressionS disp_expressions[2], im_expressions[2];
277 /* Current operand we are working on. */
278 static int this_operand;
280 /* We support four different modes. FLAG_CODE variable is used to distinguish
281 these. */
283 enum flag_code {
284 CODE_32BIT,
285 CODE_16BIT,
286 CODE_64BIT };
287 #define NUM_FLAG_CODE ((int) CODE_64BIT + 1)
289 static enum flag_code flag_code;
290 static unsigned int object_64bit;
291 static int use_rela_relocations = 0;
293 /* The names used to print error messages. */
294 static const char *flag_code_names[] =
296 "32",
297 "16",
298 "64"
301 /* 1 for intel syntax,
302 0 if att syntax. */
303 static int intel_syntax = 0;
305 /* 1 if register prefix % not required. */
306 static int allow_naked_reg = 0;
308 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
309 leave, push, and pop instructions so that gcc has the same stack
310 frame as in 32 bit mode. */
311 static char stackop_size = '\0';
313 /* Non-zero to optimize code alignment. */
314 int optimize_align_code = 1;
316 /* Non-zero to quieten some warnings. */
317 static int quiet_warnings = 0;
319 /* CPU name. */
320 static const char *cpu_arch_name = NULL;
321 static const char *cpu_sub_arch_name = NULL;
323 /* CPU feature flags. */
324 static unsigned int cpu_arch_flags = CpuUnknownFlags | CpuNo64;
326 /* If set, conditional jumps are not automatically promoted to handle
327 larger than a byte offset. */
328 static unsigned int no_cond_jump_promotion = 0;
330 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
331 static symbolS *GOT_symbol;
333 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
334 unsigned int x86_dwarf2_return_column;
336 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
337 int x86_cie_data_alignment;
339 /* Interface to relax_segment.
340 There are 3 major relax states for 386 jump insns because the
341 different types of jumps add different sizes to frags when we're
342 figuring out what sort of jump to choose to reach a given label. */
344 /* Types. */
345 #define UNCOND_JUMP 0
346 #define COND_JUMP 1
347 #define COND_JUMP86 2
349 /* Sizes. */
350 #define CODE16 1
351 #define SMALL 0
352 #define SMALL16 (SMALL | CODE16)
353 #define BIG 2
354 #define BIG16 (BIG | CODE16)
356 #ifndef INLINE
357 #ifdef __GNUC__
358 #define INLINE __inline__
359 #else
360 #define INLINE
361 #endif
362 #endif
364 #define ENCODE_RELAX_STATE(type, size) \
365 ((relax_substateT) (((type) << 2) | (size)))
366 #define TYPE_FROM_RELAX_STATE(s) \
367 ((s) >> 2)
368 #define DISP_SIZE_FROM_RELAX_STATE(s) \
369 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
371 /* This table is used by relax_frag to promote short jumps to long
372 ones where necessary. SMALL (short) jumps may be promoted to BIG
373 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
374 don't allow a short jump in a 32 bit code segment to be promoted to
375 a 16 bit offset jump because it's slower (requires data size
376 prefix), and doesn't work, unless the destination is in the bottom
377 64k of the code segment (The top 16 bits of eip are zeroed). */
379 const relax_typeS md_relax_table[] =
381 /* The fields are:
382 1) most positive reach of this state,
383 2) most negative reach of this state,
384 3) how many bytes this mode will have in the variable part of the frag
385 4) which index into the table to try if we can't fit into this one. */
387 /* UNCOND_JUMP states. */
388 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
389 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
390 /* dword jmp adds 4 bytes to frag:
391 0 extra opcode bytes, 4 displacement bytes. */
392 {0, 0, 4, 0},
393 /* word jmp adds 2 byte2 to frag:
394 0 extra opcode bytes, 2 displacement bytes. */
395 {0, 0, 2, 0},
397 /* COND_JUMP states. */
398 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
399 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
400 /* dword conditionals adds 5 bytes to frag:
401 1 extra opcode byte, 4 displacement bytes. */
402 {0, 0, 5, 0},
403 /* word conditionals add 3 bytes to frag:
404 1 extra opcode byte, 2 displacement bytes. */
405 {0, 0, 3, 0},
407 /* COND_JUMP86 states. */
408 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
409 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
410 /* dword conditionals adds 5 bytes to frag:
411 1 extra opcode byte, 4 displacement bytes. */
412 {0, 0, 5, 0},
413 /* word conditionals add 4 bytes to frag:
414 1 displacement byte and a 3 byte long branch insn. */
415 {0, 0, 4, 0}
418 static const arch_entry cpu_arch[] = {
419 {"i8086", Cpu086 },
420 {"i186", Cpu086|Cpu186 },
421 {"i286", Cpu086|Cpu186|Cpu286 },
422 {"i386", Cpu086|Cpu186|Cpu286|Cpu386 },
423 {"i486", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486 },
424 {"i586", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586 },
425 {"i686", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686 },
426 {"pentium", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586 },
427 {"pentiumpro",Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686 },
428 {"pentiumii", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuMMX },
429 {"pentiumiii",Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuMMX|CpuMMX2|CpuSSE },
430 {"pentium4", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuP4|CpuMMX|CpuMMX2|CpuSSE|CpuSSE2 },
431 {"prescott", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuP4|CpuMMX|CpuMMX2|CpuSSE|CpuSSE2|CpuPNI },
432 {"k6", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|CpuK6|CpuMMX },
433 {"k6_2", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|CpuK6|CpuMMX|Cpu3dnow },
434 {"athlon", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuK6|CpuAthlon|CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA },
435 {"sledgehammer",Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuK6|CpuAthlon|CpuSledgehammer|CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA|CpuSSE|CpuSSE2 },
436 {"opteron", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuK6|CpuAthlon|CpuSledgehammer|CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA|CpuSSE|CpuSSE2 },
437 {".mmx", CpuMMX },
438 {".sse", CpuMMX|CpuMMX2|CpuSSE },
439 {".sse2", CpuMMX|CpuMMX2|CpuSSE|CpuSSE2 },
440 {".sse3", CpuMMX|CpuMMX2|CpuSSE|CpuSSE2|CpuSSE3 },
441 {".3dnow", CpuMMX|Cpu3dnow },
442 {".3dnowa", CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA },
443 {".padlock", CpuPadLock },
444 {".pacifica", CpuSVME },
445 {".svme", CpuSVME },
446 {NULL, 0 }
449 const pseudo_typeS md_pseudo_table[] =
451 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
452 {"align", s_align_bytes, 0},
453 #else
454 {"align", s_align_ptwo, 0},
455 #endif
456 {"arch", set_cpu_arch, 0},
457 #ifndef I386COFF
458 {"bss", s_bss, 0},
459 #endif
460 {"ffloat", float_cons, 'f'},
461 {"dfloat", float_cons, 'd'},
462 {"tfloat", float_cons, 'x'},
463 {"value", cons, 2},
464 {"slong", signed_cons, 4},
465 {"noopt", s_ignore, 0},
466 {"optim", s_ignore, 0},
467 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
468 {"code16", set_code_flag, CODE_16BIT},
469 {"code32", set_code_flag, CODE_32BIT},
470 {"code64", set_code_flag, CODE_64BIT},
471 {"intel_syntax", set_intel_syntax, 1},
472 {"att_syntax", set_intel_syntax, 0},
473 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
474 {"largecomm", handle_large_common, 0},
475 #else
476 {"file", (void (*) PARAMS ((int))) dwarf2_directive_file, 0},
477 {"loc", dwarf2_directive_loc, 0},
478 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
479 #endif
480 #ifdef TE_PE
481 {"secrel32", pe_directive_secrel, 0},
482 #endif
483 {0, 0, 0}
486 /* For interface with expression (). */
487 extern char *input_line_pointer;
489 /* Hash table for instruction mnemonic lookup. */
490 static struct hash_control *op_hash;
492 /* Hash table for register lookup. */
493 static struct hash_control *reg_hash;
495 void
496 i386_align_code (fragP, count)
497 fragS *fragP;
498 int count;
500 /* Various efficient no-op patterns for aligning code labels.
501 Note: Don't try to assemble the instructions in the comments.
502 0L and 0w are not legal. */
503 static const char f32_1[] =
504 {0x90}; /* nop */
505 static const char f32_2[] =
506 {0x89,0xf6}; /* movl %esi,%esi */
507 static const char f32_3[] =
508 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
509 static const char f32_4[] =
510 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
511 static const char f32_5[] =
512 {0x90, /* nop */
513 0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
514 static const char f32_6[] =
515 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
516 static const char f32_7[] =
517 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
518 static const char f32_8[] =
519 {0x90, /* nop */
520 0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
521 static const char f32_9[] =
522 {0x89,0xf6, /* movl %esi,%esi */
523 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
524 static const char f32_10[] =
525 {0x8d,0x76,0x00, /* leal 0(%esi),%esi */
526 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
527 static const char f32_11[] =
528 {0x8d,0x74,0x26,0x00, /* leal 0(%esi,1),%esi */
529 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
530 static const char f32_12[] =
531 {0x8d,0xb6,0x00,0x00,0x00,0x00, /* leal 0L(%esi),%esi */
532 0x8d,0xbf,0x00,0x00,0x00,0x00}; /* leal 0L(%edi),%edi */
533 static const char f32_13[] =
534 {0x8d,0xb6,0x00,0x00,0x00,0x00, /* leal 0L(%esi),%esi */
535 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
536 static const char f32_14[] =
537 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00, /* leal 0L(%esi,1),%esi */
538 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
539 static const char f32_15[] =
540 {0xeb,0x0d,0x90,0x90,0x90,0x90,0x90, /* jmp .+15; lotsa nops */
541 0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90};
542 static const char f16_3[] =
543 {0x8d,0x74,0x00}; /* lea 0(%esi),%esi */
544 static const char f16_4[] =
545 {0x8d,0xb4,0x00,0x00}; /* lea 0w(%si),%si */
546 static const char f16_5[] =
547 {0x90, /* nop */
548 0x8d,0xb4,0x00,0x00}; /* lea 0w(%si),%si */
549 static const char f16_6[] =
550 {0x89,0xf6, /* mov %si,%si */
551 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
552 static const char f16_7[] =
553 {0x8d,0x74,0x00, /* lea 0(%si),%si */
554 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
555 static const char f16_8[] =
556 {0x8d,0xb4,0x00,0x00, /* lea 0w(%si),%si */
557 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
558 static const char *const f32_patt[] = {
559 f32_1, f32_2, f32_3, f32_4, f32_5, f32_6, f32_7, f32_8,
560 f32_9, f32_10, f32_11, f32_12, f32_13, f32_14, f32_15
562 static const char *const f16_patt[] = {
563 f32_1, f32_2, f16_3, f16_4, f16_5, f16_6, f16_7, f16_8,
564 f32_15, f32_15, f32_15, f32_15, f32_15, f32_15, f32_15
567 if (count <= 0 || count > 15)
568 return;
570 /* The recommended way to pad 64bit code is to use NOPs preceded by
571 maximally four 0x66 prefixes. Balance the size of nops. */
572 if (flag_code == CODE_64BIT)
574 int i;
575 int nnops = (count + 3) / 4;
576 int len = count / nnops;
577 int remains = count - nnops * len;
578 int pos = 0;
580 for (i = 0; i < remains; i++)
582 memset (fragP->fr_literal + fragP->fr_fix + pos, 0x66, len);
583 fragP->fr_literal[fragP->fr_fix + pos + len] = 0x90;
584 pos += len + 1;
586 for (; i < nnops; i++)
588 memset (fragP->fr_literal + fragP->fr_fix + pos, 0x66, len - 1);
589 fragP->fr_literal[fragP->fr_fix + pos + len - 1] = 0x90;
590 pos += len;
593 else
594 if (flag_code == CODE_16BIT)
596 memcpy (fragP->fr_literal + fragP->fr_fix,
597 f16_patt[count - 1], count);
598 if (count > 8)
599 /* Adjust jump offset. */
600 fragP->fr_literal[fragP->fr_fix + 1] = count - 2;
602 else
603 memcpy (fragP->fr_literal + fragP->fr_fix,
604 f32_patt[count - 1], count);
605 fragP->fr_var = count;
608 static INLINE unsigned int
609 mode_from_disp_size (t)
610 unsigned int t;
612 return (t & Disp8) ? 1 : (t & (Disp16 | Disp32 | Disp32S)) ? 2 : 0;
615 static INLINE int
616 fits_in_signed_byte (num)
617 offsetT num;
619 return (num >= -128) && (num <= 127);
622 static INLINE int
623 fits_in_unsigned_byte (num)
624 offsetT num;
626 return (num & 0xff) == num;
629 static INLINE int
630 fits_in_unsigned_word (num)
631 offsetT num;
633 return (num & 0xffff) == num;
636 static INLINE int
637 fits_in_signed_word (num)
638 offsetT num;
640 return (-32768 <= num) && (num <= 32767);
642 static INLINE int
643 fits_in_signed_long (num)
644 offsetT num ATTRIBUTE_UNUSED;
646 #ifndef BFD64
647 return 1;
648 #else
649 return (!(((offsetT) -1 << 31) & num)
650 || (((offsetT) -1 << 31) & num) == ((offsetT) -1 << 31));
651 #endif
652 } /* fits_in_signed_long() */
653 static INLINE int
654 fits_in_unsigned_long (num)
655 offsetT num ATTRIBUTE_UNUSED;
657 #ifndef BFD64
658 return 1;
659 #else
660 return (num & (((offsetT) 2 << 31) - 1)) == num;
661 #endif
662 } /* fits_in_unsigned_long() */
664 static int
665 smallest_imm_type (num)
666 offsetT num;
668 if (cpu_arch_flags != (Cpu086 | Cpu186 | Cpu286 | Cpu386 | Cpu486 | CpuNo64))
670 /* This code is disabled on the 486 because all the Imm1 forms
671 in the opcode table are slower on the i486. They're the
672 versions with the implicitly specified single-position
673 displacement, which has another syntax if you really want to
674 use that form. */
675 if (num == 1)
676 return Imm1 | Imm8 | Imm8S | Imm16 | Imm32 | Imm32S | Imm64;
678 return (fits_in_signed_byte (num)
679 ? (Imm8S | Imm8 | Imm16 | Imm32 | Imm32S | Imm64)
680 : fits_in_unsigned_byte (num)
681 ? (Imm8 | Imm16 | Imm32 | Imm32S | Imm64)
682 : (fits_in_signed_word (num) || fits_in_unsigned_word (num))
683 ? (Imm16 | Imm32 | Imm32S | Imm64)
684 : fits_in_signed_long (num)
685 ? (Imm32 | Imm32S | Imm64)
686 : fits_in_unsigned_long (num)
687 ? (Imm32 | Imm64)
688 : Imm64);
691 static offsetT
692 offset_in_range (val, size)
693 offsetT val;
694 int size;
696 addressT mask;
698 switch (size)
700 case 1: mask = ((addressT) 1 << 8) - 1; break;
701 case 2: mask = ((addressT) 1 << 16) - 1; break;
702 case 4: mask = ((addressT) 2 << 31) - 1; break;
703 #ifdef BFD64
704 case 8: mask = ((addressT) 2 << 63) - 1; break;
705 #endif
706 default: abort ();
709 /* If BFD64, sign extend val. */
710 if (!use_rela_relocations)
711 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
712 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
714 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
716 char buf1[40], buf2[40];
718 sprint_value (buf1, val);
719 sprint_value (buf2, val & mask);
720 as_warn (_("%s shortened to %s"), buf1, buf2);
722 return val & mask;
725 /* Returns 0 if attempting to add a prefix where one from the same
726 class already exists, 1 if non rep/repne added, 2 if rep/repne
727 added. */
728 static int
729 add_prefix (prefix)
730 unsigned int prefix;
732 int ret = 1;
733 unsigned int q;
735 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
736 && flag_code == CODE_64BIT)
738 if ((i.prefix[REX_PREFIX] & prefix & REX_MODE64)
739 || ((i.prefix[REX_PREFIX] & (REX_EXTX | REX_EXTY | REX_EXTZ))
740 && (prefix & (REX_EXTX | REX_EXTY | REX_EXTZ))))
741 ret = 0;
742 q = REX_PREFIX;
744 else
746 switch (prefix)
748 default:
749 abort ();
751 case CS_PREFIX_OPCODE:
752 case DS_PREFIX_OPCODE:
753 case ES_PREFIX_OPCODE:
754 case FS_PREFIX_OPCODE:
755 case GS_PREFIX_OPCODE:
756 case SS_PREFIX_OPCODE:
757 q = SEG_PREFIX;
758 break;
760 case REPNE_PREFIX_OPCODE:
761 case REPE_PREFIX_OPCODE:
762 ret = 2;
763 /* fall thru */
764 case LOCK_PREFIX_OPCODE:
765 q = LOCKREP_PREFIX;
766 break;
768 case FWAIT_OPCODE:
769 q = WAIT_PREFIX;
770 break;
772 case ADDR_PREFIX_OPCODE:
773 q = ADDR_PREFIX;
774 break;
776 case DATA_PREFIX_OPCODE:
777 q = DATA_PREFIX;
778 break;
780 if (i.prefix[q] != 0)
781 ret = 0;
784 if (ret)
786 if (!i.prefix[q])
787 ++i.prefixes;
788 i.prefix[q] |= prefix;
790 else
791 as_bad (_("same type of prefix used twice"));
793 return ret;
796 static void
797 set_code_flag (value)
798 int value;
800 flag_code = value;
801 cpu_arch_flags &= ~(Cpu64 | CpuNo64);
802 cpu_arch_flags |= (flag_code == CODE_64BIT ? Cpu64 : CpuNo64);
803 if (value == CODE_64BIT && !(cpu_arch_flags & CpuSledgehammer))
805 as_bad (_("64bit mode not supported on this CPU."));
807 if (value == CODE_32BIT && !(cpu_arch_flags & Cpu386))
809 as_bad (_("32bit mode not supported on this CPU."));
811 stackop_size = '\0';
814 static void
815 set_16bit_gcc_code_flag (new_code_flag)
816 int new_code_flag;
818 flag_code = new_code_flag;
819 cpu_arch_flags &= ~(Cpu64 | CpuNo64);
820 cpu_arch_flags |= (flag_code == CODE_64BIT ? Cpu64 : CpuNo64);
821 stackop_size = LONG_MNEM_SUFFIX;
824 static void
825 set_intel_syntax (syntax_flag)
826 int syntax_flag;
828 /* Find out if register prefixing is specified. */
829 int ask_naked_reg = 0;
831 SKIP_WHITESPACE ();
832 if (!is_end_of_line[(unsigned char) *input_line_pointer])
834 char *string = input_line_pointer;
835 int e = get_symbol_end ();
837 if (strcmp (string, "prefix") == 0)
838 ask_naked_reg = 1;
839 else if (strcmp (string, "noprefix") == 0)
840 ask_naked_reg = -1;
841 else
842 as_bad (_("bad argument to syntax directive."));
843 *input_line_pointer = e;
845 demand_empty_rest_of_line ();
847 intel_syntax = syntax_flag;
849 if (ask_naked_reg == 0)
850 allow_naked_reg = (intel_syntax
851 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
852 else
853 allow_naked_reg = (ask_naked_reg < 0);
855 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
856 identifier_chars['$'] = intel_syntax ? '$' : 0;
859 static void
860 set_cpu_arch (dummy)
861 int dummy ATTRIBUTE_UNUSED;
863 SKIP_WHITESPACE ();
865 if (!is_end_of_line[(unsigned char) *input_line_pointer])
867 char *string = input_line_pointer;
868 int e = get_symbol_end ();
869 int i;
871 for (i = 0; cpu_arch[i].name; i++)
873 if (strcmp (string, cpu_arch[i].name) == 0)
875 if (*string != '.')
877 cpu_arch_name = cpu_arch[i].name;
878 cpu_sub_arch_name = NULL;
879 cpu_arch_flags = (cpu_arch[i].flags
880 | (flag_code == CODE_64BIT ? Cpu64 : CpuNo64));
881 break;
883 if ((cpu_arch_flags | cpu_arch[i].flags) != cpu_arch_flags)
885 cpu_sub_arch_name = cpu_arch[i].name;
886 cpu_arch_flags |= cpu_arch[i].flags;
888 *input_line_pointer = e;
889 demand_empty_rest_of_line ();
890 return;
893 if (!cpu_arch[i].name)
894 as_bad (_("no such architecture: `%s'"), string);
896 *input_line_pointer = e;
898 else
899 as_bad (_("missing cpu architecture"));
901 no_cond_jump_promotion = 0;
902 if (*input_line_pointer == ','
903 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
905 char *string = ++input_line_pointer;
906 int e = get_symbol_end ();
908 if (strcmp (string, "nojumps") == 0)
909 no_cond_jump_promotion = 1;
910 else if (strcmp (string, "jumps") == 0)
912 else
913 as_bad (_("no such architecture modifier: `%s'"), string);
915 *input_line_pointer = e;
918 demand_empty_rest_of_line ();
921 unsigned long
922 i386_mach ()
924 if (!strcmp (default_arch, "x86_64"))
925 return bfd_mach_x86_64;
926 else if (!strcmp (default_arch, "i386"))
927 return bfd_mach_i386_i386;
928 else
929 as_fatal (_("Unknown architecture"));
932 void
933 md_begin ()
935 const char *hash_err;
937 /* Initialize op_hash hash table. */
938 op_hash = hash_new ();
941 const template *optab;
942 templates *core_optab;
944 /* Setup for loop. */
945 optab = i386_optab;
946 core_optab = (templates *) xmalloc (sizeof (templates));
947 core_optab->start = optab;
949 while (1)
951 ++optab;
952 if (optab->name == NULL
953 || strcmp (optab->name, (optab - 1)->name) != 0)
955 /* different name --> ship out current template list;
956 add to hash table; & begin anew. */
957 core_optab->end = optab;
958 hash_err = hash_insert (op_hash,
959 (optab - 1)->name,
960 (PTR) core_optab);
961 if (hash_err)
963 as_fatal (_("Internal Error: Can't hash %s: %s"),
964 (optab - 1)->name,
965 hash_err);
967 if (optab->name == NULL)
968 break;
969 core_optab = (templates *) xmalloc (sizeof (templates));
970 core_optab->start = optab;
975 /* Initialize reg_hash hash table. */
976 reg_hash = hash_new ();
978 const reg_entry *regtab;
980 for (regtab = i386_regtab;
981 regtab < i386_regtab + sizeof (i386_regtab) / sizeof (i386_regtab[0]);
982 regtab++)
984 hash_err = hash_insert (reg_hash, regtab->reg_name, (PTR) regtab);
985 if (hash_err)
986 as_fatal (_("Internal Error: Can't hash %s: %s"),
987 regtab->reg_name,
988 hash_err);
992 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
994 int c;
995 char *p;
997 for (c = 0; c < 256; c++)
999 if (ISDIGIT (c))
1001 digit_chars[c] = c;
1002 mnemonic_chars[c] = c;
1003 register_chars[c] = c;
1004 operand_chars[c] = c;
1006 else if (ISLOWER (c))
1008 mnemonic_chars[c] = c;
1009 register_chars[c] = c;
1010 operand_chars[c] = c;
1012 else if (ISUPPER (c))
1014 mnemonic_chars[c] = TOLOWER (c);
1015 register_chars[c] = mnemonic_chars[c];
1016 operand_chars[c] = c;
1019 if (ISALPHA (c) || ISDIGIT (c))
1020 identifier_chars[c] = c;
1021 else if (c >= 128)
1023 identifier_chars[c] = c;
1024 operand_chars[c] = c;
1028 #ifdef LEX_AT
1029 identifier_chars['@'] = '@';
1030 #endif
1031 #ifdef LEX_QM
1032 identifier_chars['?'] = '?';
1033 operand_chars['?'] = '?';
1034 #endif
1035 digit_chars['-'] = '-';
1036 mnemonic_chars['-'] = '-';
1037 identifier_chars['_'] = '_';
1038 identifier_chars['.'] = '.';
1040 for (p = operand_special_chars; *p != '\0'; p++)
1041 operand_chars[(unsigned char) *p] = *p;
1044 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1045 if (IS_ELF)
1047 record_alignment (text_section, 2);
1048 record_alignment (data_section, 2);
1049 record_alignment (bss_section, 2);
1051 #endif
1053 if (flag_code == CODE_64BIT)
1055 x86_dwarf2_return_column = 16;
1056 x86_cie_data_alignment = -8;
1058 else
1060 x86_dwarf2_return_column = 8;
1061 x86_cie_data_alignment = -4;
1065 void
1066 i386_print_statistics (file)
1067 FILE *file;
1069 hash_print_statistics (file, "i386 opcode", op_hash);
1070 hash_print_statistics (file, "i386 register", reg_hash);
1073 #ifdef DEBUG386
1075 /* Debugging routines for md_assemble. */
1076 static void pi PARAMS ((char *, i386_insn *));
1077 static void pte PARAMS ((template *));
1078 static void pt PARAMS ((unsigned int));
1079 static void pe PARAMS ((expressionS *));
1080 static void ps PARAMS ((symbolS *));
1082 static void
1083 pi (line, x)
1084 char *line;
1085 i386_insn *x;
1087 unsigned int i;
1089 fprintf (stdout, "%s: template ", line);
1090 pte (&x->tm);
1091 fprintf (stdout, " address: base %s index %s scale %x\n",
1092 x->base_reg ? x->base_reg->reg_name : "none",
1093 x->index_reg ? x->index_reg->reg_name : "none",
1094 x->log2_scale_factor);
1095 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
1096 x->rm.mode, x->rm.reg, x->rm.regmem);
1097 fprintf (stdout, " sib: base %x index %x scale %x\n",
1098 x->sib.base, x->sib.index, x->sib.scale);
1099 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
1100 (x->rex & REX_MODE64) != 0,
1101 (x->rex & REX_EXTX) != 0,
1102 (x->rex & REX_EXTY) != 0,
1103 (x->rex & REX_EXTZ) != 0);
1104 for (i = 0; i < x->operands; i++)
1106 fprintf (stdout, " #%d: ", i + 1);
1107 pt (x->types[i]);
1108 fprintf (stdout, "\n");
1109 if (x->types[i]
1110 & (Reg | SReg2 | SReg3 | Control | Debug | Test | RegMMX | RegXMM))
1111 fprintf (stdout, "%s\n", x->op[i].regs->reg_name);
1112 if (x->types[i] & Imm)
1113 pe (x->op[i].imms);
1114 if (x->types[i] & Disp)
1115 pe (x->op[i].disps);
1119 static void
1120 pte (t)
1121 template *t;
1123 unsigned int i;
1124 fprintf (stdout, " %d operands ", t->operands);
1125 fprintf (stdout, "opcode %x ", t->base_opcode);
1126 if (t->extension_opcode != None)
1127 fprintf (stdout, "ext %x ", t->extension_opcode);
1128 if (t->opcode_modifier & D)
1129 fprintf (stdout, "D");
1130 if (t->opcode_modifier & W)
1131 fprintf (stdout, "W");
1132 fprintf (stdout, "\n");
1133 for (i = 0; i < t->operands; i++)
1135 fprintf (stdout, " #%d type ", i + 1);
1136 pt (t->operand_types[i]);
1137 fprintf (stdout, "\n");
1141 static void
1142 pe (e)
1143 expressionS *e;
1145 fprintf (stdout, " operation %d\n", e->X_op);
1146 fprintf (stdout, " add_number %ld (%lx)\n",
1147 (long) e->X_add_number, (long) e->X_add_number);
1148 if (e->X_add_symbol)
1150 fprintf (stdout, " add_symbol ");
1151 ps (e->X_add_symbol);
1152 fprintf (stdout, "\n");
1154 if (e->X_op_symbol)
1156 fprintf (stdout, " op_symbol ");
1157 ps (e->X_op_symbol);
1158 fprintf (stdout, "\n");
1162 static void
1163 ps (s)
1164 symbolS *s;
1166 fprintf (stdout, "%s type %s%s",
1167 S_GET_NAME (s),
1168 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
1169 segment_name (S_GET_SEGMENT (s)));
1172 struct type_name
1174 unsigned int mask;
1175 char *tname;
1178 static const type_names[] =
1180 { Reg8, "r8" },
1181 { Reg16, "r16" },
1182 { Reg32, "r32" },
1183 { Reg64, "r64" },
1184 { Imm8, "i8" },
1185 { Imm8S, "i8s" },
1186 { Imm16, "i16" },
1187 { Imm32, "i32" },
1188 { Imm32S, "i32s" },
1189 { Imm64, "i64" },
1190 { Imm1, "i1" },
1191 { BaseIndex, "BaseIndex" },
1192 { Disp8, "d8" },
1193 { Disp16, "d16" },
1194 { Disp32, "d32" },
1195 { Disp32S, "d32s" },
1196 { Disp64, "d64" },
1197 { InOutPortReg, "InOutPortReg" },
1198 { ShiftCount, "ShiftCount" },
1199 { Control, "control reg" },
1200 { Test, "test reg" },
1201 { Debug, "debug reg" },
1202 { FloatReg, "FReg" },
1203 { FloatAcc, "FAcc" },
1204 { SReg2, "SReg2" },
1205 { SReg3, "SReg3" },
1206 { Acc, "Acc" },
1207 { JumpAbsolute, "Jump Absolute" },
1208 { RegMMX, "rMMX" },
1209 { RegXMM, "rXMM" },
1210 { EsSeg, "es" },
1211 { 0, "" }
1214 static void
1215 pt (t)
1216 unsigned int t;
1218 const struct type_name *ty;
1220 for (ty = type_names; ty->mask; ty++)
1221 if (t & ty->mask)
1222 fprintf (stdout, "%s, ", ty->tname);
1223 fflush (stdout);
1226 #endif /* DEBUG386 */
1228 static bfd_reloc_code_real_type
1229 reloc (unsigned int size,
1230 int pcrel,
1231 int sign,
1232 bfd_reloc_code_real_type other)
1234 if (other != NO_RELOC)
1236 reloc_howto_type *reloc;
1238 if (size == 8)
1239 switch (other)
1241 case BFD_RELOC_X86_64_TPOFF32:
1242 other = BFD_RELOC_X86_64_TPOFF64;
1243 break;
1244 case BFD_RELOC_X86_64_DTPOFF32:
1245 other = BFD_RELOC_X86_64_DTPOFF64;
1246 break;
1247 default:
1248 break;
1251 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
1252 if (size == 4 && flag_code != CODE_64BIT)
1253 sign = -1;
1255 reloc = bfd_reloc_type_lookup (stdoutput, other);
1256 if (!reloc)
1257 as_bad (_("unknown relocation (%u)"), other);
1258 else if (size != bfd_get_reloc_size (reloc))
1259 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
1260 bfd_get_reloc_size (reloc),
1261 size);
1262 else if (pcrel && !reloc->pc_relative)
1263 as_bad (_("non-pc-relative relocation for pc-relative field"));
1264 else if ((reloc->complain_on_overflow == complain_overflow_signed
1265 && !sign)
1266 || (reloc->complain_on_overflow == complain_overflow_unsigned
1267 && sign > 0))
1268 as_bad (_("relocated field and relocation type differ in signedness"));
1269 else
1270 return other;
1271 return NO_RELOC;
1274 if (pcrel)
1276 if (!sign)
1277 as_bad (_("there are no unsigned pc-relative relocations"));
1278 switch (size)
1280 case 1: return BFD_RELOC_8_PCREL;
1281 case 2: return BFD_RELOC_16_PCREL;
1282 case 4: return BFD_RELOC_32_PCREL;
1283 case 8: return BFD_RELOC_64_PCREL;
1285 as_bad (_("cannot do %u byte pc-relative relocation"), size);
1287 else
1289 if (sign > 0)
1290 switch (size)
1292 case 4: return BFD_RELOC_X86_64_32S;
1294 else
1295 switch (size)
1297 case 1: return BFD_RELOC_8;
1298 case 2: return BFD_RELOC_16;
1299 case 4: return BFD_RELOC_32;
1300 case 8: return BFD_RELOC_64;
1302 as_bad (_("cannot do %s %u byte relocation"),
1303 sign > 0 ? "signed" : "unsigned", size);
1306 abort ();
1307 return BFD_RELOC_NONE;
1310 /* Here we decide which fixups can be adjusted to make them relative to
1311 the beginning of the section instead of the symbol. Basically we need
1312 to make sure that the dynamic relocations are done correctly, so in
1313 some cases we force the original symbol to be used. */
1316 tc_i386_fix_adjustable (fixP)
1317 fixS *fixP ATTRIBUTE_UNUSED;
1319 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1320 if (!IS_ELF)
1321 return 1;
1323 /* Don't adjust pc-relative references to merge sections in 64-bit
1324 mode. */
1325 if (use_rela_relocations
1326 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
1327 && fixP->fx_pcrel)
1328 return 0;
1330 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
1331 and changed later by validate_fix. */
1332 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
1333 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
1334 return 0;
1336 /* adjust_reloc_syms doesn't know about the GOT. */
1337 if (fixP->fx_r_type == BFD_RELOC_386_GOTOFF
1338 || fixP->fx_r_type == BFD_RELOC_386_PLT32
1339 || fixP->fx_r_type == BFD_RELOC_386_GOT32
1340 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
1341 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
1342 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
1343 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
1344 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
1345 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
1346 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
1347 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
1348 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
1349 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
1350 || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
1351 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
1352 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
1353 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
1354 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
1355 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
1356 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
1357 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
1358 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
1359 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
1360 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
1361 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
1362 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
1363 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
1364 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
1365 return 0;
1366 #endif
1367 return 1;
1370 static int intel_float_operand PARAMS ((const char *mnemonic));
1372 static int
1373 intel_float_operand (mnemonic)
1374 const char *mnemonic;
1376 /* Note that the value returned is meaningful only for opcodes with (memory)
1377 operands, hence the code here is free to improperly handle opcodes that
1378 have no operands (for better performance and smaller code). */
1380 if (mnemonic[0] != 'f')
1381 return 0; /* non-math */
1383 switch (mnemonic[1])
1385 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
1386 the fs segment override prefix not currently handled because no
1387 call path can make opcodes without operands get here */
1388 case 'i':
1389 return 2 /* integer op */;
1390 case 'l':
1391 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
1392 return 3; /* fldcw/fldenv */
1393 break;
1394 case 'n':
1395 if (mnemonic[2] != 'o' /* fnop */)
1396 return 3; /* non-waiting control op */
1397 break;
1398 case 'r':
1399 if (mnemonic[2] == 's')
1400 return 3; /* frstor/frstpm */
1401 break;
1402 case 's':
1403 if (mnemonic[2] == 'a')
1404 return 3; /* fsave */
1405 if (mnemonic[2] == 't')
1407 switch (mnemonic[3])
1409 case 'c': /* fstcw */
1410 case 'd': /* fstdw */
1411 case 'e': /* fstenv */
1412 case 's': /* fsts[gw] */
1413 return 3;
1416 break;
1417 case 'x':
1418 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
1419 return 0; /* fxsave/fxrstor are not really math ops */
1420 break;
1423 return 1;
1426 /* This is the guts of the machine-dependent assembler. LINE points to a
1427 machine dependent instruction. This function is supposed to emit
1428 the frags/bytes it assembles to. */
1430 void
1431 md_assemble (line)
1432 char *line;
1434 int j;
1435 char mnemonic[MAX_MNEM_SIZE];
1437 /* Initialize globals. */
1438 memset (&i, '\0', sizeof (i));
1439 for (j = 0; j < MAX_OPERANDS; j++)
1440 i.reloc[j] = NO_RELOC;
1441 memset (disp_expressions, '\0', sizeof (disp_expressions));
1442 memset (im_expressions, '\0', sizeof (im_expressions));
1443 save_stack_p = save_stack;
1445 /* First parse an instruction mnemonic & call i386_operand for the operands.
1446 We assume that the scrubber has arranged it so that line[0] is the valid
1447 start of a (possibly prefixed) mnemonic. */
1449 line = parse_insn (line, mnemonic);
1450 if (line == NULL)
1451 return;
1453 line = parse_operands (line, mnemonic);
1454 if (line == NULL)
1455 return;
1457 /* Now we've parsed the mnemonic into a set of templates, and have the
1458 operands at hand. */
1460 /* All intel opcodes have reversed operands except for "bound" and
1461 "enter". We also don't reverse intersegment "jmp" and "call"
1462 instructions with 2 immediate operands so that the immediate segment
1463 precedes the offset, as it does when in AT&T mode. "enter" and the
1464 intersegment "jmp" and "call" instructions are the only ones that
1465 have two immediate operands. */
1466 if (intel_syntax && i.operands > 1
1467 && (strcmp (mnemonic, "bound") != 0)
1468 && (strcmp (mnemonic, "invlpga") != 0)
1469 && !((i.types[0] & Imm) && (i.types[1] & Imm)))
1470 swap_operands ();
1472 if (i.imm_operands)
1473 optimize_imm ();
1475 /* Don't optimize displacement for movabs since it only takes 64bit
1476 displacement. */
1477 if (i.disp_operands
1478 && (flag_code != CODE_64BIT
1479 || strcmp (mnemonic, "movabs") != 0))
1480 optimize_disp ();
1482 /* Next, we find a template that matches the given insn,
1483 making sure the overlap of the given operands types is consistent
1484 with the template operand types. */
1486 if (!match_template ())
1487 return;
1489 if (intel_syntax)
1491 /* Undo SYSV386_COMPAT brokenness when in Intel mode. See i386.h */
1492 if (SYSV386_COMPAT
1493 && (i.tm.base_opcode & 0xfffffde0) == 0xdce0)
1494 i.tm.base_opcode ^= FloatR;
1496 /* Zap movzx and movsx suffix. The suffix may have been set from
1497 "word ptr" or "byte ptr" on the source operand, but we'll use
1498 the suffix later to choose the destination register. */
1499 if ((i.tm.base_opcode & ~9) == 0x0fb6)
1501 if (i.reg_operands < 2
1502 && !i.suffix
1503 && (~i.tm.opcode_modifier
1504 & (No_bSuf
1505 | No_wSuf
1506 | No_lSuf
1507 | No_sSuf
1508 | No_xSuf
1509 | No_qSuf)))
1510 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
1512 i.suffix = 0;
1516 if (i.tm.opcode_modifier & FWait)
1517 if (!add_prefix (FWAIT_OPCODE))
1518 return;
1520 /* Check string instruction segment overrides. */
1521 if ((i.tm.opcode_modifier & IsString) != 0 && i.mem_operands != 0)
1523 if (!check_string ())
1524 return;
1527 if (!process_suffix ())
1528 return;
1530 /* Make still unresolved immediate matches conform to size of immediate
1531 given in i.suffix. */
1532 if (!finalize_imm ())
1533 return;
1535 if (i.types[0] & Imm1)
1536 i.imm_operands = 0; /* kludge for shift insns. */
1537 if (i.types[0] & ImplicitRegister)
1538 i.reg_operands--;
1539 if (i.types[1] & ImplicitRegister)
1540 i.reg_operands--;
1541 if (i.types[2] & ImplicitRegister)
1542 i.reg_operands--;
1544 if (i.tm.opcode_modifier & ImmExt)
1546 expressionS *exp;
1548 if ((i.tm.cpu_flags & CpuPNI) && i.operands > 0)
1550 /* These Intel Prescott New Instructions have the fixed
1551 operands with an opcode suffix which is coded in the same
1552 place as an 8-bit immediate field would be. Here we check
1553 those operands and remove them afterwards. */
1554 unsigned int x;
1556 for (x = 0; x < i.operands; x++)
1557 if (i.op[x].regs->reg_num != x)
1558 as_bad (_("can't use register '%%%s' as operand %d in '%s'."),
1559 i.op[x].regs->reg_name, x + 1, i.tm.name);
1560 i.operands = 0;
1563 /* These AMD 3DNow! and Intel Katmai New Instructions have an
1564 opcode suffix which is coded in the same place as an 8-bit
1565 immediate field would be. Here we fake an 8-bit immediate
1566 operand from the opcode suffix stored in tm.extension_opcode. */
1568 assert (i.imm_operands == 0 && i.operands <= 2 && 2 < MAX_OPERANDS);
1570 exp = &im_expressions[i.imm_operands++];
1571 i.op[i.operands].imms = exp;
1572 i.types[i.operands++] = Imm8;
1573 exp->X_op = O_constant;
1574 exp->X_add_number = i.tm.extension_opcode;
1575 i.tm.extension_opcode = None;
1578 /* For insns with operands there are more diddles to do to the opcode. */
1579 if (i.operands)
1581 if (!process_operands ())
1582 return;
1584 else if (!quiet_warnings && (i.tm.opcode_modifier & Ugh) != 0)
1586 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
1587 as_warn (_("translating to `%sp'"), i.tm.name);
1590 /* Handle conversion of 'int $3' --> special int3 insn. */
1591 if (i.tm.base_opcode == INT_OPCODE && i.op[0].imms->X_add_number == 3)
1593 i.tm.base_opcode = INT3_OPCODE;
1594 i.imm_operands = 0;
1597 if ((i.tm.opcode_modifier & (Jump | JumpByte | JumpDword))
1598 && i.op[0].disps->X_op == O_constant)
1600 /* Convert "jmp constant" (and "call constant") to a jump (call) to
1601 the absolute address given by the constant. Since ix86 jumps and
1602 calls are pc relative, we need to generate a reloc. */
1603 i.op[0].disps->X_add_symbol = &abs_symbol;
1604 i.op[0].disps->X_op = O_symbol;
1607 if ((i.tm.opcode_modifier & Rex64) != 0)
1608 i.rex |= REX_MODE64;
1610 /* For 8 bit registers we need an empty rex prefix. Also if the
1611 instruction already has a prefix, we need to convert old
1612 registers to new ones. */
1614 if (((i.types[0] & Reg8) != 0
1615 && (i.op[0].regs->reg_flags & RegRex64) != 0)
1616 || ((i.types[1] & Reg8) != 0
1617 && (i.op[1].regs->reg_flags & RegRex64) != 0)
1618 || (((i.types[0] & Reg8) != 0 || (i.types[1] & Reg8) != 0)
1619 && i.rex != 0))
1621 int x;
1623 i.rex |= REX_OPCODE;
1624 for (x = 0; x < 2; x++)
1626 /* Look for 8 bit operand that uses old registers. */
1627 if ((i.types[x] & Reg8) != 0
1628 && (i.op[x].regs->reg_flags & RegRex64) == 0)
1630 /* In case it is "hi" register, give up. */
1631 if (i.op[x].regs->reg_num > 3)
1632 as_bad (_("can't encode register '%%%s' in an instruction requiring REX prefix."),
1633 i.op[x].regs->reg_name);
1635 /* Otherwise it is equivalent to the extended register.
1636 Since the encoding doesn't change this is merely
1637 cosmetic cleanup for debug output. */
1639 i.op[x].regs = i.op[x].regs + 8;
1644 if (i.rex != 0)
1645 add_prefix (REX_OPCODE | i.rex);
1647 /* We are ready to output the insn. */
1648 output_insn ();
1651 static char *
1652 parse_insn (line, mnemonic)
1653 char *line;
1654 char *mnemonic;
1656 char *l = line;
1657 char *token_start = l;
1658 char *mnem_p;
1659 int supported;
1660 const template *t;
1662 /* Non-zero if we found a prefix only acceptable with string insns. */
1663 const char *expecting_string_instruction = NULL;
1665 while (1)
1667 mnem_p = mnemonic;
1668 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
1670 mnem_p++;
1671 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
1673 as_bad (_("no such instruction: `%s'"), token_start);
1674 return NULL;
1676 l++;
1678 if (!is_space_char (*l)
1679 && *l != END_OF_INSN
1680 && (intel_syntax
1681 || (*l != PREFIX_SEPARATOR
1682 && *l != ',')))
1684 as_bad (_("invalid character %s in mnemonic"),
1685 output_invalid (*l));
1686 return NULL;
1688 if (token_start == l)
1690 if (!intel_syntax && *l == PREFIX_SEPARATOR)
1691 as_bad (_("expecting prefix; got nothing"));
1692 else
1693 as_bad (_("expecting mnemonic; got nothing"));
1694 return NULL;
1697 /* Look up instruction (or prefix) via hash table. */
1698 current_templates = hash_find (op_hash, mnemonic);
1700 if (*l != END_OF_INSN
1701 && (!is_space_char (*l) || l[1] != END_OF_INSN)
1702 && current_templates
1703 && (current_templates->start->opcode_modifier & IsPrefix))
1705 if (current_templates->start->cpu_flags
1706 & (flag_code != CODE_64BIT ? Cpu64 : CpuNo64))
1708 as_bad ((flag_code != CODE_64BIT
1709 ? _("`%s' is only supported in 64-bit mode")
1710 : _("`%s' is not supported in 64-bit mode")),
1711 current_templates->start->name);
1712 return NULL;
1714 /* If we are in 16-bit mode, do not allow addr16 or data16.
1715 Similarly, in 32-bit mode, do not allow addr32 or data32. */
1716 if ((current_templates->start->opcode_modifier & (Size16 | Size32))
1717 && flag_code != CODE_64BIT
1718 && (((current_templates->start->opcode_modifier & Size32) != 0)
1719 ^ (flag_code == CODE_16BIT)))
1721 as_bad (_("redundant %s prefix"),
1722 current_templates->start->name);
1723 return NULL;
1725 /* Add prefix, checking for repeated prefixes. */
1726 switch (add_prefix (current_templates->start->base_opcode))
1728 case 0:
1729 return NULL;
1730 case 2:
1731 expecting_string_instruction = current_templates->start->name;
1732 break;
1734 /* Skip past PREFIX_SEPARATOR and reset token_start. */
1735 token_start = ++l;
1737 else
1738 break;
1741 if (!current_templates)
1743 /* See if we can get a match by trimming off a suffix. */
1744 switch (mnem_p[-1])
1746 case WORD_MNEM_SUFFIX:
1747 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
1748 i.suffix = SHORT_MNEM_SUFFIX;
1749 else
1750 case BYTE_MNEM_SUFFIX:
1751 case QWORD_MNEM_SUFFIX:
1752 i.suffix = mnem_p[-1];
1753 mnem_p[-1] = '\0';
1754 current_templates = hash_find (op_hash, mnemonic);
1755 break;
1756 case SHORT_MNEM_SUFFIX:
1757 case LONG_MNEM_SUFFIX:
1758 if (!intel_syntax)
1760 i.suffix = mnem_p[-1];
1761 mnem_p[-1] = '\0';
1762 current_templates = hash_find (op_hash, mnemonic);
1764 break;
1766 /* Intel Syntax. */
1767 case 'd':
1768 if (intel_syntax)
1770 if (intel_float_operand (mnemonic) == 1)
1771 i.suffix = SHORT_MNEM_SUFFIX;
1772 else
1773 i.suffix = LONG_MNEM_SUFFIX;
1774 mnem_p[-1] = '\0';
1775 current_templates = hash_find (op_hash, mnemonic);
1777 break;
1779 if (!current_templates)
1781 as_bad (_("no such instruction: `%s'"), token_start);
1782 return NULL;
1786 if (current_templates->start->opcode_modifier & (Jump | JumpByte))
1788 /* Check for a branch hint. We allow ",pt" and ",pn" for
1789 predict taken and predict not taken respectively.
1790 I'm not sure that branch hints actually do anything on loop
1791 and jcxz insns (JumpByte) for current Pentium4 chips. They
1792 may work in the future and it doesn't hurt to accept them
1793 now. */
1794 if (l[0] == ',' && l[1] == 'p')
1796 if (l[2] == 't')
1798 if (!add_prefix (DS_PREFIX_OPCODE))
1799 return NULL;
1800 l += 3;
1802 else if (l[2] == 'n')
1804 if (!add_prefix (CS_PREFIX_OPCODE))
1805 return NULL;
1806 l += 3;
1810 /* Any other comma loses. */
1811 if (*l == ',')
1813 as_bad (_("invalid character %s in mnemonic"),
1814 output_invalid (*l));
1815 return NULL;
1818 /* Check if instruction is supported on specified architecture. */
1819 supported = 0;
1820 for (t = current_templates->start; t < current_templates->end; ++t)
1822 if (!((t->cpu_flags & ~(Cpu64 | CpuNo64))
1823 & ~(cpu_arch_flags & ~(Cpu64 | CpuNo64))))
1824 supported |= 1;
1825 if (!(t->cpu_flags & (flag_code == CODE_64BIT ? CpuNo64 : Cpu64)))
1826 supported |= 2;
1828 if (!(supported & 2))
1830 as_bad (flag_code == CODE_64BIT
1831 ? _("`%s' is not supported in 64-bit mode")
1832 : _("`%s' is only supported in 64-bit mode"),
1833 current_templates->start->name);
1834 return NULL;
1836 if (!(supported & 1))
1838 as_warn (_("`%s' is not supported on `%s%s'"),
1839 current_templates->start->name,
1840 cpu_arch_name,
1841 cpu_sub_arch_name ? cpu_sub_arch_name : "");
1843 else if ((Cpu386 & ~cpu_arch_flags) && (flag_code != CODE_16BIT))
1845 as_warn (_("use .code16 to ensure correct addressing mode"));
1848 /* Check for rep/repne without a string instruction. */
1849 if (expecting_string_instruction)
1851 static templates override;
1853 for (t = current_templates->start; t < current_templates->end; ++t)
1854 if (t->opcode_modifier & IsString)
1855 break;
1856 if (t >= current_templates->end)
1858 as_bad (_("expecting string instruction after `%s'"),
1859 expecting_string_instruction);
1860 return NULL;
1862 for (override.start = t; t < current_templates->end; ++t)
1863 if (!(t->opcode_modifier & IsString))
1864 break;
1865 override.end = t;
1866 current_templates = &override;
1869 return l;
1872 static char *
1873 parse_operands (l, mnemonic)
1874 char *l;
1875 const char *mnemonic;
1877 char *token_start;
1879 /* 1 if operand is pending after ','. */
1880 unsigned int expecting_operand = 0;
1882 /* Non-zero if operand parens not balanced. */
1883 unsigned int paren_not_balanced;
1885 while (*l != END_OF_INSN)
1887 /* Skip optional white space before operand. */
1888 if (is_space_char (*l))
1889 ++l;
1890 if (!is_operand_char (*l) && *l != END_OF_INSN)
1892 as_bad (_("invalid character %s before operand %d"),
1893 output_invalid (*l),
1894 i.operands + 1);
1895 return NULL;
1897 token_start = l; /* after white space */
1898 paren_not_balanced = 0;
1899 while (paren_not_balanced || *l != ',')
1901 if (*l == END_OF_INSN)
1903 if (paren_not_balanced)
1905 if (!intel_syntax)
1906 as_bad (_("unbalanced parenthesis in operand %d."),
1907 i.operands + 1);
1908 else
1909 as_bad (_("unbalanced brackets in operand %d."),
1910 i.operands + 1);
1911 return NULL;
1913 else
1914 break; /* we are done */
1916 else if (!is_operand_char (*l) && !is_space_char (*l))
1918 as_bad (_("invalid character %s in operand %d"),
1919 output_invalid (*l),
1920 i.operands + 1);
1921 return NULL;
1923 if (!intel_syntax)
1925 if (*l == '(')
1926 ++paren_not_balanced;
1927 if (*l == ')')
1928 --paren_not_balanced;
1930 else
1932 if (*l == '[')
1933 ++paren_not_balanced;
1934 if (*l == ']')
1935 --paren_not_balanced;
1937 l++;
1939 if (l != token_start)
1940 { /* Yes, we've read in another operand. */
1941 unsigned int operand_ok;
1942 this_operand = i.operands++;
1943 if (i.operands > MAX_OPERANDS)
1945 as_bad (_("spurious operands; (%d operands/instruction max)"),
1946 MAX_OPERANDS);
1947 return NULL;
1949 /* Now parse operand adding info to 'i' as we go along. */
1950 END_STRING_AND_SAVE (l);
1952 if (intel_syntax)
1953 operand_ok =
1954 i386_intel_operand (token_start,
1955 intel_float_operand (mnemonic));
1956 else
1957 operand_ok = i386_operand (token_start);
1959 RESTORE_END_STRING (l);
1960 if (!operand_ok)
1961 return NULL;
1963 else
1965 if (expecting_operand)
1967 expecting_operand_after_comma:
1968 as_bad (_("expecting operand after ','; got nothing"));
1969 return NULL;
1971 if (*l == ',')
1973 as_bad (_("expecting operand before ','; got nothing"));
1974 return NULL;
1978 /* Now *l must be either ',' or END_OF_INSN. */
1979 if (*l == ',')
1981 if (*++l == END_OF_INSN)
1983 /* Just skip it, if it's \n complain. */
1984 goto expecting_operand_after_comma;
1986 expecting_operand = 1;
1989 return l;
1992 static void
1993 swap_operands ()
1995 union i386_op temp_op;
1996 unsigned int temp_type;
1997 enum bfd_reloc_code_real temp_reloc;
1998 int xchg1 = 0;
1999 int xchg2 = 0;
2001 if (i.operands == 2)
2003 xchg1 = 0;
2004 xchg2 = 1;
2006 else if (i.operands == 3)
2008 xchg1 = 0;
2009 xchg2 = 2;
2011 temp_type = i.types[xchg2];
2012 i.types[xchg2] = i.types[xchg1];
2013 i.types[xchg1] = temp_type;
2014 temp_op = i.op[xchg2];
2015 i.op[xchg2] = i.op[xchg1];
2016 i.op[xchg1] = temp_op;
2017 temp_reloc = i.reloc[xchg2];
2018 i.reloc[xchg2] = i.reloc[xchg1];
2019 i.reloc[xchg1] = temp_reloc;
2021 if (i.mem_operands == 2)
2023 const seg_entry *temp_seg;
2024 temp_seg = i.seg[0];
2025 i.seg[0] = i.seg[1];
2026 i.seg[1] = temp_seg;
2030 /* Try to ensure constant immediates are represented in the smallest
2031 opcode possible. */
2032 static void
2033 optimize_imm ()
2035 char guess_suffix = 0;
2036 int op;
2038 if (i.suffix)
2039 guess_suffix = i.suffix;
2040 else if (i.reg_operands)
2042 /* Figure out a suffix from the last register operand specified.
2043 We can't do this properly yet, ie. excluding InOutPortReg,
2044 but the following works for instructions with immediates.
2045 In any case, we can't set i.suffix yet. */
2046 for (op = i.operands; --op >= 0;)
2047 if (i.types[op] & Reg)
2049 if (i.types[op] & Reg8)
2050 guess_suffix = BYTE_MNEM_SUFFIX;
2051 else if (i.types[op] & Reg16)
2052 guess_suffix = WORD_MNEM_SUFFIX;
2053 else if (i.types[op] & Reg32)
2054 guess_suffix = LONG_MNEM_SUFFIX;
2055 else if (i.types[op] & Reg64)
2056 guess_suffix = QWORD_MNEM_SUFFIX;
2057 break;
2060 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
2061 guess_suffix = WORD_MNEM_SUFFIX;
2063 for (op = i.operands; --op >= 0;)
2064 if (i.types[op] & Imm)
2066 switch (i.op[op].imms->X_op)
2068 case O_constant:
2069 /* If a suffix is given, this operand may be shortened. */
2070 switch (guess_suffix)
2072 case LONG_MNEM_SUFFIX:
2073 i.types[op] |= Imm32 | Imm64;
2074 break;
2075 case WORD_MNEM_SUFFIX:
2076 i.types[op] |= Imm16 | Imm32S | Imm32 | Imm64;
2077 break;
2078 case BYTE_MNEM_SUFFIX:
2079 i.types[op] |= Imm16 | Imm8 | Imm8S | Imm32S | Imm32 | Imm64;
2080 break;
2083 /* If this operand is at most 16 bits, convert it
2084 to a signed 16 bit number before trying to see
2085 whether it will fit in an even smaller size.
2086 This allows a 16-bit operand such as $0xffe0 to
2087 be recognised as within Imm8S range. */
2088 if ((i.types[op] & Imm16)
2089 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
2091 i.op[op].imms->X_add_number =
2092 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
2094 if ((i.types[op] & Imm32)
2095 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
2096 == 0))
2098 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
2099 ^ ((offsetT) 1 << 31))
2100 - ((offsetT) 1 << 31));
2102 i.types[op] |= smallest_imm_type (i.op[op].imms->X_add_number);
2104 /* We must avoid matching of Imm32 templates when 64bit
2105 only immediate is available. */
2106 if (guess_suffix == QWORD_MNEM_SUFFIX)
2107 i.types[op] &= ~Imm32;
2108 break;
2110 case O_absent:
2111 case O_register:
2112 abort ();
2114 /* Symbols and expressions. */
2115 default:
2116 /* Convert symbolic operand to proper sizes for matching, but don't
2117 prevent matching a set of insns that only supports sizes other
2118 than those matching the insn suffix. */
2120 unsigned int mask, allowed = 0;
2121 const template *t;
2123 for (t = current_templates->start; t < current_templates->end; ++t)
2124 allowed |= t->operand_types[op];
2125 switch (guess_suffix)
2127 case QWORD_MNEM_SUFFIX:
2128 mask = Imm64 | Imm32S;
2129 break;
2130 case LONG_MNEM_SUFFIX:
2131 mask = Imm32;
2132 break;
2133 case WORD_MNEM_SUFFIX:
2134 mask = Imm16;
2135 break;
2136 case BYTE_MNEM_SUFFIX:
2137 mask = Imm8;
2138 break;
2139 default:
2140 mask = 0;
2141 break;
2143 if (mask & allowed)
2144 i.types[op] &= mask;
2146 break;
2151 /* Try to use the smallest displacement type too. */
2152 static void
2153 optimize_disp ()
2155 int op;
2157 for (op = i.operands; --op >= 0;)
2158 if (i.types[op] & Disp)
2160 if (i.op[op].disps->X_op == O_constant)
2162 offsetT disp = i.op[op].disps->X_add_number;
2164 if ((i.types[op] & Disp16)
2165 && (disp & ~(offsetT) 0xffff) == 0)
2167 /* If this operand is at most 16 bits, convert
2168 to a signed 16 bit number and don't use 64bit
2169 displacement. */
2170 disp = (((disp & 0xffff) ^ 0x8000) - 0x8000);
2171 i.types[op] &= ~Disp64;
2173 if ((i.types[op] & Disp32)
2174 && (disp & ~(((offsetT) 2 << 31) - 1)) == 0)
2176 /* If this operand is at most 32 bits, convert
2177 to a signed 32 bit number and don't use 64bit
2178 displacement. */
2179 disp &= (((offsetT) 2 << 31) - 1);
2180 disp = (disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
2181 i.types[op] &= ~Disp64;
2183 if (!disp && (i.types[op] & BaseIndex))
2185 i.types[op] &= ~Disp;
2186 i.op[op].disps = 0;
2187 i.disp_operands--;
2189 else if (flag_code == CODE_64BIT)
2191 if (fits_in_signed_long (disp))
2193 i.types[op] &= ~Disp64;
2194 i.types[op] |= Disp32S;
2196 if (fits_in_unsigned_long (disp))
2197 i.types[op] |= Disp32;
2199 if ((i.types[op] & (Disp32 | Disp32S | Disp16))
2200 && fits_in_signed_byte (disp))
2201 i.types[op] |= Disp8;
2203 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
2204 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
2206 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
2207 i.op[op].disps, 0, i.reloc[op]);
2208 i.types[op] &= ~Disp;
2210 else
2211 /* We only support 64bit displacement on constants. */
2212 i.types[op] &= ~Disp64;
2216 static int
2217 match_template ()
2219 /* Points to template once we've found it. */
2220 const template *t;
2221 unsigned int overlap0, overlap1, overlap2;
2222 unsigned int found_reverse_match;
2223 int suffix_check;
2225 #define MATCH(overlap, given, template) \
2226 ((overlap & ~JumpAbsolute) \
2227 && (((given) & (BaseIndex | JumpAbsolute)) \
2228 == ((overlap) & (BaseIndex | JumpAbsolute))))
2230 /* If given types r0 and r1 are registers they must be of the same type
2231 unless the expected operand type register overlap is null.
2232 Note that Acc in a template matches every size of reg. */
2233 #define CONSISTENT_REGISTER_MATCH(m0, g0, t0, m1, g1, t1) \
2234 (((g0) & Reg) == 0 || ((g1) & Reg) == 0 \
2235 || ((g0) & Reg) == ((g1) & Reg) \
2236 || ((((m0) & Acc) ? Reg : (t0)) & (((m1) & Acc) ? Reg : (t1)) & Reg) == 0 )
2238 overlap0 = 0;
2239 overlap1 = 0;
2240 overlap2 = 0;
2241 found_reverse_match = 0;
2242 suffix_check = (i.suffix == BYTE_MNEM_SUFFIX
2243 ? No_bSuf
2244 : (i.suffix == WORD_MNEM_SUFFIX
2245 ? No_wSuf
2246 : (i.suffix == SHORT_MNEM_SUFFIX
2247 ? No_sSuf
2248 : (i.suffix == LONG_MNEM_SUFFIX
2249 ? No_lSuf
2250 : (i.suffix == QWORD_MNEM_SUFFIX
2251 ? No_qSuf
2252 : (i.suffix == LONG_DOUBLE_MNEM_SUFFIX
2253 ? No_xSuf : 0))))));
2255 t = current_templates->start;
2256 if (i.suffix == QWORD_MNEM_SUFFIX
2257 && flag_code != CODE_64BIT
2258 && (intel_syntax
2259 ? !(t->opcode_modifier & IgnoreSize)
2260 && !intel_float_operand (t->name)
2261 : intel_float_operand (t->name) != 2)
2262 && (!(t->operand_types[0] & (RegMMX | RegXMM))
2263 || !(t->operand_types[t->operands > 1] & (RegMMX | RegXMM)))
2264 && (t->base_opcode != 0x0fc7
2265 || t->extension_opcode != 1 /* cmpxchg8b */))
2266 t = current_templates->end;
2267 for (; t < current_templates->end; t++)
2269 /* Must have right number of operands. */
2270 if (i.operands != t->operands)
2271 continue;
2273 /* Check the suffix, except for some instructions in intel mode. */
2274 if ((t->opcode_modifier & suffix_check)
2275 && !(intel_syntax
2276 && (t->opcode_modifier & IgnoreSize)))
2277 continue;
2279 /* Do not verify operands when there are none. */
2280 else if (!t->operands)
2282 if (t->cpu_flags & ~cpu_arch_flags)
2283 continue;
2284 /* We've found a match; break out of loop. */
2285 break;
2288 overlap0 = i.types[0] & t->operand_types[0];
2289 switch (t->operands)
2291 case 1:
2292 if (!MATCH (overlap0, i.types[0], t->operand_types[0]))
2293 continue;
2294 break;
2295 case 2:
2296 case 3:
2297 overlap1 = i.types[1] & t->operand_types[1];
2298 if (!MATCH (overlap0, i.types[0], t->operand_types[0])
2299 || !MATCH (overlap1, i.types[1], t->operand_types[1])
2300 /* monitor in SSE3 is a very special case. The first
2301 register and the second register may have differnet
2302 sizes. */
2303 || !((t->base_opcode == 0x0f01
2304 && t->extension_opcode == 0xc8)
2305 || CONSISTENT_REGISTER_MATCH (overlap0, i.types[0],
2306 t->operand_types[0],
2307 overlap1, i.types[1],
2308 t->operand_types[1])))
2310 /* Check if other direction is valid ... */
2311 if ((t->opcode_modifier & (D | FloatD)) == 0)
2312 continue;
2314 /* Try reversing direction of operands. */
2315 overlap0 = i.types[0] & t->operand_types[1];
2316 overlap1 = i.types[1] & t->operand_types[0];
2317 if (!MATCH (overlap0, i.types[0], t->operand_types[1])
2318 || !MATCH (overlap1, i.types[1], t->operand_types[0])
2319 || !CONSISTENT_REGISTER_MATCH (overlap0, i.types[0],
2320 t->operand_types[1],
2321 overlap1, i.types[1],
2322 t->operand_types[0]))
2324 /* Does not match either direction. */
2325 continue;
2327 /* found_reverse_match holds which of D or FloatDR
2328 we've found. */
2329 found_reverse_match = t->opcode_modifier & (D | FloatDR);
2331 /* Found a forward 2 operand match here. */
2332 else if (t->operands == 3)
2334 /* Here we make use of the fact that there are no
2335 reverse match 3 operand instructions, and all 3
2336 operand instructions only need to be checked for
2337 register consistency between operands 2 and 3. */
2338 overlap2 = i.types[2] & t->operand_types[2];
2339 if (!MATCH (overlap2, i.types[2], t->operand_types[2])
2340 || !CONSISTENT_REGISTER_MATCH (overlap1, i.types[1],
2341 t->operand_types[1],
2342 overlap2, i.types[2],
2343 t->operand_types[2]))
2345 continue;
2347 /* Found either forward/reverse 2 or 3 operand match here:
2348 slip through to break. */
2350 if (t->cpu_flags & ~cpu_arch_flags)
2352 found_reverse_match = 0;
2353 continue;
2355 /* We've found a match; break out of loop. */
2356 break;
2359 if (t == current_templates->end)
2361 /* We found no match. */
2362 as_bad (_("suffix or operands invalid for `%s'"),
2363 current_templates->start->name);
2364 return 0;
2367 if (!quiet_warnings)
2369 if (!intel_syntax
2370 && ((i.types[0] & JumpAbsolute)
2371 != (t->operand_types[0] & JumpAbsolute)))
2373 as_warn (_("indirect %s without `*'"), t->name);
2376 if ((t->opcode_modifier & (IsPrefix | IgnoreSize))
2377 == (IsPrefix | IgnoreSize))
2379 /* Warn them that a data or address size prefix doesn't
2380 affect assembly of the next line of code. */
2381 as_warn (_("stand-alone `%s' prefix"), t->name);
2385 /* Copy the template we found. */
2386 i.tm = *t;
2387 if (found_reverse_match)
2389 /* If we found a reverse match we must alter the opcode
2390 direction bit. found_reverse_match holds bits to change
2391 (different for int & float insns). */
2393 i.tm.base_opcode ^= found_reverse_match;
2395 i.tm.operand_types[0] = t->operand_types[1];
2396 i.tm.operand_types[1] = t->operand_types[0];
2399 return 1;
2402 static int
2403 check_string ()
2405 int mem_op = (i.types[0] & AnyMem) ? 0 : 1;
2406 if ((i.tm.operand_types[mem_op] & EsSeg) != 0)
2408 if (i.seg[0] != NULL && i.seg[0] != &es)
2410 as_bad (_("`%s' operand %d must use `%%es' segment"),
2411 i.tm.name,
2412 mem_op + 1);
2413 return 0;
2415 /* There's only ever one segment override allowed per instruction.
2416 This instruction possibly has a legal segment override on the
2417 second operand, so copy the segment to where non-string
2418 instructions store it, allowing common code. */
2419 i.seg[0] = i.seg[1];
2421 else if ((i.tm.operand_types[mem_op + 1] & EsSeg) != 0)
2423 if (i.seg[1] != NULL && i.seg[1] != &es)
2425 as_bad (_("`%s' operand %d must use `%%es' segment"),
2426 i.tm.name,
2427 mem_op + 2);
2428 return 0;
2431 return 1;
2434 static int
2435 process_suffix (void)
2437 /* If matched instruction specifies an explicit instruction mnemonic
2438 suffix, use it. */
2439 if (i.tm.opcode_modifier & (Size16 | Size32 | Size64))
2441 if (i.tm.opcode_modifier & Size16)
2442 i.suffix = WORD_MNEM_SUFFIX;
2443 else if (i.tm.opcode_modifier & Size64)
2444 i.suffix = QWORD_MNEM_SUFFIX;
2445 else
2446 i.suffix = LONG_MNEM_SUFFIX;
2448 else if (i.reg_operands)
2450 /* If there's no instruction mnemonic suffix we try to invent one
2451 based on register operands. */
2452 if (!i.suffix)
2454 /* We take i.suffix from the last register operand specified,
2455 Destination register type is more significant than source
2456 register type. */
2457 int op;
2459 for (op = i.operands; --op >= 0;)
2460 if ((i.types[op] & Reg)
2461 && !(i.tm.operand_types[op] & InOutPortReg))
2463 i.suffix = ((i.types[op] & Reg8) ? BYTE_MNEM_SUFFIX :
2464 (i.types[op] & Reg16) ? WORD_MNEM_SUFFIX :
2465 (i.types[op] & Reg64) ? QWORD_MNEM_SUFFIX :
2466 LONG_MNEM_SUFFIX);
2467 break;
2470 else if (i.suffix == BYTE_MNEM_SUFFIX)
2472 if (!check_byte_reg ())
2473 return 0;
2475 else if (i.suffix == LONG_MNEM_SUFFIX)
2477 if (!check_long_reg ())
2478 return 0;
2480 else if (i.suffix == QWORD_MNEM_SUFFIX)
2482 if (!check_qword_reg ())
2483 return 0;
2485 else if (i.suffix == WORD_MNEM_SUFFIX)
2487 if (!check_word_reg ())
2488 return 0;
2490 else if (intel_syntax && (i.tm.opcode_modifier & IgnoreSize))
2491 /* Do nothing if the instruction is going to ignore the prefix. */
2493 else
2494 abort ();
2496 else if ((i.tm.opcode_modifier & DefaultSize)
2497 && !i.suffix
2498 /* exclude fldenv/frstor/fsave/fstenv */
2499 && (i.tm.opcode_modifier & No_sSuf))
2501 i.suffix = stackop_size;
2503 else if (intel_syntax
2504 && !i.suffix
2505 && ((i.tm.operand_types[0] & JumpAbsolute)
2506 || (i.tm.opcode_modifier & (JumpByte|JumpInterSegment))
2507 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
2508 && i.tm.extension_opcode <= 3)))
2510 switch (flag_code)
2512 case CODE_64BIT:
2513 if (!(i.tm.opcode_modifier & No_qSuf))
2515 i.suffix = QWORD_MNEM_SUFFIX;
2516 break;
2518 case CODE_32BIT:
2519 if (!(i.tm.opcode_modifier & No_lSuf))
2520 i.suffix = LONG_MNEM_SUFFIX;
2521 break;
2522 case CODE_16BIT:
2523 if (!(i.tm.opcode_modifier & No_wSuf))
2524 i.suffix = WORD_MNEM_SUFFIX;
2525 break;
2529 if (!i.suffix)
2531 if (!intel_syntax)
2533 if (i.tm.opcode_modifier & W)
2535 as_bad (_("no instruction mnemonic suffix given and no register operands; can't size instruction"));
2536 return 0;
2539 else
2541 unsigned int suffixes = ~i.tm.opcode_modifier
2542 & (No_bSuf
2543 | No_wSuf
2544 | No_lSuf
2545 | No_sSuf
2546 | No_xSuf
2547 | No_qSuf);
2549 if ((i.tm.opcode_modifier & W)
2550 || ((suffixes & (suffixes - 1))
2551 && !(i.tm.opcode_modifier & (DefaultSize | IgnoreSize))))
2553 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
2554 return 0;
2559 /* Change the opcode based on the operand size given by i.suffix;
2560 We don't need to change things for byte insns. */
2562 if (i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
2564 /* It's not a byte, select word/dword operation. */
2565 if (i.tm.opcode_modifier & W)
2567 if (i.tm.opcode_modifier & ShortForm)
2568 i.tm.base_opcode |= 8;
2569 else
2570 i.tm.base_opcode |= 1;
2573 /* Now select between word & dword operations via the operand
2574 size prefix, except for instructions that will ignore this
2575 prefix anyway. */
2576 if (i.tm.base_opcode == 0x0f01 && i.tm.extension_opcode == 0xc8)
2578 /* monitor in SSE3 is a very special case. The default size
2579 of AX is the size of mode. The address size override
2580 prefix will change the size of AX. */
2581 if (i.op->regs[0].reg_type &
2582 (flag_code == CODE_32BIT ? Reg16 : Reg32))
2583 if (!add_prefix (ADDR_PREFIX_OPCODE))
2584 return 0;
2586 else if (i.suffix != QWORD_MNEM_SUFFIX
2587 && i.suffix != LONG_DOUBLE_MNEM_SUFFIX
2588 && !(i.tm.opcode_modifier & (IgnoreSize | FloatMF))
2589 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
2590 || (flag_code == CODE_64BIT
2591 && (i.tm.opcode_modifier & JumpByte))))
2593 unsigned int prefix = DATA_PREFIX_OPCODE;
2595 if (i.tm.opcode_modifier & JumpByte) /* jcxz, loop */
2596 prefix = ADDR_PREFIX_OPCODE;
2598 if (!add_prefix (prefix))
2599 return 0;
2602 /* Set mode64 for an operand. */
2603 if (i.suffix == QWORD_MNEM_SUFFIX
2604 && flag_code == CODE_64BIT
2605 && (i.tm.opcode_modifier & NoRex64) == 0)
2606 i.rex |= REX_MODE64;
2608 /* Size floating point instruction. */
2609 if (i.suffix == LONG_MNEM_SUFFIX)
2610 if (i.tm.opcode_modifier & FloatMF)
2611 i.tm.base_opcode ^= 4;
2614 return 1;
2617 static int
2618 check_byte_reg (void)
2620 int op;
2622 for (op = i.operands; --op >= 0;)
2624 /* If this is an eight bit register, it's OK. If it's the 16 or
2625 32 bit version of an eight bit register, we will just use the
2626 low portion, and that's OK too. */
2627 if (i.types[op] & Reg8)
2628 continue;
2630 /* movzx and movsx should not generate this warning. */
2631 if (intel_syntax
2632 && (i.tm.base_opcode == 0xfb7
2633 || i.tm.base_opcode == 0xfb6
2634 || i.tm.base_opcode == 0x63
2635 || i.tm.base_opcode == 0xfbe
2636 || i.tm.base_opcode == 0xfbf))
2637 continue;
2639 if ((i.types[op] & WordReg) && i.op[op].regs->reg_num < 4)
2641 /* Prohibit these changes in the 64bit mode, since the
2642 lowering is more complicated. */
2643 if (flag_code == CODE_64BIT
2644 && (i.tm.operand_types[op] & InOutPortReg) == 0)
2646 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2647 i.op[op].regs->reg_name,
2648 i.suffix);
2649 return 0;
2651 #if REGISTER_WARNINGS
2652 if (!quiet_warnings
2653 && (i.tm.operand_types[op] & InOutPortReg) == 0)
2654 as_warn (_("using `%%%s' instead of `%%%s' due to `%c' suffix"),
2655 (i.op[op].regs + (i.types[op] & Reg16
2656 ? REGNAM_AL - REGNAM_AX
2657 : REGNAM_AL - REGNAM_EAX))->reg_name,
2658 i.op[op].regs->reg_name,
2659 i.suffix);
2660 #endif
2661 continue;
2663 /* Any other register is bad. */
2664 if (i.types[op] & (Reg | RegMMX | RegXMM
2665 | SReg2 | SReg3
2666 | Control | Debug | Test
2667 | FloatReg | FloatAcc))
2669 as_bad (_("`%%%s' not allowed with `%s%c'"),
2670 i.op[op].regs->reg_name,
2671 i.tm.name,
2672 i.suffix);
2673 return 0;
2676 return 1;
2679 static int
2680 check_long_reg ()
2682 int op;
2684 for (op = i.operands; --op >= 0;)
2685 /* Reject eight bit registers, except where the template requires
2686 them. (eg. movzb) */
2687 if ((i.types[op] & Reg8) != 0
2688 && (i.tm.operand_types[op] & (Reg16 | Reg32 | Acc)) != 0)
2690 as_bad (_("`%%%s' not allowed with `%s%c'"),
2691 i.op[op].regs->reg_name,
2692 i.tm.name,
2693 i.suffix);
2694 return 0;
2696 /* Warn if the e prefix on a general reg is missing. */
2697 else if ((!quiet_warnings || flag_code == CODE_64BIT)
2698 && (i.types[op] & Reg16) != 0
2699 && (i.tm.operand_types[op] & (Reg32 | Acc)) != 0)
2701 /* Prohibit these changes in the 64bit mode, since the
2702 lowering is more complicated. */
2703 if (flag_code == CODE_64BIT)
2705 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2706 i.op[op].regs->reg_name,
2707 i.suffix);
2708 return 0;
2710 #if REGISTER_WARNINGS
2711 else
2712 as_warn (_("using `%%%s' instead of `%%%s' due to `%c' suffix"),
2713 (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
2714 i.op[op].regs->reg_name,
2715 i.suffix);
2716 #endif
2718 /* Warn if the r prefix on a general reg is missing. */
2719 else if ((i.types[op] & Reg64) != 0
2720 && (i.tm.operand_types[op] & (Reg32 | Acc)) != 0)
2722 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2723 i.op[op].regs->reg_name,
2724 i.suffix);
2725 return 0;
2727 return 1;
2730 static int
2731 check_qword_reg ()
2733 int op;
2735 for (op = i.operands; --op >= 0; )
2736 /* Reject eight bit registers, except where the template requires
2737 them. (eg. movzb) */
2738 if ((i.types[op] & Reg8) != 0
2739 && (i.tm.operand_types[op] & (Reg16 | Reg32 | Acc)) != 0)
2741 as_bad (_("`%%%s' not allowed with `%s%c'"),
2742 i.op[op].regs->reg_name,
2743 i.tm.name,
2744 i.suffix);
2745 return 0;
2747 /* Warn if the e prefix on a general reg is missing. */
2748 else if (((i.types[op] & Reg16) != 0
2749 || (i.types[op] & Reg32) != 0)
2750 && (i.tm.operand_types[op] & (Reg32 | Acc)) != 0)
2752 /* Prohibit these changes in the 64bit mode, since the
2753 lowering is more complicated. */
2754 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2755 i.op[op].regs->reg_name,
2756 i.suffix);
2757 return 0;
2759 return 1;
2762 static int
2763 check_word_reg ()
2765 int op;
2766 for (op = i.operands; --op >= 0;)
2767 /* Reject eight bit registers, except where the template requires
2768 them. (eg. movzb) */
2769 if ((i.types[op] & Reg8) != 0
2770 && (i.tm.operand_types[op] & (Reg16 | Reg32 | Acc)) != 0)
2772 as_bad (_("`%%%s' not allowed with `%s%c'"),
2773 i.op[op].regs->reg_name,
2774 i.tm.name,
2775 i.suffix);
2776 return 0;
2778 /* Warn if the e prefix on a general reg is present. */
2779 else if ((!quiet_warnings || flag_code == CODE_64BIT)
2780 && (i.types[op] & Reg32) != 0
2781 && (i.tm.operand_types[op] & (Reg16 | Acc)) != 0)
2783 /* Prohibit these changes in the 64bit mode, since the
2784 lowering is more complicated. */
2785 if (flag_code == CODE_64BIT)
2787 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2788 i.op[op].regs->reg_name,
2789 i.suffix);
2790 return 0;
2792 else
2793 #if REGISTER_WARNINGS
2794 as_warn (_("using `%%%s' instead of `%%%s' due to `%c' suffix"),
2795 (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
2796 i.op[op].regs->reg_name,
2797 i.suffix);
2798 #endif
2800 return 1;
2803 static int
2804 finalize_imm ()
2806 unsigned int overlap0, overlap1, overlap2;
2808 overlap0 = i.types[0] & i.tm.operand_types[0];
2809 if ((overlap0 & (Imm8 | Imm8S | Imm16 | Imm32 | Imm32S | Imm64))
2810 && overlap0 != Imm8 && overlap0 != Imm8S
2811 && overlap0 != Imm16 && overlap0 != Imm32S
2812 && overlap0 != Imm32 && overlap0 != Imm64)
2814 if (i.suffix)
2816 overlap0 &= (i.suffix == BYTE_MNEM_SUFFIX
2817 ? Imm8 | Imm8S
2818 : (i.suffix == WORD_MNEM_SUFFIX
2819 ? Imm16
2820 : (i.suffix == QWORD_MNEM_SUFFIX
2821 ? Imm64 | Imm32S
2822 : Imm32)));
2824 else if (overlap0 == (Imm16 | Imm32S | Imm32)
2825 || overlap0 == (Imm16 | Imm32)
2826 || overlap0 == (Imm16 | Imm32S))
2828 overlap0 = ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0)
2829 ? Imm16 : Imm32S);
2831 if (overlap0 != Imm8 && overlap0 != Imm8S
2832 && overlap0 != Imm16 && overlap0 != Imm32S
2833 && overlap0 != Imm32 && overlap0 != Imm64)
2835 as_bad (_("no instruction mnemonic suffix given; can't determine immediate size"));
2836 return 0;
2839 i.types[0] = overlap0;
2841 overlap1 = i.types[1] & i.tm.operand_types[1];
2842 if ((overlap1 & (Imm8 | Imm8S | Imm16 | Imm32S | Imm32 | Imm64))
2843 && overlap1 != Imm8 && overlap1 != Imm8S
2844 && overlap1 != Imm16 && overlap1 != Imm32S
2845 && overlap1 != Imm32 && overlap1 != Imm64)
2847 if (i.suffix)
2849 overlap1 &= (i.suffix == BYTE_MNEM_SUFFIX
2850 ? Imm8 | Imm8S
2851 : (i.suffix == WORD_MNEM_SUFFIX
2852 ? Imm16
2853 : (i.suffix == QWORD_MNEM_SUFFIX
2854 ? Imm64 | Imm32S
2855 : Imm32)));
2857 else if (overlap1 == (Imm16 | Imm32 | Imm32S)
2858 || overlap1 == (Imm16 | Imm32)
2859 || overlap1 == (Imm16 | Imm32S))
2861 overlap1 = ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0)
2862 ? Imm16 : Imm32S);
2864 if (overlap1 != Imm8 && overlap1 != Imm8S
2865 && overlap1 != Imm16 && overlap1 != Imm32S
2866 && overlap1 != Imm32 && overlap1 != Imm64)
2868 as_bad (_("no instruction mnemonic suffix given; can't determine immediate size %x %c"),overlap1, i.suffix);
2869 return 0;
2872 i.types[1] = overlap1;
2874 overlap2 = i.types[2] & i.tm.operand_types[2];
2875 assert ((overlap2 & Imm) == 0);
2876 i.types[2] = overlap2;
2878 return 1;
2881 static int
2882 process_operands ()
2884 /* Default segment register this instruction will use for memory
2885 accesses. 0 means unknown. This is only for optimizing out
2886 unnecessary segment overrides. */
2887 const seg_entry *default_seg = 0;
2889 /* The imul $imm, %reg instruction is converted into
2890 imul $imm, %reg, %reg, and the clr %reg instruction
2891 is converted into xor %reg, %reg. */
2892 if (i.tm.opcode_modifier & regKludge)
2894 unsigned int first_reg_op = (i.types[0] & Reg) ? 0 : 1;
2895 /* Pretend we saw the extra register operand. */
2896 assert (i.op[first_reg_op + 1].regs == 0);
2897 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
2898 i.types[first_reg_op + 1] = i.types[first_reg_op];
2899 i.reg_operands = 2;
2902 if (i.tm.opcode_modifier & ShortForm)
2904 /* The register or float register operand is in operand 0 or 1. */
2905 unsigned int op = (i.types[0] & (Reg | FloatReg)) ? 0 : 1;
2906 /* Register goes in low 3 bits of opcode. */
2907 i.tm.base_opcode |= i.op[op].regs->reg_num;
2908 if ((i.op[op].regs->reg_flags & RegRex) != 0)
2909 i.rex |= REX_EXTZ;
2910 if (!quiet_warnings && (i.tm.opcode_modifier & Ugh) != 0)
2912 /* Warn about some common errors, but press on regardless.
2913 The first case can be generated by gcc (<= 2.8.1). */
2914 if (i.operands == 2)
2916 /* Reversed arguments on faddp, fsubp, etc. */
2917 as_warn (_("translating to `%s %%%s,%%%s'"), i.tm.name,
2918 i.op[1].regs->reg_name,
2919 i.op[0].regs->reg_name);
2921 else
2923 /* Extraneous `l' suffix on fp insn. */
2924 as_warn (_("translating to `%s %%%s'"), i.tm.name,
2925 i.op[0].regs->reg_name);
2929 else if (i.tm.opcode_modifier & Modrm)
2931 /* The opcode is completed (modulo i.tm.extension_opcode which
2932 must be put into the modrm byte). Now, we make the modrm and
2933 index base bytes based on all the info we've collected. */
2935 default_seg = build_modrm_byte ();
2937 else if (i.tm.opcode_modifier & (Seg2ShortForm | Seg3ShortForm))
2939 if (i.tm.base_opcode == POP_SEG_SHORT
2940 && i.op[0].regs->reg_num == 1)
2942 as_bad (_("you can't `pop %%cs'"));
2943 return 0;
2945 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
2946 if ((i.op[0].regs->reg_flags & RegRex) != 0)
2947 i.rex |= REX_EXTZ;
2949 else if ((i.tm.base_opcode & ~(D | W)) == MOV_AX_DISP32)
2951 default_seg = &ds;
2953 else if ((i.tm.opcode_modifier & IsString) != 0)
2955 /* For the string instructions that allow a segment override
2956 on one of their operands, the default segment is ds. */
2957 default_seg = &ds;
2960 if ((i.tm.base_opcode == 0x8d /* lea */
2961 || (i.tm.cpu_flags & CpuSVME))
2962 && i.seg[0] && !quiet_warnings)
2963 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
2965 /* If a segment was explicitly specified, and the specified segment
2966 is not the default, use an opcode prefix to select it. If we
2967 never figured out what the default segment is, then default_seg
2968 will be zero at this point, and the specified segment prefix will
2969 always be used. */
2970 if ((i.seg[0]) && (i.seg[0] != default_seg))
2972 if (!add_prefix (i.seg[0]->seg_prefix))
2973 return 0;
2975 return 1;
2978 static const seg_entry *
2979 build_modrm_byte ()
2981 const seg_entry *default_seg = 0;
2983 /* i.reg_operands MUST be the number of real register operands;
2984 implicit registers do not count. */
2985 if (i.reg_operands == 2)
2987 unsigned int source, dest;
2988 source = ((i.types[0]
2989 & (Reg | RegMMX | RegXMM
2990 | SReg2 | SReg3
2991 | Control | Debug | Test))
2992 ? 0 : 1);
2993 dest = source + 1;
2995 i.rm.mode = 3;
2996 /* One of the register operands will be encoded in the i.tm.reg
2997 field, the other in the combined i.tm.mode and i.tm.regmem
2998 fields. If no form of this instruction supports a memory
2999 destination operand, then we assume the source operand may
3000 sometimes be a memory operand and so we need to store the
3001 destination in the i.rm.reg field. */
3002 if ((i.tm.operand_types[dest] & AnyMem) == 0)
3004 i.rm.reg = i.op[dest].regs->reg_num;
3005 i.rm.regmem = i.op[source].regs->reg_num;
3006 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
3007 i.rex |= REX_EXTX;
3008 if ((i.op[source].regs->reg_flags & RegRex) != 0)
3009 i.rex |= REX_EXTZ;
3011 else
3013 i.rm.reg = i.op[source].regs->reg_num;
3014 i.rm.regmem = i.op[dest].regs->reg_num;
3015 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
3016 i.rex |= REX_EXTZ;
3017 if ((i.op[source].regs->reg_flags & RegRex) != 0)
3018 i.rex |= REX_EXTX;
3020 if (flag_code != CODE_64BIT && (i.rex & (REX_EXTX | REX_EXTZ)))
3022 if (!((i.types[0] | i.types[1]) & Control))
3023 abort ();
3024 i.rex &= ~(REX_EXTX | REX_EXTZ);
3025 add_prefix (LOCK_PREFIX_OPCODE);
3028 else
3029 { /* If it's not 2 reg operands... */
3030 if (i.mem_operands)
3032 unsigned int fake_zero_displacement = 0;
3033 unsigned int op = ((i.types[0] & AnyMem)
3035 : (i.types[1] & AnyMem) ? 1 : 2);
3037 default_seg = &ds;
3039 if (i.base_reg == 0)
3041 i.rm.mode = 0;
3042 if (!i.disp_operands)
3043 fake_zero_displacement = 1;
3044 if (i.index_reg == 0)
3046 /* Operand is just <disp> */
3047 if (flag_code == CODE_64BIT)
3049 /* 64bit mode overwrites the 32bit absolute
3050 addressing by RIP relative addressing and
3051 absolute addressing is encoded by one of the
3052 redundant SIB forms. */
3053 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
3054 i.sib.base = NO_BASE_REGISTER;
3055 i.sib.index = NO_INDEX_REGISTER;
3056 i.types[op] = ((i.prefix[ADDR_PREFIX] == 0) ? Disp32S : Disp32);
3058 else if ((flag_code == CODE_16BIT) ^ (i.prefix[ADDR_PREFIX] != 0))
3060 i.rm.regmem = NO_BASE_REGISTER_16;
3061 i.types[op] = Disp16;
3063 else
3065 i.rm.regmem = NO_BASE_REGISTER;
3066 i.types[op] = Disp32;
3069 else /* !i.base_reg && i.index_reg */
3071 i.sib.index = i.index_reg->reg_num;
3072 i.sib.base = NO_BASE_REGISTER;
3073 i.sib.scale = i.log2_scale_factor;
3074 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
3075 i.types[op] &= ~Disp;
3076 if (flag_code != CODE_64BIT)
3077 i.types[op] |= Disp32; /* Must be 32 bit */
3078 else
3079 i.types[op] |= Disp32S;
3080 if ((i.index_reg->reg_flags & RegRex) != 0)
3081 i.rex |= REX_EXTY;
3084 /* RIP addressing for 64bit mode. */
3085 else if (i.base_reg->reg_type == BaseIndex)
3087 i.rm.regmem = NO_BASE_REGISTER;
3088 i.types[op] &= ~ Disp;
3089 i.types[op] |= Disp32S;
3090 i.flags[op] = Operand_PCrel;
3091 if (! i.disp_operands)
3092 fake_zero_displacement = 1;
3094 else if (i.base_reg->reg_type & Reg16)
3096 switch (i.base_reg->reg_num)
3098 case 3: /* (%bx) */
3099 if (i.index_reg == 0)
3100 i.rm.regmem = 7;
3101 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
3102 i.rm.regmem = i.index_reg->reg_num - 6;
3103 break;
3104 case 5: /* (%bp) */
3105 default_seg = &ss;
3106 if (i.index_reg == 0)
3108 i.rm.regmem = 6;
3109 if ((i.types[op] & Disp) == 0)
3111 /* fake (%bp) into 0(%bp) */
3112 i.types[op] |= Disp8;
3113 fake_zero_displacement = 1;
3116 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
3117 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
3118 break;
3119 default: /* (%si) -> 4 or (%di) -> 5 */
3120 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
3122 i.rm.mode = mode_from_disp_size (i.types[op]);
3124 else /* i.base_reg and 32/64 bit mode */
3126 if (flag_code == CODE_64BIT
3127 && (i.types[op] & Disp))
3128 i.types[op] = (i.types[op] & Disp8) | (i.prefix[ADDR_PREFIX] == 0 ? Disp32S : Disp32);
3130 i.rm.regmem = i.base_reg->reg_num;
3131 if ((i.base_reg->reg_flags & RegRex) != 0)
3132 i.rex |= REX_EXTZ;
3133 i.sib.base = i.base_reg->reg_num;
3134 /* x86-64 ignores REX prefix bit here to avoid decoder
3135 complications. */
3136 if ((i.base_reg->reg_num & 7) == EBP_REG_NUM)
3138 default_seg = &ss;
3139 if (i.disp_operands == 0)
3141 fake_zero_displacement = 1;
3142 i.types[op] |= Disp8;
3145 else if (i.base_reg->reg_num == ESP_REG_NUM)
3147 default_seg = &ss;
3149 i.sib.scale = i.log2_scale_factor;
3150 if (i.index_reg == 0)
3152 /* <disp>(%esp) becomes two byte modrm with no index
3153 register. We've already stored the code for esp
3154 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
3155 Any base register besides %esp will not use the
3156 extra modrm byte. */
3157 i.sib.index = NO_INDEX_REGISTER;
3158 #if !SCALE1_WHEN_NO_INDEX
3159 /* Another case where we force the second modrm byte. */
3160 if (i.log2_scale_factor)
3161 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
3162 #endif
3164 else
3166 i.sib.index = i.index_reg->reg_num;
3167 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
3168 if ((i.index_reg->reg_flags & RegRex) != 0)
3169 i.rex |= REX_EXTY;
3172 if (i.disp_operands
3173 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
3174 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
3175 i.rm.mode = 0;
3176 else
3177 i.rm.mode = mode_from_disp_size (i.types[op]);
3180 if (fake_zero_displacement)
3182 /* Fakes a zero displacement assuming that i.types[op]
3183 holds the correct displacement size. */
3184 expressionS *exp;
3186 assert (i.op[op].disps == 0);
3187 exp = &disp_expressions[i.disp_operands++];
3188 i.op[op].disps = exp;
3189 exp->X_op = O_constant;
3190 exp->X_add_number = 0;
3191 exp->X_add_symbol = (symbolS *) 0;
3192 exp->X_op_symbol = (symbolS *) 0;
3196 /* Fill in i.rm.reg or i.rm.regmem field with register operand
3197 (if any) based on i.tm.extension_opcode. Again, we must be
3198 careful to make sure that segment/control/debug/test/MMX
3199 registers are coded into the i.rm.reg field. */
3200 if (i.reg_operands)
3202 unsigned int op =
3203 ((i.types[0]
3204 & (Reg | RegMMX | RegXMM
3205 | SReg2 | SReg3
3206 | Control | Debug | Test))
3208 : ((i.types[1]
3209 & (Reg | RegMMX | RegXMM
3210 | SReg2 | SReg3
3211 | Control | Debug | Test))
3213 : 2));
3214 /* If there is an extension opcode to put here, the register
3215 number must be put into the regmem field. */
3216 if (i.tm.extension_opcode != None)
3218 i.rm.regmem = i.op[op].regs->reg_num;
3219 if ((i.op[op].regs->reg_flags & RegRex) != 0)
3220 i.rex |= REX_EXTZ;
3222 else
3224 i.rm.reg = i.op[op].regs->reg_num;
3225 if ((i.op[op].regs->reg_flags & RegRex) != 0)
3226 i.rex |= REX_EXTX;
3229 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
3230 must set it to 3 to indicate this is a register operand
3231 in the regmem field. */
3232 if (!i.mem_operands)
3233 i.rm.mode = 3;
3236 /* Fill in i.rm.reg field with extension opcode (if any). */
3237 if (i.tm.extension_opcode != None)
3238 i.rm.reg = i.tm.extension_opcode;
3240 return default_seg;
3243 static void
3244 output_branch ()
3246 char *p;
3247 int code16;
3248 int prefix;
3249 relax_substateT subtype;
3250 symbolS *sym;
3251 offsetT off;
3253 code16 = 0;
3254 if (flag_code == CODE_16BIT)
3255 code16 = CODE16;
3257 prefix = 0;
3258 if (i.prefix[DATA_PREFIX] != 0)
3260 prefix = 1;
3261 i.prefixes -= 1;
3262 code16 ^= CODE16;
3264 /* Pentium4 branch hints. */
3265 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
3266 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
3268 prefix++;
3269 i.prefixes--;
3271 if (i.prefix[REX_PREFIX] != 0)
3273 prefix++;
3274 i.prefixes--;
3277 if (i.prefixes != 0 && !intel_syntax)
3278 as_warn (_("skipping prefixes on this instruction"));
3280 /* It's always a symbol; End frag & setup for relax.
3281 Make sure there is enough room in this frag for the largest
3282 instruction we may generate in md_convert_frag. This is 2
3283 bytes for the opcode and room for the prefix and largest
3284 displacement. */
3285 frag_grow (prefix + 2 + 4);
3286 /* Prefix and 1 opcode byte go in fr_fix. */
3287 p = frag_more (prefix + 1);
3288 if (i.prefix[DATA_PREFIX] != 0)
3289 *p++ = DATA_PREFIX_OPCODE;
3290 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
3291 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
3292 *p++ = i.prefix[SEG_PREFIX];
3293 if (i.prefix[REX_PREFIX] != 0)
3294 *p++ = i.prefix[REX_PREFIX];
3295 *p = i.tm.base_opcode;
3297 if ((unsigned char) *p == JUMP_PC_RELATIVE)
3298 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, SMALL);
3299 else if ((cpu_arch_flags & Cpu386) != 0)
3300 subtype = ENCODE_RELAX_STATE (COND_JUMP, SMALL);
3301 else
3302 subtype = ENCODE_RELAX_STATE (COND_JUMP86, SMALL);
3303 subtype |= code16;
3305 sym = i.op[0].disps->X_add_symbol;
3306 off = i.op[0].disps->X_add_number;
3308 if (i.op[0].disps->X_op != O_constant
3309 && i.op[0].disps->X_op != O_symbol)
3311 /* Handle complex expressions. */
3312 sym = make_expr_symbol (i.op[0].disps);
3313 off = 0;
3316 /* 1 possible extra opcode + 4 byte displacement go in var part.
3317 Pass reloc in fr_var. */
3318 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
3321 static void
3322 output_jump ()
3324 char *p;
3325 int size;
3326 fixS *fixP;
3328 if (i.tm.opcode_modifier & JumpByte)
3330 /* This is a loop or jecxz type instruction. */
3331 size = 1;
3332 if (i.prefix[ADDR_PREFIX] != 0)
3334 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
3335 i.prefixes -= 1;
3337 /* Pentium4 branch hints. */
3338 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
3339 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
3341 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
3342 i.prefixes--;
3345 else
3347 int code16;
3349 code16 = 0;
3350 if (flag_code == CODE_16BIT)
3351 code16 = CODE16;
3353 if (i.prefix[DATA_PREFIX] != 0)
3355 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
3356 i.prefixes -= 1;
3357 code16 ^= CODE16;
3360 size = 4;
3361 if (code16)
3362 size = 2;
3365 if (i.prefix[REX_PREFIX] != 0)
3367 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
3368 i.prefixes -= 1;
3371 if (i.prefixes != 0 && !intel_syntax)
3372 as_warn (_("skipping prefixes on this instruction"));
3374 p = frag_more (1 + size);
3375 *p++ = i.tm.base_opcode;
3377 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3378 i.op[0].disps, 1, reloc (size, 1, 1, i.reloc[0]));
3380 /* All jumps handled here are signed, but don't use a signed limit
3381 check for 32 and 16 bit jumps as we want to allow wrap around at
3382 4G and 64k respectively. */
3383 if (size == 1)
3384 fixP->fx_signed = 1;
3387 static void
3388 output_interseg_jump ()
3390 char *p;
3391 int size;
3392 int prefix;
3393 int code16;
3395 code16 = 0;
3396 if (flag_code == CODE_16BIT)
3397 code16 = CODE16;
3399 prefix = 0;
3400 if (i.prefix[DATA_PREFIX] != 0)
3402 prefix = 1;
3403 i.prefixes -= 1;
3404 code16 ^= CODE16;
3406 if (i.prefix[REX_PREFIX] != 0)
3408 prefix++;
3409 i.prefixes -= 1;
3412 size = 4;
3413 if (code16)
3414 size = 2;
3416 if (i.prefixes != 0 && !intel_syntax)
3417 as_warn (_("skipping prefixes on this instruction"));
3419 /* 1 opcode; 2 segment; offset */
3420 p = frag_more (prefix + 1 + 2 + size);
3422 if (i.prefix[DATA_PREFIX] != 0)
3423 *p++ = DATA_PREFIX_OPCODE;
3425 if (i.prefix[REX_PREFIX] != 0)
3426 *p++ = i.prefix[REX_PREFIX];
3428 *p++ = i.tm.base_opcode;
3429 if (i.op[1].imms->X_op == O_constant)
3431 offsetT n = i.op[1].imms->X_add_number;
3433 if (size == 2
3434 && !fits_in_unsigned_word (n)
3435 && !fits_in_signed_word (n))
3437 as_bad (_("16-bit jump out of range"));
3438 return;
3440 md_number_to_chars (p, n, size);
3442 else
3443 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3444 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
3445 if (i.op[0].imms->X_op != O_constant)
3446 as_bad (_("can't handle non absolute segment in `%s'"),
3447 i.tm.name);
3448 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
3451 static void
3452 output_insn ()
3454 fragS *insn_start_frag;
3455 offsetT insn_start_off;
3457 /* Tie dwarf2 debug info to the address at the start of the insn.
3458 We can't do this after the insn has been output as the current
3459 frag may have been closed off. eg. by frag_var. */
3460 dwarf2_emit_insn (0);
3462 insn_start_frag = frag_now;
3463 insn_start_off = frag_now_fix ();
3465 /* Output jumps. */
3466 if (i.tm.opcode_modifier & Jump)
3467 output_branch ();
3468 else if (i.tm.opcode_modifier & (JumpByte | JumpDword))
3469 output_jump ();
3470 else if (i.tm.opcode_modifier & JumpInterSegment)
3471 output_interseg_jump ();
3472 else
3474 /* Output normal instructions here. */
3475 char *p;
3476 unsigned char *q;
3478 /* All opcodes on i386 have either 1 or 2 bytes. We may use one
3479 more higher byte to specify a prefix the instruction
3480 requires. */
3481 if ((i.tm.base_opcode & 0xff0000) != 0)
3483 if ((i.tm.cpu_flags & CpuPadLock) != 0)
3485 unsigned int prefix;
3486 prefix = (i.tm.base_opcode >> 16) & 0xff;
3488 if (prefix != REPE_PREFIX_OPCODE
3489 || i.prefix[LOCKREP_PREFIX] != REPE_PREFIX_OPCODE)
3490 add_prefix (prefix);
3492 else
3493 add_prefix ((i.tm.base_opcode >> 16) & 0xff);
3496 /* The prefix bytes. */
3497 for (q = i.prefix;
3498 q < i.prefix + sizeof (i.prefix) / sizeof (i.prefix[0]);
3499 q++)
3501 if (*q)
3503 p = frag_more (1);
3504 md_number_to_chars (p, (valueT) *q, 1);
3508 /* Now the opcode; be careful about word order here! */
3509 if (fits_in_unsigned_byte (i.tm.base_opcode))
3511 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
3513 else
3515 p = frag_more (2);
3517 /* Put out high byte first: can't use md_number_to_chars! */
3518 *p++ = (i.tm.base_opcode >> 8) & 0xff;
3519 *p = i.tm.base_opcode & 0xff;
3522 /* Now the modrm byte and sib byte (if present). */
3523 if (i.tm.opcode_modifier & Modrm)
3525 p = frag_more (1);
3526 md_number_to_chars (p,
3527 (valueT) (i.rm.regmem << 0
3528 | i.rm.reg << 3
3529 | i.rm.mode << 6),
3531 /* If i.rm.regmem == ESP (4)
3532 && i.rm.mode != (Register mode)
3533 && not 16 bit
3534 ==> need second modrm byte. */
3535 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
3536 && i.rm.mode != 3
3537 && !(i.base_reg && (i.base_reg->reg_type & Reg16) != 0))
3539 p = frag_more (1);
3540 md_number_to_chars (p,
3541 (valueT) (i.sib.base << 0
3542 | i.sib.index << 3
3543 | i.sib.scale << 6),
3548 if (i.disp_operands)
3549 output_disp (insn_start_frag, insn_start_off);
3551 if (i.imm_operands)
3552 output_imm (insn_start_frag, insn_start_off);
3555 #ifdef DEBUG386
3556 if (flag_debug)
3558 pi (line, &i);
3560 #endif /* DEBUG386 */
3563 static void
3564 output_disp (insn_start_frag, insn_start_off)
3565 fragS *insn_start_frag;
3566 offsetT insn_start_off;
3568 char *p;
3569 unsigned int n;
3571 for (n = 0; n < i.operands; n++)
3573 if (i.types[n] & Disp)
3575 if (i.op[n].disps->X_op == O_constant)
3577 int size;
3578 offsetT val;
3580 size = 4;
3581 if (i.types[n] & (Disp8 | Disp16 | Disp64))
3583 size = 2;
3584 if (i.types[n] & Disp8)
3585 size = 1;
3586 if (i.types[n] & Disp64)
3587 size = 8;
3589 val = offset_in_range (i.op[n].disps->X_add_number,
3590 size);
3591 p = frag_more (size);
3592 md_number_to_chars (p, val, size);
3594 else
3596 enum bfd_reloc_code_real reloc_type;
3597 int size = 4;
3598 int sign = 0;
3599 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
3601 /* The PC relative address is computed relative
3602 to the instruction boundary, so in case immediate
3603 fields follows, we need to adjust the value. */
3604 if (pcrel && i.imm_operands)
3606 int imm_size = 4;
3607 unsigned int n1;
3609 for (n1 = 0; n1 < i.operands; n1++)
3610 if (i.types[n1] & Imm)
3612 if (i.types[n1] & (Imm8 | Imm8S | Imm16 | Imm64))
3614 imm_size = 2;
3615 if (i.types[n1] & (Imm8 | Imm8S))
3616 imm_size = 1;
3617 if (i.types[n1] & Imm64)
3618 imm_size = 8;
3620 break;
3622 /* We should find the immediate. */
3623 if (n1 == i.operands)
3624 abort ();
3625 i.op[n].disps->X_add_number -= imm_size;
3628 if (i.types[n] & Disp32S)
3629 sign = 1;
3631 if (i.types[n] & (Disp16 | Disp64))
3633 size = 2;
3634 if (i.types[n] & Disp64)
3635 size = 8;
3638 p = frag_more (size);
3639 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
3640 if (GOT_symbol
3641 && GOT_symbol == i.op[n].disps->X_add_symbol
3642 && (((reloc_type == BFD_RELOC_32
3643 || reloc_type == BFD_RELOC_X86_64_32S)
3644 && (i.op[n].disps->X_op == O_symbol
3645 || (i.op[n].disps->X_op == O_add
3646 && ((symbol_get_value_expression
3647 (i.op[n].disps->X_op_symbol)->X_op)
3648 == O_subtract))))
3649 || reloc_type == BFD_RELOC_32_PCREL))
3651 offsetT add;
3653 if (insn_start_frag == frag_now)
3654 add = (p - frag_now->fr_literal) - insn_start_off;
3655 else
3657 fragS *fr;
3659 add = insn_start_frag->fr_fix - insn_start_off;
3660 for (fr = insn_start_frag->fr_next;
3661 fr && fr != frag_now; fr = fr->fr_next)
3662 add += fr->fr_fix;
3663 add += p - frag_now->fr_literal;
3666 if (!object_64bit)
3667 reloc_type = BFD_RELOC_386_GOTPC;
3668 else
3669 reloc_type = BFD_RELOC_X86_64_GOTPC32;
3670 i.op[n].disps->X_add_number += add;
3672 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3673 i.op[n].disps, pcrel, reloc_type);
3679 static void
3680 output_imm (insn_start_frag, insn_start_off)
3681 fragS *insn_start_frag;
3682 offsetT insn_start_off;
3684 char *p;
3685 unsigned int n;
3687 for (n = 0; n < i.operands; n++)
3689 if (i.types[n] & Imm)
3691 if (i.op[n].imms->X_op == O_constant)
3693 int size;
3694 offsetT val;
3696 size = 4;
3697 if (i.types[n] & (Imm8 | Imm8S | Imm16 | Imm64))
3699 size = 2;
3700 if (i.types[n] & (Imm8 | Imm8S))
3701 size = 1;
3702 else if (i.types[n] & Imm64)
3703 size = 8;
3705 val = offset_in_range (i.op[n].imms->X_add_number,
3706 size);
3707 p = frag_more (size);
3708 md_number_to_chars (p, val, size);
3710 else
3712 /* Not absolute_section.
3713 Need a 32-bit fixup (don't support 8bit
3714 non-absolute imms). Try to support other
3715 sizes ... */
3716 enum bfd_reloc_code_real reloc_type;
3717 int size = 4;
3718 int sign = 0;
3720 if ((i.types[n] & (Imm32S))
3721 && (i.suffix == QWORD_MNEM_SUFFIX
3722 || (!i.suffix && (i.tm.opcode_modifier & No_lSuf))))
3723 sign = 1;
3724 if (i.types[n] & (Imm8 | Imm8S | Imm16 | Imm64))
3726 size = 2;
3727 if (i.types[n] & (Imm8 | Imm8S))
3728 size = 1;
3729 if (i.types[n] & Imm64)
3730 size = 8;
3733 p = frag_more (size);
3734 reloc_type = reloc (size, 0, sign, i.reloc[n]);
3736 /* This is tough to explain. We end up with this one if we
3737 * have operands that look like
3738 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
3739 * obtain the absolute address of the GOT, and it is strongly
3740 * preferable from a performance point of view to avoid using
3741 * a runtime relocation for this. The actual sequence of
3742 * instructions often look something like:
3744 * call .L66
3745 * .L66:
3746 * popl %ebx
3747 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
3749 * The call and pop essentially return the absolute address
3750 * of the label .L66 and store it in %ebx. The linker itself
3751 * will ultimately change the first operand of the addl so
3752 * that %ebx points to the GOT, but to keep things simple, the
3753 * .o file must have this operand set so that it generates not
3754 * the absolute address of .L66, but the absolute address of
3755 * itself. This allows the linker itself simply treat a GOTPC
3756 * relocation as asking for a pcrel offset to the GOT to be
3757 * added in, and the addend of the relocation is stored in the
3758 * operand field for the instruction itself.
3760 * Our job here is to fix the operand so that it would add
3761 * the correct offset so that %ebx would point to itself. The
3762 * thing that is tricky is that .-.L66 will point to the
3763 * beginning of the instruction, so we need to further modify
3764 * the operand so that it will point to itself. There are
3765 * other cases where you have something like:
3767 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
3769 * and here no correction would be required. Internally in
3770 * the assembler we treat operands of this form as not being
3771 * pcrel since the '.' is explicitly mentioned, and I wonder
3772 * whether it would simplify matters to do it this way. Who
3773 * knows. In earlier versions of the PIC patches, the
3774 * pcrel_adjust field was used to store the correction, but
3775 * since the expression is not pcrel, I felt it would be
3776 * confusing to do it this way. */
3778 if ((reloc_type == BFD_RELOC_32
3779 || reloc_type == BFD_RELOC_X86_64_32S)
3780 && GOT_symbol
3781 && GOT_symbol == i.op[n].imms->X_add_symbol
3782 && (i.op[n].imms->X_op == O_symbol
3783 || (i.op[n].imms->X_op == O_add
3784 && ((symbol_get_value_expression
3785 (i.op[n].imms->X_op_symbol)->X_op)
3786 == O_subtract))))
3788 offsetT add;
3790 if (insn_start_frag == frag_now)
3791 add = (p - frag_now->fr_literal) - insn_start_off;
3792 else
3794 fragS *fr;
3796 add = insn_start_frag->fr_fix - insn_start_off;
3797 for (fr = insn_start_frag->fr_next;
3798 fr && fr != frag_now; fr = fr->fr_next)
3799 add += fr->fr_fix;
3800 add += p - frag_now->fr_literal;
3803 if (!object_64bit)
3804 reloc_type = BFD_RELOC_386_GOTPC;
3805 else
3806 reloc_type = BFD_RELOC_X86_64_GOTPC32;
3807 i.op[n].imms->X_add_number += add;
3809 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3810 i.op[n].imms, 0, reloc_type);
3816 /* x86_cons_fix_new is called via the expression parsing code when a
3817 reloc is needed. We use this hook to get the correct .got reloc. */
3818 static enum bfd_reloc_code_real got_reloc = NO_RELOC;
3819 static int cons_sign = -1;
3821 void
3822 x86_cons_fix_new (fragS *frag,
3823 unsigned int off,
3824 unsigned int len,
3825 expressionS *exp)
3827 enum bfd_reloc_code_real r = reloc (len, 0, cons_sign, got_reloc);
3829 got_reloc = NO_RELOC;
3831 #ifdef TE_PE
3832 if (exp->X_op == O_secrel)
3834 exp->X_op = O_symbol;
3835 r = BFD_RELOC_32_SECREL;
3837 #endif
3839 fix_new_exp (frag, off, len, exp, 0, r);
3842 #if (!defined (OBJ_ELF) && !defined (OBJ_MAYBE_ELF)) || defined (LEX_AT)
3843 # define lex_got(reloc, adjust, types) NULL
3844 #else
3845 /* Parse operands of the form
3846 <symbol>@GOTOFF+<nnn>
3847 and similar .plt or .got references.
3849 If we find one, set up the correct relocation in RELOC and copy the
3850 input string, minus the `@GOTOFF' into a malloc'd buffer for
3851 parsing by the calling routine. Return this buffer, and if ADJUST
3852 is non-null set it to the length of the string we removed from the
3853 input line. Otherwise return NULL. */
3854 static char *
3855 lex_got (enum bfd_reloc_code_real *reloc,
3856 int *adjust,
3857 unsigned int *types)
3859 static const struct {
3860 const char *str;
3861 const enum bfd_reloc_code_real rel[2];
3862 const unsigned int types64;
3863 } gotrel[] = {
3864 { "PLT", { BFD_RELOC_386_PLT32, BFD_RELOC_X86_64_PLT32 }, Imm32|Imm32S|Disp32 },
3865 { "GOTOFF", { BFD_RELOC_386_GOTOFF, BFD_RELOC_X86_64_GOTOFF64 }, Imm64|Disp64 },
3866 { "GOTPCREL", { 0, BFD_RELOC_X86_64_GOTPCREL }, Imm32|Imm32S|Disp32 },
3867 { "TLSGD", { BFD_RELOC_386_TLS_GD, BFD_RELOC_X86_64_TLSGD }, Imm32|Imm32S|Disp32 },
3868 { "TLSLDM", { BFD_RELOC_386_TLS_LDM, 0 }, 0 },
3869 { "TLSLD", { 0, BFD_RELOC_X86_64_TLSLD }, Imm32|Imm32S|Disp32 },
3870 { "GOTTPOFF", { BFD_RELOC_386_TLS_IE_32, BFD_RELOC_X86_64_GOTTPOFF }, Imm32|Imm32S|Disp32 },
3871 { "TPOFF", { BFD_RELOC_386_TLS_LE_32, BFD_RELOC_X86_64_TPOFF32 }, Imm32|Imm32S|Imm64|Disp32|Disp64 },
3872 { "NTPOFF", { BFD_RELOC_386_TLS_LE, 0 }, 0 },
3873 { "DTPOFF", { BFD_RELOC_386_TLS_LDO_32, BFD_RELOC_X86_64_DTPOFF32 }, Imm32|Imm32S|Imm64|Disp32|Disp64 },
3874 { "GOTNTPOFF",{ BFD_RELOC_386_TLS_GOTIE, 0 }, 0 },
3875 { "INDNTPOFF",{ BFD_RELOC_386_TLS_IE, 0 }, 0 },
3876 { "GOT", { BFD_RELOC_386_GOT32, BFD_RELOC_X86_64_GOT32 }, Imm32|Imm32S|Disp32 },
3877 { "TLSDESC", { BFD_RELOC_386_TLS_GOTDESC, BFD_RELOC_X86_64_GOTPC32_TLSDESC }, Imm32|Imm32S|Disp32 },
3878 { "TLSCALL", { BFD_RELOC_386_TLS_DESC_CALL, BFD_RELOC_X86_64_TLSDESC_CALL }, Imm32|Imm32S|Disp32 }
3880 char *cp;
3881 unsigned int j;
3883 if (!IS_ELF)
3884 return NULL;
3886 for (cp = input_line_pointer; *cp != '@'; cp++)
3887 if (is_end_of_line[(unsigned char) *cp])
3888 return NULL;
3890 for (j = 0; j < sizeof (gotrel) / sizeof (gotrel[0]); j++)
3892 int len;
3894 len = strlen (gotrel[j].str);
3895 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
3897 if (gotrel[j].rel[object_64bit] != 0)
3899 int first, second;
3900 char *tmpbuf, *past_reloc;
3902 *reloc = gotrel[j].rel[object_64bit];
3903 if (adjust)
3904 *adjust = len;
3906 if (types)
3908 if (flag_code != CODE_64BIT)
3909 *types = Imm32|Disp32;
3910 else
3911 *types = gotrel[j].types64;
3914 if (GOT_symbol == NULL)
3915 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
3917 /* Replace the relocation token with ' ', so that
3918 errors like foo@GOTOFF1 will be detected. */
3920 /* The length of the first part of our input line. */
3921 first = cp - input_line_pointer;
3923 /* The second part goes from after the reloc token until
3924 (and including) an end_of_line char. Don't use strlen
3925 here as the end_of_line char may not be a NUL. */
3926 past_reloc = cp + 1 + len;
3927 for (cp = past_reloc; !is_end_of_line[(unsigned char) *cp++]; )
3929 second = cp - past_reloc;
3931 /* Allocate and copy string. The trailing NUL shouldn't
3932 be necessary, but be safe. */
3933 tmpbuf = xmalloc (first + second + 2);
3934 memcpy (tmpbuf, input_line_pointer, first);
3935 tmpbuf[first] = ' ';
3936 memcpy (tmpbuf + first + 1, past_reloc, second);
3937 tmpbuf[first + second + 1] = '\0';
3938 return tmpbuf;
3941 as_bad (_("@%s reloc is not supported with %d-bit output format"),
3942 gotrel[j].str, 1 << (5 + object_64bit));
3943 return NULL;
3947 /* Might be a symbol version string. Don't as_bad here. */
3948 return NULL;
3951 void
3952 x86_cons (exp, size)
3953 expressionS *exp;
3954 int size;
3956 if (size == 4 || (object_64bit && size == 8))
3958 /* Handle @GOTOFF and the like in an expression. */
3959 char *save;
3960 char *gotfree_input_line;
3961 int adjust;
3963 save = input_line_pointer;
3964 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
3965 if (gotfree_input_line)
3966 input_line_pointer = gotfree_input_line;
3968 expression (exp);
3970 if (gotfree_input_line)
3972 /* expression () has merrily parsed up to the end of line,
3973 or a comma - in the wrong buffer. Transfer how far
3974 input_line_pointer has moved to the right buffer. */
3975 input_line_pointer = (save
3976 + (input_line_pointer - gotfree_input_line)
3977 + adjust);
3978 free (gotfree_input_line);
3981 else
3982 expression (exp);
3984 #endif
3986 static void signed_cons (int size)
3988 if (flag_code == CODE_64BIT)
3989 cons_sign = 1;
3990 cons (size);
3991 cons_sign = -1;
3994 #ifdef TE_PE
3995 static void
3996 pe_directive_secrel (dummy)
3997 int dummy ATTRIBUTE_UNUSED;
3999 expressionS exp;
4003 expression (&exp);
4004 if (exp.X_op == O_symbol)
4005 exp.X_op = O_secrel;
4007 emit_expr (&exp, 4);
4009 while (*input_line_pointer++ == ',');
4011 input_line_pointer--;
4012 demand_empty_rest_of_line ();
4014 #endif
4016 static int i386_immediate PARAMS ((char *));
4018 static int
4019 i386_immediate (imm_start)
4020 char *imm_start;
4022 char *save_input_line_pointer;
4023 char *gotfree_input_line;
4024 segT exp_seg = 0;
4025 expressionS *exp;
4026 unsigned int types = ~0U;
4028 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
4030 as_bad (_("only 1 or 2 immediate operands are allowed"));
4031 return 0;
4034 exp = &im_expressions[i.imm_operands++];
4035 i.op[this_operand].imms = exp;
4037 if (is_space_char (*imm_start))
4038 ++imm_start;
4040 save_input_line_pointer = input_line_pointer;
4041 input_line_pointer = imm_start;
4043 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
4044 if (gotfree_input_line)
4045 input_line_pointer = gotfree_input_line;
4047 exp_seg = expression (exp);
4049 SKIP_WHITESPACE ();
4050 if (*input_line_pointer)
4051 as_bad (_("junk `%s' after expression"), input_line_pointer);
4053 input_line_pointer = save_input_line_pointer;
4054 if (gotfree_input_line)
4055 free (gotfree_input_line);
4057 if (exp->X_op == O_absent || exp->X_op == O_big)
4059 /* Missing or bad expr becomes absolute 0. */
4060 as_bad (_("missing or invalid immediate expression `%s' taken as 0"),
4061 imm_start);
4062 exp->X_op = O_constant;
4063 exp->X_add_number = 0;
4064 exp->X_add_symbol = (symbolS *) 0;
4065 exp->X_op_symbol = (symbolS *) 0;
4067 else if (exp->X_op == O_constant)
4069 /* Size it properly later. */
4070 i.types[this_operand] |= Imm64;
4071 /* If BFD64, sign extend val. */
4072 if (!use_rela_relocations)
4073 if ((exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
4074 exp->X_add_number = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
4076 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
4077 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
4078 && exp_seg != absolute_section
4079 && exp_seg != text_section
4080 && exp_seg != data_section
4081 && exp_seg != bss_section
4082 && exp_seg != undefined_section
4083 && !bfd_is_com_section (exp_seg))
4085 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
4086 return 0;
4088 #endif
4089 else
4091 /* This is an address. The size of the address will be
4092 determined later, depending on destination register,
4093 suffix, or the default for the section. */
4094 i.types[this_operand] |= Imm8 | Imm16 | Imm32 | Imm32S | Imm64;
4095 i.types[this_operand] &= types;
4098 return 1;
4101 static char *i386_scale PARAMS ((char *));
4103 static char *
4104 i386_scale (scale)
4105 char *scale;
4107 offsetT val;
4108 char *save = input_line_pointer;
4110 input_line_pointer = scale;
4111 val = get_absolute_expression ();
4113 switch (val)
4115 case 1:
4116 i.log2_scale_factor = 0;
4117 break;
4118 case 2:
4119 i.log2_scale_factor = 1;
4120 break;
4121 case 4:
4122 i.log2_scale_factor = 2;
4123 break;
4124 case 8:
4125 i.log2_scale_factor = 3;
4126 break;
4127 default:
4129 char sep = *input_line_pointer;
4131 *input_line_pointer = '\0';
4132 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
4133 scale);
4134 *input_line_pointer = sep;
4135 input_line_pointer = save;
4136 return NULL;
4139 if (i.log2_scale_factor != 0 && i.index_reg == 0)
4141 as_warn (_("scale factor of %d without an index register"),
4142 1 << i.log2_scale_factor);
4143 #if SCALE1_WHEN_NO_INDEX
4144 i.log2_scale_factor = 0;
4145 #endif
4147 scale = input_line_pointer;
4148 input_line_pointer = save;
4149 return scale;
4152 static int i386_displacement PARAMS ((char *, char *));
4154 static int
4155 i386_displacement (disp_start, disp_end)
4156 char *disp_start;
4157 char *disp_end;
4159 expressionS *exp;
4160 segT exp_seg = 0;
4161 char *save_input_line_pointer;
4162 char *gotfree_input_line;
4163 int bigdisp, override;
4164 unsigned int types = Disp;
4166 if ((i.types[this_operand] & JumpAbsolute)
4167 || !(current_templates->start->opcode_modifier & (Jump | JumpDword)))
4169 bigdisp = Disp32;
4170 override = (i.prefix[ADDR_PREFIX] != 0);
4172 else
4174 /* For PC-relative branches, the width of the displacement
4175 is dependent upon data size, not address size. */
4176 bigdisp = 0;
4177 override = (i.prefix[DATA_PREFIX] != 0);
4179 if (flag_code == CODE_64BIT)
4181 if (!bigdisp)
4182 bigdisp = (override || i.suffix == WORD_MNEM_SUFFIX)
4183 ? Disp16
4184 : Disp32S | Disp32;
4185 else if (!override)
4186 bigdisp = Disp64 | Disp32S | Disp32;
4188 else
4190 if (!bigdisp)
4192 if (!override)
4193 override = (i.suffix == (flag_code != CODE_16BIT
4194 ? WORD_MNEM_SUFFIX
4195 : LONG_MNEM_SUFFIX));
4196 bigdisp = Disp32;
4198 if ((flag_code == CODE_16BIT) ^ override)
4199 bigdisp = Disp16;
4201 i.types[this_operand] |= bigdisp;
4203 exp = &disp_expressions[i.disp_operands];
4204 i.op[this_operand].disps = exp;
4205 i.disp_operands++;
4206 save_input_line_pointer = input_line_pointer;
4207 input_line_pointer = disp_start;
4208 END_STRING_AND_SAVE (disp_end);
4210 #ifndef GCC_ASM_O_HACK
4211 #define GCC_ASM_O_HACK 0
4212 #endif
4213 #if GCC_ASM_O_HACK
4214 END_STRING_AND_SAVE (disp_end + 1);
4215 if ((i.types[this_operand] & BaseIndex) != 0
4216 && displacement_string_end[-1] == '+')
4218 /* This hack is to avoid a warning when using the "o"
4219 constraint within gcc asm statements.
4220 For instance:
4222 #define _set_tssldt_desc(n,addr,limit,type) \
4223 __asm__ __volatile__ ( \
4224 "movw %w2,%0\n\t" \
4225 "movw %w1,2+%0\n\t" \
4226 "rorl $16,%1\n\t" \
4227 "movb %b1,4+%0\n\t" \
4228 "movb %4,5+%0\n\t" \
4229 "movb $0,6+%0\n\t" \
4230 "movb %h1,7+%0\n\t" \
4231 "rorl $16,%1" \
4232 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
4234 This works great except that the output assembler ends
4235 up looking a bit weird if it turns out that there is
4236 no offset. You end up producing code that looks like:
4238 #APP
4239 movw $235,(%eax)
4240 movw %dx,2+(%eax)
4241 rorl $16,%edx
4242 movb %dl,4+(%eax)
4243 movb $137,5+(%eax)
4244 movb $0,6+(%eax)
4245 movb %dh,7+(%eax)
4246 rorl $16,%edx
4247 #NO_APP
4249 So here we provide the missing zero. */
4251 *displacement_string_end = '0';
4253 #endif
4254 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
4255 if (gotfree_input_line)
4256 input_line_pointer = gotfree_input_line;
4258 exp_seg = expression (exp);
4260 SKIP_WHITESPACE ();
4261 if (*input_line_pointer)
4262 as_bad (_("junk `%s' after expression"), input_line_pointer);
4263 #if GCC_ASM_O_HACK
4264 RESTORE_END_STRING (disp_end + 1);
4265 #endif
4266 RESTORE_END_STRING (disp_end);
4267 input_line_pointer = save_input_line_pointer;
4268 if (gotfree_input_line)
4269 free (gotfree_input_line);
4271 /* We do this to make sure that the section symbol is in
4272 the symbol table. We will ultimately change the relocation
4273 to be relative to the beginning of the section. */
4274 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
4275 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
4276 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
4278 if (exp->X_op != O_symbol)
4280 as_bad (_("bad expression used with @%s"),
4281 (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
4282 ? "GOTPCREL"
4283 : "GOTOFF"));
4284 return 0;
4287 if (S_IS_LOCAL (exp->X_add_symbol)
4288 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section)
4289 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
4290 exp->X_op = O_subtract;
4291 exp->X_op_symbol = GOT_symbol;
4292 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
4293 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
4294 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
4295 i.reloc[this_operand] = BFD_RELOC_64;
4296 else
4297 i.reloc[this_operand] = BFD_RELOC_32;
4300 if (exp->X_op == O_absent || exp->X_op == O_big)
4302 /* Missing or bad expr becomes absolute 0. */
4303 as_bad (_("missing or invalid displacement expression `%s' taken as 0"),
4304 disp_start);
4305 exp->X_op = O_constant;
4306 exp->X_add_number = 0;
4307 exp->X_add_symbol = (symbolS *) 0;
4308 exp->X_op_symbol = (symbolS *) 0;
4311 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
4312 if (exp->X_op != O_constant
4313 && OUTPUT_FLAVOR == bfd_target_aout_flavour
4314 && exp_seg != absolute_section
4315 && exp_seg != text_section
4316 && exp_seg != data_section
4317 && exp_seg != bss_section
4318 && exp_seg != undefined_section
4319 && !bfd_is_com_section (exp_seg))
4321 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
4322 return 0;
4324 #endif
4326 if (!(i.types[this_operand] & ~Disp))
4327 i.types[this_operand] &= types;
4329 return 1;
4332 static int i386_index_check PARAMS ((const char *));
4334 /* Make sure the memory operand we've been dealt is valid.
4335 Return 1 on success, 0 on a failure. */
4337 static int
4338 i386_index_check (operand_string)
4339 const char *operand_string;
4341 int ok;
4342 #if INFER_ADDR_PREFIX
4343 int fudged = 0;
4345 tryprefix:
4346 #endif
4347 ok = 1;
4348 if ((current_templates->start->cpu_flags & CpuSVME)
4349 && current_templates->end[-1].operand_types[0] == AnyMem)
4351 /* Memory operands of SVME insns are special in that they only allow
4352 rAX as their memory address and ignore any segment override. */
4353 unsigned RegXX;
4355 /* SKINIT is even more restrictive: it always requires EAX. */
4356 if (strcmp (current_templates->start->name, "skinit") == 0)
4357 RegXX = Reg32;
4358 else if (flag_code == CODE_64BIT)
4359 RegXX = i.prefix[ADDR_PREFIX] == 0 ? Reg64 : Reg32;
4360 else
4361 RegXX = (flag_code == CODE_16BIT) ^ (i.prefix[ADDR_PREFIX] != 0)
4362 ? Reg16
4363 : Reg32;
4364 if (!i.base_reg
4365 || !(i.base_reg->reg_type & Acc)
4366 || !(i.base_reg->reg_type & RegXX)
4367 || i.index_reg
4368 || (i.types[0] & Disp))
4369 ok = 0;
4371 else if (flag_code == CODE_64BIT)
4373 unsigned RegXX = (i.prefix[ADDR_PREFIX] == 0 ? Reg64 : Reg32);
4375 if ((i.base_reg
4376 && ((i.base_reg->reg_type & RegXX) == 0)
4377 && (i.base_reg->reg_type != BaseIndex
4378 || i.index_reg))
4379 || (i.index_reg
4380 && ((i.index_reg->reg_type & (RegXX | BaseIndex))
4381 != (RegXX | BaseIndex))))
4382 ok = 0;
4384 else
4386 if ((flag_code == CODE_16BIT) ^ (i.prefix[ADDR_PREFIX] != 0))
4388 /* 16bit checks. */
4389 if ((i.base_reg
4390 && ((i.base_reg->reg_type & (Reg16 | BaseIndex | RegRex))
4391 != (Reg16 | BaseIndex)))
4392 || (i.index_reg
4393 && (((i.index_reg->reg_type & (Reg16 | BaseIndex))
4394 != (Reg16 | BaseIndex))
4395 || !(i.base_reg
4396 && i.base_reg->reg_num < 6
4397 && i.index_reg->reg_num >= 6
4398 && i.log2_scale_factor == 0))))
4399 ok = 0;
4401 else
4403 /* 32bit checks. */
4404 if ((i.base_reg
4405 && (i.base_reg->reg_type & (Reg32 | RegRex)) != Reg32)
4406 || (i.index_reg
4407 && ((i.index_reg->reg_type & (Reg32 | BaseIndex | RegRex))
4408 != (Reg32 | BaseIndex))))
4409 ok = 0;
4412 if (!ok)
4414 #if INFER_ADDR_PREFIX
4415 if (i.prefix[ADDR_PREFIX] == 0)
4417 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
4418 i.prefixes += 1;
4419 /* Change the size of any displacement too. At most one of
4420 Disp16 or Disp32 is set.
4421 FIXME. There doesn't seem to be any real need for separate
4422 Disp16 and Disp32 flags. The same goes for Imm16 and Imm32.
4423 Removing them would probably clean up the code quite a lot. */
4424 if (flag_code != CODE_64BIT && (i.types[this_operand] & (Disp16 | Disp32)))
4425 i.types[this_operand] ^= (Disp16 | Disp32);
4426 fudged = 1;
4427 goto tryprefix;
4429 if (fudged)
4430 as_bad (_("`%s' is not a valid base/index expression"),
4431 operand_string);
4432 else
4433 #endif
4434 as_bad (_("`%s' is not a valid %s bit base/index expression"),
4435 operand_string,
4436 flag_code_names[flag_code]);
4438 return ok;
4441 /* Parse OPERAND_STRING into the i386_insn structure I. Returns non-zero
4442 on error. */
4444 static int
4445 i386_operand (operand_string)
4446 char *operand_string;
4448 const reg_entry *r;
4449 char *end_op;
4450 char *op_string = operand_string;
4452 if (is_space_char (*op_string))
4453 ++op_string;
4455 /* We check for an absolute prefix (differentiating,
4456 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
4457 if (*op_string == ABSOLUTE_PREFIX)
4459 ++op_string;
4460 if (is_space_char (*op_string))
4461 ++op_string;
4462 i.types[this_operand] |= JumpAbsolute;
4465 /* Check if operand is a register. */
4466 if ((r = parse_register (op_string, &end_op)) != NULL)
4468 /* Check for a segment override by searching for ':' after a
4469 segment register. */
4470 op_string = end_op;
4471 if (is_space_char (*op_string))
4472 ++op_string;
4473 if (*op_string == ':' && (r->reg_type & (SReg2 | SReg3)))
4475 switch (r->reg_num)
4477 case 0:
4478 i.seg[i.mem_operands] = &es;
4479 break;
4480 case 1:
4481 i.seg[i.mem_operands] = &cs;
4482 break;
4483 case 2:
4484 i.seg[i.mem_operands] = &ss;
4485 break;
4486 case 3:
4487 i.seg[i.mem_operands] = &ds;
4488 break;
4489 case 4:
4490 i.seg[i.mem_operands] = &fs;
4491 break;
4492 case 5:
4493 i.seg[i.mem_operands] = &gs;
4494 break;
4497 /* Skip the ':' and whitespace. */
4498 ++op_string;
4499 if (is_space_char (*op_string))
4500 ++op_string;
4502 if (!is_digit_char (*op_string)
4503 && !is_identifier_char (*op_string)
4504 && *op_string != '('
4505 && *op_string != ABSOLUTE_PREFIX)
4507 as_bad (_("bad memory operand `%s'"), op_string);
4508 return 0;
4510 /* Handle case of %es:*foo. */
4511 if (*op_string == ABSOLUTE_PREFIX)
4513 ++op_string;
4514 if (is_space_char (*op_string))
4515 ++op_string;
4516 i.types[this_operand] |= JumpAbsolute;
4518 goto do_memory_reference;
4520 if (*op_string)
4522 as_bad (_("junk `%s' after register"), op_string);
4523 return 0;
4525 i.types[this_operand] |= r->reg_type & ~BaseIndex;
4526 i.op[this_operand].regs = r;
4527 i.reg_operands++;
4529 else if (*op_string == REGISTER_PREFIX)
4531 as_bad (_("bad register name `%s'"), op_string);
4532 return 0;
4534 else if (*op_string == IMMEDIATE_PREFIX)
4536 ++op_string;
4537 if (i.types[this_operand] & JumpAbsolute)
4539 as_bad (_("immediate operand illegal with absolute jump"));
4540 return 0;
4542 if (!i386_immediate (op_string))
4543 return 0;
4545 else if (is_digit_char (*op_string)
4546 || is_identifier_char (*op_string)
4547 || *op_string == '(')
4549 /* This is a memory reference of some sort. */
4550 char *base_string;
4552 /* Start and end of displacement string expression (if found). */
4553 char *displacement_string_start;
4554 char *displacement_string_end;
4556 do_memory_reference:
4557 if ((i.mem_operands == 1
4558 && (current_templates->start->opcode_modifier & IsString) == 0)
4559 || i.mem_operands == 2)
4561 as_bad (_("too many memory references for `%s'"),
4562 current_templates->start->name);
4563 return 0;
4566 /* Check for base index form. We detect the base index form by
4567 looking for an ')' at the end of the operand, searching
4568 for the '(' matching it, and finding a REGISTER_PREFIX or ','
4569 after the '('. */
4570 base_string = op_string + strlen (op_string);
4572 --base_string;
4573 if (is_space_char (*base_string))
4574 --base_string;
4576 /* If we only have a displacement, set-up for it to be parsed later. */
4577 displacement_string_start = op_string;
4578 displacement_string_end = base_string + 1;
4580 if (*base_string == ')')
4582 char *temp_string;
4583 unsigned int parens_balanced = 1;
4584 /* We've already checked that the number of left & right ()'s are
4585 equal, so this loop will not be infinite. */
4588 base_string--;
4589 if (*base_string == ')')
4590 parens_balanced++;
4591 if (*base_string == '(')
4592 parens_balanced--;
4594 while (parens_balanced);
4596 temp_string = base_string;
4598 /* Skip past '(' and whitespace. */
4599 ++base_string;
4600 if (is_space_char (*base_string))
4601 ++base_string;
4603 if (*base_string == ','
4604 || ((i.base_reg = parse_register (base_string, &end_op)) != NULL))
4606 displacement_string_end = temp_string;
4608 i.types[this_operand] |= BaseIndex;
4610 if (i.base_reg)
4612 base_string = end_op;
4613 if (is_space_char (*base_string))
4614 ++base_string;
4617 /* There may be an index reg or scale factor here. */
4618 if (*base_string == ',')
4620 ++base_string;
4621 if (is_space_char (*base_string))
4622 ++base_string;
4624 if ((i.index_reg = parse_register (base_string, &end_op)) != NULL)
4626 base_string = end_op;
4627 if (is_space_char (*base_string))
4628 ++base_string;
4629 if (*base_string == ',')
4631 ++base_string;
4632 if (is_space_char (*base_string))
4633 ++base_string;
4635 else if (*base_string != ')')
4637 as_bad (_("expecting `,' or `)' after index register in `%s'"),
4638 operand_string);
4639 return 0;
4642 else if (*base_string == REGISTER_PREFIX)
4644 as_bad (_("bad register name `%s'"), base_string);
4645 return 0;
4648 /* Check for scale factor. */
4649 if (*base_string != ')')
4651 char *end_scale = i386_scale (base_string);
4653 if (!end_scale)
4654 return 0;
4656 base_string = end_scale;
4657 if (is_space_char (*base_string))
4658 ++base_string;
4659 if (*base_string != ')')
4661 as_bad (_("expecting `)' after scale factor in `%s'"),
4662 operand_string);
4663 return 0;
4666 else if (!i.index_reg)
4668 as_bad (_("expecting index register or scale factor after `,'; got '%c'"),
4669 *base_string);
4670 return 0;
4673 else if (*base_string != ')')
4675 as_bad (_("expecting `,' or `)' after base register in `%s'"),
4676 operand_string);
4677 return 0;
4680 else if (*base_string == REGISTER_PREFIX)
4682 as_bad (_("bad register name `%s'"), base_string);
4683 return 0;
4687 /* If there's an expression beginning the operand, parse it,
4688 assuming displacement_string_start and
4689 displacement_string_end are meaningful. */
4690 if (displacement_string_start != displacement_string_end)
4692 if (!i386_displacement (displacement_string_start,
4693 displacement_string_end))
4694 return 0;
4697 /* Special case for (%dx) while doing input/output op. */
4698 if (i.base_reg
4699 && i.base_reg->reg_type == (Reg16 | InOutPortReg)
4700 && i.index_reg == 0
4701 && i.log2_scale_factor == 0
4702 && i.seg[i.mem_operands] == 0
4703 && (i.types[this_operand] & Disp) == 0)
4705 i.types[this_operand] = InOutPortReg;
4706 return 1;
4709 if (i386_index_check (operand_string) == 0)
4710 return 0;
4711 i.mem_operands++;
4713 else
4715 /* It's not a memory operand; argh! */
4716 as_bad (_("invalid char %s beginning operand %d `%s'"),
4717 output_invalid (*op_string),
4718 this_operand + 1,
4719 op_string);
4720 return 0;
4722 return 1; /* Normal return. */
4725 /* md_estimate_size_before_relax()
4727 Called just before relax() for rs_machine_dependent frags. The x86
4728 assembler uses these frags to handle variable size jump
4729 instructions.
4731 Any symbol that is now undefined will not become defined.
4732 Return the correct fr_subtype in the frag.
4733 Return the initial "guess for variable size of frag" to caller.
4734 The guess is actually the growth beyond the fixed part. Whatever
4735 we do to grow the fixed or variable part contributes to our
4736 returned value. */
4739 md_estimate_size_before_relax (fragP, segment)
4740 fragS *fragP;
4741 segT segment;
4743 /* We've already got fragP->fr_subtype right; all we have to do is
4744 check for un-relaxable symbols. On an ELF system, we can't relax
4745 an externally visible symbol, because it may be overridden by a
4746 shared library. */
4747 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
4748 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
4749 || (IS_ELF
4750 && (S_IS_EXTERNAL (fragP->fr_symbol)
4751 || S_IS_WEAK (fragP->fr_symbol)))
4752 #endif
4755 /* Symbol is undefined in this segment, or we need to keep a
4756 reloc so that weak symbols can be overridden. */
4757 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
4758 enum bfd_reloc_code_real reloc_type;
4759 unsigned char *opcode;
4760 int old_fr_fix;
4762 if (fragP->fr_var != NO_RELOC)
4763 reloc_type = fragP->fr_var;
4764 else if (size == 2)
4765 reloc_type = BFD_RELOC_16_PCREL;
4766 else
4767 reloc_type = BFD_RELOC_32_PCREL;
4769 old_fr_fix = fragP->fr_fix;
4770 opcode = (unsigned char *) fragP->fr_opcode;
4772 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
4774 case UNCOND_JUMP:
4775 /* Make jmp (0xeb) a (d)word displacement jump. */
4776 opcode[0] = 0xe9;
4777 fragP->fr_fix += size;
4778 fix_new (fragP, old_fr_fix, size,
4779 fragP->fr_symbol,
4780 fragP->fr_offset, 1,
4781 reloc_type);
4782 break;
4784 case COND_JUMP86:
4785 if (size == 2
4786 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
4788 /* Negate the condition, and branch past an
4789 unconditional jump. */
4790 opcode[0] ^= 1;
4791 opcode[1] = 3;
4792 /* Insert an unconditional jump. */
4793 opcode[2] = 0xe9;
4794 /* We added two extra opcode bytes, and have a two byte
4795 offset. */
4796 fragP->fr_fix += 2 + 2;
4797 fix_new (fragP, old_fr_fix + 2, 2,
4798 fragP->fr_symbol,
4799 fragP->fr_offset, 1,
4800 reloc_type);
4801 break;
4803 /* Fall through. */
4805 case COND_JUMP:
4806 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
4808 fixS *fixP;
4810 fragP->fr_fix += 1;
4811 fixP = fix_new (fragP, old_fr_fix, 1,
4812 fragP->fr_symbol,
4813 fragP->fr_offset, 1,
4814 BFD_RELOC_8_PCREL);
4815 fixP->fx_signed = 1;
4816 break;
4819 /* This changes the byte-displacement jump 0x7N
4820 to the (d)word-displacement jump 0x0f,0x8N. */
4821 opcode[1] = opcode[0] + 0x10;
4822 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
4823 /* We've added an opcode byte. */
4824 fragP->fr_fix += 1 + size;
4825 fix_new (fragP, old_fr_fix + 1, size,
4826 fragP->fr_symbol,
4827 fragP->fr_offset, 1,
4828 reloc_type);
4829 break;
4831 default:
4832 BAD_CASE (fragP->fr_subtype);
4833 break;
4835 frag_wane (fragP);
4836 return fragP->fr_fix - old_fr_fix;
4839 /* Guess size depending on current relax state. Initially the relax
4840 state will correspond to a short jump and we return 1, because
4841 the variable part of the frag (the branch offset) is one byte
4842 long. However, we can relax a section more than once and in that
4843 case we must either set fr_subtype back to the unrelaxed state,
4844 or return the value for the appropriate branch. */
4845 return md_relax_table[fragP->fr_subtype].rlx_length;
4848 /* Called after relax() is finished.
4850 In: Address of frag.
4851 fr_type == rs_machine_dependent.
4852 fr_subtype is what the address relaxed to.
4854 Out: Any fixSs and constants are set up.
4855 Caller will turn frag into a ".space 0". */
4857 void
4858 md_convert_frag (abfd, sec, fragP)
4859 bfd *abfd ATTRIBUTE_UNUSED;
4860 segT sec ATTRIBUTE_UNUSED;
4861 fragS *fragP;
4863 unsigned char *opcode;
4864 unsigned char *where_to_put_displacement = NULL;
4865 offsetT target_address;
4866 offsetT opcode_address;
4867 unsigned int extension = 0;
4868 offsetT displacement_from_opcode_start;
4870 opcode = (unsigned char *) fragP->fr_opcode;
4872 /* Address we want to reach in file space. */
4873 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
4875 /* Address opcode resides at in file space. */
4876 opcode_address = fragP->fr_address + fragP->fr_fix;
4878 /* Displacement from opcode start to fill into instruction. */
4879 displacement_from_opcode_start = target_address - opcode_address;
4881 if ((fragP->fr_subtype & BIG) == 0)
4883 /* Don't have to change opcode. */
4884 extension = 1; /* 1 opcode + 1 displacement */
4885 where_to_put_displacement = &opcode[1];
4887 else
4889 if (no_cond_jump_promotion
4890 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
4891 as_warn_where (fragP->fr_file, fragP->fr_line, _("long jump required"));
4893 switch (fragP->fr_subtype)
4895 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
4896 extension = 4; /* 1 opcode + 4 displacement */
4897 opcode[0] = 0xe9;
4898 where_to_put_displacement = &opcode[1];
4899 break;
4901 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
4902 extension = 2; /* 1 opcode + 2 displacement */
4903 opcode[0] = 0xe9;
4904 where_to_put_displacement = &opcode[1];
4905 break;
4907 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
4908 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
4909 extension = 5; /* 2 opcode + 4 displacement */
4910 opcode[1] = opcode[0] + 0x10;
4911 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
4912 where_to_put_displacement = &opcode[2];
4913 break;
4915 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
4916 extension = 3; /* 2 opcode + 2 displacement */
4917 opcode[1] = opcode[0] + 0x10;
4918 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
4919 where_to_put_displacement = &opcode[2];
4920 break;
4922 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
4923 extension = 4;
4924 opcode[0] ^= 1;
4925 opcode[1] = 3;
4926 opcode[2] = 0xe9;
4927 where_to_put_displacement = &opcode[3];
4928 break;
4930 default:
4931 BAD_CASE (fragP->fr_subtype);
4932 break;
4936 /* Now put displacement after opcode. */
4937 md_number_to_chars ((char *) where_to_put_displacement,
4938 (valueT) (displacement_from_opcode_start - extension),
4939 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
4940 fragP->fr_fix += extension;
4943 /* Size of byte displacement jmp. */
4944 int md_short_jump_size = 2;
4946 /* Size of dword displacement jmp. */
4947 int md_long_jump_size = 5;
4949 void
4950 md_create_short_jump (ptr, from_addr, to_addr, frag, to_symbol)
4951 char *ptr;
4952 addressT from_addr, to_addr;
4953 fragS *frag ATTRIBUTE_UNUSED;
4954 symbolS *to_symbol ATTRIBUTE_UNUSED;
4956 offsetT offset;
4958 offset = to_addr - (from_addr + 2);
4959 /* Opcode for byte-disp jump. */
4960 md_number_to_chars (ptr, (valueT) 0xeb, 1);
4961 md_number_to_chars (ptr + 1, (valueT) offset, 1);
4964 void
4965 md_create_long_jump (ptr, from_addr, to_addr, frag, to_symbol)
4966 char *ptr;
4967 addressT from_addr, to_addr;
4968 fragS *frag ATTRIBUTE_UNUSED;
4969 symbolS *to_symbol ATTRIBUTE_UNUSED;
4971 offsetT offset;
4973 offset = to_addr - (from_addr + 5);
4974 md_number_to_chars (ptr, (valueT) 0xe9, 1);
4975 md_number_to_chars (ptr + 1, (valueT) offset, 4);
4978 /* Apply a fixup (fixS) to segment data, once it has been determined
4979 by our caller that we have all the info we need to fix it up.
4981 On the 386, immediates, displacements, and data pointers are all in
4982 the same (little-endian) format, so we don't need to care about which
4983 we are handling. */
4985 void
4986 md_apply_fix (fixP, valP, seg)
4987 /* The fix we're to put in. */
4988 fixS *fixP;
4989 /* Pointer to the value of the bits. */
4990 valueT *valP;
4991 /* Segment fix is from. */
4992 segT seg ATTRIBUTE_UNUSED;
4994 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
4995 valueT value = *valP;
4997 #if !defined (TE_Mach)
4998 if (fixP->fx_pcrel)
5000 switch (fixP->fx_r_type)
5002 default:
5003 break;
5005 case BFD_RELOC_64:
5006 fixP->fx_r_type = BFD_RELOC_64_PCREL;
5007 break;
5008 case BFD_RELOC_32:
5009 case BFD_RELOC_X86_64_32S:
5010 fixP->fx_r_type = BFD_RELOC_32_PCREL;
5011 break;
5012 case BFD_RELOC_16:
5013 fixP->fx_r_type = BFD_RELOC_16_PCREL;
5014 break;
5015 case BFD_RELOC_8:
5016 fixP->fx_r_type = BFD_RELOC_8_PCREL;
5017 break;
5021 if (fixP->fx_addsy != NULL
5022 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
5023 || fixP->fx_r_type == BFD_RELOC_64_PCREL
5024 || fixP->fx_r_type == BFD_RELOC_16_PCREL
5025 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
5026 && !use_rela_relocations)
5028 /* This is a hack. There should be a better way to handle this.
5029 This covers for the fact that bfd_install_relocation will
5030 subtract the current location (for partial_inplace, PC relative
5031 relocations); see more below. */
5032 #ifndef OBJ_AOUT
5033 if (IS_ELF
5034 #ifdef TE_PE
5035 || OUTPUT_FLAVOR == bfd_target_coff_flavour
5036 #endif
5038 value += fixP->fx_where + fixP->fx_frag->fr_address;
5039 #endif
5040 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5041 if (IS_ELF)
5043 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
5045 if ((sym_seg == seg
5046 || (symbol_section_p (fixP->fx_addsy)
5047 && sym_seg != absolute_section))
5048 && !generic_force_reloc (fixP))
5050 /* Yes, we add the values in twice. This is because
5051 bfd_install_relocation subtracts them out again. I think
5052 bfd_install_relocation is broken, but I don't dare change
5053 it. FIXME. */
5054 value += fixP->fx_where + fixP->fx_frag->fr_address;
5057 #endif
5058 #if defined (OBJ_COFF) && defined (TE_PE)
5059 /* For some reason, the PE format does not store a
5060 section address offset for a PC relative symbol. */
5061 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
5062 || S_IS_WEAK (fixP->fx_addsy))
5063 value += md_pcrel_from (fixP);
5064 #endif
5067 /* Fix a few things - the dynamic linker expects certain values here,
5068 and we must not disappoint it. */
5069 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5070 if (IS_ELF && fixP->fx_addsy)
5071 switch (fixP->fx_r_type)
5073 case BFD_RELOC_386_PLT32:
5074 case BFD_RELOC_X86_64_PLT32:
5075 /* Make the jump instruction point to the address of the operand. At
5076 runtime we merely add the offset to the actual PLT entry. */
5077 value = -4;
5078 break;
5080 case BFD_RELOC_386_TLS_GD:
5081 case BFD_RELOC_386_TLS_LDM:
5082 case BFD_RELOC_386_TLS_IE_32:
5083 case BFD_RELOC_386_TLS_IE:
5084 case BFD_RELOC_386_TLS_GOTIE:
5085 case BFD_RELOC_386_TLS_GOTDESC:
5086 case BFD_RELOC_X86_64_TLSGD:
5087 case BFD_RELOC_X86_64_TLSLD:
5088 case BFD_RELOC_X86_64_GOTTPOFF:
5089 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
5090 value = 0; /* Fully resolved at runtime. No addend. */
5091 /* Fallthrough */
5092 case BFD_RELOC_386_TLS_LE:
5093 case BFD_RELOC_386_TLS_LDO_32:
5094 case BFD_RELOC_386_TLS_LE_32:
5095 case BFD_RELOC_X86_64_DTPOFF32:
5096 case BFD_RELOC_X86_64_DTPOFF64:
5097 case BFD_RELOC_X86_64_TPOFF32:
5098 case BFD_RELOC_X86_64_TPOFF64:
5099 S_SET_THREAD_LOCAL (fixP->fx_addsy);
5100 break;
5102 case BFD_RELOC_386_TLS_DESC_CALL:
5103 case BFD_RELOC_X86_64_TLSDESC_CALL:
5104 value = 0; /* Fully resolved at runtime. No addend. */
5105 S_SET_THREAD_LOCAL (fixP->fx_addsy);
5106 fixP->fx_done = 0;
5107 return;
5109 case BFD_RELOC_386_GOT32:
5110 case BFD_RELOC_X86_64_GOT32:
5111 value = 0; /* Fully resolved at runtime. No addend. */
5112 break;
5114 case BFD_RELOC_VTABLE_INHERIT:
5115 case BFD_RELOC_VTABLE_ENTRY:
5116 fixP->fx_done = 0;
5117 return;
5119 default:
5120 break;
5122 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
5123 *valP = value;
5124 #endif /* !defined (TE_Mach) */
5126 /* Are we finished with this relocation now? */
5127 if (fixP->fx_addsy == NULL)
5128 fixP->fx_done = 1;
5129 else if (use_rela_relocations)
5131 fixP->fx_no_overflow = 1;
5132 /* Remember value for tc_gen_reloc. */
5133 fixP->fx_addnumber = value;
5134 value = 0;
5137 md_number_to_chars (p, value, fixP->fx_size);
5140 #define MAX_LITTLENUMS 6
5142 /* Turn the string pointed to by litP into a floating point constant
5143 of type TYPE, and emit the appropriate bytes. The number of
5144 LITTLENUMS emitted is stored in *SIZEP. An error message is
5145 returned, or NULL on OK. */
5147 char *
5148 md_atof (type, litP, sizeP)
5149 int type;
5150 char *litP;
5151 int *sizeP;
5153 int prec;
5154 LITTLENUM_TYPE words[MAX_LITTLENUMS];
5155 LITTLENUM_TYPE *wordP;
5156 char *t;
5158 switch (type)
5160 case 'f':
5161 case 'F':
5162 prec = 2;
5163 break;
5165 case 'd':
5166 case 'D':
5167 prec = 4;
5168 break;
5170 case 'x':
5171 case 'X':
5172 prec = 5;
5173 break;
5175 default:
5176 *sizeP = 0;
5177 return _("Bad call to md_atof ()");
5179 t = atof_ieee (input_line_pointer, type, words);
5180 if (t)
5181 input_line_pointer = t;
5183 *sizeP = prec * sizeof (LITTLENUM_TYPE);
5184 /* This loops outputs the LITTLENUMs in REVERSE order; in accord with
5185 the bigendian 386. */
5186 for (wordP = words + prec - 1; prec--;)
5188 md_number_to_chars (litP, (valueT) (*wordP--), sizeof (LITTLENUM_TYPE));
5189 litP += sizeof (LITTLENUM_TYPE);
5191 return 0;
5194 static char output_invalid_buf[8];
5196 static char *
5197 output_invalid (c)
5198 int c;
5200 if (ISPRINT (c))
5201 sprintf (output_invalid_buf, "'%c'", c);
5202 else
5203 sprintf (output_invalid_buf, "(0x%x)", (unsigned) c);
5204 return output_invalid_buf;
5207 /* REG_STRING starts *before* REGISTER_PREFIX. */
5209 static const reg_entry *
5210 parse_real_register (char *reg_string, char **end_op)
5212 char *s = reg_string;
5213 char *p;
5214 char reg_name_given[MAX_REG_NAME_SIZE + 1];
5215 const reg_entry *r;
5217 /* Skip possible REGISTER_PREFIX and possible whitespace. */
5218 if (*s == REGISTER_PREFIX)
5219 ++s;
5221 if (is_space_char (*s))
5222 ++s;
5224 p = reg_name_given;
5225 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
5227 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
5228 return (const reg_entry *) NULL;
5229 s++;
5232 /* For naked regs, make sure that we are not dealing with an identifier.
5233 This prevents confusing an identifier like `eax_var' with register
5234 `eax'. */
5235 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
5236 return (const reg_entry *) NULL;
5238 *end_op = s;
5240 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
5242 /* Handle floating point regs, allowing spaces in the (i) part. */
5243 if (r == i386_regtab /* %st is first entry of table */)
5245 if (is_space_char (*s))
5246 ++s;
5247 if (*s == '(')
5249 ++s;
5250 if (is_space_char (*s))
5251 ++s;
5252 if (*s >= '0' && *s <= '7')
5254 r = &i386_float_regtab[*s - '0'];
5255 ++s;
5256 if (is_space_char (*s))
5257 ++s;
5258 if (*s == ')')
5260 *end_op = s + 1;
5261 return r;
5264 /* We have "%st(" then garbage. */
5265 return (const reg_entry *) NULL;
5269 if (r != NULL
5270 && ((r->reg_flags & (RegRex64 | RegRex)) | (r->reg_type & Reg64)) != 0
5271 && (r->reg_type != Control || !(cpu_arch_flags & CpuSledgehammer))
5272 && flag_code != CODE_64BIT)
5273 return (const reg_entry *) NULL;
5275 return r;
5278 /* REG_STRING starts *before* REGISTER_PREFIX. */
5280 static const reg_entry *
5281 parse_register (char *reg_string, char **end_op)
5283 const reg_entry *r;
5285 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
5286 r = parse_real_register (reg_string, end_op);
5287 else
5288 r = NULL;
5289 if (!r)
5291 char *save = input_line_pointer;
5292 char c;
5293 symbolS *symbolP;
5295 input_line_pointer = reg_string;
5296 c = get_symbol_end ();
5297 symbolP = symbol_find (reg_string);
5298 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
5300 const expressionS *e = symbol_get_value_expression (symbolP);
5302 know (e->X_op == O_register);
5303 know (e->X_add_number >= 0 && (valueT) e->X_add_number < ARRAY_SIZE (i386_regtab));
5304 r = i386_regtab + e->X_add_number;
5305 *end_op = input_line_pointer;
5307 *input_line_pointer = c;
5308 input_line_pointer = save;
5310 return r;
5314 i386_parse_name (char *name, expressionS *e, char *nextcharP)
5316 const reg_entry *r;
5317 char *end = input_line_pointer;
5319 *end = *nextcharP;
5320 r = parse_register (name, &input_line_pointer);
5321 if (r && end <= input_line_pointer)
5323 *nextcharP = *input_line_pointer;
5324 *input_line_pointer = 0;
5325 e->X_op = O_register;
5326 e->X_add_number = r - i386_regtab;
5327 return 1;
5329 input_line_pointer = end;
5330 *end = 0;
5331 return 0;
5334 void
5335 md_operand (expressionS *e)
5337 if (*input_line_pointer == REGISTER_PREFIX)
5339 char *end;
5340 const reg_entry *r = parse_real_register (input_line_pointer, &end);
5342 if (r)
5344 e->X_op = O_register;
5345 e->X_add_number = r - i386_regtab;
5346 input_line_pointer = end;
5352 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5353 const char *md_shortopts = "kVQ:sqn";
5354 #else
5355 const char *md_shortopts = "qn";
5356 #endif
5358 #define OPTION_32 (OPTION_MD_BASE + 0)
5359 #define OPTION_64 (OPTION_MD_BASE + 1)
5360 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
5362 struct option md_longopts[] = {
5363 {"32", no_argument, NULL, OPTION_32},
5364 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5365 {"64", no_argument, NULL, OPTION_64},
5366 #endif
5367 {"divide", no_argument, NULL, OPTION_DIVIDE},
5368 {NULL, no_argument, NULL, 0}
5370 size_t md_longopts_size = sizeof (md_longopts);
5373 md_parse_option (c, arg)
5374 int c;
5375 char *arg ATTRIBUTE_UNUSED;
5377 switch (c)
5379 case 'n':
5380 optimize_align_code = 0;
5381 break;
5383 case 'q':
5384 quiet_warnings = 1;
5385 break;
5387 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5388 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
5389 should be emitted or not. FIXME: Not implemented. */
5390 case 'Q':
5391 break;
5393 /* -V: SVR4 argument to print version ID. */
5394 case 'V':
5395 print_version_id ();
5396 break;
5398 /* -k: Ignore for FreeBSD compatibility. */
5399 case 'k':
5400 break;
5402 case 's':
5403 /* -s: On i386 Solaris, this tells the native assembler to use
5404 .stab instead of .stab.excl. We always use .stab anyhow. */
5405 break;
5407 case OPTION_64:
5409 const char **list, **l;
5411 list = bfd_target_list ();
5412 for (l = list; *l != NULL; l++)
5413 if (strcmp (*l, "elf64-x86-64") == 0)
5415 default_arch = "x86_64";
5416 break;
5418 if (*l == NULL)
5419 as_fatal (_("No compiled in support for x86_64"));
5420 free (list);
5422 break;
5423 #endif
5425 case OPTION_32:
5426 default_arch = "i386";
5427 break;
5429 case OPTION_DIVIDE:
5430 #ifdef SVR4_COMMENT_CHARS
5432 char *n, *t;
5433 const char *s;
5435 n = (char *) xmalloc (strlen (i386_comment_chars) + 1);
5436 t = n;
5437 for (s = i386_comment_chars; *s != '\0'; s++)
5438 if (*s != '/')
5439 *t++ = *s;
5440 *t = '\0';
5441 i386_comment_chars = n;
5443 #endif
5444 break;
5446 default:
5447 return 0;
5449 return 1;
5452 void
5453 md_show_usage (stream)
5454 FILE *stream;
5456 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5457 fprintf (stream, _("\
5458 -Q ignored\n\
5459 -V print assembler version number\n\
5460 -k ignored\n"));
5461 #endif
5462 fprintf (stream, _("\
5463 -n Do not optimize code alignment\n\
5464 -q quieten some warnings\n"));
5465 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5466 fprintf (stream, _("\
5467 -s ignored\n"));
5468 #endif
5469 #ifdef SVR4_COMMENT_CHARS
5470 fprintf (stream, _("\
5471 --divide do not treat `/' as a comment character\n"));
5472 #else
5473 fprintf (stream, _("\
5474 --divide ignored\n"));
5475 #endif
5478 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
5479 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))
5481 /* Pick the target format to use. */
5483 const char *
5484 i386_target_format ()
5486 if (!strcmp (default_arch, "x86_64"))
5487 set_code_flag (CODE_64BIT);
5488 else if (!strcmp (default_arch, "i386"))
5489 set_code_flag (CODE_32BIT);
5490 else
5491 as_fatal (_("Unknown architecture"));
5492 switch (OUTPUT_FLAVOR)
5494 #ifdef OBJ_MAYBE_AOUT
5495 case bfd_target_aout_flavour:
5496 return AOUT_TARGET_FORMAT;
5497 #endif
5498 #ifdef OBJ_MAYBE_COFF
5499 case bfd_target_coff_flavour:
5500 return "coff-i386";
5501 #endif
5502 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
5503 case bfd_target_elf_flavour:
5505 if (flag_code == CODE_64BIT)
5507 object_64bit = 1;
5508 use_rela_relocations = 1;
5510 return flag_code == CODE_64BIT ? "elf64-x86-64" : ELF_TARGET_FORMAT;
5512 #endif
5513 default:
5514 abort ();
5515 return NULL;
5519 #endif /* OBJ_MAYBE_ more than one */
5521 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))
5522 void i386_elf_emit_arch_note ()
5524 if (IS_ELF && cpu_arch_name != NULL)
5526 char *p;
5527 asection *seg = now_seg;
5528 subsegT subseg = now_subseg;
5529 Elf_Internal_Note i_note;
5530 Elf_External_Note e_note;
5531 asection *note_secp;
5532 int len;
5534 /* Create the .note section. */
5535 note_secp = subseg_new (".note", 0);
5536 bfd_set_section_flags (stdoutput,
5537 note_secp,
5538 SEC_HAS_CONTENTS | SEC_READONLY);
5540 /* Process the arch string. */
5541 len = strlen (cpu_arch_name);
5543 i_note.namesz = len + 1;
5544 i_note.descsz = 0;
5545 i_note.type = NT_ARCH;
5546 p = frag_more (sizeof (e_note.namesz));
5547 md_number_to_chars (p, (valueT) i_note.namesz, sizeof (e_note.namesz));
5548 p = frag_more (sizeof (e_note.descsz));
5549 md_number_to_chars (p, (valueT) i_note.descsz, sizeof (e_note.descsz));
5550 p = frag_more (sizeof (e_note.type));
5551 md_number_to_chars (p, (valueT) i_note.type, sizeof (e_note.type));
5552 p = frag_more (len + 1);
5553 strcpy (p, cpu_arch_name);
5555 frag_align (2, 0, 0);
5557 subseg_set (seg, subseg);
5560 #endif
5562 symbolS *
5563 md_undefined_symbol (name)
5564 char *name;
5566 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
5567 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
5568 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
5569 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
5571 if (!GOT_symbol)
5573 if (symbol_find (name))
5574 as_bad (_("GOT already in symbol table"));
5575 GOT_symbol = symbol_new (name, undefined_section,
5576 (valueT) 0, &zero_address_frag);
5578 return GOT_symbol;
5580 return 0;
5583 /* Round up a section size to the appropriate boundary. */
5585 valueT
5586 md_section_align (segment, size)
5587 segT segment ATTRIBUTE_UNUSED;
5588 valueT size;
5590 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
5591 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
5593 /* For a.out, force the section size to be aligned. If we don't do
5594 this, BFD will align it for us, but it will not write out the
5595 final bytes of the section. This may be a bug in BFD, but it is
5596 easier to fix it here since that is how the other a.out targets
5597 work. */
5598 int align;
5600 align = bfd_get_section_alignment (stdoutput, segment);
5601 size = ((size + (1 << align) - 1) & ((valueT) -1 << align));
5603 #endif
5605 return size;
5608 /* On the i386, PC-relative offsets are relative to the start of the
5609 next instruction. That is, the address of the offset, plus its
5610 size, since the offset is always the last part of the insn. */
5612 long
5613 md_pcrel_from (fixP)
5614 fixS *fixP;
5616 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
5619 #ifndef I386COFF
5621 static void
5622 s_bss (ignore)
5623 int ignore ATTRIBUTE_UNUSED;
5625 int temp;
5627 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5628 if (IS_ELF)
5629 obj_elf_section_change_hook ();
5630 #endif
5631 temp = get_absolute_expression ();
5632 subseg_set (bss_section, (subsegT) temp);
5633 demand_empty_rest_of_line ();
5636 #endif
5638 void
5639 i386_validate_fix (fixp)
5640 fixS *fixp;
5642 if (fixp->fx_subsy && fixp->fx_subsy == GOT_symbol)
5644 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
5646 if (!object_64bit)
5647 abort ();
5648 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
5650 else
5652 if (!object_64bit)
5653 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
5654 else
5655 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
5657 fixp->fx_subsy = 0;
5661 arelent *
5662 tc_gen_reloc (section, fixp)
5663 asection *section ATTRIBUTE_UNUSED;
5664 fixS *fixp;
5666 arelent *rel;
5667 bfd_reloc_code_real_type code;
5669 switch (fixp->fx_r_type)
5671 case BFD_RELOC_X86_64_PLT32:
5672 case BFD_RELOC_X86_64_GOT32:
5673 case BFD_RELOC_X86_64_GOTPCREL:
5674 case BFD_RELOC_386_PLT32:
5675 case BFD_RELOC_386_GOT32:
5676 case BFD_RELOC_386_GOTOFF:
5677 case BFD_RELOC_386_GOTPC:
5678 case BFD_RELOC_386_TLS_GD:
5679 case BFD_RELOC_386_TLS_LDM:
5680 case BFD_RELOC_386_TLS_LDO_32:
5681 case BFD_RELOC_386_TLS_IE_32:
5682 case BFD_RELOC_386_TLS_IE:
5683 case BFD_RELOC_386_TLS_GOTIE:
5684 case BFD_RELOC_386_TLS_LE_32:
5685 case BFD_RELOC_386_TLS_LE:
5686 case BFD_RELOC_386_TLS_GOTDESC:
5687 case BFD_RELOC_386_TLS_DESC_CALL:
5688 case BFD_RELOC_X86_64_TLSGD:
5689 case BFD_RELOC_X86_64_TLSLD:
5690 case BFD_RELOC_X86_64_DTPOFF32:
5691 case BFD_RELOC_X86_64_DTPOFF64:
5692 case BFD_RELOC_X86_64_GOTTPOFF:
5693 case BFD_RELOC_X86_64_TPOFF32:
5694 case BFD_RELOC_X86_64_TPOFF64:
5695 case BFD_RELOC_X86_64_GOTOFF64:
5696 case BFD_RELOC_X86_64_GOTPC32:
5697 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
5698 case BFD_RELOC_X86_64_TLSDESC_CALL:
5699 case BFD_RELOC_RVA:
5700 case BFD_RELOC_VTABLE_ENTRY:
5701 case BFD_RELOC_VTABLE_INHERIT:
5702 #ifdef TE_PE
5703 case BFD_RELOC_32_SECREL:
5704 #endif
5705 code = fixp->fx_r_type;
5706 break;
5707 case BFD_RELOC_X86_64_32S:
5708 if (!fixp->fx_pcrel)
5710 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
5711 code = fixp->fx_r_type;
5712 break;
5714 default:
5715 if (fixp->fx_pcrel)
5717 switch (fixp->fx_size)
5719 default:
5720 as_bad_where (fixp->fx_file, fixp->fx_line,
5721 _("can not do %d byte pc-relative relocation"),
5722 fixp->fx_size);
5723 code = BFD_RELOC_32_PCREL;
5724 break;
5725 case 1: code = BFD_RELOC_8_PCREL; break;
5726 case 2: code = BFD_RELOC_16_PCREL; break;
5727 case 4: code = BFD_RELOC_32_PCREL; break;
5728 #ifdef BFD64
5729 case 8: code = BFD_RELOC_64_PCREL; break;
5730 #endif
5733 else
5735 switch (fixp->fx_size)
5737 default:
5738 as_bad_where (fixp->fx_file, fixp->fx_line,
5739 _("can not do %d byte relocation"),
5740 fixp->fx_size);
5741 code = BFD_RELOC_32;
5742 break;
5743 case 1: code = BFD_RELOC_8; break;
5744 case 2: code = BFD_RELOC_16; break;
5745 case 4: code = BFD_RELOC_32; break;
5746 #ifdef BFD64
5747 case 8: code = BFD_RELOC_64; break;
5748 #endif
5751 break;
5754 if ((code == BFD_RELOC_32
5755 || code == BFD_RELOC_32_PCREL
5756 || code == BFD_RELOC_X86_64_32S)
5757 && GOT_symbol
5758 && fixp->fx_addsy == GOT_symbol)
5760 if (!object_64bit)
5761 code = BFD_RELOC_386_GOTPC;
5762 else
5763 code = BFD_RELOC_X86_64_GOTPC32;
5766 rel = (arelent *) xmalloc (sizeof (arelent));
5767 rel->sym_ptr_ptr = (asymbol **) xmalloc (sizeof (asymbol *));
5768 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
5770 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
5772 if (!use_rela_relocations)
5774 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
5775 vtable entry to be used in the relocation's section offset. */
5776 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
5777 rel->address = fixp->fx_offset;
5779 rel->addend = 0;
5781 /* Use the rela in 64bit mode. */
5782 else
5784 if (!fixp->fx_pcrel)
5785 rel->addend = fixp->fx_offset;
5786 else
5787 switch (code)
5789 case BFD_RELOC_X86_64_PLT32:
5790 case BFD_RELOC_X86_64_GOT32:
5791 case BFD_RELOC_X86_64_GOTPCREL:
5792 case BFD_RELOC_X86_64_TLSGD:
5793 case BFD_RELOC_X86_64_TLSLD:
5794 case BFD_RELOC_X86_64_GOTTPOFF:
5795 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
5796 case BFD_RELOC_X86_64_TLSDESC_CALL:
5797 rel->addend = fixp->fx_offset - fixp->fx_size;
5798 break;
5799 default:
5800 rel->addend = (section->vma
5801 - fixp->fx_size
5802 + fixp->fx_addnumber
5803 + md_pcrel_from (fixp));
5804 break;
5808 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
5809 if (rel->howto == NULL)
5811 as_bad_where (fixp->fx_file, fixp->fx_line,
5812 _("cannot represent relocation type %s"),
5813 bfd_get_reloc_code_name (code));
5814 /* Set howto to a garbage value so that we can keep going. */
5815 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
5816 assert (rel->howto != NULL);
5819 return rel;
5823 /* Parse operands using Intel syntax. This implements a recursive descent
5824 parser based on the BNF grammar published in Appendix B of the MASM 6.1
5825 Programmer's Guide.
5827 FIXME: We do not recognize the full operand grammar defined in the MASM
5828 documentation. In particular, all the structure/union and
5829 high-level macro operands are missing.
5831 Uppercase words are terminals, lower case words are non-terminals.
5832 Objects surrounded by double brackets '[[' ']]' are optional. Vertical
5833 bars '|' denote choices. Most grammar productions are implemented in
5834 functions called 'intel_<production>'.
5836 Initial production is 'expr'.
5838 addOp + | -
5840 alpha [a-zA-Z]
5842 binOp & | AND | \| | OR | ^ | XOR
5844 byteRegister AL | AH | BL | BH | CL | CH | DL | DH
5846 constant digits [[ radixOverride ]]
5848 dataType BYTE | WORD | DWORD | FWORD | QWORD | TBYTE | OWORD | XMMWORD
5850 digits decdigit
5851 | digits decdigit
5852 | digits hexdigit
5854 decdigit [0-9]
5856 e04 e04 addOp e05
5857 | e05
5859 e05 e05 binOp e06
5860 | e06
5862 e06 e06 mulOp e09
5863 | e09
5865 e09 OFFSET e10
5866 | SHORT e10
5867 | + e10
5868 | - e10
5869 | ~ e10
5870 | NOT e10
5871 | e09 PTR e10
5872 | e09 : e10
5873 | e10
5875 e10 e10 [ expr ]
5876 | e11
5878 e11 ( expr )
5879 | [ expr ]
5880 | constant
5881 | dataType
5882 | id
5884 | register
5886 => expr expr cmpOp e04
5887 | e04
5889 gpRegister AX | EAX | BX | EBX | CX | ECX | DX | EDX
5890 | BP | EBP | SP | ESP | DI | EDI | SI | ESI
5892 hexdigit a | b | c | d | e | f
5893 | A | B | C | D | E | F
5895 id alpha
5896 | id alpha
5897 | id decdigit
5899 mulOp * | / | % | MOD | << | SHL | >> | SHR
5901 quote " | '
5903 register specialRegister
5904 | gpRegister
5905 | byteRegister
5907 segmentRegister CS | DS | ES | FS | GS | SS
5909 specialRegister CR0 | CR2 | CR3 | CR4
5910 | DR0 | DR1 | DR2 | DR3 | DR6 | DR7
5911 | TR3 | TR4 | TR5 | TR6 | TR7
5913 We simplify the grammar in obvious places (e.g., register parsing is
5914 done by calling parse_register) and eliminate immediate left recursion
5915 to implement a recursive-descent parser.
5917 expr e04 expr'
5919 expr' cmpOp e04 expr'
5920 | Empty
5922 e04 e05 e04'
5924 e04' addOp e05 e04'
5925 | Empty
5927 e05 e06 e05'
5929 e05' binOp e06 e05'
5930 | Empty
5932 e06 e09 e06'
5934 e06' mulOp e09 e06'
5935 | Empty
5937 e09 OFFSET e10 e09'
5938 | SHORT e10'
5939 | + e10'
5940 | - e10'
5941 | ~ e10'
5942 | NOT e10'
5943 | e10 e09'
5945 e09' PTR e10 e09'
5946 | : e10 e09'
5947 | Empty
5949 e10 e11 e10'
5951 e10' [ expr ] e10'
5952 | Empty
5954 e11 ( expr )
5955 | [ expr ]
5956 | BYTE
5957 | WORD
5958 | DWORD
5959 | FWORD
5960 | QWORD
5961 | TBYTE
5962 | OWORD
5963 | XMMWORD
5966 | register
5967 | id
5968 | constant */
5970 /* Parsing structure for the intel syntax parser. Used to implement the
5971 semantic actions for the operand grammar. */
5972 struct intel_parser_s
5974 char *op_string; /* The string being parsed. */
5975 int got_a_float; /* Whether the operand is a float. */
5976 int op_modifier; /* Operand modifier. */
5977 int is_mem; /* 1 if operand is memory reference. */
5978 int in_offset; /* >=1 if parsing operand of offset. */
5979 int in_bracket; /* >=1 if parsing operand in brackets. */
5980 const reg_entry *reg; /* Last register reference found. */
5981 char *disp; /* Displacement string being built. */
5982 char *next_operand; /* Resume point when splitting operands. */
5985 static struct intel_parser_s intel_parser;
5987 /* Token structure for parsing intel syntax. */
5988 struct intel_token
5990 int code; /* Token code. */
5991 const reg_entry *reg; /* Register entry for register tokens. */
5992 char *str; /* String representation. */
5995 static struct intel_token cur_token, prev_token;
5997 /* Token codes for the intel parser. Since T_SHORT is already used
5998 by COFF, undefine it first to prevent a warning. */
5999 #define T_NIL -1
6000 #define T_CONST 1
6001 #define T_REG 2
6002 #define T_BYTE 3
6003 #define T_WORD 4
6004 #define T_DWORD 5
6005 #define T_FWORD 6
6006 #define T_QWORD 7
6007 #define T_TBYTE 8
6008 #define T_XMMWORD 9
6009 #undef T_SHORT
6010 #define T_SHORT 10
6011 #define T_OFFSET 11
6012 #define T_PTR 12
6013 #define T_ID 13
6014 #define T_SHL 14
6015 #define T_SHR 15
6017 /* Prototypes for intel parser functions. */
6018 static int intel_match_token PARAMS ((int code));
6019 static void intel_get_token PARAMS ((void));
6020 static void intel_putback_token PARAMS ((void));
6021 static int intel_expr PARAMS ((void));
6022 static int intel_e04 PARAMS ((void));
6023 static int intel_e05 PARAMS ((void));
6024 static int intel_e06 PARAMS ((void));
6025 static int intel_e09 PARAMS ((void));
6026 static int intel_bracket_expr PARAMS ((void));
6027 static int intel_e10 PARAMS ((void));
6028 static int intel_e11 PARAMS ((void));
6030 static int
6031 i386_intel_operand (operand_string, got_a_float)
6032 char *operand_string;
6033 int got_a_float;
6035 int ret;
6036 char *p;
6038 p = intel_parser.op_string = xstrdup (operand_string);
6039 intel_parser.disp = (char *) xmalloc (strlen (operand_string) + 1);
6041 for (;;)
6043 /* Initialize token holders. */
6044 cur_token.code = prev_token.code = T_NIL;
6045 cur_token.reg = prev_token.reg = NULL;
6046 cur_token.str = prev_token.str = NULL;
6048 /* Initialize parser structure. */
6049 intel_parser.got_a_float = got_a_float;
6050 intel_parser.op_modifier = 0;
6051 intel_parser.is_mem = 0;
6052 intel_parser.in_offset = 0;
6053 intel_parser.in_bracket = 0;
6054 intel_parser.reg = NULL;
6055 intel_parser.disp[0] = '\0';
6056 intel_parser.next_operand = NULL;
6058 /* Read the first token and start the parser. */
6059 intel_get_token ();
6060 ret = intel_expr ();
6062 if (!ret)
6063 break;
6065 if (cur_token.code != T_NIL)
6067 as_bad (_("invalid operand for '%s' ('%s' unexpected)"),
6068 current_templates->start->name, cur_token.str);
6069 ret = 0;
6071 /* If we found a memory reference, hand it over to i386_displacement
6072 to fill in the rest of the operand fields. */
6073 else if (intel_parser.is_mem)
6075 if ((i.mem_operands == 1
6076 && (current_templates->start->opcode_modifier & IsString) == 0)
6077 || i.mem_operands == 2)
6079 as_bad (_("too many memory references for '%s'"),
6080 current_templates->start->name);
6081 ret = 0;
6083 else
6085 char *s = intel_parser.disp;
6086 i.mem_operands++;
6088 if (!quiet_warnings && intel_parser.is_mem < 0)
6089 /* See the comments in intel_bracket_expr. */
6090 as_warn (_("Treating `%s' as memory reference"), operand_string);
6092 /* Add the displacement expression. */
6093 if (*s != '\0')
6094 ret = i386_displacement (s, s + strlen (s));
6095 if (ret)
6097 /* Swap base and index in 16-bit memory operands like
6098 [si+bx]. Since i386_index_check is also used in AT&T
6099 mode we have to do that here. */
6100 if (i.base_reg
6101 && i.index_reg
6102 && (i.base_reg->reg_type & Reg16)
6103 && (i.index_reg->reg_type & Reg16)
6104 && i.base_reg->reg_num >= 6
6105 && i.index_reg->reg_num < 6)
6107 const reg_entry *base = i.index_reg;
6109 i.index_reg = i.base_reg;
6110 i.base_reg = base;
6112 ret = i386_index_check (operand_string);
6117 /* Constant and OFFSET expressions are handled by i386_immediate. */
6118 else if ((intel_parser.op_modifier & (1 << T_OFFSET))
6119 || intel_parser.reg == NULL)
6120 ret = i386_immediate (intel_parser.disp);
6122 if (intel_parser.next_operand && this_operand >= MAX_OPERANDS - 1)
6123 ret = 0;
6124 if (!ret || !intel_parser.next_operand)
6125 break;
6126 intel_parser.op_string = intel_parser.next_operand;
6127 this_operand = i.operands++;
6130 free (p);
6131 free (intel_parser.disp);
6133 return ret;
6136 #define NUM_ADDRESS_REGS (!!i.base_reg + !!i.index_reg)
6138 /* expr e04 expr'
6140 expr' cmpOp e04 expr'
6141 | Empty */
6142 static int
6143 intel_expr ()
6145 /* XXX Implement the comparison operators. */
6146 return intel_e04 ();
6149 /* e04 e05 e04'
6151 e04' addOp e05 e04'
6152 | Empty */
6153 static int
6154 intel_e04 ()
6156 int nregs = -1;
6158 for (;;)
6160 if (!intel_e05())
6161 return 0;
6163 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
6164 i.base_reg = i386_regtab + REGNAM_AL; /* al is invalid as base */
6166 if (cur_token.code == '+')
6167 nregs = -1;
6168 else if (cur_token.code == '-')
6169 nregs = NUM_ADDRESS_REGS;
6170 else
6171 return 1;
6173 strcat (intel_parser.disp, cur_token.str);
6174 intel_match_token (cur_token.code);
6178 /* e05 e06 e05'
6180 e05' binOp e06 e05'
6181 | Empty */
6182 static int
6183 intel_e05 ()
6185 int nregs = ~NUM_ADDRESS_REGS;
6187 for (;;)
6189 if (!intel_e06())
6190 return 0;
6192 if (cur_token.code == '&' || cur_token.code == '|' || cur_token.code == '^')
6194 char str[2];
6196 str[0] = cur_token.code;
6197 str[1] = 0;
6198 strcat (intel_parser.disp, str);
6200 else
6201 break;
6203 intel_match_token (cur_token.code);
6205 if (nregs < 0)
6206 nregs = ~nregs;
6208 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
6209 i.base_reg = i386_regtab + REGNAM_AL + 1; /* cl is invalid as base */
6210 return 1;
6213 /* e06 e09 e06'
6215 e06' mulOp e09 e06'
6216 | Empty */
6217 static int
6218 intel_e06 ()
6220 int nregs = ~NUM_ADDRESS_REGS;
6222 for (;;)
6224 if (!intel_e09())
6225 return 0;
6227 if (cur_token.code == '*' || cur_token.code == '/' || cur_token.code == '%')
6229 char str[2];
6231 str[0] = cur_token.code;
6232 str[1] = 0;
6233 strcat (intel_parser.disp, str);
6235 else if (cur_token.code == T_SHL)
6236 strcat (intel_parser.disp, "<<");
6237 else if (cur_token.code == T_SHR)
6238 strcat (intel_parser.disp, ">>");
6239 else
6240 break;
6242 intel_match_token (cur_token.code);
6244 if (nregs < 0)
6245 nregs = ~nregs;
6247 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
6248 i.base_reg = i386_regtab + REGNAM_AL + 2; /* dl is invalid as base */
6249 return 1;
6252 /* e09 OFFSET e09
6253 | SHORT e09
6254 | + e09
6255 | - e09
6256 | ~ e09
6257 | NOT e09
6258 | e10 e09'
6260 e09' PTR e10 e09'
6261 | : e10 e09'
6262 | Empty */
6263 static int
6264 intel_e09 ()
6266 int nregs = ~NUM_ADDRESS_REGS;
6267 int in_offset = 0;
6269 for (;;)
6271 /* Don't consume constants here. */
6272 if (cur_token.code == '+' || cur_token.code == '-')
6274 /* Need to look one token ahead - if the next token
6275 is a constant, the current token is its sign. */
6276 int next_code;
6278 intel_match_token (cur_token.code);
6279 next_code = cur_token.code;
6280 intel_putback_token ();
6281 if (next_code == T_CONST)
6282 break;
6285 /* e09 OFFSET e09 */
6286 if (cur_token.code == T_OFFSET)
6288 if (!in_offset++)
6289 ++intel_parser.in_offset;
6292 /* e09 SHORT e09 */
6293 else if (cur_token.code == T_SHORT)
6294 intel_parser.op_modifier |= 1 << T_SHORT;
6296 /* e09 + e09 */
6297 else if (cur_token.code == '+')
6298 strcat (intel_parser.disp, "+");
6300 /* e09 - e09
6301 | ~ e09
6302 | NOT e09 */
6303 else if (cur_token.code == '-' || cur_token.code == '~')
6305 char str[2];
6307 if (nregs < 0)
6308 nregs = ~nregs;
6309 str[0] = cur_token.code;
6310 str[1] = 0;
6311 strcat (intel_parser.disp, str);
6314 /* e09 e10 e09' */
6315 else
6316 break;
6318 intel_match_token (cur_token.code);
6321 for (;;)
6323 if (!intel_e10 ())
6324 return 0;
6326 /* e09' PTR e10 e09' */
6327 if (cur_token.code == T_PTR)
6329 char suffix;
6331 if (prev_token.code == T_BYTE)
6332 suffix = BYTE_MNEM_SUFFIX;
6334 else if (prev_token.code == T_WORD)
6336 if (current_templates->start->name[0] == 'l'
6337 && current_templates->start->name[2] == 's'
6338 && current_templates->start->name[3] == 0)
6339 suffix = BYTE_MNEM_SUFFIX; /* so it will cause an error */
6340 else if (intel_parser.got_a_float == 2) /* "fi..." */
6341 suffix = SHORT_MNEM_SUFFIX;
6342 else
6343 suffix = WORD_MNEM_SUFFIX;
6346 else if (prev_token.code == T_DWORD)
6348 if (current_templates->start->name[0] == 'l'
6349 && current_templates->start->name[2] == 's'
6350 && current_templates->start->name[3] == 0)
6351 suffix = WORD_MNEM_SUFFIX;
6352 else if (flag_code == CODE_16BIT
6353 && (current_templates->start->opcode_modifier
6354 & (Jump | JumpDword)))
6355 suffix = LONG_DOUBLE_MNEM_SUFFIX;
6356 else if (intel_parser.got_a_float == 1) /* "f..." */
6357 suffix = SHORT_MNEM_SUFFIX;
6358 else
6359 suffix = LONG_MNEM_SUFFIX;
6362 else if (prev_token.code == T_FWORD)
6364 if (current_templates->start->name[0] == 'l'
6365 && current_templates->start->name[2] == 's'
6366 && current_templates->start->name[3] == 0)
6367 suffix = LONG_MNEM_SUFFIX;
6368 else if (!intel_parser.got_a_float)
6370 if (flag_code == CODE_16BIT)
6371 add_prefix (DATA_PREFIX_OPCODE);
6372 suffix = LONG_DOUBLE_MNEM_SUFFIX;
6374 else
6375 suffix = BYTE_MNEM_SUFFIX; /* so it will cause an error */
6378 else if (prev_token.code == T_QWORD)
6380 if (intel_parser.got_a_float == 1) /* "f..." */
6381 suffix = LONG_MNEM_SUFFIX;
6382 else
6383 suffix = QWORD_MNEM_SUFFIX;
6386 else if (prev_token.code == T_TBYTE)
6388 if (intel_parser.got_a_float == 1)
6389 suffix = LONG_DOUBLE_MNEM_SUFFIX;
6390 else
6391 suffix = BYTE_MNEM_SUFFIX; /* so it will cause an error */
6394 else if (prev_token.code == T_XMMWORD)
6396 /* XXX ignored for now, but accepted since gcc uses it */
6397 suffix = 0;
6400 else
6402 as_bad (_("Unknown operand modifier `%s'"), prev_token.str);
6403 return 0;
6406 /* Operands for jump/call using 'ptr' notation denote absolute
6407 addresses. */
6408 if (current_templates->start->opcode_modifier & (Jump | JumpDword))
6409 i.types[this_operand] |= JumpAbsolute;
6411 if (current_templates->start->base_opcode == 0x8d /* lea */)
6413 else if (!i.suffix)
6414 i.suffix = suffix;
6415 else if (i.suffix != suffix)
6417 as_bad (_("Conflicting operand modifiers"));
6418 return 0;
6423 /* e09' : e10 e09' */
6424 else if (cur_token.code == ':')
6426 if (prev_token.code != T_REG)
6428 /* While {call,jmp} SSSS:OOOO is MASM syntax only when SSSS is a
6429 segment/group identifier (which we don't have), using comma
6430 as the operand separator there is even less consistent, since
6431 there all branches only have a single operand. */
6432 if (this_operand != 0
6433 || intel_parser.in_offset
6434 || intel_parser.in_bracket
6435 || (!(current_templates->start->opcode_modifier
6436 & (Jump|JumpDword|JumpInterSegment))
6437 && !(current_templates->start->operand_types[0]
6438 & JumpAbsolute)))
6439 return intel_match_token (T_NIL);
6440 /* Remember the start of the 2nd operand and terminate 1st
6441 operand here.
6442 XXX This isn't right, yet (when SSSS:OOOO is right operand of
6443 another expression), but it gets at least the simplest case
6444 (a plain number or symbol on the left side) right. */
6445 intel_parser.next_operand = intel_parser.op_string;
6446 *--intel_parser.op_string = '\0';
6447 return intel_match_token (':');
6451 /* e09' Empty */
6452 else
6453 break;
6455 intel_match_token (cur_token.code);
6459 if (in_offset)
6461 --intel_parser.in_offset;
6462 if (nregs < 0)
6463 nregs = ~nregs;
6464 if (NUM_ADDRESS_REGS > nregs)
6466 as_bad (_("Invalid operand to `OFFSET'"));
6467 return 0;
6469 intel_parser.op_modifier |= 1 << T_OFFSET;
6472 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
6473 i.base_reg = i386_regtab + REGNAM_AL + 3; /* bl is invalid as base */
6474 return 1;
6477 static int
6478 intel_bracket_expr ()
6480 int was_offset = intel_parser.op_modifier & (1 << T_OFFSET);
6481 const char *start = intel_parser.op_string;
6482 int len;
6484 if (i.op[this_operand].regs)
6485 return intel_match_token (T_NIL);
6487 intel_match_token ('[');
6489 /* Mark as a memory operand only if it's not already known to be an
6490 offset expression. If it's an offset expression, we need to keep
6491 the brace in. */
6492 if (!intel_parser.in_offset)
6494 ++intel_parser.in_bracket;
6496 /* Operands for jump/call inside brackets denote absolute addresses. */
6497 if (current_templates->start->opcode_modifier & (Jump | JumpDword))
6498 i.types[this_operand] |= JumpAbsolute;
6500 /* Unfortunately gas always diverged from MASM in a respect that can't
6501 be easily fixed without risking to break code sequences likely to be
6502 encountered (the testsuite even check for this): MASM doesn't consider
6503 an expression inside brackets unconditionally as a memory reference.
6504 When that is e.g. a constant, an offset expression, or the sum of the
6505 two, this is still taken as a constant load. gas, however, always
6506 treated these as memory references. As a compromise, we'll try to make
6507 offset expressions inside brackets work the MASM way (since that's
6508 less likely to be found in real world code), but make constants alone
6509 continue to work the traditional gas way. In either case, issue a
6510 warning. */
6511 intel_parser.op_modifier &= ~was_offset;
6513 else
6514 strcat (intel_parser.disp, "[");
6516 /* Add a '+' to the displacement string if necessary. */
6517 if (*intel_parser.disp != '\0'
6518 && *(intel_parser.disp + strlen (intel_parser.disp) - 1) != '+')
6519 strcat (intel_parser.disp, "+");
6521 if (intel_expr ()
6522 && (len = intel_parser.op_string - start - 1,
6523 intel_match_token (']')))
6525 /* Preserve brackets when the operand is an offset expression. */
6526 if (intel_parser.in_offset)
6527 strcat (intel_parser.disp, "]");
6528 else
6530 --intel_parser.in_bracket;
6531 if (i.base_reg || i.index_reg)
6532 intel_parser.is_mem = 1;
6533 if (!intel_parser.is_mem)
6535 if (!(intel_parser.op_modifier & (1 << T_OFFSET)))
6536 /* Defer the warning until all of the operand was parsed. */
6537 intel_parser.is_mem = -1;
6538 else if (!quiet_warnings)
6539 as_warn (_("`[%.*s]' taken to mean just `%.*s'"), len, start, len, start);
6542 intel_parser.op_modifier |= was_offset;
6544 return 1;
6546 return 0;
6549 /* e10 e11 e10'
6551 e10' [ expr ] e10'
6552 | Empty */
6553 static int
6554 intel_e10 ()
6556 if (!intel_e11 ())
6557 return 0;
6559 while (cur_token.code == '[')
6561 if (!intel_bracket_expr ())
6562 return 0;
6565 return 1;
6568 /* e11 ( expr )
6569 | [ expr ]
6570 | BYTE
6571 | WORD
6572 | DWORD
6573 | FWORD
6574 | QWORD
6575 | TBYTE
6576 | OWORD
6577 | XMMWORD
6580 | register
6581 | id
6582 | constant */
6583 static int
6584 intel_e11 ()
6586 switch (cur_token.code)
6588 /* e11 ( expr ) */
6589 case '(':
6590 intel_match_token ('(');
6591 strcat (intel_parser.disp, "(");
6593 if (intel_expr () && intel_match_token (')'))
6595 strcat (intel_parser.disp, ")");
6596 return 1;
6598 return 0;
6600 /* e11 [ expr ] */
6601 case '[':
6602 return intel_bracket_expr ();
6604 /* e11 $
6605 | . */
6606 case '.':
6607 strcat (intel_parser.disp, cur_token.str);
6608 intel_match_token (cur_token.code);
6610 /* Mark as a memory operand only if it's not already known to be an
6611 offset expression. */
6612 if (!intel_parser.in_offset)
6613 intel_parser.is_mem = 1;
6615 return 1;
6617 /* e11 register */
6618 case T_REG:
6620 const reg_entry *reg = intel_parser.reg = cur_token.reg;
6622 intel_match_token (T_REG);
6624 /* Check for segment change. */
6625 if (cur_token.code == ':')
6627 if (!(reg->reg_type & (SReg2 | SReg3)))
6629 as_bad (_("`%s' is not a valid segment register"), reg->reg_name);
6630 return 0;
6632 else if (i.seg[i.mem_operands])
6633 as_warn (_("Extra segment override ignored"));
6634 else
6636 if (!intel_parser.in_offset)
6637 intel_parser.is_mem = 1;
6638 switch (reg->reg_num)
6640 case 0:
6641 i.seg[i.mem_operands] = &es;
6642 break;
6643 case 1:
6644 i.seg[i.mem_operands] = &cs;
6645 break;
6646 case 2:
6647 i.seg[i.mem_operands] = &ss;
6648 break;
6649 case 3:
6650 i.seg[i.mem_operands] = &ds;
6651 break;
6652 case 4:
6653 i.seg[i.mem_operands] = &fs;
6654 break;
6655 case 5:
6656 i.seg[i.mem_operands] = &gs;
6657 break;
6662 /* Not a segment register. Check for register scaling. */
6663 else if (cur_token.code == '*')
6665 if (!intel_parser.in_bracket)
6667 as_bad (_("Register scaling only allowed in memory operands"));
6668 return 0;
6671 if (reg->reg_type & Reg16) /* Disallow things like [si*1]. */
6672 reg = i386_regtab + REGNAM_AX + 4; /* sp is invalid as index */
6673 else if (i.index_reg)
6674 reg = i386_regtab + REGNAM_EAX + 4; /* esp is invalid as index */
6676 /* What follows must be a valid scale. */
6677 intel_match_token ('*');
6678 i.index_reg = reg;
6679 i.types[this_operand] |= BaseIndex;
6681 /* Set the scale after setting the register (otherwise,
6682 i386_scale will complain) */
6683 if (cur_token.code == '+' || cur_token.code == '-')
6685 char *str, sign = cur_token.code;
6686 intel_match_token (cur_token.code);
6687 if (cur_token.code != T_CONST)
6689 as_bad (_("Syntax error: Expecting a constant, got `%s'"),
6690 cur_token.str);
6691 return 0;
6693 str = (char *) xmalloc (strlen (cur_token.str) + 2);
6694 strcpy (str + 1, cur_token.str);
6695 *str = sign;
6696 if (!i386_scale (str))
6697 return 0;
6698 free (str);
6700 else if (!i386_scale (cur_token.str))
6701 return 0;
6702 intel_match_token (cur_token.code);
6705 /* No scaling. If this is a memory operand, the register is either a
6706 base register (first occurrence) or an index register (second
6707 occurrence). */
6708 else if (intel_parser.in_bracket)
6711 if (!i.base_reg)
6712 i.base_reg = reg;
6713 else if (!i.index_reg)
6714 i.index_reg = reg;
6715 else
6717 as_bad (_("Too many register references in memory operand"));
6718 return 0;
6721 i.types[this_operand] |= BaseIndex;
6724 /* It's neither base nor index. */
6725 else if (!intel_parser.in_offset && !intel_parser.is_mem)
6727 i.types[this_operand] |= reg->reg_type & ~BaseIndex;
6728 i.op[this_operand].regs = reg;
6729 i.reg_operands++;
6731 else
6733 as_bad (_("Invalid use of register"));
6734 return 0;
6737 /* Since registers are not part of the displacement string (except
6738 when we're parsing offset operands), we may need to remove any
6739 preceding '+' from the displacement string. */
6740 if (*intel_parser.disp != '\0'
6741 && !intel_parser.in_offset)
6743 char *s = intel_parser.disp;
6744 s += strlen (s) - 1;
6745 if (*s == '+')
6746 *s = '\0';
6749 return 1;
6752 /* e11 BYTE
6753 | WORD
6754 | DWORD
6755 | FWORD
6756 | QWORD
6757 | TBYTE
6758 | OWORD
6759 | XMMWORD */
6760 case T_BYTE:
6761 case T_WORD:
6762 case T_DWORD:
6763 case T_FWORD:
6764 case T_QWORD:
6765 case T_TBYTE:
6766 case T_XMMWORD:
6767 intel_match_token (cur_token.code);
6769 if (cur_token.code == T_PTR)
6770 return 1;
6772 /* It must have been an identifier. */
6773 intel_putback_token ();
6774 cur_token.code = T_ID;
6775 /* FALLTHRU */
6777 /* e11 id
6778 | constant */
6779 case T_ID:
6780 if (!intel_parser.in_offset && intel_parser.is_mem <= 0)
6782 symbolS *symbolP;
6784 /* The identifier represents a memory reference only if it's not
6785 preceded by an offset modifier and if it's not an equate. */
6786 symbolP = symbol_find(cur_token.str);
6787 if (!symbolP || S_GET_SEGMENT(symbolP) != absolute_section)
6788 intel_parser.is_mem = 1;
6790 /* FALLTHRU */
6792 case T_CONST:
6793 case '-':
6794 case '+':
6796 char *save_str, sign = 0;
6798 /* Allow constants that start with `+' or `-'. */
6799 if (cur_token.code == '-' || cur_token.code == '+')
6801 sign = cur_token.code;
6802 intel_match_token (cur_token.code);
6803 if (cur_token.code != T_CONST)
6805 as_bad (_("Syntax error: Expecting a constant, got `%s'"),
6806 cur_token.str);
6807 return 0;
6811 save_str = (char *) xmalloc (strlen (cur_token.str) + 2);
6812 strcpy (save_str + !!sign, cur_token.str);
6813 if (sign)
6814 *save_str = sign;
6816 /* Get the next token to check for register scaling. */
6817 intel_match_token (cur_token.code);
6819 /* Check if this constant is a scaling factor for an index register. */
6820 if (cur_token.code == '*')
6822 if (intel_match_token ('*') && cur_token.code == T_REG)
6824 const reg_entry *reg = cur_token.reg;
6826 if (!intel_parser.in_bracket)
6828 as_bad (_("Register scaling only allowed in memory operands"));
6829 return 0;
6832 if (reg->reg_type & Reg16) /* Disallow things like [1*si]. */
6833 reg = i386_regtab + REGNAM_AX + 4; /* sp is invalid as index */
6834 else if (i.index_reg)
6835 reg = i386_regtab + REGNAM_EAX + 4; /* esp is invalid as index */
6837 /* The constant is followed by `* reg', so it must be
6838 a valid scale. */
6839 i.index_reg = reg;
6840 i.types[this_operand] |= BaseIndex;
6842 /* Set the scale after setting the register (otherwise,
6843 i386_scale will complain) */
6844 if (!i386_scale (save_str))
6845 return 0;
6846 intel_match_token (T_REG);
6848 /* Since registers are not part of the displacement
6849 string, we may need to remove any preceding '+' from
6850 the displacement string. */
6851 if (*intel_parser.disp != '\0')
6853 char *s = intel_parser.disp;
6854 s += strlen (s) - 1;
6855 if (*s == '+')
6856 *s = '\0';
6859 free (save_str);
6861 return 1;
6864 /* The constant was not used for register scaling. Since we have
6865 already consumed the token following `*' we now need to put it
6866 back in the stream. */
6867 intel_putback_token ();
6870 /* Add the constant to the displacement string. */
6871 strcat (intel_parser.disp, save_str);
6872 free (save_str);
6874 return 1;
6878 as_bad (_("Unrecognized token '%s'"), cur_token.str);
6879 return 0;
6882 /* Match the given token against cur_token. If they match, read the next
6883 token from the operand string. */
6884 static int
6885 intel_match_token (code)
6886 int code;
6888 if (cur_token.code == code)
6890 intel_get_token ();
6891 return 1;
6893 else
6895 as_bad (_("Unexpected token `%s'"), cur_token.str);
6896 return 0;
6900 /* Read a new token from intel_parser.op_string and store it in cur_token. */
6901 static void
6902 intel_get_token ()
6904 char *end_op;
6905 const reg_entry *reg;
6906 struct intel_token new_token;
6908 new_token.code = T_NIL;
6909 new_token.reg = NULL;
6910 new_token.str = NULL;
6912 /* Free the memory allocated to the previous token and move
6913 cur_token to prev_token. */
6914 if (prev_token.str)
6915 free (prev_token.str);
6917 prev_token = cur_token;
6919 /* Skip whitespace. */
6920 while (is_space_char (*intel_parser.op_string))
6921 intel_parser.op_string++;
6923 /* Return an empty token if we find nothing else on the line. */
6924 if (*intel_parser.op_string == '\0')
6926 cur_token = new_token;
6927 return;
6930 /* The new token cannot be larger than the remainder of the operand
6931 string. */
6932 new_token.str = (char *) xmalloc (strlen (intel_parser.op_string) + 1);
6933 new_token.str[0] = '\0';
6935 if (strchr ("0123456789", *intel_parser.op_string))
6937 char *p = new_token.str;
6938 char *q = intel_parser.op_string;
6939 new_token.code = T_CONST;
6941 /* Allow any kind of identifier char to encompass floating point and
6942 hexadecimal numbers. */
6943 while (is_identifier_char (*q))
6944 *p++ = *q++;
6945 *p = '\0';
6947 /* Recognize special symbol names [0-9][bf]. */
6948 if (strlen (intel_parser.op_string) == 2
6949 && (intel_parser.op_string[1] == 'b'
6950 || intel_parser.op_string[1] == 'f'))
6951 new_token.code = T_ID;
6954 else if ((reg = parse_register (intel_parser.op_string, &end_op)) != NULL)
6956 size_t len = end_op - intel_parser.op_string;
6958 new_token.code = T_REG;
6959 new_token.reg = reg;
6961 memcpy (new_token.str, intel_parser.op_string, len);
6962 new_token.str[len] = '\0';
6965 else if (is_identifier_char (*intel_parser.op_string))
6967 char *p = new_token.str;
6968 char *q = intel_parser.op_string;
6970 /* A '.' or '$' followed by an identifier char is an identifier.
6971 Otherwise, it's operator '.' followed by an expression. */
6972 if ((*q == '.' || *q == '$') && !is_identifier_char (*(q + 1)))
6974 new_token.code = '.';
6975 new_token.str[0] = '.';
6976 new_token.str[1] = '\0';
6978 else
6980 while (is_identifier_char (*q) || *q == '@')
6981 *p++ = *q++;
6982 *p = '\0';
6984 if (strcasecmp (new_token.str, "NOT") == 0)
6985 new_token.code = '~';
6987 else if (strcasecmp (new_token.str, "MOD") == 0)
6988 new_token.code = '%';
6990 else if (strcasecmp (new_token.str, "AND") == 0)
6991 new_token.code = '&';
6993 else if (strcasecmp (new_token.str, "OR") == 0)
6994 new_token.code = '|';
6996 else if (strcasecmp (new_token.str, "XOR") == 0)
6997 new_token.code = '^';
6999 else if (strcasecmp (new_token.str, "SHL") == 0)
7000 new_token.code = T_SHL;
7002 else if (strcasecmp (new_token.str, "SHR") == 0)
7003 new_token.code = T_SHR;
7005 else if (strcasecmp (new_token.str, "BYTE") == 0)
7006 new_token.code = T_BYTE;
7008 else if (strcasecmp (new_token.str, "WORD") == 0)
7009 new_token.code = T_WORD;
7011 else if (strcasecmp (new_token.str, "DWORD") == 0)
7012 new_token.code = T_DWORD;
7014 else if (strcasecmp (new_token.str, "FWORD") == 0)
7015 new_token.code = T_FWORD;
7017 else if (strcasecmp (new_token.str, "QWORD") == 0)
7018 new_token.code = T_QWORD;
7020 else if (strcasecmp (new_token.str, "TBYTE") == 0
7021 /* XXX remove (gcc still uses it) */
7022 || strcasecmp (new_token.str, "XWORD") == 0)
7023 new_token.code = T_TBYTE;
7025 else if (strcasecmp (new_token.str, "XMMWORD") == 0
7026 || strcasecmp (new_token.str, "OWORD") == 0)
7027 new_token.code = T_XMMWORD;
7029 else if (strcasecmp (new_token.str, "PTR") == 0)
7030 new_token.code = T_PTR;
7032 else if (strcasecmp (new_token.str, "SHORT") == 0)
7033 new_token.code = T_SHORT;
7035 else if (strcasecmp (new_token.str, "OFFSET") == 0)
7037 new_token.code = T_OFFSET;
7039 /* ??? This is not mentioned in the MASM grammar but gcc
7040 makes use of it with -mintel-syntax. OFFSET may be
7041 followed by FLAT: */
7042 if (strncasecmp (q, " FLAT:", 6) == 0)
7043 strcat (new_token.str, " FLAT:");
7046 /* ??? This is not mentioned in the MASM grammar. */
7047 else if (strcasecmp (new_token.str, "FLAT") == 0)
7049 new_token.code = T_OFFSET;
7050 if (*q == ':')
7051 strcat (new_token.str, ":");
7052 else
7053 as_bad (_("`:' expected"));
7056 else
7057 new_token.code = T_ID;
7061 else if (strchr ("+-/*%|&^:[]()~", *intel_parser.op_string))
7063 new_token.code = *intel_parser.op_string;
7064 new_token.str[0] = *intel_parser.op_string;
7065 new_token.str[1] = '\0';
7068 else if (strchr ("<>", *intel_parser.op_string)
7069 && *intel_parser.op_string == *(intel_parser.op_string + 1))
7071 new_token.code = *intel_parser.op_string == '<' ? T_SHL : T_SHR;
7072 new_token.str[0] = *intel_parser.op_string;
7073 new_token.str[1] = *intel_parser.op_string;
7074 new_token.str[2] = '\0';
7077 else
7078 as_bad (_("Unrecognized token `%s'"), intel_parser.op_string);
7080 intel_parser.op_string += strlen (new_token.str);
7081 cur_token = new_token;
7084 /* Put cur_token back into the token stream and make cur_token point to
7085 prev_token. */
7086 static void
7087 intel_putback_token ()
7089 if (cur_token.code != T_NIL)
7091 intel_parser.op_string -= strlen (cur_token.str);
7092 free (cur_token.str);
7094 cur_token = prev_token;
7096 /* Forget prev_token. */
7097 prev_token.code = T_NIL;
7098 prev_token.reg = NULL;
7099 prev_token.str = NULL;
7103 tc_x86_regname_to_dw2regnum (const char *regname)
7105 unsigned int regnum;
7106 unsigned int regnames_count;
7107 static const char *const regnames_32[] =
7109 "eax", "ecx", "edx", "ebx",
7110 "esp", "ebp", "esi", "edi",
7111 "eip", "eflags", NULL,
7112 "st0", "st1", "st2", "st3",
7113 "st4", "st5", "st6", "st7",
7114 NULL, NULL,
7115 "xmm0", "xmm1", "xmm2", "xmm3",
7116 "xmm4", "xmm5", "xmm6", "xmm7",
7117 "mm0", "mm1", "mm2", "mm3",
7118 "mm4", "mm5", "mm6", "mm7",
7119 "fcw", "fsw", "mxcsr",
7120 "es", "cs", "ss", "ds", "fs", "gs", NULL, NULL,
7121 "tr", "ldtr"
7123 static const char *const regnames_64[] =
7125 "rax", "rdx", "rcx", "rbx",
7126 "rsi", "rdi", "rbp", "rsp",
7127 "r8", "r9", "r10", "r11",
7128 "r12", "r13", "r14", "r15",
7129 "rip",
7130 "xmm0", "xmm1", "xmm2", "xmm3",
7131 "xmm4", "xmm5", "xmm6", "xmm7",
7132 "xmm8", "xmm9", "xmm10", "xmm11",
7133 "xmm12", "xmm13", "xmm14", "xmm15",
7134 "st0", "st1", "st2", "st3",
7135 "st4", "st5", "st6", "st7",
7136 "mm0", "mm1", "mm2", "mm3",
7137 "mm4", "mm5", "mm6", "mm7",
7138 "rflags",
7139 "es", "cs", "ss", "ds", "fs", "gs", NULL, NULL,
7140 "fs.base", "gs.base", NULL, NULL,
7141 "tr", "ldtr",
7142 "mxcsr", "fcw", "fsw"
7144 const char *const *regnames;
7146 if (flag_code == CODE_64BIT)
7148 regnames = regnames_64;
7149 regnames_count = ARRAY_SIZE (regnames_64);
7151 else
7153 regnames = regnames_32;
7154 regnames_count = ARRAY_SIZE (regnames_32);
7157 for (regnum = 0; regnum < regnames_count; regnum++)
7158 if (regnames[regnum] != NULL
7159 && strcmp (regname, regnames[regnum]) == 0)
7160 return regnum;
7162 return -1;
7165 void
7166 tc_x86_frame_initial_instructions (void)
7168 static unsigned int sp_regno;
7170 if (!sp_regno)
7171 sp_regno = tc_x86_regname_to_dw2regnum (flag_code == CODE_64BIT
7172 ? "rsp" : "esp");
7174 cfi_add_CFA_def_cfa (sp_regno, -x86_cie_data_alignment);
7175 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
7179 i386_elf_section_type (const char *str, size_t len)
7181 if (flag_code == CODE_64BIT
7182 && len == sizeof ("unwind") - 1
7183 && strncmp (str, "unwind", 6) == 0)
7184 return SHT_X86_64_UNWIND;
7186 return -1;
7189 #ifdef TE_PE
7190 void
7191 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
7193 expressionS expr;
7195 expr.X_op = O_secrel;
7196 expr.X_add_symbol = symbol;
7197 expr.X_add_number = 0;
7198 emit_expr (&expr, size);
7200 #endif
7202 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7203 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
7206 x86_64_section_letter (int letter, char **ptr_msg)
7208 if (flag_code == CODE_64BIT)
7210 if (letter == 'l')
7211 return SHF_X86_64_LARGE;
7213 *ptr_msg = _("Bad .section directive: want a,l,w,x,M,S,G,T in string");
7215 else
7216 *ptr_msg = _("Bad .section directive: want a,w,x,M,S,G,T in string");
7217 return -1;
7221 x86_64_section_word (char *str, size_t len)
7223 if (len == 5 && flag_code == CODE_64BIT && strncmp (str, "large", 5) == 0)
7224 return SHF_X86_64_LARGE;
7226 return -1;
7229 static void
7230 handle_large_common (int small ATTRIBUTE_UNUSED)
7232 if (flag_code != CODE_64BIT)
7234 s_comm_internal (0, elf_common_parse);
7235 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
7237 else
7239 static segT lbss_section;
7240 asection *saved_com_section_ptr = elf_com_section_ptr;
7241 asection *saved_bss_section = bss_section;
7243 if (lbss_section == NULL)
7245 flagword applicable;
7246 segT seg = now_seg;
7247 subsegT subseg = now_subseg;
7249 /* The .lbss section is for local .largecomm symbols. */
7250 lbss_section = subseg_new (".lbss", 0);
7251 applicable = bfd_applicable_section_flags (stdoutput);
7252 bfd_set_section_flags (stdoutput, lbss_section,
7253 applicable & SEC_ALLOC);
7254 seg_info (lbss_section)->bss = 1;
7256 subseg_set (seg, subseg);
7259 elf_com_section_ptr = &_bfd_elf_large_com_section;
7260 bss_section = lbss_section;
7262 s_comm_internal (0, elf_common_parse);
7264 elf_com_section_ptr = saved_com_section_ptr;
7265 bss_section = saved_bss_section;
7268 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */