1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright 1989, 1991, 1992, 1993, 1994, 1995, 1996, 1997, 1998, 1999,
3 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010
4 Free Software Foundation, Inc.
6 This file is part of GAS, the GNU Assembler.
8 GAS is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 3, or (at your option)
13 GAS is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with GAS; see the file COPYING. If not, write to the Free
20 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
23 /* Intel 80386 machine specific gas.
24 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
25 x86_64 support by Jan Hubicka (jh@suse.cz)
26 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
27 Bugs & suggestions are completely welcome. This is free software.
28 Please help us make it better. */
31 #include "safe-ctype.h"
33 #include "dwarf2dbg.h"
34 #include "dw2gencfi.h"
35 #include "elf/x86-64.h"
36 #include "opcodes/i386-init.h"
38 #ifndef REGISTER_WARNINGS
39 #define REGISTER_WARNINGS 1
42 #ifndef INFER_ADDR_PREFIX
43 #define INFER_ADDR_PREFIX 1
47 #define DEFAULT_ARCH "i386"
52 #define INLINE __inline__
58 /* Prefixes will be emitted in the order defined below.
59 WAIT_PREFIX must be the first prefix since FWAIT is really is an
60 instruction, and so must come before any prefixes.
61 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
62 REP_PREFIX, LOCK_PREFIX. */
69 #define REX_PREFIX 6 /* must come last. */
70 #define MAX_PREFIXES 7 /* max prefixes per opcode */
72 /* we define the syntax here (modulo base,index,scale syntax) */
73 #define REGISTER_PREFIX '%'
74 #define IMMEDIATE_PREFIX '$'
75 #define ABSOLUTE_PREFIX '*'
77 /* these are the instruction mnemonic suffixes in AT&T syntax or
78 memory operand size in Intel syntax. */
79 #define WORD_MNEM_SUFFIX 'w'
80 #define BYTE_MNEM_SUFFIX 'b'
81 #define SHORT_MNEM_SUFFIX 's'
82 #define LONG_MNEM_SUFFIX 'l'
83 #define QWORD_MNEM_SUFFIX 'q'
84 #define XMMWORD_MNEM_SUFFIX 'x'
85 #define YMMWORD_MNEM_SUFFIX 'y'
86 /* Intel Syntax. Use a non-ascii letter since since it never appears
88 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
90 #define END_OF_INSN '\0'
93 'templates' is for grouping together 'template' structures for opcodes
94 of the same name. This is only used for storing the insns in the grand
95 ole hash table of insns.
96 The templates themselves start at START and range up to (but not including)
101 const insn_template *start;
102 const insn_template *end;
106 /* 386 operand encoding bytes: see 386 book for details of this. */
109 unsigned int regmem; /* codes register or memory operand */
110 unsigned int reg; /* codes register operand (or extended opcode) */
111 unsigned int mode; /* how to interpret regmem & reg */
115 /* x86-64 extension prefix. */
116 typedef int rex_byte;
118 /* 386 opcode byte to code indirect addressing. */
127 /* x86 arch names, types and features */
130 const char *name; /* arch name */
131 unsigned int len; /* arch string length */
132 enum processor_type type; /* arch type */
133 i386_cpu_flags flags; /* cpu feature flags */
134 unsigned int skip; /* show_arch should skip this. */
135 unsigned int negated; /* turn off indicated flags. */
139 static void update_code_flag (int, int);
140 static void set_code_flag (int);
141 static void set_16bit_gcc_code_flag (int);
142 static void set_intel_syntax (int);
143 static void set_intel_mnemonic (int);
144 static void set_allow_index_reg (int);
145 static void set_sse_check (int);
146 static void set_cpu_arch (int);
148 static void pe_directive_secrel (int);
150 static void signed_cons (int);
151 static char *output_invalid (int c);
152 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
154 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
156 static int i386_att_operand (char *);
157 static int i386_intel_operand (char *, int);
158 static int i386_intel_simplify (expressionS *);
159 static int i386_intel_parse_name (const char *, expressionS *);
160 static const reg_entry *parse_register (char *, char **);
161 static char *parse_insn (char *, char *);
162 static char *parse_operands (char *, const char *);
163 static void swap_operands (void);
164 static void swap_2_operands (int, int);
165 static void optimize_imm (void);
166 static void optimize_disp (void);
167 static const insn_template *match_template (void);
168 static int check_string (void);
169 static int process_suffix (void);
170 static int check_byte_reg (void);
171 static int check_long_reg (void);
172 static int check_qword_reg (void);
173 static int check_word_reg (void);
174 static int finalize_imm (void);
175 static int process_operands (void);
176 static const seg_entry *build_modrm_byte (void);
177 static void output_insn (void);
178 static void output_imm (fragS *, offsetT);
179 static void output_disp (fragS *, offsetT);
181 static void s_bss (int);
183 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
184 static void handle_large_common (int small ATTRIBUTE_UNUSED);
187 static const char *default_arch = DEFAULT_ARCH;
192 /* VEX prefix is either 2 byte or 3 byte. */
193 unsigned char bytes[3];
195 /* Destination or source register specifier. */
196 const reg_entry *register_specifier;
199 /* 'md_assemble ()' gathers together information and puts it into a
206 const reg_entry *regs;
211 operand_size_mismatch,
212 operand_type_mismatch,
213 register_type_mismatch,
214 number_of_operands_mismatch,
215 invalid_instruction_suffix,
218 unsupported_with_intel_mnemonic,
225 /* TM holds the template for the insn were currently assembling. */
228 /* SUFFIX holds the instruction size suffix for byte, word, dword
229 or qword, if given. */
232 /* OPERANDS gives the number of given operands. */
233 unsigned int operands;
235 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
236 of given register, displacement, memory operands and immediate
238 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
240 /* TYPES [i] is the type (see above #defines) which tells us how to
241 use OP[i] for the corresponding operand. */
242 i386_operand_type types[MAX_OPERANDS];
244 /* Displacement expression, immediate expression, or register for each
246 union i386_op op[MAX_OPERANDS];
248 /* Flags for operands. */
249 unsigned int flags[MAX_OPERANDS];
250 #define Operand_PCrel 1
252 /* Relocation type for operand */
253 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
255 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
256 the base index byte below. */
257 const reg_entry *base_reg;
258 const reg_entry *index_reg;
259 unsigned int log2_scale_factor;
261 /* SEG gives the seg_entries of this insn. They are zero unless
262 explicit segment overrides are given. */
263 const seg_entry *seg[2];
265 /* PREFIX holds all the given prefix opcodes (usually null).
266 PREFIXES is the number of prefix opcodes. */
267 unsigned int prefixes;
268 unsigned char prefix[MAX_PREFIXES];
270 /* RM and SIB are the modrm byte and the sib byte where the
271 addressing modes of this insn are encoded. */
277 /* Swap operand in encoding. */
278 unsigned int swap_operand;
280 /* Force 32bit displacement in encoding. */
281 unsigned int disp32_encoding;
284 enum i386_error error;
287 typedef struct _i386_insn i386_insn;
289 /* List of chars besides those in app.c:symbol_chars that can start an
290 operand. Used to prevent the scrubber eating vital white-space. */
291 const char extra_symbol_chars[] = "*%-(["
300 #if (defined (TE_I386AIX) \
301 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
302 && !defined (TE_GNU) \
303 && !defined (TE_LINUX) \
304 && !defined (TE_NETWARE) \
305 && !defined (TE_FreeBSD) \
306 && !defined (TE_DragonFly) \
307 && !defined (TE_NetBSD)))
308 /* This array holds the chars that always start a comment. If the
309 pre-processor is disabled, these aren't very useful. The option
310 --divide will remove '/' from this list. */
311 const char *i386_comment_chars = "#/";
312 #define SVR4_COMMENT_CHARS 1
313 #define PREFIX_SEPARATOR '\\'
316 const char *i386_comment_chars = "#";
317 #define PREFIX_SEPARATOR '/'
320 /* This array holds the chars that only start a comment at the beginning of
321 a line. If the line seems to have the form '# 123 filename'
322 .line and .file directives will appear in the pre-processed output.
323 Note that input_file.c hand checks for '#' at the beginning of the
324 first line of the input file. This is because the compiler outputs
325 #NO_APP at the beginning of its output.
326 Also note that comments started like this one will always work if
327 '/' isn't otherwise defined. */
328 const char line_comment_chars[] = "#/";
330 const char line_separator_chars[] = ";";
332 /* Chars that can be used to separate mant from exp in floating point
334 const char EXP_CHARS[] = "eE";
336 /* Chars that mean this number is a floating point constant
339 const char FLT_CHARS[] = "fFdDxX";
341 /* Tables for lexical analysis. */
342 static char mnemonic_chars[256];
343 static char register_chars[256];
344 static char operand_chars[256];
345 static char identifier_chars[256];
346 static char digit_chars[256];
348 /* Lexical macros. */
349 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
350 #define is_operand_char(x) (operand_chars[(unsigned char) x])
351 #define is_register_char(x) (register_chars[(unsigned char) x])
352 #define is_space_char(x) ((x) == ' ')
353 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
354 #define is_digit_char(x) (digit_chars[(unsigned char) x])
356 /* All non-digit non-letter characters that may occur in an operand. */
357 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
359 /* md_assemble() always leaves the strings it's passed unaltered. To
360 effect this we maintain a stack of saved characters that we've smashed
361 with '\0's (indicating end of strings for various sub-fields of the
362 assembler instruction). */
363 static char save_stack[32];
364 static char *save_stack_p;
365 #define END_STRING_AND_SAVE(s) \
366 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
367 #define RESTORE_END_STRING(s) \
368 do { *(s) = *--save_stack_p; } while (0)
370 /* The instruction we're assembling. */
373 /* Possible templates for current insn. */
374 static const templates *current_templates;
376 /* Per instruction expressionS buffers: max displacements & immediates. */
377 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
378 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
380 /* Current operand we are working on. */
381 static int this_operand = -1;
383 /* We support four different modes. FLAG_CODE variable is used to distinguish
391 static enum flag_code flag_code;
392 static unsigned int object_64bit;
393 static unsigned int disallow_64bit_reloc;
394 static int use_rela_relocations = 0;
396 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
397 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
398 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
400 /* The ELF ABI to use. */
408 static enum x86_elf_abi x86_elf_abi = I386_ABI;
411 /* The names used to print error messages. */
412 static const char *flag_code_names[] =
419 /* 1 for intel syntax,
421 static int intel_syntax = 0;
423 /* 1 for intel mnemonic,
424 0 if att mnemonic. */
425 static int intel_mnemonic = !SYSV386_COMPAT;
427 /* 1 if support old (<= 2.8.1) versions of gcc. */
428 static int old_gcc = OLDGCC_COMPAT;
430 /* 1 if pseudo registers are permitted. */
431 static int allow_pseudo_reg = 0;
433 /* 1 if register prefix % not required. */
434 static int allow_naked_reg = 0;
436 /* 1 if pseudo index register, eiz/riz, is allowed . */
437 static int allow_index_reg = 0;
447 /* Register prefix used for error message. */
448 static const char *register_prefix = "%";
450 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
451 leave, push, and pop instructions so that gcc has the same stack
452 frame as in 32 bit mode. */
453 static char stackop_size = '\0';
455 /* Non-zero to optimize code alignment. */
456 int optimize_align_code = 1;
458 /* Non-zero to quieten some warnings. */
459 static int quiet_warnings = 0;
462 static const char *cpu_arch_name = NULL;
463 static char *cpu_sub_arch_name = NULL;
465 /* CPU feature flags. */
466 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
468 /* If we have selected a cpu we are generating instructions for. */
469 static int cpu_arch_tune_set = 0;
471 /* Cpu we are generating instructions for. */
472 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
474 /* CPU feature flags of cpu we are generating instructions for. */
475 static i386_cpu_flags cpu_arch_tune_flags;
477 /* CPU instruction set architecture used. */
478 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
480 /* CPU feature flags of instruction set architecture used. */
481 i386_cpu_flags cpu_arch_isa_flags;
483 /* If set, conditional jumps are not automatically promoted to handle
484 larger than a byte offset. */
485 static unsigned int no_cond_jump_promotion = 0;
487 /* Encode SSE instructions with VEX prefix. */
488 static unsigned int sse2avx;
490 /* Encode scalar AVX instructions with specific vector length. */
497 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
498 static symbolS *GOT_symbol;
500 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
501 unsigned int x86_dwarf2_return_column;
503 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
504 int x86_cie_data_alignment;
506 /* Interface to relax_segment.
507 There are 3 major relax states for 386 jump insns because the
508 different types of jumps add different sizes to frags when we're
509 figuring out what sort of jump to choose to reach a given label. */
512 #define UNCOND_JUMP 0
514 #define COND_JUMP86 2
519 #define SMALL16 (SMALL | CODE16)
521 #define BIG16 (BIG | CODE16)
525 #define INLINE __inline__
531 #define ENCODE_RELAX_STATE(type, size) \
532 ((relax_substateT) (((type) << 2) | (size)))
533 #define TYPE_FROM_RELAX_STATE(s) \
535 #define DISP_SIZE_FROM_RELAX_STATE(s) \
536 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
538 /* This table is used by relax_frag to promote short jumps to long
539 ones where necessary. SMALL (short) jumps may be promoted to BIG
540 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
541 don't allow a short jump in a 32 bit code segment to be promoted to
542 a 16 bit offset jump because it's slower (requires data size
543 prefix), and doesn't work, unless the destination is in the bottom
544 64k of the code segment (The top 16 bits of eip are zeroed). */
546 const relax_typeS md_relax_table[] =
549 1) most positive reach of this state,
550 2) most negative reach of this state,
551 3) how many bytes this mode will have in the variable part of the frag
552 4) which index into the table to try if we can't fit into this one. */
554 /* UNCOND_JUMP states. */
555 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
556 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
557 /* dword jmp adds 4 bytes to frag:
558 0 extra opcode bytes, 4 displacement bytes. */
560 /* word jmp adds 2 byte2 to frag:
561 0 extra opcode bytes, 2 displacement bytes. */
564 /* COND_JUMP states. */
565 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
566 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
567 /* dword conditionals adds 5 bytes to frag:
568 1 extra opcode byte, 4 displacement bytes. */
570 /* word conditionals add 3 bytes to frag:
571 1 extra opcode byte, 2 displacement bytes. */
574 /* COND_JUMP86 states. */
575 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
576 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
577 /* dword conditionals adds 5 bytes to frag:
578 1 extra opcode byte, 4 displacement bytes. */
580 /* word conditionals add 4 bytes to frag:
581 1 displacement byte and a 3 byte long branch insn. */
585 static const arch_entry cpu_arch[] =
587 /* Do not replace the first two entries - i386_target_format()
588 relies on them being there in this order. */
589 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
590 CPU_GENERIC32_FLAGS, 0, 0 },
591 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
592 CPU_GENERIC64_FLAGS, 0, 0 },
593 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
594 CPU_NONE_FLAGS, 0, 0 },
595 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
596 CPU_I186_FLAGS, 0, 0 },
597 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
598 CPU_I286_FLAGS, 0, 0 },
599 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
600 CPU_I386_FLAGS, 0, 0 },
601 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
602 CPU_I486_FLAGS, 0, 0 },
603 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
604 CPU_I586_FLAGS, 0, 0 },
605 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
606 CPU_I686_FLAGS, 0, 0 },
607 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
608 CPU_I586_FLAGS, 0, 0 },
609 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
610 CPU_PENTIUMPRO_FLAGS, 0, 0 },
611 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
612 CPU_P2_FLAGS, 0, 0 },
613 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
614 CPU_P3_FLAGS, 0, 0 },
615 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
616 CPU_P4_FLAGS, 0, 0 },
617 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
618 CPU_CORE_FLAGS, 0, 0 },
619 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
620 CPU_NOCONA_FLAGS, 0, 0 },
621 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
622 CPU_CORE_FLAGS, 1, 0 },
623 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
624 CPU_CORE_FLAGS, 0, 0 },
625 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
626 CPU_CORE2_FLAGS, 1, 0 },
627 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
628 CPU_CORE2_FLAGS, 0, 0 },
629 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
630 CPU_COREI7_FLAGS, 0, 0 },
631 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
632 CPU_L1OM_FLAGS, 0, 0 },
633 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
634 CPU_K6_FLAGS, 0, 0 },
635 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
636 CPU_K6_2_FLAGS, 0, 0 },
637 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
638 CPU_ATHLON_FLAGS, 0, 0 },
639 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
640 CPU_K8_FLAGS, 1, 0 },
641 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
642 CPU_K8_FLAGS, 0, 0 },
643 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
644 CPU_K8_FLAGS, 0, 0 },
645 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
646 CPU_AMDFAM10_FLAGS, 0, 0 },
647 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BDVER1,
648 CPU_BDVER1_FLAGS, 0, 0 },
649 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
650 CPU_8087_FLAGS, 0, 0 },
651 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
652 CPU_287_FLAGS, 0, 0 },
653 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
654 CPU_387_FLAGS, 0, 0 },
655 { STRING_COMMA_LEN (".no87"), PROCESSOR_UNKNOWN,
656 CPU_ANY87_FLAGS, 0, 1 },
657 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
658 CPU_MMX_FLAGS, 0, 0 },
659 { STRING_COMMA_LEN (".nommx"), PROCESSOR_UNKNOWN,
660 CPU_3DNOWA_FLAGS, 0, 1 },
661 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
662 CPU_SSE_FLAGS, 0, 0 },
663 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
664 CPU_SSE2_FLAGS, 0, 0 },
665 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
666 CPU_SSE3_FLAGS, 0, 0 },
667 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
668 CPU_SSSE3_FLAGS, 0, 0 },
669 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
670 CPU_SSE4_1_FLAGS, 0, 0 },
671 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
672 CPU_SSE4_2_FLAGS, 0, 0 },
673 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
674 CPU_SSE4_2_FLAGS, 0, 0 },
675 { STRING_COMMA_LEN (".nosse"), PROCESSOR_UNKNOWN,
676 CPU_ANY_SSE_FLAGS, 0, 1 },
677 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
678 CPU_AVX_FLAGS, 0, 0 },
679 { STRING_COMMA_LEN (".noavx"), PROCESSOR_UNKNOWN,
680 CPU_ANY_AVX_FLAGS, 0, 1 },
681 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
682 CPU_VMX_FLAGS, 0, 0 },
683 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
684 CPU_SMX_FLAGS, 0, 0 },
685 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
686 CPU_XSAVE_FLAGS, 0, 0 },
687 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
688 CPU_XSAVEOPT_FLAGS, 0, 0 },
689 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
690 CPU_AES_FLAGS, 0, 0 },
691 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
692 CPU_PCLMUL_FLAGS, 0, 0 },
693 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
694 CPU_PCLMUL_FLAGS, 1, 0 },
695 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
696 CPU_FSGSBASE_FLAGS, 0, 0 },
697 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
698 CPU_RDRND_FLAGS, 0, 0 },
699 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
700 CPU_F16C_FLAGS, 0, 0 },
701 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
702 CPU_FMA_FLAGS, 0, 0 },
703 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
704 CPU_FMA4_FLAGS, 0, 0 },
705 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
706 CPU_XOP_FLAGS, 0, 0 },
707 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
708 CPU_LWP_FLAGS, 0, 0 },
709 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
710 CPU_MOVBE_FLAGS, 0, 0 },
711 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
712 CPU_EPT_FLAGS, 0, 0 },
713 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
714 CPU_CLFLUSH_FLAGS, 0, 0 },
715 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
716 CPU_NOP_FLAGS, 0, 0 },
717 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
718 CPU_SYSCALL_FLAGS, 0, 0 },
719 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
720 CPU_RDTSCP_FLAGS, 0, 0 },
721 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
722 CPU_3DNOW_FLAGS, 0, 0 },
723 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
724 CPU_3DNOWA_FLAGS, 0, 0 },
725 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
726 CPU_PADLOCK_FLAGS, 0, 0 },
727 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
728 CPU_SVME_FLAGS, 1, 0 },
729 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
730 CPU_SVME_FLAGS, 0, 0 },
731 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
732 CPU_SSE4A_FLAGS, 0, 0 },
733 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
734 CPU_ABM_FLAGS, 0, 0 },
735 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
736 CPU_BMI_FLAGS, 0, 0 },
737 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
738 CPU_TBM_FLAGS, 0, 0 },
742 /* Like s_lcomm_internal in gas/read.c but the alignment string
743 is allowed to be optional. */
746 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
753 && *input_line_pointer == ',')
755 align = parse_align (needs_align - 1);
757 if (align == (addressT) -1)
772 bss_alloc (symbolP, size, align);
777 pe_lcomm (int needs_align)
779 s_comm_internal (needs_align * 2, pe_lcomm_internal);
783 const pseudo_typeS md_pseudo_table[] =
785 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
786 {"align", s_align_bytes, 0},
788 {"align", s_align_ptwo, 0},
790 {"arch", set_cpu_arch, 0},
794 {"lcomm", pe_lcomm, 1},
796 {"ffloat", float_cons, 'f'},
797 {"dfloat", float_cons, 'd'},
798 {"tfloat", float_cons, 'x'},
800 {"slong", signed_cons, 4},
801 {"noopt", s_ignore, 0},
802 {"optim", s_ignore, 0},
803 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
804 {"code16", set_code_flag, CODE_16BIT},
805 {"code32", set_code_flag, CODE_32BIT},
806 {"code64", set_code_flag, CODE_64BIT},
807 {"intel_syntax", set_intel_syntax, 1},
808 {"att_syntax", set_intel_syntax, 0},
809 {"intel_mnemonic", set_intel_mnemonic, 1},
810 {"att_mnemonic", set_intel_mnemonic, 0},
811 {"allow_index_reg", set_allow_index_reg, 1},
812 {"disallow_index_reg", set_allow_index_reg, 0},
813 {"sse_check", set_sse_check, 0},
814 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
815 {"largecomm", handle_large_common, 0},
817 {"file", (void (*) (int)) dwarf2_directive_file, 0},
818 {"loc", dwarf2_directive_loc, 0},
819 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
822 {"secrel32", pe_directive_secrel, 0},
827 /* For interface with expression (). */
828 extern char *input_line_pointer;
830 /* Hash table for instruction mnemonic lookup. */
831 static struct hash_control *op_hash;
833 /* Hash table for register lookup. */
834 static struct hash_control *reg_hash;
837 i386_align_code (fragS *fragP, int count)
839 /* Various efficient no-op patterns for aligning code labels.
840 Note: Don't try to assemble the instructions in the comments.
841 0L and 0w are not legal. */
842 static const char f32_1[] =
844 static const char f32_2[] =
845 {0x66,0x90}; /* xchg %ax,%ax */
846 static const char f32_3[] =
847 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
848 static const char f32_4[] =
849 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
850 static const char f32_5[] =
852 0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
853 static const char f32_6[] =
854 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
855 static const char f32_7[] =
856 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
857 static const char f32_8[] =
859 0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
860 static const char f32_9[] =
861 {0x89,0xf6, /* movl %esi,%esi */
862 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
863 static const char f32_10[] =
864 {0x8d,0x76,0x00, /* leal 0(%esi),%esi */
865 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
866 static const char f32_11[] =
867 {0x8d,0x74,0x26,0x00, /* leal 0(%esi,1),%esi */
868 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
869 static const char f32_12[] =
870 {0x8d,0xb6,0x00,0x00,0x00,0x00, /* leal 0L(%esi),%esi */
871 0x8d,0xbf,0x00,0x00,0x00,0x00}; /* leal 0L(%edi),%edi */
872 static const char f32_13[] =
873 {0x8d,0xb6,0x00,0x00,0x00,0x00, /* leal 0L(%esi),%esi */
874 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
875 static const char f32_14[] =
876 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00, /* leal 0L(%esi,1),%esi */
877 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
878 static const char f16_3[] =
879 {0x8d,0x74,0x00}; /* lea 0(%esi),%esi */
880 static const char f16_4[] =
881 {0x8d,0xb4,0x00,0x00}; /* lea 0w(%si),%si */
882 static const char f16_5[] =
884 0x8d,0xb4,0x00,0x00}; /* lea 0w(%si),%si */
885 static const char f16_6[] =
886 {0x89,0xf6, /* mov %si,%si */
887 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
888 static const char f16_7[] =
889 {0x8d,0x74,0x00, /* lea 0(%si),%si */
890 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
891 static const char f16_8[] =
892 {0x8d,0xb4,0x00,0x00, /* lea 0w(%si),%si */
893 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
894 static const char jump_31[] =
895 {0xeb,0x1d,0x90,0x90,0x90,0x90,0x90, /* jmp .+31; lotsa nops */
896 0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90,
897 0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90,
898 0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90};
899 static const char *const f32_patt[] = {
900 f32_1, f32_2, f32_3, f32_4, f32_5, f32_6, f32_7, f32_8,
901 f32_9, f32_10, f32_11, f32_12, f32_13, f32_14
903 static const char *const f16_patt[] = {
904 f32_1, f32_2, f16_3, f16_4, f16_5, f16_6, f16_7, f16_8
907 static const char alt_3[] =
909 /* nopl 0(%[re]ax) */
910 static const char alt_4[] =
911 {0x0f,0x1f,0x40,0x00};
912 /* nopl 0(%[re]ax,%[re]ax,1) */
913 static const char alt_5[] =
914 {0x0f,0x1f,0x44,0x00,0x00};
915 /* nopw 0(%[re]ax,%[re]ax,1) */
916 static const char alt_6[] =
917 {0x66,0x0f,0x1f,0x44,0x00,0x00};
918 /* nopl 0L(%[re]ax) */
919 static const char alt_7[] =
920 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
921 /* nopl 0L(%[re]ax,%[re]ax,1) */
922 static const char alt_8[] =
923 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
924 /* nopw 0L(%[re]ax,%[re]ax,1) */
925 static const char alt_9[] =
926 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
927 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
928 static const char alt_10[] =
929 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
931 nopw %cs:0L(%[re]ax,%[re]ax,1) */
932 static const char alt_long_11[] =
934 0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
937 nopw %cs:0L(%[re]ax,%[re]ax,1) */
938 static const char alt_long_12[] =
941 0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
945 nopw %cs:0L(%[re]ax,%[re]ax,1) */
946 static const char alt_long_13[] =
950 0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
955 nopw %cs:0L(%[re]ax,%[re]ax,1) */
956 static const char alt_long_14[] =
961 0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
967 nopw %cs:0L(%[re]ax,%[re]ax,1) */
968 static const char alt_long_15[] =
974 0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
975 /* nopl 0(%[re]ax,%[re]ax,1)
976 nopw 0(%[re]ax,%[re]ax,1) */
977 static const char alt_short_11[] =
978 {0x0f,0x1f,0x44,0x00,0x00,
979 0x66,0x0f,0x1f,0x44,0x00,0x00};
980 /* nopw 0(%[re]ax,%[re]ax,1)
981 nopw 0(%[re]ax,%[re]ax,1) */
982 static const char alt_short_12[] =
983 {0x66,0x0f,0x1f,0x44,0x00,0x00,
984 0x66,0x0f,0x1f,0x44,0x00,0x00};
985 /* nopw 0(%[re]ax,%[re]ax,1)
987 static const char alt_short_13[] =
988 {0x66,0x0f,0x1f,0x44,0x00,0x00,
989 0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
992 static const char alt_short_14[] =
993 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00,
994 0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
996 nopl 0L(%[re]ax,%[re]ax,1) */
997 static const char alt_short_15[] =
998 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00,
999 0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1000 static const char *const alt_short_patt[] = {
1001 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1002 alt_9, alt_10, alt_short_11, alt_short_12, alt_short_13,
1003 alt_short_14, alt_short_15
1005 static const char *const alt_long_patt[] = {
1006 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1007 alt_9, alt_10, alt_long_11, alt_long_12, alt_long_13,
1008 alt_long_14, alt_long_15
1011 /* Only align for at least a positive non-zero boundary. */
1012 if (count <= 0 || count > MAX_MEM_FOR_RS_ALIGN_CODE)
1015 /* We need to decide which NOP sequence to use for 32bit and
1016 64bit. When -mtune= is used:
1018 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1019 PROCESSOR_GENERIC32, f32_patt will be used.
1020 2. For PROCESSOR_PENTIUMPRO, PROCESSOR_PENTIUM4, PROCESSOR_NOCONA,
1021 PROCESSOR_CORE, PROCESSOR_CORE2, PROCESSOR_COREI7, and
1022 PROCESSOR_GENERIC64, alt_long_patt will be used.
1023 3. For PROCESSOR_ATHLON, PROCESSOR_K6, PROCESSOR_K8 and
1024 PROCESSOR_AMDFAM10, and PROCESSOR_BDVER1, alt_short_patt
1027 When -mtune= isn't used, alt_long_patt will be used if
1028 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1031 When -march= or .arch is used, we can't use anything beyond
1032 cpu_arch_isa_flags. */
1034 if (flag_code == CODE_16BIT)
1038 memcpy (fragP->fr_literal + fragP->fr_fix,
1040 /* Adjust jump offset. */
1041 fragP->fr_literal[fragP->fr_fix + 1] = count - 2;
1044 memcpy (fragP->fr_literal + fragP->fr_fix,
1045 f16_patt[count - 1], count);
1049 const char *const *patt = NULL;
1051 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1053 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1054 switch (cpu_arch_tune)
1056 case PROCESSOR_UNKNOWN:
1057 /* We use cpu_arch_isa_flags to check if we SHOULD
1058 optimize with nops. */
1059 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1060 patt = alt_long_patt;
1064 case PROCESSOR_PENTIUM4:
1065 case PROCESSOR_NOCONA:
1066 case PROCESSOR_CORE:
1067 case PROCESSOR_CORE2:
1068 case PROCESSOR_COREI7:
1069 case PROCESSOR_L1OM:
1070 case PROCESSOR_GENERIC64:
1071 patt = alt_long_patt;
1074 case PROCESSOR_ATHLON:
1076 case PROCESSOR_AMDFAM10:
1077 case PROCESSOR_BDVER1:
1078 patt = alt_short_patt;
1080 case PROCESSOR_I386:
1081 case PROCESSOR_I486:
1082 case PROCESSOR_PENTIUM:
1083 case PROCESSOR_PENTIUMPRO:
1084 case PROCESSOR_GENERIC32:
1091 switch (fragP->tc_frag_data.tune)
1093 case PROCESSOR_UNKNOWN:
1094 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1095 PROCESSOR_UNKNOWN. */
1099 case PROCESSOR_I386:
1100 case PROCESSOR_I486:
1101 case PROCESSOR_PENTIUM:
1103 case PROCESSOR_ATHLON:
1105 case PROCESSOR_AMDFAM10:
1106 case PROCESSOR_BDVER1:
1107 case PROCESSOR_GENERIC32:
1108 /* We use cpu_arch_isa_flags to check if we CAN optimize
1110 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1111 patt = alt_short_patt;
1115 case PROCESSOR_PENTIUMPRO:
1116 case PROCESSOR_PENTIUM4:
1117 case PROCESSOR_NOCONA:
1118 case PROCESSOR_CORE:
1119 case PROCESSOR_CORE2:
1120 case PROCESSOR_COREI7:
1121 case PROCESSOR_L1OM:
1122 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1123 patt = alt_long_patt;
1127 case PROCESSOR_GENERIC64:
1128 patt = alt_long_patt;
1133 if (patt == f32_patt)
1135 /* If the padding is less than 15 bytes, we use the normal
1136 ones. Otherwise, we use a jump instruction and adjust
1140 /* For 64bit, the limit is 3 bytes. */
1141 if (flag_code == CODE_64BIT
1142 && fragP->tc_frag_data.isa_flags.bitfield.cpulm)
1147 memcpy (fragP->fr_literal + fragP->fr_fix,
1148 patt[count - 1], count);
1151 memcpy (fragP->fr_literal + fragP->fr_fix,
1153 /* Adjust jump offset. */
1154 fragP->fr_literal[fragP->fr_fix + 1] = count - 2;
1159 /* Maximum length of an instruction is 15 byte. If the
1160 padding is greater than 15 bytes and we don't use jump,
1161 we have to break it into smaller pieces. */
1162 int padding = count;
1163 while (padding > 15)
1166 memcpy (fragP->fr_literal + fragP->fr_fix + padding,
1171 memcpy (fragP->fr_literal + fragP->fr_fix,
1172 patt [padding - 1], padding);
1175 fragP->fr_var = count;
1179 operand_type_all_zero (const union i386_operand_type *x)
1181 switch (ARRAY_SIZE(x->array))
1190 return !x->array[0];
1197 operand_type_set (union i386_operand_type *x, unsigned int v)
1199 switch (ARRAY_SIZE(x->array))
1214 operand_type_equal (const union i386_operand_type *x,
1215 const union i386_operand_type *y)
1217 switch (ARRAY_SIZE(x->array))
1220 if (x->array[2] != y->array[2])
1223 if (x->array[1] != y->array[1])
1226 return x->array[0] == y->array[0];
1234 cpu_flags_all_zero (const union i386_cpu_flags *x)
1236 switch (ARRAY_SIZE(x->array))
1245 return !x->array[0];
1252 cpu_flags_set (union i386_cpu_flags *x, unsigned int v)
1254 switch (ARRAY_SIZE(x->array))
1269 cpu_flags_equal (const union i386_cpu_flags *x,
1270 const union i386_cpu_flags *y)
1272 switch (ARRAY_SIZE(x->array))
1275 if (x->array[2] != y->array[2])
1278 if (x->array[1] != y->array[1])
1281 return x->array[0] == y->array[0];
1289 cpu_flags_check_cpu64 (i386_cpu_flags f)
1291 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1292 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1295 static INLINE i386_cpu_flags
1296 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1298 switch (ARRAY_SIZE (x.array))
1301 x.array [2] &= y.array [2];
1303 x.array [1] &= y.array [1];
1305 x.array [0] &= y.array [0];
1313 static INLINE i386_cpu_flags
1314 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1316 switch (ARRAY_SIZE (x.array))
1319 x.array [2] |= y.array [2];
1321 x.array [1] |= y.array [1];
1323 x.array [0] |= y.array [0];
1331 static INLINE i386_cpu_flags
1332 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1334 switch (ARRAY_SIZE (x.array))
1337 x.array [2] &= ~y.array [2];
1339 x.array [1] &= ~y.array [1];
1341 x.array [0] &= ~y.array [0];
1349 #define CPU_FLAGS_ARCH_MATCH 0x1
1350 #define CPU_FLAGS_64BIT_MATCH 0x2
1351 #define CPU_FLAGS_AES_MATCH 0x4
1352 #define CPU_FLAGS_PCLMUL_MATCH 0x8
1353 #define CPU_FLAGS_AVX_MATCH 0x10
1355 #define CPU_FLAGS_32BIT_MATCH \
1356 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_AES_MATCH \
1357 | CPU_FLAGS_PCLMUL_MATCH | CPU_FLAGS_AVX_MATCH)
1358 #define CPU_FLAGS_PERFECT_MATCH \
1359 (CPU_FLAGS_32BIT_MATCH | CPU_FLAGS_64BIT_MATCH)
1361 /* Return CPU flags match bits. */
1364 cpu_flags_match (const insn_template *t)
1366 i386_cpu_flags x = t->cpu_flags;
1367 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1369 x.bitfield.cpu64 = 0;
1370 x.bitfield.cpuno64 = 0;
1372 if (cpu_flags_all_zero (&x))
1374 /* This instruction is available on all archs. */
1375 match |= CPU_FLAGS_32BIT_MATCH;
1379 /* This instruction is available only on some archs. */
1380 i386_cpu_flags cpu = cpu_arch_flags;
1382 cpu.bitfield.cpu64 = 0;
1383 cpu.bitfield.cpuno64 = 0;
1384 cpu = cpu_flags_and (x, cpu);
1385 if (!cpu_flags_all_zero (&cpu))
1387 if (x.bitfield.cpuavx)
1389 /* We only need to check AES/PCLMUL/SSE2AVX with AVX. */
1390 if (cpu.bitfield.cpuavx)
1392 /* Check SSE2AVX. */
1393 if (!t->opcode_modifier.sse2avx|| sse2avx)
1395 match |= (CPU_FLAGS_ARCH_MATCH
1396 | CPU_FLAGS_AVX_MATCH);
1398 if (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1399 match |= CPU_FLAGS_AES_MATCH;
1401 if (!x.bitfield.cpupclmul
1402 || cpu.bitfield.cpupclmul)
1403 match |= CPU_FLAGS_PCLMUL_MATCH;
1407 match |= CPU_FLAGS_ARCH_MATCH;
1410 match |= CPU_FLAGS_32BIT_MATCH;
1416 static INLINE i386_operand_type
1417 operand_type_and (i386_operand_type x, i386_operand_type y)
1419 switch (ARRAY_SIZE (x.array))
1422 x.array [2] &= y.array [2];
1424 x.array [1] &= y.array [1];
1426 x.array [0] &= y.array [0];
1434 static INLINE i386_operand_type
1435 operand_type_or (i386_operand_type x, i386_operand_type y)
1437 switch (ARRAY_SIZE (x.array))
1440 x.array [2] |= y.array [2];
1442 x.array [1] |= y.array [1];
1444 x.array [0] |= y.array [0];
1452 static INLINE i386_operand_type
1453 operand_type_xor (i386_operand_type x, i386_operand_type y)
1455 switch (ARRAY_SIZE (x.array))
1458 x.array [2] ^= y.array [2];
1460 x.array [1] ^= y.array [1];
1462 x.array [0] ^= y.array [0];
1470 static const i386_operand_type acc32 = OPERAND_TYPE_ACC32;
1471 static const i386_operand_type acc64 = OPERAND_TYPE_ACC64;
1472 static const i386_operand_type control = OPERAND_TYPE_CONTROL;
1473 static const i386_operand_type inoutportreg
1474 = OPERAND_TYPE_INOUTPORTREG;
1475 static const i386_operand_type reg16_inoutportreg
1476 = OPERAND_TYPE_REG16_INOUTPORTREG;
1477 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
1478 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
1479 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
1480 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
1481 static const i386_operand_type anydisp
1482 = OPERAND_TYPE_ANYDISP;
1483 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
1484 static const i386_operand_type regymm = OPERAND_TYPE_REGYMM;
1485 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
1486 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
1487 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
1488 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
1489 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
1490 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
1491 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
1492 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
1493 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
1494 static const i386_operand_type vec_imm4 = OPERAND_TYPE_VEC_IMM4;
1505 operand_type_check (i386_operand_type t, enum operand_type c)
1510 return (t.bitfield.reg8
1513 || t.bitfield.reg64);
1516 return (t.bitfield.imm8
1520 || t.bitfield.imm32s
1521 || t.bitfield.imm64);
1524 return (t.bitfield.disp8
1525 || t.bitfield.disp16
1526 || t.bitfield.disp32
1527 || t.bitfield.disp32s
1528 || t.bitfield.disp64);
1531 return (t.bitfield.disp8
1532 || t.bitfield.disp16
1533 || t.bitfield.disp32
1534 || t.bitfield.disp32s
1535 || t.bitfield.disp64
1536 || t.bitfield.baseindex);
1545 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit on
1546 operand J for instruction template T. */
1549 match_reg_size (const insn_template *t, unsigned int j)
1551 return !((i.types[j].bitfield.byte
1552 && !t->operand_types[j].bitfield.byte)
1553 || (i.types[j].bitfield.word
1554 && !t->operand_types[j].bitfield.word)
1555 || (i.types[j].bitfield.dword
1556 && !t->operand_types[j].bitfield.dword)
1557 || (i.types[j].bitfield.qword
1558 && !t->operand_types[j].bitfield.qword));
1561 /* Return 1 if there is no conflict in any size on operand J for
1562 instruction template T. */
1565 match_mem_size (const insn_template *t, unsigned int j)
1567 return (match_reg_size (t, j)
1568 && !((i.types[j].bitfield.unspecified
1569 && !t->operand_types[j].bitfield.unspecified)
1570 || (i.types[j].bitfield.fword
1571 && !t->operand_types[j].bitfield.fword)
1572 || (i.types[j].bitfield.tbyte
1573 && !t->operand_types[j].bitfield.tbyte)
1574 || (i.types[j].bitfield.xmmword
1575 && !t->operand_types[j].bitfield.xmmword)
1576 || (i.types[j].bitfield.ymmword
1577 && !t->operand_types[j].bitfield.ymmword)));
1580 /* Return 1 if there is no size conflict on any operands for
1581 instruction template T. */
1584 operand_size_match (const insn_template *t)
1589 /* Don't check jump instructions. */
1590 if (t->opcode_modifier.jump
1591 || t->opcode_modifier.jumpbyte
1592 || t->opcode_modifier.jumpdword
1593 || t->opcode_modifier.jumpintersegment)
1596 /* Check memory and accumulator operand size. */
1597 for (j = 0; j < i.operands; j++)
1599 if (t->operand_types[j].bitfield.anysize)
1602 if (t->operand_types[j].bitfield.acc && !match_reg_size (t, j))
1608 if (i.types[j].bitfield.mem && !match_mem_size (t, j))
1617 else if (!t->opcode_modifier.d && !t->opcode_modifier.floatd)
1620 i.error = operand_size_mismatch;
1624 /* Check reverse. */
1625 gas_assert (i.operands == 2);
1628 for (j = 0; j < 2; j++)
1630 if (t->operand_types[j].bitfield.acc
1631 && !match_reg_size (t, j ? 0 : 1))
1634 if (i.types[j].bitfield.mem
1635 && !match_mem_size (t, j ? 0 : 1))
1643 operand_type_match (i386_operand_type overlap,
1644 i386_operand_type given)
1646 i386_operand_type temp = overlap;
1648 temp.bitfield.jumpabsolute = 0;
1649 temp.bitfield.unspecified = 0;
1650 temp.bitfield.byte = 0;
1651 temp.bitfield.word = 0;
1652 temp.bitfield.dword = 0;
1653 temp.bitfield.fword = 0;
1654 temp.bitfield.qword = 0;
1655 temp.bitfield.tbyte = 0;
1656 temp.bitfield.xmmword = 0;
1657 temp.bitfield.ymmword = 0;
1658 if (operand_type_all_zero (&temp))
1661 if (given.bitfield.baseindex == overlap.bitfield.baseindex
1662 && given.bitfield.jumpabsolute == overlap.bitfield.jumpabsolute)
1666 i.error = operand_type_mismatch;
1670 /* If given types g0 and g1 are registers they must be of the same type
1671 unless the expected operand type register overlap is null.
1672 Note that Acc in a template matches every size of reg. */
1675 operand_type_register_match (i386_operand_type m0,
1676 i386_operand_type g0,
1677 i386_operand_type t0,
1678 i386_operand_type m1,
1679 i386_operand_type g1,
1680 i386_operand_type t1)
1682 if (!operand_type_check (g0, reg))
1685 if (!operand_type_check (g1, reg))
1688 if (g0.bitfield.reg8 == g1.bitfield.reg8
1689 && g0.bitfield.reg16 == g1.bitfield.reg16
1690 && g0.bitfield.reg32 == g1.bitfield.reg32
1691 && g0.bitfield.reg64 == g1.bitfield.reg64)
1694 if (m0.bitfield.acc)
1696 t0.bitfield.reg8 = 1;
1697 t0.bitfield.reg16 = 1;
1698 t0.bitfield.reg32 = 1;
1699 t0.bitfield.reg64 = 1;
1702 if (m1.bitfield.acc)
1704 t1.bitfield.reg8 = 1;
1705 t1.bitfield.reg16 = 1;
1706 t1.bitfield.reg32 = 1;
1707 t1.bitfield.reg64 = 1;
1710 if (!(t0.bitfield.reg8 & t1.bitfield.reg8)
1711 && !(t0.bitfield.reg16 & t1.bitfield.reg16)
1712 && !(t0.bitfield.reg32 & t1.bitfield.reg32)
1713 && !(t0.bitfield.reg64 & t1.bitfield.reg64))
1716 i.error = register_type_mismatch;
1721 static INLINE unsigned int
1722 mode_from_disp_size (i386_operand_type t)
1724 if (t.bitfield.disp8)
1726 else if (t.bitfield.disp16
1727 || t.bitfield.disp32
1728 || t.bitfield.disp32s)
1735 fits_in_signed_byte (offsetT num)
1737 return (num >= -128) && (num <= 127);
1741 fits_in_unsigned_byte (offsetT num)
1743 return (num & 0xff) == num;
1747 fits_in_unsigned_word (offsetT num)
1749 return (num & 0xffff) == num;
1753 fits_in_signed_word (offsetT num)
1755 return (-32768 <= num) && (num <= 32767);
1759 fits_in_signed_long (offsetT num ATTRIBUTE_UNUSED)
1764 return (!(((offsetT) -1 << 31) & num)
1765 || (((offsetT) -1 << 31) & num) == ((offsetT) -1 << 31));
1767 } /* fits_in_signed_long() */
1770 fits_in_unsigned_long (offsetT num ATTRIBUTE_UNUSED)
1775 return (num & (((offsetT) 2 << 31) - 1)) == num;
1777 } /* fits_in_unsigned_long() */
1780 fits_in_imm4 (offsetT num)
1782 return (num & 0xf) == num;
1785 static i386_operand_type
1786 smallest_imm_type (offsetT num)
1788 i386_operand_type t;
1790 operand_type_set (&t, 0);
1791 t.bitfield.imm64 = 1;
1793 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
1795 /* This code is disabled on the 486 because all the Imm1 forms
1796 in the opcode table are slower on the i486. They're the
1797 versions with the implicitly specified single-position
1798 displacement, which has another syntax if you really want to
1800 t.bitfield.imm1 = 1;
1801 t.bitfield.imm8 = 1;
1802 t.bitfield.imm8s = 1;
1803 t.bitfield.imm16 = 1;
1804 t.bitfield.imm32 = 1;
1805 t.bitfield.imm32s = 1;
1807 else if (fits_in_signed_byte (num))
1809 t.bitfield.imm8 = 1;
1810 t.bitfield.imm8s = 1;
1811 t.bitfield.imm16 = 1;
1812 t.bitfield.imm32 = 1;
1813 t.bitfield.imm32s = 1;
1815 else if (fits_in_unsigned_byte (num))
1817 t.bitfield.imm8 = 1;
1818 t.bitfield.imm16 = 1;
1819 t.bitfield.imm32 = 1;
1820 t.bitfield.imm32s = 1;
1822 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
1824 t.bitfield.imm16 = 1;
1825 t.bitfield.imm32 = 1;
1826 t.bitfield.imm32s = 1;
1828 else if (fits_in_signed_long (num))
1830 t.bitfield.imm32 = 1;
1831 t.bitfield.imm32s = 1;
1833 else if (fits_in_unsigned_long (num))
1834 t.bitfield.imm32 = 1;
1840 offset_in_range (offsetT val, int size)
1846 case 1: mask = ((addressT) 1 << 8) - 1; break;
1847 case 2: mask = ((addressT) 1 << 16) - 1; break;
1848 case 4: mask = ((addressT) 2 << 31) - 1; break;
1850 case 8: mask = ((addressT) 2 << 63) - 1; break;
1856 /* If BFD64, sign extend val for 32bit address mode. */
1857 if (flag_code != CODE_64BIT
1858 || i.prefix[ADDR_PREFIX])
1859 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
1860 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
1863 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
1865 char buf1[40], buf2[40];
1867 sprint_value (buf1, val);
1868 sprint_value (buf2, val & mask);
1869 as_warn (_("%s shortened to %s"), buf1, buf2);
1883 a. PREFIX_EXIST if attempting to add a prefix where one from the
1884 same class already exists.
1885 b. PREFIX_LOCK if lock prefix is added.
1886 c. PREFIX_REP if rep/repne prefix is added.
1887 d. PREFIX_OTHER if other prefix is added.
1890 static enum PREFIX_GROUP
1891 add_prefix (unsigned int prefix)
1893 enum PREFIX_GROUP ret = PREFIX_OTHER;
1896 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
1897 && flag_code == CODE_64BIT)
1899 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
1900 || ((i.prefix[REX_PREFIX] & (REX_R | REX_X | REX_B))
1901 && (prefix & (REX_R | REX_X | REX_B))))
1912 case CS_PREFIX_OPCODE:
1913 case DS_PREFIX_OPCODE:
1914 case ES_PREFIX_OPCODE:
1915 case FS_PREFIX_OPCODE:
1916 case GS_PREFIX_OPCODE:
1917 case SS_PREFIX_OPCODE:
1921 case REPNE_PREFIX_OPCODE:
1922 case REPE_PREFIX_OPCODE:
1927 case LOCK_PREFIX_OPCODE:
1936 case ADDR_PREFIX_OPCODE:
1940 case DATA_PREFIX_OPCODE:
1944 if (i.prefix[q] != 0)
1952 i.prefix[q] |= prefix;
1955 as_bad (_("same type of prefix used twice"));
1961 update_code_flag (int value, int check)
1963 PRINTF_LIKE ((*as_error));
1965 flag_code = (enum flag_code) value;
1966 if (flag_code == CODE_64BIT)
1968 cpu_arch_flags.bitfield.cpu64 = 1;
1969 cpu_arch_flags.bitfield.cpuno64 = 0;
1973 cpu_arch_flags.bitfield.cpu64 = 0;
1974 cpu_arch_flags.bitfield.cpuno64 = 1;
1976 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
1979 as_error = as_fatal;
1982 (*as_error) (_("64bit mode not supported on `%s'."),
1983 cpu_arch_name ? cpu_arch_name : default_arch);
1985 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
1988 as_error = as_fatal;
1991 (*as_error) (_("32bit mode not supported on `%s'."),
1992 cpu_arch_name ? cpu_arch_name : default_arch);
1994 stackop_size = '\0';
1998 set_code_flag (int value)
2000 update_code_flag (value, 0);
2004 set_16bit_gcc_code_flag (int new_code_flag)
2006 flag_code = (enum flag_code) new_code_flag;
2007 if (flag_code != CODE_16BIT)
2009 cpu_arch_flags.bitfield.cpu64 = 0;
2010 cpu_arch_flags.bitfield.cpuno64 = 1;
2011 stackop_size = LONG_MNEM_SUFFIX;
2015 set_intel_syntax (int syntax_flag)
2017 /* Find out if register prefixing is specified. */
2018 int ask_naked_reg = 0;
2021 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2023 char *string = input_line_pointer;
2024 int e = get_symbol_end ();
2026 if (strcmp (string, "prefix") == 0)
2028 else if (strcmp (string, "noprefix") == 0)
2031 as_bad (_("bad argument to syntax directive."));
2032 *input_line_pointer = e;
2034 demand_empty_rest_of_line ();
2036 intel_syntax = syntax_flag;
2038 if (ask_naked_reg == 0)
2039 allow_naked_reg = (intel_syntax
2040 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2042 allow_naked_reg = (ask_naked_reg < 0);
2044 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2046 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2047 identifier_chars['$'] = intel_syntax ? '$' : 0;
2048 register_prefix = allow_naked_reg ? "" : "%";
2052 set_intel_mnemonic (int mnemonic_flag)
2054 intel_mnemonic = mnemonic_flag;
2058 set_allow_index_reg (int flag)
2060 allow_index_reg = flag;
2064 set_sse_check (int dummy ATTRIBUTE_UNUSED)
2068 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2070 char *string = input_line_pointer;
2071 int e = get_symbol_end ();
2073 if (strcmp (string, "none") == 0)
2074 sse_check = sse_check_none;
2075 else if (strcmp (string, "warning") == 0)
2076 sse_check = sse_check_warning;
2077 else if (strcmp (string, "error") == 0)
2078 sse_check = sse_check_error;
2080 as_bad (_("bad argument to sse_check directive."));
2081 *input_line_pointer = e;
2084 as_bad (_("missing argument for sse_check directive"));
2086 demand_empty_rest_of_line ();
2090 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2091 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2093 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2094 static const char *arch;
2096 /* Intel LIOM is only supported on ELF. */
2102 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2103 use default_arch. */
2104 arch = cpu_arch_name;
2106 arch = default_arch;
2109 /* If we are targeting Intel L1OM, we must enable it. */
2110 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2111 || new_flag.bitfield.cpul1om)
2114 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2119 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2123 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2125 char *string = input_line_pointer;
2126 int e = get_symbol_end ();
2128 i386_cpu_flags flags;
2130 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2132 if (strcmp (string, cpu_arch[j].name) == 0)
2134 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2138 cpu_arch_name = cpu_arch[j].name;
2139 cpu_sub_arch_name = NULL;
2140 cpu_arch_flags = cpu_arch[j].flags;
2141 if (flag_code == CODE_64BIT)
2143 cpu_arch_flags.bitfield.cpu64 = 1;
2144 cpu_arch_flags.bitfield.cpuno64 = 0;
2148 cpu_arch_flags.bitfield.cpu64 = 0;
2149 cpu_arch_flags.bitfield.cpuno64 = 1;
2151 cpu_arch_isa = cpu_arch[j].type;
2152 cpu_arch_isa_flags = cpu_arch[j].flags;
2153 if (!cpu_arch_tune_set)
2155 cpu_arch_tune = cpu_arch_isa;
2156 cpu_arch_tune_flags = cpu_arch_isa_flags;
2161 if (!cpu_arch[j].negated)
2162 flags = cpu_flags_or (cpu_arch_flags,
2165 flags = cpu_flags_and_not (cpu_arch_flags,
2167 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2169 if (cpu_sub_arch_name)
2171 char *name = cpu_sub_arch_name;
2172 cpu_sub_arch_name = concat (name,
2174 (const char *) NULL);
2178 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2179 cpu_arch_flags = flags;
2180 cpu_arch_isa_flags = flags;
2182 *input_line_pointer = e;
2183 demand_empty_rest_of_line ();
2187 if (j >= ARRAY_SIZE (cpu_arch))
2188 as_bad (_("no such architecture: `%s'"), string);
2190 *input_line_pointer = e;
2193 as_bad (_("missing cpu architecture"));
2195 no_cond_jump_promotion = 0;
2196 if (*input_line_pointer == ','
2197 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2199 char *string = ++input_line_pointer;
2200 int e = get_symbol_end ();
2202 if (strcmp (string, "nojumps") == 0)
2203 no_cond_jump_promotion = 1;
2204 else if (strcmp (string, "jumps") == 0)
2207 as_bad (_("no such architecture modifier: `%s'"), string);
2209 *input_line_pointer = e;
2212 demand_empty_rest_of_line ();
2215 enum bfd_architecture
2218 if (cpu_arch_isa == PROCESSOR_L1OM)
2220 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2221 || flag_code != CODE_64BIT)
2222 as_fatal (_("Intel L1OM is 64bit ELF only"));
2223 return bfd_arch_l1om;
2226 return bfd_arch_i386;
2232 if (!strncmp (default_arch, "x86_64", 6))
2234 if (cpu_arch_isa == PROCESSOR_L1OM)
2236 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2237 || default_arch[6] != '\0')
2238 as_fatal (_("Intel L1OM is 64bit ELF only"));
2239 return bfd_mach_l1om;
2241 else if (default_arch[6] == '\0')
2242 return bfd_mach_x86_64;
2244 return bfd_mach_x64_32;
2246 else if (!strcmp (default_arch, "i386"))
2247 return bfd_mach_i386_i386;
2249 as_fatal (_("Unknown architecture"));
2255 const char *hash_err;
2257 /* Initialize op_hash hash table. */
2258 op_hash = hash_new ();
2261 const insn_template *optab;
2262 templates *core_optab;
2264 /* Setup for loop. */
2266 core_optab = (templates *) xmalloc (sizeof (templates));
2267 core_optab->start = optab;
2272 if (optab->name == NULL
2273 || strcmp (optab->name, (optab - 1)->name) != 0)
2275 /* different name --> ship out current template list;
2276 add to hash table; & begin anew. */
2277 core_optab->end = optab;
2278 hash_err = hash_insert (op_hash,
2280 (void *) core_optab);
2283 as_fatal (_("Internal Error: Can't hash %s: %s"),
2287 if (optab->name == NULL)
2289 core_optab = (templates *) xmalloc (sizeof (templates));
2290 core_optab->start = optab;
2295 /* Initialize reg_hash hash table. */
2296 reg_hash = hash_new ();
2298 const reg_entry *regtab;
2299 unsigned int regtab_size = i386_regtab_size;
2301 for (regtab = i386_regtab; regtab_size--; regtab++)
2303 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
2305 as_fatal (_("Internal Error: Can't hash %s: %s"),
2311 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
2316 for (c = 0; c < 256; c++)
2321 mnemonic_chars[c] = c;
2322 register_chars[c] = c;
2323 operand_chars[c] = c;
2325 else if (ISLOWER (c))
2327 mnemonic_chars[c] = c;
2328 register_chars[c] = c;
2329 operand_chars[c] = c;
2331 else if (ISUPPER (c))
2333 mnemonic_chars[c] = TOLOWER (c);
2334 register_chars[c] = mnemonic_chars[c];
2335 operand_chars[c] = c;
2338 if (ISALPHA (c) || ISDIGIT (c))
2339 identifier_chars[c] = c;
2342 identifier_chars[c] = c;
2343 operand_chars[c] = c;
2348 identifier_chars['@'] = '@';
2351 identifier_chars['?'] = '?';
2352 operand_chars['?'] = '?';
2354 digit_chars['-'] = '-';
2355 mnemonic_chars['_'] = '_';
2356 mnemonic_chars['-'] = '-';
2357 mnemonic_chars['.'] = '.';
2358 identifier_chars['_'] = '_';
2359 identifier_chars['.'] = '.';
2361 for (p = operand_special_chars; *p != '\0'; p++)
2362 operand_chars[(unsigned char) *p] = *p;
2365 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2368 record_alignment (text_section, 2);
2369 record_alignment (data_section, 2);
2370 record_alignment (bss_section, 2);
2374 if (flag_code == CODE_64BIT)
2376 #if defined (OBJ_COFF) && defined (TE_PE)
2377 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
2380 x86_dwarf2_return_column = 16;
2382 x86_cie_data_alignment = -8;
2386 x86_dwarf2_return_column = 8;
2387 x86_cie_data_alignment = -4;
2392 i386_print_statistics (FILE *file)
2394 hash_print_statistics (file, "i386 opcode", op_hash);
2395 hash_print_statistics (file, "i386 register", reg_hash);
2400 /* Debugging routines for md_assemble. */
2401 static void pte (insn_template *);
2402 static void pt (i386_operand_type);
2403 static void pe (expressionS *);
2404 static void ps (symbolS *);
2407 pi (char *line, i386_insn *x)
2411 fprintf (stdout, "%s: template ", line);
2413 fprintf (stdout, " address: base %s index %s scale %x\n",
2414 x->base_reg ? x->base_reg->reg_name : "none",
2415 x->index_reg ? x->index_reg->reg_name : "none",
2416 x->log2_scale_factor);
2417 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
2418 x->rm.mode, x->rm.reg, x->rm.regmem);
2419 fprintf (stdout, " sib: base %x index %x scale %x\n",
2420 x->sib.base, x->sib.index, x->sib.scale);
2421 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
2422 (x->rex & REX_W) != 0,
2423 (x->rex & REX_R) != 0,
2424 (x->rex & REX_X) != 0,
2425 (x->rex & REX_B) != 0);
2426 for (j = 0; j < x->operands; j++)
2428 fprintf (stdout, " #%d: ", j + 1);
2430 fprintf (stdout, "\n");
2431 if (x->types[j].bitfield.reg8
2432 || x->types[j].bitfield.reg16
2433 || x->types[j].bitfield.reg32
2434 || x->types[j].bitfield.reg64
2435 || x->types[j].bitfield.regmmx
2436 || x->types[j].bitfield.regxmm
2437 || x->types[j].bitfield.regymm
2438 || x->types[j].bitfield.sreg2
2439 || x->types[j].bitfield.sreg3
2440 || x->types[j].bitfield.control
2441 || x->types[j].bitfield.debug
2442 || x->types[j].bitfield.test)
2443 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
2444 if (operand_type_check (x->types[j], imm))
2446 if (operand_type_check (x->types[j], disp))
2447 pe (x->op[j].disps);
2452 pte (insn_template *t)
2455 fprintf (stdout, " %d operands ", t->operands);
2456 fprintf (stdout, "opcode %x ", t->base_opcode);
2457 if (t->extension_opcode != None)
2458 fprintf (stdout, "ext %x ", t->extension_opcode);
2459 if (t->opcode_modifier.d)
2460 fprintf (stdout, "D");
2461 if (t->opcode_modifier.w)
2462 fprintf (stdout, "W");
2463 fprintf (stdout, "\n");
2464 for (j = 0; j < t->operands; j++)
2466 fprintf (stdout, " #%d type ", j + 1);
2467 pt (t->operand_types[j]);
2468 fprintf (stdout, "\n");
2475 fprintf (stdout, " operation %d\n", e->X_op);
2476 fprintf (stdout, " add_number %ld (%lx)\n",
2477 (long) e->X_add_number, (long) e->X_add_number);
2478 if (e->X_add_symbol)
2480 fprintf (stdout, " add_symbol ");
2481 ps (e->X_add_symbol);
2482 fprintf (stdout, "\n");
2486 fprintf (stdout, " op_symbol ");
2487 ps (e->X_op_symbol);
2488 fprintf (stdout, "\n");
2495 fprintf (stdout, "%s type %s%s",
2497 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
2498 segment_name (S_GET_SEGMENT (s)));
2501 static struct type_name
2503 i386_operand_type mask;
2506 const type_names[] =
2508 { OPERAND_TYPE_REG8, "r8" },
2509 { OPERAND_TYPE_REG16, "r16" },
2510 { OPERAND_TYPE_REG32, "r32" },
2511 { OPERAND_TYPE_REG64, "r64" },
2512 { OPERAND_TYPE_IMM8, "i8" },
2513 { OPERAND_TYPE_IMM8, "i8s" },
2514 { OPERAND_TYPE_IMM16, "i16" },
2515 { OPERAND_TYPE_IMM32, "i32" },
2516 { OPERAND_TYPE_IMM32S, "i32s" },
2517 { OPERAND_TYPE_IMM64, "i64" },
2518 { OPERAND_TYPE_IMM1, "i1" },
2519 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
2520 { OPERAND_TYPE_DISP8, "d8" },
2521 { OPERAND_TYPE_DISP16, "d16" },
2522 { OPERAND_TYPE_DISP32, "d32" },
2523 { OPERAND_TYPE_DISP32S, "d32s" },
2524 { OPERAND_TYPE_DISP64, "d64" },
2525 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
2526 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
2527 { OPERAND_TYPE_CONTROL, "control reg" },
2528 { OPERAND_TYPE_TEST, "test reg" },
2529 { OPERAND_TYPE_DEBUG, "debug reg" },
2530 { OPERAND_TYPE_FLOATREG, "FReg" },
2531 { OPERAND_TYPE_FLOATACC, "FAcc" },
2532 { OPERAND_TYPE_SREG2, "SReg2" },
2533 { OPERAND_TYPE_SREG3, "SReg3" },
2534 { OPERAND_TYPE_ACC, "Acc" },
2535 { OPERAND_TYPE_JUMPABSOLUTE, "Jump Absolute" },
2536 { OPERAND_TYPE_REGMMX, "rMMX" },
2537 { OPERAND_TYPE_REGXMM, "rXMM" },
2538 { OPERAND_TYPE_REGYMM, "rYMM" },
2539 { OPERAND_TYPE_ESSEG, "es" },
2543 pt (i386_operand_type t)
2546 i386_operand_type a;
2548 for (j = 0; j < ARRAY_SIZE (type_names); j++)
2550 a = operand_type_and (t, type_names[j].mask);
2551 if (!operand_type_all_zero (&a))
2552 fprintf (stdout, "%s, ", type_names[j].name);
2557 #endif /* DEBUG386 */
2559 static bfd_reloc_code_real_type
2560 reloc (unsigned int size,
2563 bfd_reloc_code_real_type other)
2565 if (other != NO_RELOC)
2567 reloc_howto_type *rel;
2572 case BFD_RELOC_X86_64_GOT32:
2573 return BFD_RELOC_X86_64_GOT64;
2575 case BFD_RELOC_X86_64_PLTOFF64:
2576 return BFD_RELOC_X86_64_PLTOFF64;
2578 case BFD_RELOC_X86_64_GOTPC32:
2579 other = BFD_RELOC_X86_64_GOTPC64;
2581 case BFD_RELOC_X86_64_GOTPCREL:
2582 other = BFD_RELOC_X86_64_GOTPCREL64;
2584 case BFD_RELOC_X86_64_TPOFF32:
2585 other = BFD_RELOC_X86_64_TPOFF64;
2587 case BFD_RELOC_X86_64_DTPOFF32:
2588 other = BFD_RELOC_X86_64_DTPOFF64;
2594 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
2595 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
2598 rel = bfd_reloc_type_lookup (stdoutput, other);
2600 as_bad (_("unknown relocation (%u)"), other);
2601 else if (size != bfd_get_reloc_size (rel))
2602 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
2603 bfd_get_reloc_size (rel),
2605 else if (pcrel && !rel->pc_relative)
2606 as_bad (_("non-pc-relative relocation for pc-relative field"));
2607 else if ((rel->complain_on_overflow == complain_overflow_signed
2609 || (rel->complain_on_overflow == complain_overflow_unsigned
2611 as_bad (_("relocated field and relocation type differ in signedness"));
2620 as_bad (_("there are no unsigned pc-relative relocations"));
2623 case 1: return BFD_RELOC_8_PCREL;
2624 case 2: return BFD_RELOC_16_PCREL;
2625 case 4: return BFD_RELOC_32_PCREL;
2626 case 8: return BFD_RELOC_64_PCREL;
2628 as_bad (_("cannot do %u byte pc-relative relocation"), size);
2635 case 4: return BFD_RELOC_X86_64_32S;
2640 case 1: return BFD_RELOC_8;
2641 case 2: return BFD_RELOC_16;
2642 case 4: return BFD_RELOC_32;
2643 case 8: return BFD_RELOC_64;
2645 as_bad (_("cannot do %s %u byte relocation"),
2646 sign > 0 ? "signed" : "unsigned", size);
2652 /* Here we decide which fixups can be adjusted to make them relative to
2653 the beginning of the section instead of the symbol. Basically we need
2654 to make sure that the dynamic relocations are done correctly, so in
2655 some cases we force the original symbol to be used. */
2658 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
2660 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2664 /* Don't adjust pc-relative references to merge sections in 64-bit
2666 if (use_rela_relocations
2667 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
2671 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
2672 and changed later by validate_fix. */
2673 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
2674 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
2677 /* adjust_reloc_syms doesn't know about the GOT. */
2678 if (fixP->fx_r_type == BFD_RELOC_386_GOTOFF
2679 || fixP->fx_r_type == BFD_RELOC_386_PLT32
2680 || fixP->fx_r_type == BFD_RELOC_386_GOT32
2681 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
2682 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
2683 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
2684 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
2685 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
2686 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
2687 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
2688 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
2689 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
2690 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
2691 || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
2692 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
2693 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
2694 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
2695 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
2696 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
2697 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
2698 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
2699 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
2700 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
2701 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
2702 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
2703 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
2704 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
2705 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
2712 intel_float_operand (const char *mnemonic)
2714 /* Note that the value returned is meaningful only for opcodes with (memory)
2715 operands, hence the code here is free to improperly handle opcodes that
2716 have no operands (for better performance and smaller code). */
2718 if (mnemonic[0] != 'f')
2719 return 0; /* non-math */
2721 switch (mnemonic[1])
2723 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
2724 the fs segment override prefix not currently handled because no
2725 call path can make opcodes without operands get here */
2727 return 2 /* integer op */;
2729 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
2730 return 3; /* fldcw/fldenv */
2733 if (mnemonic[2] != 'o' /* fnop */)
2734 return 3; /* non-waiting control op */
2737 if (mnemonic[2] == 's')
2738 return 3; /* frstor/frstpm */
2741 if (mnemonic[2] == 'a')
2742 return 3; /* fsave */
2743 if (mnemonic[2] == 't')
2745 switch (mnemonic[3])
2747 case 'c': /* fstcw */
2748 case 'd': /* fstdw */
2749 case 'e': /* fstenv */
2750 case 's': /* fsts[gw] */
2756 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
2757 return 0; /* fxsave/fxrstor are not really math ops */
2764 /* Build the VEX prefix. */
2767 build_vex_prefix (const insn_template *t)
2769 unsigned int register_specifier;
2770 unsigned int implied_prefix;
2771 unsigned int vector_length;
2773 /* Check register specifier. */
2774 if (i.vex.register_specifier)
2776 register_specifier = i.vex.register_specifier->reg_num;
2777 if ((i.vex.register_specifier->reg_flags & RegRex))
2778 register_specifier += 8;
2779 register_specifier = ~register_specifier & 0xf;
2782 register_specifier = 0xf;
2784 /* Use 2-byte VEX prefix by swappping destination and source
2787 && i.operands == i.reg_operands
2788 && i.tm.opcode_modifier.vexopcode == VEX0F
2789 && i.tm.opcode_modifier.s
2792 unsigned int xchg = i.operands - 1;
2793 union i386_op temp_op;
2794 i386_operand_type temp_type;
2796 temp_type = i.types[xchg];
2797 i.types[xchg] = i.types[0];
2798 i.types[0] = temp_type;
2799 temp_op = i.op[xchg];
2800 i.op[xchg] = i.op[0];
2803 gas_assert (i.rm.mode == 3);
2807 i.rm.regmem = i.rm.reg;
2810 /* Use the next insn. */
2814 if (i.tm.opcode_modifier.vex == VEXScalar)
2815 vector_length = avxscalar;
2817 vector_length = i.tm.opcode_modifier.vex == VEX256 ? 1 : 0;
2819 switch ((i.tm.base_opcode >> 8) & 0xff)
2824 case DATA_PREFIX_OPCODE:
2827 case REPE_PREFIX_OPCODE:
2830 case REPNE_PREFIX_OPCODE:
2837 /* Use 2-byte VEX prefix if possible. */
2838 if (i.tm.opcode_modifier.vexopcode == VEX0F
2839 && i.tm.opcode_modifier.vexw != VEXW1
2840 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
2842 /* 2-byte VEX prefix. */
2846 i.vex.bytes[0] = 0xc5;
2848 /* Check the REX.R bit. */
2849 r = (i.rex & REX_R) ? 0 : 1;
2850 i.vex.bytes[1] = (r << 7
2851 | register_specifier << 3
2852 | vector_length << 2
2857 /* 3-byte VEX prefix. */
2862 switch (i.tm.opcode_modifier.vexopcode)
2866 i.vex.bytes[0] = 0xc4;
2870 i.vex.bytes[0] = 0xc4;
2874 i.vex.bytes[0] = 0xc4;
2878 i.vex.bytes[0] = 0x8f;
2882 i.vex.bytes[0] = 0x8f;
2886 i.vex.bytes[0] = 0x8f;
2892 /* The high 3 bits of the second VEX byte are 1's compliment
2893 of RXB bits from REX. */
2894 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
2896 /* Check the REX.W bit. */
2897 w = (i.rex & REX_W) ? 1 : 0;
2898 if (i.tm.opcode_modifier.vexw)
2903 if (i.tm.opcode_modifier.vexw == VEXW1)
2907 i.vex.bytes[2] = (w << 7
2908 | register_specifier << 3
2909 | vector_length << 2
2915 process_immext (void)
2919 if (i.tm.cpu_flags.bitfield.cpusse3 && i.operands > 0)
2921 /* SSE3 Instructions have the fixed operands with an opcode
2922 suffix which is coded in the same place as an 8-bit immediate
2923 field would be. Here we check those operands and remove them
2927 for (x = 0; x < i.operands; x++)
2928 if (i.op[x].regs->reg_num != x)
2929 as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
2930 register_prefix, i.op[x].regs->reg_name, x + 1,
2936 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
2937 which is coded in the same place as an 8-bit immediate field
2938 would be. Here we fake an 8-bit immediate operand from the
2939 opcode suffix stored in tm.extension_opcode.
2941 AVX instructions also use this encoding, for some of
2942 3 argument instructions. */
2944 gas_assert (i.imm_operands == 0
2946 || (i.tm.opcode_modifier.vex
2947 && i.operands <= 4)));
2949 exp = &im_expressions[i.imm_operands++];
2950 i.op[i.operands].imms = exp;
2951 i.types[i.operands] = imm8;
2953 exp->X_op = O_constant;
2954 exp->X_add_number = i.tm.extension_opcode;
2955 i.tm.extension_opcode = None;
2958 /* This is the guts of the machine-dependent assembler. LINE points to a
2959 machine dependent instruction. This function is supposed to emit
2960 the frags/bytes it assembles to. */
2963 md_assemble (char *line)
2966 char mnemonic[MAX_MNEM_SIZE];
2967 const insn_template *t;
2969 /* Initialize globals. */
2970 memset (&i, '\0', sizeof (i));
2971 for (j = 0; j < MAX_OPERANDS; j++)
2972 i.reloc[j] = NO_RELOC;
2973 memset (disp_expressions, '\0', sizeof (disp_expressions));
2974 memset (im_expressions, '\0', sizeof (im_expressions));
2975 save_stack_p = save_stack;
2977 /* First parse an instruction mnemonic & call i386_operand for the operands.
2978 We assume that the scrubber has arranged it so that line[0] is the valid
2979 start of a (possibly prefixed) mnemonic. */
2981 line = parse_insn (line, mnemonic);
2985 line = parse_operands (line, mnemonic);
2990 /* Now we've parsed the mnemonic into a set of templates, and have the
2991 operands at hand. */
2993 /* All intel opcodes have reversed operands except for "bound" and
2994 "enter". We also don't reverse intersegment "jmp" and "call"
2995 instructions with 2 immediate operands so that the immediate segment
2996 precedes the offset, as it does when in AT&T mode. */
2999 && (strcmp (mnemonic, "bound") != 0)
3000 && (strcmp (mnemonic, "invlpga") != 0)
3001 && !(operand_type_check (i.types[0], imm)
3002 && operand_type_check (i.types[1], imm)))
3005 /* The order of the immediates should be reversed
3006 for 2 immediates extrq and insertq instructions */
3007 if (i.imm_operands == 2
3008 && (strcmp (mnemonic, "extrq") == 0
3009 || strcmp (mnemonic, "insertq") == 0))
3010 swap_2_operands (0, 1);
3015 /* Don't optimize displacement for movabs since it only takes 64bit
3018 && !i.disp32_encoding
3019 && (flag_code != CODE_64BIT
3020 || strcmp (mnemonic, "movabs") != 0))
3023 /* Next, we find a template that matches the given insn,
3024 making sure the overlap of the given operands types is consistent
3025 with the template operand types. */
3027 if (!(t = match_template ()))
3030 if (sse_check != sse_check_none
3031 && !i.tm.opcode_modifier.noavx
3032 && (i.tm.cpu_flags.bitfield.cpusse
3033 || i.tm.cpu_flags.bitfield.cpusse2
3034 || i.tm.cpu_flags.bitfield.cpusse3
3035 || i.tm.cpu_flags.bitfield.cpussse3
3036 || i.tm.cpu_flags.bitfield.cpusse4_1
3037 || i.tm.cpu_flags.bitfield.cpusse4_2))
3039 (sse_check == sse_check_warning
3041 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
3044 /* Zap movzx and movsx suffix. The suffix has been set from
3045 "word ptr" or "byte ptr" on the source operand in Intel syntax
3046 or extracted from mnemonic in AT&T syntax. But we'll use
3047 the destination register to choose the suffix for encoding. */
3048 if ((i.tm.base_opcode & ~9) == 0x0fb6)
3050 /* In Intel syntax, there must be a suffix. In AT&T syntax, if
3051 there is no suffix, the default will be byte extension. */
3052 if (i.reg_operands != 2
3055 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
3060 if (i.tm.opcode_modifier.fwait)
3061 if (!add_prefix (FWAIT_OPCODE))
3064 /* Check for lock without a lockable instruction. Destination operand
3065 must be memory unless it is xchg (0x86). */
3066 if (i.prefix[LOCK_PREFIX]
3067 && (!i.tm.opcode_modifier.islockable
3068 || i.mem_operands == 0
3069 || (i.tm.base_opcode != 0x86
3070 && !operand_type_check (i.types[i.operands - 1], anymem))))
3072 as_bad (_("expecting lockable instruction after `lock'"));
3076 /* Check string instruction segment overrides. */
3077 if (i.tm.opcode_modifier.isstring && i.mem_operands != 0)
3079 if (!check_string ())
3081 i.disp_operands = 0;
3084 if (!process_suffix ())
3087 /* Update operand types. */
3088 for (j = 0; j < i.operands; j++)
3089 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
3091 /* Make still unresolved immediate matches conform to size of immediate
3092 given in i.suffix. */
3093 if (!finalize_imm ())
3096 if (i.types[0].bitfield.imm1)
3097 i.imm_operands = 0; /* kludge for shift insns. */
3099 /* We only need to check those implicit registers for instructions
3100 with 3 operands or less. */
3101 if (i.operands <= 3)
3102 for (j = 0; j < i.operands; j++)
3103 if (i.types[j].bitfield.inoutportreg
3104 || i.types[j].bitfield.shiftcount
3105 || i.types[j].bitfield.acc
3106 || i.types[j].bitfield.floatacc)
3109 /* ImmExt should be processed after SSE2AVX. */
3110 if (!i.tm.opcode_modifier.sse2avx
3111 && i.tm.opcode_modifier.immext)
3114 /* For insns with operands there are more diddles to do to the opcode. */
3117 if (!process_operands ())
3120 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
3122 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
3123 as_warn (_("translating to `%sp'"), i.tm.name);
3126 if (i.tm.opcode_modifier.vex)
3127 build_vex_prefix (t);
3129 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
3130 instructions may define INT_OPCODE as well, so avoid this corner
3131 case for those instructions that use MODRM. */
3132 if (i.tm.base_opcode == INT_OPCODE
3133 && !i.tm.opcode_modifier.modrm
3134 && i.op[0].imms->X_add_number == 3)
3136 i.tm.base_opcode = INT3_OPCODE;
3140 if ((i.tm.opcode_modifier.jump
3141 || i.tm.opcode_modifier.jumpbyte
3142 || i.tm.opcode_modifier.jumpdword)
3143 && i.op[0].disps->X_op == O_constant)
3145 /* Convert "jmp constant" (and "call constant") to a jump (call) to
3146 the absolute address given by the constant. Since ix86 jumps and
3147 calls are pc relative, we need to generate a reloc. */
3148 i.op[0].disps->X_add_symbol = &abs_symbol;
3149 i.op[0].disps->X_op = O_symbol;
3152 if (i.tm.opcode_modifier.rex64)
3155 /* For 8 bit registers we need an empty rex prefix. Also if the
3156 instruction already has a prefix, we need to convert old
3157 registers to new ones. */
3159 if ((i.types[0].bitfield.reg8
3160 && (i.op[0].regs->reg_flags & RegRex64) != 0)
3161 || (i.types[1].bitfield.reg8
3162 && (i.op[1].regs->reg_flags & RegRex64) != 0)
3163 || ((i.types[0].bitfield.reg8
3164 || i.types[1].bitfield.reg8)
3169 i.rex |= REX_OPCODE;
3170 for (x = 0; x < 2; x++)
3172 /* Look for 8 bit operand that uses old registers. */
3173 if (i.types[x].bitfield.reg8
3174 && (i.op[x].regs->reg_flags & RegRex64) == 0)
3176 /* In case it is "hi" register, give up. */
3177 if (i.op[x].regs->reg_num > 3)
3178 as_bad (_("can't encode register '%s%s' in an "
3179 "instruction requiring REX prefix."),
3180 register_prefix, i.op[x].regs->reg_name);
3182 /* Otherwise it is equivalent to the extended register.
3183 Since the encoding doesn't change this is merely
3184 cosmetic cleanup for debug output. */
3186 i.op[x].regs = i.op[x].regs + 8;
3192 add_prefix (REX_OPCODE | i.rex);
3194 /* We are ready to output the insn. */
3199 parse_insn (char *line, char *mnemonic)
3202 char *token_start = l;
3205 const insn_template *t;
3208 /* Non-zero if we found a prefix only acceptable with string insns. */
3209 const char *expecting_string_instruction = NULL;
3214 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
3219 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
3221 as_bad (_("no such instruction: `%s'"), token_start);
3226 if (!is_space_char (*l)
3227 && *l != END_OF_INSN
3229 || (*l != PREFIX_SEPARATOR
3232 as_bad (_("invalid character %s in mnemonic"),
3233 output_invalid (*l));
3236 if (token_start == l)
3238 if (!intel_syntax && *l == PREFIX_SEPARATOR)
3239 as_bad (_("expecting prefix; got nothing"));
3241 as_bad (_("expecting mnemonic; got nothing"));
3245 /* Look up instruction (or prefix) via hash table. */
3246 current_templates = (const templates *) hash_find (op_hash, mnemonic);
3248 if (*l != END_OF_INSN
3249 && (!is_space_char (*l) || l[1] != END_OF_INSN)
3250 && current_templates
3251 && current_templates->start->opcode_modifier.isprefix)
3253 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
3255 as_bad ((flag_code != CODE_64BIT
3256 ? _("`%s' is only supported in 64-bit mode")
3257 : _("`%s' is not supported in 64-bit mode")),
3258 current_templates->start->name);
3261 /* If we are in 16-bit mode, do not allow addr16 or data16.
3262 Similarly, in 32-bit mode, do not allow addr32 or data32. */
3263 if ((current_templates->start->opcode_modifier.size16
3264 || current_templates->start->opcode_modifier.size32)
3265 && flag_code != CODE_64BIT
3266 && (current_templates->start->opcode_modifier.size32
3267 ^ (flag_code == CODE_16BIT)))
3269 as_bad (_("redundant %s prefix"),
3270 current_templates->start->name);
3273 /* Add prefix, checking for repeated prefixes. */
3274 switch (add_prefix (current_templates->start->base_opcode))
3279 expecting_string_instruction = current_templates->start->name;
3284 /* Skip past PREFIX_SEPARATOR and reset token_start. */
3291 if (!current_templates)
3293 /* Check if we should swap operand or force 32bit displacement in
3295 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
3297 else if (mnem_p - 4 == dot_p
3301 i.disp32_encoding = 1;
3306 current_templates = (const templates *) hash_find (op_hash, mnemonic);
3309 if (!current_templates)
3312 /* See if we can get a match by trimming off a suffix. */
3315 case WORD_MNEM_SUFFIX:
3316 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
3317 i.suffix = SHORT_MNEM_SUFFIX;
3319 case BYTE_MNEM_SUFFIX:
3320 case QWORD_MNEM_SUFFIX:
3321 i.suffix = mnem_p[-1];
3323 current_templates = (const templates *) hash_find (op_hash,
3326 case SHORT_MNEM_SUFFIX:
3327 case LONG_MNEM_SUFFIX:
3330 i.suffix = mnem_p[-1];
3332 current_templates = (const templates *) hash_find (op_hash,
3341 if (intel_float_operand (mnemonic) == 1)
3342 i.suffix = SHORT_MNEM_SUFFIX;
3344 i.suffix = LONG_MNEM_SUFFIX;
3346 current_templates = (const templates *) hash_find (op_hash,
3351 if (!current_templates)
3353 as_bad (_("no such instruction: `%s'"), token_start);
3358 if (current_templates->start->opcode_modifier.jump
3359 || current_templates->start->opcode_modifier.jumpbyte)
3361 /* Check for a branch hint. We allow ",pt" and ",pn" for
3362 predict taken and predict not taken respectively.
3363 I'm not sure that branch hints actually do anything on loop
3364 and jcxz insns (JumpByte) for current Pentium4 chips. They
3365 may work in the future and it doesn't hurt to accept them
3367 if (l[0] == ',' && l[1] == 'p')
3371 if (!add_prefix (DS_PREFIX_OPCODE))
3375 else if (l[2] == 'n')
3377 if (!add_prefix (CS_PREFIX_OPCODE))
3383 /* Any other comma loses. */
3386 as_bad (_("invalid character %s in mnemonic"),
3387 output_invalid (*l));
3391 /* Check if instruction is supported on specified architecture. */
3393 for (t = current_templates->start; t < current_templates->end; ++t)
3395 supported |= cpu_flags_match (t);
3396 if (supported == CPU_FLAGS_PERFECT_MATCH)
3400 if (!(supported & CPU_FLAGS_64BIT_MATCH))
3402 as_bad (flag_code == CODE_64BIT
3403 ? _("`%s' is not supported in 64-bit mode")
3404 : _("`%s' is only supported in 64-bit mode"),
3405 current_templates->start->name);
3408 if (supported != CPU_FLAGS_PERFECT_MATCH)
3410 as_bad (_("`%s' is not supported on `%s%s'"),
3411 current_templates->start->name,
3412 cpu_arch_name ? cpu_arch_name : default_arch,
3413 cpu_sub_arch_name ? cpu_sub_arch_name : "");
3418 if (!cpu_arch_flags.bitfield.cpui386
3419 && (flag_code != CODE_16BIT))
3421 as_warn (_("use .code16 to ensure correct addressing mode"));
3424 /* Check for rep/repne without a string instruction. */
3425 if (expecting_string_instruction)
3427 static templates override;
3429 for (t = current_templates->start; t < current_templates->end; ++t)
3430 if (t->opcode_modifier.isstring)
3432 if (t >= current_templates->end)
3434 as_bad (_("expecting string instruction after `%s'"),
3435 expecting_string_instruction);
3438 for (override.start = t; t < current_templates->end; ++t)
3439 if (!t->opcode_modifier.isstring)
3442 current_templates = &override;
3449 parse_operands (char *l, const char *mnemonic)
3453 /* 1 if operand is pending after ','. */
3454 unsigned int expecting_operand = 0;
3456 /* Non-zero if operand parens not balanced. */
3457 unsigned int paren_not_balanced;
3459 while (*l != END_OF_INSN)
3461 /* Skip optional white space before operand. */
3462 if (is_space_char (*l))
3464 if (!is_operand_char (*l) && *l != END_OF_INSN)
3466 as_bad (_("invalid character %s before operand %d"),
3467 output_invalid (*l),
3471 token_start = l; /* after white space */
3472 paren_not_balanced = 0;
3473 while (paren_not_balanced || *l != ',')
3475 if (*l == END_OF_INSN)
3477 if (paren_not_balanced)
3480 as_bad (_("unbalanced parenthesis in operand %d."),
3483 as_bad (_("unbalanced brackets in operand %d."),
3488 break; /* we are done */
3490 else if (!is_operand_char (*l) && !is_space_char (*l))
3492 as_bad (_("invalid character %s in operand %d"),
3493 output_invalid (*l),
3500 ++paren_not_balanced;
3502 --paren_not_balanced;
3507 ++paren_not_balanced;
3509 --paren_not_balanced;
3513 if (l != token_start)
3514 { /* Yes, we've read in another operand. */
3515 unsigned int operand_ok;
3516 this_operand = i.operands++;
3517 i.types[this_operand].bitfield.unspecified = 1;
3518 if (i.operands > MAX_OPERANDS)
3520 as_bad (_("spurious operands; (%d operands/instruction max)"),
3524 /* Now parse operand adding info to 'i' as we go along. */
3525 END_STRING_AND_SAVE (l);
3529 i386_intel_operand (token_start,
3530 intel_float_operand (mnemonic));
3532 operand_ok = i386_att_operand (token_start);
3534 RESTORE_END_STRING (l);
3540 if (expecting_operand)
3542 expecting_operand_after_comma:
3543 as_bad (_("expecting operand after ','; got nothing"));
3548 as_bad (_("expecting operand before ','; got nothing"));
3553 /* Now *l must be either ',' or END_OF_INSN. */
3556 if (*++l == END_OF_INSN)
3558 /* Just skip it, if it's \n complain. */
3559 goto expecting_operand_after_comma;
3561 expecting_operand = 1;
3568 swap_2_operands (int xchg1, int xchg2)
3570 union i386_op temp_op;
3571 i386_operand_type temp_type;
3572 enum bfd_reloc_code_real temp_reloc;
3574 temp_type = i.types[xchg2];
3575 i.types[xchg2] = i.types[xchg1];
3576 i.types[xchg1] = temp_type;
3577 temp_op = i.op[xchg2];
3578 i.op[xchg2] = i.op[xchg1];
3579 i.op[xchg1] = temp_op;
3580 temp_reloc = i.reloc[xchg2];
3581 i.reloc[xchg2] = i.reloc[xchg1];
3582 i.reloc[xchg1] = temp_reloc;
3586 swap_operands (void)
3592 swap_2_operands (1, i.operands - 2);
3595 swap_2_operands (0, i.operands - 1);
3601 if (i.mem_operands == 2)
3603 const seg_entry *temp_seg;
3604 temp_seg = i.seg[0];
3605 i.seg[0] = i.seg[1];
3606 i.seg[1] = temp_seg;
3610 /* Try to ensure constant immediates are represented in the smallest
3615 char guess_suffix = 0;
3619 guess_suffix = i.suffix;
3620 else if (i.reg_operands)
3622 /* Figure out a suffix from the last register operand specified.
3623 We can't do this properly yet, ie. excluding InOutPortReg,
3624 but the following works for instructions with immediates.
3625 In any case, we can't set i.suffix yet. */
3626 for (op = i.operands; --op >= 0;)
3627 if (i.types[op].bitfield.reg8)
3629 guess_suffix = BYTE_MNEM_SUFFIX;
3632 else if (i.types[op].bitfield.reg16)
3634 guess_suffix = WORD_MNEM_SUFFIX;
3637 else if (i.types[op].bitfield.reg32)
3639 guess_suffix = LONG_MNEM_SUFFIX;
3642 else if (i.types[op].bitfield.reg64)
3644 guess_suffix = QWORD_MNEM_SUFFIX;
3648 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
3649 guess_suffix = WORD_MNEM_SUFFIX;
3651 for (op = i.operands; --op >= 0;)
3652 if (operand_type_check (i.types[op], imm))
3654 switch (i.op[op].imms->X_op)
3657 /* If a suffix is given, this operand may be shortened. */
3658 switch (guess_suffix)
3660 case LONG_MNEM_SUFFIX:
3661 i.types[op].bitfield.imm32 = 1;
3662 i.types[op].bitfield.imm64 = 1;
3664 case WORD_MNEM_SUFFIX:
3665 i.types[op].bitfield.imm16 = 1;
3666 i.types[op].bitfield.imm32 = 1;
3667 i.types[op].bitfield.imm32s = 1;
3668 i.types[op].bitfield.imm64 = 1;
3670 case BYTE_MNEM_SUFFIX:
3671 i.types[op].bitfield.imm8 = 1;
3672 i.types[op].bitfield.imm8s = 1;
3673 i.types[op].bitfield.imm16 = 1;
3674 i.types[op].bitfield.imm32 = 1;
3675 i.types[op].bitfield.imm32s = 1;
3676 i.types[op].bitfield.imm64 = 1;
3680 /* If this operand is at most 16 bits, convert it
3681 to a signed 16 bit number before trying to see
3682 whether it will fit in an even smaller size.
3683 This allows a 16-bit operand such as $0xffe0 to
3684 be recognised as within Imm8S range. */
3685 if ((i.types[op].bitfield.imm16)
3686 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
3688 i.op[op].imms->X_add_number =
3689 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
3691 if ((i.types[op].bitfield.imm32)
3692 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
3695 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
3696 ^ ((offsetT) 1 << 31))
3697 - ((offsetT) 1 << 31));
3700 = operand_type_or (i.types[op],
3701 smallest_imm_type (i.op[op].imms->X_add_number));
3703 /* We must avoid matching of Imm32 templates when 64bit
3704 only immediate is available. */
3705 if (guess_suffix == QWORD_MNEM_SUFFIX)
3706 i.types[op].bitfield.imm32 = 0;
3713 /* Symbols and expressions. */
3715 /* Convert symbolic operand to proper sizes for matching, but don't
3716 prevent matching a set of insns that only supports sizes other
3717 than those matching the insn suffix. */
3719 i386_operand_type mask, allowed;
3720 const insn_template *t;
3722 operand_type_set (&mask, 0);
3723 operand_type_set (&allowed, 0);
3725 for (t = current_templates->start;
3726 t < current_templates->end;
3728 allowed = operand_type_or (allowed,
3729 t->operand_types[op]);
3730 switch (guess_suffix)
3732 case QWORD_MNEM_SUFFIX:
3733 mask.bitfield.imm64 = 1;
3734 mask.bitfield.imm32s = 1;
3736 case LONG_MNEM_SUFFIX:
3737 mask.bitfield.imm32 = 1;
3739 case WORD_MNEM_SUFFIX:
3740 mask.bitfield.imm16 = 1;
3742 case BYTE_MNEM_SUFFIX:
3743 mask.bitfield.imm8 = 1;
3748 allowed = operand_type_and (mask, allowed);
3749 if (!operand_type_all_zero (&allowed))
3750 i.types[op] = operand_type_and (i.types[op], mask);
3757 /* Try to use the smallest displacement type too. */
3759 optimize_disp (void)
3763 for (op = i.operands; --op >= 0;)
3764 if (operand_type_check (i.types[op], disp))
3766 if (i.op[op].disps->X_op == O_constant)
3768 offsetT op_disp = i.op[op].disps->X_add_number;
3770 if (i.types[op].bitfield.disp16
3771 && (op_disp & ~(offsetT) 0xffff) == 0)
3773 /* If this operand is at most 16 bits, convert
3774 to a signed 16 bit number and don't use 64bit
3776 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
3777 i.types[op].bitfield.disp64 = 0;
3779 if (i.types[op].bitfield.disp32
3780 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
3782 /* If this operand is at most 32 bits, convert
3783 to a signed 32 bit number and don't use 64bit
3785 op_disp &= (((offsetT) 2 << 31) - 1);
3786 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
3787 i.types[op].bitfield.disp64 = 0;
3789 if (!op_disp && i.types[op].bitfield.baseindex)
3791 i.types[op].bitfield.disp8 = 0;
3792 i.types[op].bitfield.disp16 = 0;
3793 i.types[op].bitfield.disp32 = 0;
3794 i.types[op].bitfield.disp32s = 0;
3795 i.types[op].bitfield.disp64 = 0;
3799 else if (flag_code == CODE_64BIT)
3801 if (fits_in_signed_long (op_disp))
3803 i.types[op].bitfield.disp64 = 0;
3804 i.types[op].bitfield.disp32s = 1;
3806 if (i.prefix[ADDR_PREFIX]
3807 && fits_in_unsigned_long (op_disp))
3808 i.types[op].bitfield.disp32 = 1;
3810 if ((i.types[op].bitfield.disp32
3811 || i.types[op].bitfield.disp32s
3812 || i.types[op].bitfield.disp16)
3813 && fits_in_signed_byte (op_disp))
3814 i.types[op].bitfield.disp8 = 1;
3816 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
3817 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
3819 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
3820 i.op[op].disps, 0, i.reloc[op]);
3821 i.types[op].bitfield.disp8 = 0;
3822 i.types[op].bitfield.disp16 = 0;
3823 i.types[op].bitfield.disp32 = 0;
3824 i.types[op].bitfield.disp32s = 0;
3825 i.types[op].bitfield.disp64 = 0;
3828 /* We only support 64bit displacement on constants. */
3829 i.types[op].bitfield.disp64 = 0;
3833 /* Check if operands are valid for the instruction. Update VEX
3837 VEX_check_operands (const insn_template *t)
3839 if (!t->opcode_modifier.vex)
3842 /* Only check VEX_Imm4, which must be the first operand. */
3843 if (t->operand_types[0].bitfield.vec_imm4)
3845 if (i.op[0].imms->X_op != O_constant
3846 || !fits_in_imm4 (i.op[0].imms->X_add_number))
3852 /* Turn off Imm8 so that update_imm won't complain. */
3853 i.types[0] = vec_imm4;
3859 static const insn_template *
3860 match_template (void)
3862 /* Points to template once we've found it. */
3863 const insn_template *t;
3864 i386_operand_type overlap0, overlap1, overlap2, overlap3;
3865 i386_operand_type overlap4;
3866 unsigned int found_reverse_match;
3867 i386_opcode_modifier suffix_check;
3868 i386_operand_type operand_types [MAX_OPERANDS];
3869 int addr_prefix_disp;
3871 unsigned int found_cpu_match;
3872 unsigned int check_register;
3874 #if MAX_OPERANDS != 5
3875 # error "MAX_OPERANDS must be 5."
3878 found_reverse_match = 0;
3879 addr_prefix_disp = -1;
3881 memset (&suffix_check, 0, sizeof (suffix_check));
3882 if (i.suffix == BYTE_MNEM_SUFFIX)
3883 suffix_check.no_bsuf = 1;
3884 else if (i.suffix == WORD_MNEM_SUFFIX)
3885 suffix_check.no_wsuf = 1;
3886 else if (i.suffix == SHORT_MNEM_SUFFIX)
3887 suffix_check.no_ssuf = 1;
3888 else if (i.suffix == LONG_MNEM_SUFFIX)
3889 suffix_check.no_lsuf = 1;
3890 else if (i.suffix == QWORD_MNEM_SUFFIX)
3891 suffix_check.no_qsuf = 1;
3892 else if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
3893 suffix_check.no_ldsuf = 1;
3895 /* Must have right number of operands. */
3896 i.error = number_of_operands_mismatch;
3898 for (t = current_templates->start; t < current_templates->end; t++)
3900 addr_prefix_disp = -1;
3902 if (i.operands != t->operands)
3905 /* Check processor support. */
3906 i.error = unsupported;
3907 found_cpu_match = (cpu_flags_match (t)
3908 == CPU_FLAGS_PERFECT_MATCH);
3909 if (!found_cpu_match)
3912 /* Check old gcc support. */
3913 i.error = old_gcc_only;
3914 if (!old_gcc && t->opcode_modifier.oldgcc)
3917 /* Check AT&T mnemonic. */
3918 i.error = unsupported_with_intel_mnemonic;
3919 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
3922 /* Check AT&T/Intel syntax. */
3923 i.error = unsupported_syntax;
3924 if ((intel_syntax && t->opcode_modifier.attsyntax)
3925 || (!intel_syntax && t->opcode_modifier.intelsyntax))
3928 /* Check the suffix, except for some instructions in intel mode. */
3929 i.error = invalid_instruction_suffix;
3930 if ((!intel_syntax || !t->opcode_modifier.ignoresize)
3931 && ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
3932 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
3933 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
3934 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
3935 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
3936 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf)))
3939 if (!operand_size_match (t))
3942 for (j = 0; j < MAX_OPERANDS; j++)
3943 operand_types[j] = t->operand_types[j];
3945 /* In general, don't allow 64-bit operands in 32-bit mode. */
3946 if (i.suffix == QWORD_MNEM_SUFFIX
3947 && flag_code != CODE_64BIT
3949 ? (!t->opcode_modifier.ignoresize
3950 && !intel_float_operand (t->name))
3951 : intel_float_operand (t->name) != 2)
3952 && ((!operand_types[0].bitfield.regmmx
3953 && !operand_types[0].bitfield.regxmm
3954 && !operand_types[0].bitfield.regymm)
3955 || (!operand_types[t->operands > 1].bitfield.regmmx
3956 && !!operand_types[t->operands > 1].bitfield.regxmm
3957 && !!operand_types[t->operands > 1].bitfield.regymm))
3958 && (t->base_opcode != 0x0fc7
3959 || t->extension_opcode != 1 /* cmpxchg8b */))
3962 /* In general, don't allow 32-bit operands on pre-386. */
3963 else if (i.suffix == LONG_MNEM_SUFFIX
3964 && !cpu_arch_flags.bitfield.cpui386
3966 ? (!t->opcode_modifier.ignoresize
3967 && !intel_float_operand (t->name))
3968 : intel_float_operand (t->name) != 2)
3969 && ((!operand_types[0].bitfield.regmmx
3970 && !operand_types[0].bitfield.regxmm)
3971 || (!operand_types[t->operands > 1].bitfield.regmmx
3972 && !!operand_types[t->operands > 1].bitfield.regxmm)))
3975 /* Do not verify operands when there are none. */
3979 /* We've found a match; break out of loop. */
3983 /* Address size prefix will turn Disp64/Disp32/Disp16 operand
3984 into Disp32/Disp16/Disp32 operand. */
3985 if (i.prefix[ADDR_PREFIX] != 0)
3987 /* There should be only one Disp operand. */
3991 for (j = 0; j < MAX_OPERANDS; j++)
3993 if (operand_types[j].bitfield.disp16)
3995 addr_prefix_disp = j;
3996 operand_types[j].bitfield.disp32 = 1;
3997 operand_types[j].bitfield.disp16 = 0;
4003 for (j = 0; j < MAX_OPERANDS; j++)
4005 if (operand_types[j].bitfield.disp32)
4007 addr_prefix_disp = j;
4008 operand_types[j].bitfield.disp32 = 0;
4009 operand_types[j].bitfield.disp16 = 1;
4015 for (j = 0; j < MAX_OPERANDS; j++)
4017 if (operand_types[j].bitfield.disp64)
4019 addr_prefix_disp = j;
4020 operand_types[j].bitfield.disp64 = 0;
4021 operand_types[j].bitfield.disp32 = 1;
4029 /* We check register size if needed. */
4030 check_register = t->opcode_modifier.checkregsize;
4031 overlap0 = operand_type_and (i.types[0], operand_types[0]);
4032 switch (t->operands)
4035 if (!operand_type_match (overlap0, i.types[0]))
4039 /* xchg %eax, %eax is a special case. It is an aliase for nop
4040 only in 32bit mode and we can use opcode 0x90. In 64bit
4041 mode, we can't use 0x90 for xchg %eax, %eax since it should
4042 zero-extend %eax to %rax. */
4043 if (flag_code == CODE_64BIT
4044 && t->base_opcode == 0x90
4045 && operand_type_equal (&i.types [0], &acc32)
4046 && operand_type_equal (&i.types [1], &acc32))
4050 /* If we swap operand in encoding, we either match
4051 the next one or reverse direction of operands. */
4052 if (t->opcode_modifier.s)
4054 else if (t->opcode_modifier.d)
4059 /* If we swap operand in encoding, we match the next one. */
4060 if (i.swap_operand && t->opcode_modifier.s)
4064 overlap1 = operand_type_and (i.types[1], operand_types[1]);
4065 if (!operand_type_match (overlap0, i.types[0])
4066 || !operand_type_match (overlap1, i.types[1])
4068 && !operand_type_register_match (overlap0, i.types[0],
4070 overlap1, i.types[1],
4073 /* Check if other direction is valid ... */
4074 if (!t->opcode_modifier.d && !t->opcode_modifier.floatd)
4078 /* Try reversing direction of operands. */
4079 overlap0 = operand_type_and (i.types[0], operand_types[1]);
4080 overlap1 = operand_type_and (i.types[1], operand_types[0]);
4081 if (!operand_type_match (overlap0, i.types[0])
4082 || !operand_type_match (overlap1, i.types[1])
4084 && !operand_type_register_match (overlap0,
4091 /* Does not match either direction. */
4094 /* found_reverse_match holds which of D or FloatDR
4096 if (t->opcode_modifier.d)
4097 found_reverse_match = Opcode_D;
4098 else if (t->opcode_modifier.floatd)
4099 found_reverse_match = Opcode_FloatD;
4101 found_reverse_match = 0;
4102 if (t->opcode_modifier.floatr)
4103 found_reverse_match |= Opcode_FloatR;
4107 /* Found a forward 2 operand match here. */
4108 switch (t->operands)
4111 overlap4 = operand_type_and (i.types[4],
4114 overlap3 = operand_type_and (i.types[3],
4117 overlap2 = operand_type_and (i.types[2],
4122 switch (t->operands)
4125 if (!operand_type_match (overlap4, i.types[4])
4126 || !operand_type_register_match (overlap3,
4134 if (!operand_type_match (overlap3, i.types[3])
4136 && !operand_type_register_match (overlap2,
4144 /* Here we make use of the fact that there are no
4145 reverse match 3 operand instructions, and all 3
4146 operand instructions only need to be checked for
4147 register consistency between operands 2 and 3. */
4148 if (!operand_type_match (overlap2, i.types[2])
4150 && !operand_type_register_match (overlap1,
4160 /* Found either forward/reverse 2, 3 or 4 operand match here:
4161 slip through to break. */
4163 if (!found_cpu_match)
4165 found_reverse_match = 0;
4169 /* Check if VEX operands are valid. */
4170 if (VEX_check_operands (t))
4173 /* We've found a match; break out of loop. */
4177 if (t == current_templates->end)
4179 /* We found no match. */
4180 const char *err_msg;
4185 case operand_size_mismatch:
4186 err_msg = _("operand size mismatch");