gas/config/tc-i386.c

   1 /* tc-i386.c -- Assemble code for the Intel 80386
   2    Copyright (C) 1989-2020 Free Software Foundation, Inc.
   3
   4    This file is part of GAS, the GNU Assembler.
   5
   6    GAS is free software; you can redistribute it and/or modify
   7    it under the terms of the GNU General Public License as published by
   8    the Free Software Foundation; either version 3, or (at your option)
   9    any later version.
  10
  11    GAS is distributed in the hope that it will be useful,
  12    but WITHOUT ANY WARRANTY; without even the implied warranty of
  13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14    GNU General Public License for more details.
  15
  16    You should have received a copy of the GNU General Public License
  17    along with GAS; see the file COPYING.  If not, write to the Free
  18    Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
  19    02110-1301, USA.  */
  20
  21 /* Intel 80386 machine specific gas.
  22    Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
  23    x86_64 support by Jan Hubicka (jh@suse.cz)
  24    VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
  25    Bugs & suggestions are completely welcome.  This is free software.
  26    Please help us make it better.  */
  27
  28 #include "as.h"
  29 #include "safe-ctype.h"
  30 #include "subsegs.h"
  31 #include "dwarf2dbg.h"
  32 #include "dw2gencfi.h"
  33 #include "elf/x86-64.h"
  34 #include "opcodes/i386-init.h"
  35
  36 #ifdef HAVE_LIMITS_H
  37 #include <limits.h>
  38 #else
  39 #ifdef HAVE_SYS_PARAM_H
  40 #include <sys/param.h>
  41 #endif
  42 #ifndef INT_MAX
  43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
  44 #endif
  45 #endif
  46
  47 #ifndef INFER_ADDR_PREFIX
  48 #define INFER_ADDR_PREFIX 1
  49 #endif
  50
  51 #ifndef DEFAULT_ARCH
  52 #define DEFAULT_ARCH "i386"
  53 #endif
  54
  55 #ifndef INLINE
  56 #if __GNUC__ >= 2
  57 #define INLINE __inline__
  58 #else
  59 #define INLINE
  60 #endif
  61 #endif
  62
  63 /* Prefixes will be emitted in the order defined below.
  64    WAIT_PREFIX must be the first prefix since FWAIT is really is an
  65    instruction, and so must come before any prefixes.
  66    The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
  67    REP_PREFIX/HLE_PREFIX, LOCK_PREFIX.  */
  68 #define WAIT_PREFIX     0
  69 #define SEG_PREFIX      1
  70 #define ADDR_PREFIX     2
  71 #define DATA_PREFIX     3
  72 #define REP_PREFIX      4
  73 #define HLE_PREFIX      REP_PREFIX
  74 #define BND_PREFIX      REP_PREFIX
  75 #define LOCK_PREFIX     5
  76 #define REX_PREFIX      6       /* must come last.  */
  77 #define MAX_PREFIXES    7       /* max prefixes per opcode */
  78
  79 /* we define the syntax here (modulo base,index,scale syntax) */
  80 #define REGISTER_PREFIX '%'
  81 #define IMMEDIATE_PREFIX '$'
  82 #define ABSOLUTE_PREFIX '*'
  83
  84 /* these are the instruction mnemonic suffixes in AT&T syntax or
  85    memory operand size in Intel syntax.  */
  86 #define WORD_MNEM_SUFFIX  'w'
  87 #define BYTE_MNEM_SUFFIX  'b'
  88 #define SHORT_MNEM_SUFFIX 's'
  89 #define LONG_MNEM_SUFFIX  'l'
  90 #define QWORD_MNEM_SUFFIX  'q'
  91 /* Intel Syntax.  Use a non-ascii letter since since it never appears
  92    in instructions.  */
  93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
  94
  95 #define END_OF_INSN '\0'
  96
  97 /* This matches the C -> StaticRounding alias in the opcode table.  */
  98 #define commutative staticrounding
  99
 100 /*
 101   'templates' is for grouping together 'template' structures for opcodes
 102   of the same name.  This is only used for storing the insns in the grand
 103   ole hash table of insns.
 104   The templates themselves start at START and range up to (but not including)
 105   END.
 106   */
 107 typedef struct
 108 {
 109   const insn_template *start;
 110   const insn_template *end;
 111 }
 112 templates;
 113
 114 /* 386 operand encoding bytes:  see 386 book for details of this.  */
 115 typedef struct
 116 {
 117   unsigned int regmem;  /* codes register or memory operand */
 118   unsigned int reg;     /* codes register operand (or extended opcode) */
 119   unsigned int mode;    /* how to interpret regmem & reg */
 120 }
 121 modrm_byte;
 122
 123 /* x86-64 extension prefix.  */
 124 typedef int rex_byte;
 125
 126 /* 386 opcode byte to code indirect addressing.  */
 127 typedef struct
 128 {
 129   unsigned base;
 130   unsigned index;
 131   unsigned scale;
 132 }
 133 sib_byte;
 134
 135 /* x86 arch names, types and features */
 136 typedef struct
 137 {
 138   const char *name;             /* arch name */
 139   unsigned int len;             /* arch string length */
 140   enum processor_type type;     /* arch type */
 141   i386_cpu_flags flags;         /* cpu feature flags */
 142   unsigned int skip;            /* show_arch should skip this. */
 143 }
 144 arch_entry;
 145
 146 /* Used to turn off indicated flags.  */
 147 typedef struct
 148 {
 149   const char *name;             /* arch name */
 150   unsigned int len;             /* arch string length */
 151   i386_cpu_flags flags;         /* cpu feature flags */
 152 }
 153 noarch_entry;
 154
 155 static void update_code_flag (int, int);
 156 static void set_code_flag (int);
 157 static void set_16bit_gcc_code_flag (int);
 158 static void set_intel_syntax (int);
 159 static void set_intel_mnemonic (int);
 160 static void set_allow_index_reg (int);
 161 static void set_check (int);
 162 static void set_cpu_arch (int);
 163 #ifdef TE_PE
 164 static void pe_directive_secrel (int);
 165 #endif
 166 static void signed_cons (int);
 167 static char *output_invalid (int c);
 168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
 169                                     const char *);
 170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
 171                                        const char *);
 172 static int i386_att_operand (char *);
 173 static int i386_intel_operand (char *, int);
 174 static int i386_intel_simplify (expressionS *);
 175 static int i386_intel_parse_name (const char *, expressionS *);
 176 static const reg_entry *parse_register (char *, char **);
 177 static char *parse_insn (char *, char *);
 178 static char *parse_operands (char *, const char *);
 179 static void swap_operands (void);
 180 static void swap_2_operands (int, int);
 181 static enum flag_code i386_addressing_mode (void);
 182 static void optimize_imm (void);
 183 static void optimize_disp (void);
 184 static const insn_template *match_template (char);
 185 static int check_string (void);
 186 static int process_suffix (void);
 187 static int check_byte_reg (void);
 188 static int check_long_reg (void);
 189 static int check_qword_reg (void);
 190 static int check_word_reg (void);
 191 static int finalize_imm (void);
 192 static int process_operands (void);
 193 static const seg_entry *build_modrm_byte (void);
 194 static void output_insn (void);
 195 static void output_imm (fragS *, offsetT);
 196 static void output_disp (fragS *, offsetT);
 197 #ifndef I386COFF
 198 static void s_bss (int);
 199 #endif
 200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
 202
 203 /* GNU_PROPERTY_X86_ISA_1_USED.  */
 204 static unsigned int x86_isa_1_used;
 205 /* GNU_PROPERTY_X86_FEATURE_2_USED.  */
 206 static unsigned int x86_feature_2_used;
 207 /* Generate x86 used ISA and feature properties.  */
 208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
 209 #endif
 210
 211 static const char *default_arch = DEFAULT_ARCH;
 212
 213 /* parse_register() returns this when a register alias cannot be used.  */
 214 static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
 215                                    { Dw2Inval, Dw2Inval } };
 216
 217 /* This struct describes rounding control and SAE in the instruction.  */
 218 struct RC_Operation
 219 {
 220   enum rc_type
 221     {
 222       rne = 0,
 223       rd,
 224       ru,
 225       rz,
 226       saeonly
 227     } type;
 228   int operand;
 229 };
 230
 231 static struct RC_Operation rc_op;
 232
 233 /* The struct describes masking, applied to OPERAND in the instruction.
 234    MASK is a pointer to the corresponding mask register.  ZEROING tells
 235    whether merging or zeroing mask is used.  */
 236 struct Mask_Operation
 237 {
 238   const reg_entry *mask;
 239   unsigned int zeroing;
 240   /* The operand where this operation is associated.  */
 241   int operand;
 242 };
 243
 244 static struct Mask_Operation mask_op;
 245
 246 /* The struct describes broadcasting, applied to OPERAND.  FACTOR is
 247    broadcast factor.  */
 248 struct Broadcast_Operation
 249 {
 250   /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}.  */
 251   int type;
 252
 253   /* Index of broadcasted operand.  */
 254   int operand;
 255
 256   /* Number of bytes to broadcast.  */
 257   int bytes;
 258 };
 259
 260 static struct Broadcast_Operation broadcast_op;
 261
 262 /* VEX prefix.  */
 263 typedef struct
 264 {
 265   /* VEX prefix is either 2 byte or 3 byte.  EVEX is 4 byte.  */
 266   unsigned char bytes[4];
 267   unsigned int length;
 268   /* Destination or source register specifier.  */
 269   const reg_entry *register_specifier;
 270 } vex_prefix;
 271
 272 /* 'md_assemble ()' gathers together information and puts it into a
 273    i386_insn.  */
 274
 275 union i386_op
 276   {
 277     expressionS *disps;
 278     expressionS *imms;
 279     const reg_entry *regs;
 280   };
 281
 282 enum i386_error
 283   {
 284     operand_size_mismatch,
 285     operand_type_mismatch,
 286     register_type_mismatch,
 287     number_of_operands_mismatch,
 288     invalid_instruction_suffix,
 289     bad_imm4,
 290     unsupported_with_intel_mnemonic,
 291     unsupported_syntax,
 292     unsupported,
 293     invalid_vsib_address,
 294     invalid_vector_register_set,
 295     unsupported_vector_index_register,
 296     unsupported_broadcast,
 297     broadcast_needed,
 298     unsupported_masking,
 299     mask_not_on_destination,
 300     no_default_mask,
 301     unsupported_rc_sae,
 302     rc_sae_operand_not_last_imm,
 303     invalid_register_operand,
 304   };
 305
 306 struct _i386_insn
 307   {
 308     /* TM holds the template for the insn were currently assembling.  */
 309     insn_template tm;
 310
 311     /* SUFFIX holds the instruction size suffix for byte, word, dword
 312        or qword, if given.  */
 313     char suffix;
 314
 315     /* OPERANDS gives the number of given operands.  */
 316     unsigned int operands;
 317
 318     /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
 319        of given register, displacement, memory operands and immediate
 320        operands.  */
 321     unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
 322
 323     /* TYPES [i] is the type (see above #defines) which tells us how to
 324        use OP[i] for the corresponding operand.  */
 325     i386_operand_type types[MAX_OPERANDS];
 326
 327     /* Displacement expression, immediate expression, or register for each
 328        operand.  */
 329     union i386_op op[MAX_OPERANDS];
 330
 331     /* Flags for operands.  */
 332     unsigned int flags[MAX_OPERANDS];
 333 #define Operand_PCrel 1
 334 #define Operand_Mem   2
 335
 336     /* Relocation type for operand */
 337     enum bfd_reloc_code_real reloc[MAX_OPERANDS];
 338
 339     /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
 340        the base index byte below.  */
 341     const reg_entry *base_reg;
 342     const reg_entry *index_reg;
 343     unsigned int log2_scale_factor;
 344
 345     /* SEG gives the seg_entries of this insn.  They are zero unless
 346        explicit segment overrides are given.  */
 347     const seg_entry *seg[2];
 348
 349     /* Copied first memory operand string, for re-checking.  */
 350     char *memop1_string;
 351
 352     /* PREFIX holds all the given prefix opcodes (usually null).
 353        PREFIXES is the number of prefix opcodes.  */
 354     unsigned int prefixes;
 355     unsigned char prefix[MAX_PREFIXES];
 356
 357     /* Register is in low 3 bits of opcode.  */
 358     bfd_boolean short_form;
 359
 360     /* The operand to a branch insn indicates an absolute branch.  */
 361     bfd_boolean jumpabsolute;
 362
 363     /* Has MMX register operands.  */
 364     bfd_boolean has_regmmx;
 365
 366     /* Has XMM register operands.  */
 367     bfd_boolean has_regxmm;
 368
 369     /* Has YMM register operands.  */
 370     bfd_boolean has_regymm;
 371
 372     /* Has ZMM register operands.  */
 373     bfd_boolean has_regzmm;
 374
 375     /* Has GOTPC or TLS relocation.  */
 376     bfd_boolean has_gotpc_tls_reloc;
 377
 378     /* RM and SIB are the modrm byte and the sib byte where the
 379        addressing modes of this insn are encoded.  */
 380     modrm_byte rm;
 381     rex_byte rex;
 382     rex_byte vrex;
 383     sib_byte sib;
 384     vex_prefix vex;
 385
 386     /* Masking attributes.  */
 387     struct Mask_Operation *mask;
 388
 389     /* Rounding control and SAE attributes.  */
 390     struct RC_Operation *rounding;
 391
 392     /* Broadcasting attributes.  */
 393     struct Broadcast_Operation *broadcast;
 394
 395     /* Compressed disp8*N attribute.  */
 396     unsigned int memshift;
 397
 398     /* Prefer load or store in encoding.  */
 399     enum
 400       {
 401         dir_encoding_default = 0,
 402         dir_encoding_load,
 403         dir_encoding_store,
 404         dir_encoding_swap
 405       } dir_encoding;
 406
 407     /* Prefer 8bit or 32bit displacement in encoding.  */
 408     enum
 409       {
 410         disp_encoding_default = 0,
 411         disp_encoding_8bit,
 412         disp_encoding_32bit
 413       } disp_encoding;
 414
 415     /* Prefer the REX byte in encoding.  */
 416     bfd_boolean rex_encoding;
 417
 418     /* Disable instruction size optimization.  */
 419     bfd_boolean no_optimize;
 420
 421     /* How to encode vector instructions.  */
 422     enum
 423       {
 424         vex_encoding_default = 0,
 425         vex_encoding_vex,
 426         vex_encoding_vex3,
 427         vex_encoding_evex,
 428         vex_encoding_error
 429       } vec_encoding;
 430
 431     /* REP prefix.  */
 432     const char *rep_prefix;
 433
 434     /* HLE prefix.  */
 435     const char *hle_prefix;
 436
 437     /* Have BND prefix.  */
 438     const char *bnd_prefix;
 439
 440     /* Have NOTRACK prefix.  */
 441     const char *notrack_prefix;
 442
 443     /* Error message.  */
 444     enum i386_error error;
 445   };
 446
 447 typedef struct _i386_insn i386_insn;
 448
 449 /* Link RC type with corresponding string, that'll be looked for in
 450    asm.  */
 451 struct RC_name
 452 {
 453   enum rc_type type;
 454   const char *name;
 455   unsigned int len;
 456 };
 457
 458 static const struct RC_name RC_NamesTable[] =
 459 {
 460   {  rne, STRING_COMMA_LEN ("rn-sae") },
 461   {  rd,  STRING_COMMA_LEN ("rd-sae") },
 462   {  ru,  STRING_COMMA_LEN ("ru-sae") },
 463   {  rz,  STRING_COMMA_LEN ("rz-sae") },
 464   {  saeonly,  STRING_COMMA_LEN ("sae") },
 465 };
 466
 467 /* List of chars besides those in app.c:symbol_chars that can start an
 468    operand.  Used to prevent the scrubber eating vital white-space.  */
 469 const char extra_symbol_chars[] = "*%-([{}"
 470 #ifdef LEX_AT
 471         "@"
 472 #endif
 473 #ifdef LEX_QM
 474         "?"
 475 #endif
 476         ;
 477
 478 #if (defined (TE_I386AIX)                               \
 479      || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
 480          && !defined (TE_GNU)                           \
 481          && !defined (TE_LINUX)                         \
 482          && !defined (TE_NACL)                          \
 483          && !defined (TE_FreeBSD)                       \
 484          && !defined (TE_DragonFly)                     \
 485          && !defined (TE_NetBSD)))
 486 /* This array holds the chars that always start a comment.  If the
 487    pre-processor is disabled, these aren't very useful.  The option
 488    --divide will remove '/' from this list.  */
 489 const char *i386_comment_chars = "#/";
 490 #define SVR4_COMMENT_CHARS 1
 491 #define PREFIX_SEPARATOR '\\'
 492
 493 #else
 494 const char *i386_comment_chars = "#";
 495 #define PREFIX_SEPARATOR '/'
 496 #endif
 497
 498 /* This array holds the chars that only start a comment at the beginning of
 499    a line.  If the line seems to have the form '# 123 filename'
 500    .line and .file directives will appear in the pre-processed output.
 501    Note that input_file.c hand checks for '#' at the beginning of the
 502    first line of the input file.  This is because the compiler outputs
 503    #NO_APP at the beginning of its output.
 504    Also note that comments started like this one will always work if
 505    '/' isn't otherwise defined.  */
 506 const char line_comment_chars[] = "#/";
 507
 508 const char line_separator_chars[] = ";";
 509
 510 /* Chars that can be used to separate mant from exp in floating point
 511    nums.  */
 512 const char EXP_CHARS[] = "eE";
 513
 514 /* Chars that mean this number is a floating point constant
 515    As in 0f12.456
 516    or    0d1.2345e12.  */
 517 const char FLT_CHARS[] = "fFdDxX";
 518
 519 /* Tables for lexical analysis.  */
 520 static char mnemonic_chars[256];
 521 static char register_chars[256];
 522 static char operand_chars[256];
 523 static char identifier_chars[256];
 524 static char digit_chars[256];
 525
 526 /* Lexical macros.  */
 527 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
 528 #define is_operand_char(x) (operand_chars[(unsigned char) x])
 529 #define is_register_char(x) (register_chars[(unsigned char) x])
 530 #define is_space_char(x) ((x) == ' ')
 531 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
 532 #define is_digit_char(x) (digit_chars[(unsigned char) x])
 533
 534 /* All non-digit non-letter characters that may occur in an operand.  */
 535 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
 536
 537 /* md_assemble() always leaves the strings it's passed unaltered.  To
 538    effect this we maintain a stack of saved characters that we've smashed
 539    with '\0's (indicating end of strings for various sub-fields of the
 540    assembler instruction).  */
 541 static char save_stack[32];
 542 static char *save_stack_p;
 543 #define END_STRING_AND_SAVE(s) \
 544         do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
 545 #define RESTORE_END_STRING(s) \
 546         do { *(s) = *--save_stack_p; } while (0)
 547
 548 /* The instruction we're assembling.  */
 549 static i386_insn i;
 550
 551 /* Possible templates for current insn.  */
 552 static const templates *current_templates;
 553
 554 /* Per instruction expressionS buffers: max displacements & immediates.  */
 555 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
 556 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
 557
 558 /* Current operand we are working on.  */
 559 static int this_operand = -1;
 560
 561 /* We support four different modes.  FLAG_CODE variable is used to distinguish
 562    these.  */
 563
 564 enum flag_code {
 565         CODE_32BIT,
 566         CODE_16BIT,
 567         CODE_64BIT };
 568
 569 static enum flag_code flag_code;
 570 static unsigned int object_64bit;
 571 static unsigned int disallow_64bit_reloc;
 572 static int use_rela_relocations = 0;
 573 /* __tls_get_addr/___tls_get_addr symbol for TLS.  */
 574 static const char *tls_get_addr;
 575
 576 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
 577      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
 578      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
 579
 580 /* The ELF ABI to use.  */
 581 enum x86_elf_abi
 582 {
 583   I386_ABI,
 584   X86_64_ABI,
 585   X86_64_X32_ABI
 586 };
 587
 588 static enum x86_elf_abi x86_elf_abi = I386_ABI;
 589 #endif
 590
 591 #if defined (TE_PE) || defined (TE_PEP)
 592 /* Use big object file format.  */
 593 static int use_big_obj = 0;
 594 #endif
 595
 596 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 597 /* 1 if generating code for a shared library.  */
 598 static int shared = 0;
 599 #endif
 600
 601 /* 1 for intel syntax,
 602    0 if att syntax.  */
 603 static int intel_syntax = 0;
 604
 605 static enum x86_64_isa
 606 {
 607   amd64 = 1,    /* AMD64 ISA.  */
 608   intel64       /* Intel64 ISA.  */
 609 } isa64;
 610
 611 /* 1 for intel mnemonic,
 612    0 if att mnemonic.  */
 613 static int intel_mnemonic = !SYSV386_COMPAT;
 614
 615 /* 1 if pseudo registers are permitted.  */
 616 static int allow_pseudo_reg = 0;
 617
 618 /* 1 if register prefix % not required.  */
 619 static int allow_naked_reg = 0;
 620
 621 /* 1 if the assembler should add BND prefix for all control-transferring
 622    instructions supporting it, even if this prefix wasn't specified
 623    explicitly.  */
 624 static int add_bnd_prefix = 0;
 625
 626 /* 1 if pseudo index register, eiz/riz, is allowed .  */
 627 static int allow_index_reg = 0;
 628
 629 /* 1 if the assembler should ignore LOCK prefix, even if it was
 630    specified explicitly.  */
 631 static int omit_lock_prefix = 0;
 632
 633 /* 1 if the assembler should encode lfence, mfence, and sfence as
 634    "lock addl $0, (%{re}sp)".  */
 635 static int avoid_fence = 0;
 636
 637 /* 1 if lfence should be inserted after every load.  */
 638 static int lfence_after_load = 0;
 639
 640 /* Non-zero if lfence should be inserted before indirect branch.  */
 641 static enum lfence_before_indirect_branch_kind
 642   {
 643     lfence_branch_none = 0,
 644     lfence_branch_register,
 645     lfence_branch_memory,
 646     lfence_branch_all
 647   }
 648 lfence_before_indirect_branch;
 649
 650 /* Non-zero if lfence should be inserted before ret.  */
 651 static enum lfence_before_ret_kind
 652   {
 653     lfence_before_ret_none = 0,
 654     lfence_before_ret_not,
 655     lfence_before_ret_or,
 656     lfence_before_ret_shl
 657   }
 658 lfence_before_ret;
 659
 660 /* Types of previous instruction is .byte or prefix.  */
 661 static struct
 662   {
 663     segT seg;
 664     const char *file;
 665     const char *name;
 666     unsigned int line;
 667     enum last_insn_kind
 668       {
 669         last_insn_other = 0,
 670         last_insn_directive,
 671         last_insn_prefix
 672       } kind;
 673   } last_insn;
 674
 675 /* 1 if the assembler should generate relax relocations.  */
 676
 677 static int generate_relax_relocations
 678   = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
 679
 680 static enum check_kind
 681   {
 682     check_none = 0,
 683     check_warning,
 684     check_error
 685   }
 686 sse_check, operand_check = check_warning;
 687
 688 /* Non-zero if branches should be aligned within power of 2 boundary.  */
 689 static int align_branch_power = 0;
 690
 691 /* Types of branches to align.  */
 692 enum align_branch_kind
 693   {
 694     align_branch_none = 0,
 695     align_branch_jcc = 1,
 696     align_branch_fused = 2,
 697     align_branch_jmp = 3,
 698     align_branch_call = 4,
 699     align_branch_indirect = 5,
 700     align_branch_ret = 6
 701   };
 702
 703 /* Type bits of branches to align.  */
 704 enum align_branch_bit
 705   {
 706     align_branch_jcc_bit = 1 << align_branch_jcc,
 707     align_branch_fused_bit = 1 << align_branch_fused,
 708     align_branch_jmp_bit = 1 << align_branch_jmp,
 709     align_branch_call_bit = 1 << align_branch_call,
 710     align_branch_indirect_bit = 1 << align_branch_indirect,
 711     align_branch_ret_bit = 1 << align_branch_ret
 712   };
 713
 714 static unsigned int align_branch = (align_branch_jcc_bit
 715                                     | align_branch_fused_bit
 716                                     | align_branch_jmp_bit);
 717
 718 /* Types of condition jump used by macro-fusion.  */
 719 enum mf_jcc_kind
 720   {
 721     mf_jcc_jo = 0,  /* base opcode 0x70  */
 722     mf_jcc_jc,      /* base opcode 0x72  */
 723     mf_jcc_je,      /* base opcode 0x74  */
 724     mf_jcc_jna,     /* base opcode 0x76  */
 725     mf_jcc_js,      /* base opcode 0x78  */
 726     mf_jcc_jp,      /* base opcode 0x7a  */
 727     mf_jcc_jl,      /* base opcode 0x7c  */
 728     mf_jcc_jle,     /* base opcode 0x7e  */
 729   };
 730
 731 /* Types of compare flag-modifying insntructions used by macro-fusion.  */
 732 enum mf_cmp_kind
 733   {
 734     mf_cmp_test_and,  /* test/cmp */
 735     mf_cmp_alu_cmp,  /* add/sub/cmp */
 736     mf_cmp_incdec  /* inc/dec */
 737   };
 738
 739 /* The maximum padding size for fused jcc.  CMP like instruction can
 740    be 9 bytes and jcc can be 6 bytes.  Leave room just in case for
 741    prefixes.   */
 742 #define MAX_FUSED_JCC_PADDING_SIZE 20
 743
 744 /* The maximum number of prefixes added for an instruction.  */
 745 static unsigned int align_branch_prefix_size = 5;
 746
 747 /* Optimization:
 748    1. Clear the REX_W bit with register operand if possible.
 749    2. Above plus use 128bit vector instruction to clear the full vector
 750       register.
 751  */
 752 static int optimize = 0;
 753
 754 /* Optimization:
 755    1. Clear the REX_W bit with register operand if possible.
 756    2. Above plus use 128bit vector instruction to clear the full vector
 757       register.
 758    3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
 759       "testb $imm7,%r8".
 760  */
 761 static int optimize_for_space = 0;
 762
 763 /* Register prefix used for error message.  */
 764 static const char *register_prefix = "%";
 765
 766 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
 767    leave, push, and pop instructions so that gcc has the same stack
 768    frame as in 32 bit mode.  */
 769 static char stackop_size = '\0';
 770
 771 /* Non-zero to optimize code alignment.  */
 772 int optimize_align_code = 1;
 773
 774 /* Non-zero to quieten some warnings.  */
 775 static int quiet_warnings = 0;
 776
 777 /* CPU name.  */
 778 static const char *cpu_arch_name = NULL;
 779 static char *cpu_sub_arch_name = NULL;
 780
 781 /* CPU feature flags.  */
 782 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
 783
 784 /* If we have selected a cpu we are generating instructions for.  */
 785 static int cpu_arch_tune_set = 0;
 786
 787 /* Cpu we are generating instructions for.  */
 788 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
 789
 790 /* CPU feature flags of cpu we are generating instructions for.  */
 791 static i386_cpu_flags cpu_arch_tune_flags;
 792
 793 /* CPU instruction set architecture used.  */
 794 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
 795
 796 /* CPU feature flags of instruction set architecture used.  */
 797 i386_cpu_flags cpu_arch_isa_flags;
 798
 799 /* If set, conditional jumps are not automatically promoted to handle
 800    larger than a byte offset.  */
 801 static unsigned int no_cond_jump_promotion = 0;
 802
 803 /* Encode SSE instructions with VEX prefix.  */
 804 static unsigned int sse2avx;
 805
 806 /* Encode scalar AVX instructions with specific vector length.  */
 807 static enum
 808   {
 809     vex128 = 0,
 810     vex256
 811   } avxscalar;
 812
 813 /* Encode VEX WIG instructions with specific vex.w.  */
 814 static enum
 815   {
 816     vexw0 = 0,
 817     vexw1
 818   } vexwig;
 819
 820 /* Encode scalar EVEX LIG instructions with specific vector length.  */
 821 static enum
 822   {
 823     evexl128 = 0,
 824     evexl256,
 825     evexl512
 826   } evexlig;
 827
 828 /* Encode EVEX WIG instructions with specific evex.w.  */
 829 static enum
 830   {
 831     evexw0 = 0,
 832     evexw1
 833   } evexwig;
 834
 835 /* Value to encode in EVEX RC bits, for SAE-only instructions.  */
 836 static enum rc_type evexrcig = rne;
 837
 838 /* Pre-defined "_GLOBAL_OFFSET_TABLE_".  */
 839 static symbolS *GOT_symbol;
 840
 841 /* The dwarf2 return column, adjusted for 32 or 64 bit.  */
 842 unsigned int x86_dwarf2_return_column;
 843
 844 /* The dwarf2 data alignment, adjusted for 32 or 64 bit.  */
 845 int x86_cie_data_alignment;
 846
 847 /* Interface to relax_segment.
 848    There are 3 major relax states for 386 jump insns because the
 849    different types of jumps add different sizes to frags when we're
 850    figuring out what sort of jump to choose to reach a given label.
 851
 852    BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
 853    branches which are handled by md_estimate_size_before_relax() and
 854    i386_generic_table_relax_frag().  */
 855
 856 /* Types.  */
 857 #define UNCOND_JUMP 0
 858 #define COND_JUMP 1
 859 #define COND_JUMP86 2
 860 #define BRANCH_PADDING 3
 861 #define BRANCH_PREFIX 4
 862 #define FUSED_JCC_PADDING 5
 863
 864 /* Sizes.  */
 865 #define CODE16  1
 866 #define SMALL   0
 867 #define SMALL16 (SMALL | CODE16)
 868 #define BIG     2
 869 #define BIG16   (BIG | CODE16)
 870
 871 #ifndef INLINE
 872 #ifdef __GNUC__
 873 #define INLINE __inline__
 874 #else
 875 #define INLINE
 876 #endif
 877 #endif
 878
 879 #define ENCODE_RELAX_STATE(type, size) \
 880   ((relax_substateT) (((type) << 2) | (size)))
 881 #define TYPE_FROM_RELAX_STATE(s) \
 882   ((s) >> 2)
 883 #define DISP_SIZE_FROM_RELAX_STATE(s) \
 884     ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
 885
 886 /* This table is used by relax_frag to promote short jumps to long
 887    ones where necessary.  SMALL (short) jumps may be promoted to BIG
 888    (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long).  We
 889    don't allow a short jump in a 32 bit code segment to be promoted to
 890    a 16 bit offset jump because it's slower (requires data size
 891    prefix), and doesn't work, unless the destination is in the bottom
 892    64k of the code segment (The top 16 bits of eip are zeroed).  */
 893
 894 const relax_typeS md_relax_table[] =
 895 {
 896   /* The fields are:
 897      1) most positive reach of this state,
 898      2) most negative reach of this state,
 899      3) how many bytes this mode will have in the variable part of the frag
 900      4) which index into the table to try if we can't fit into this one.  */
 901
 902   /* UNCOND_JUMP states.  */
 903   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
 904   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
 905   /* dword jmp adds 4 bytes to frag:
 906      0 extra opcode bytes, 4 displacement bytes.  */
 907   {0, 0, 4, 0},
 908   /* word jmp adds 2 byte2 to frag:
 909      0 extra opcode bytes, 2 displacement bytes.  */
 910   {0, 0, 2, 0},
 911
 912   /* COND_JUMP states.  */
 913   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
 914   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
 915   /* dword conditionals adds 5 bytes to frag:
 916      1 extra opcode byte, 4 displacement bytes.  */
 917   {0, 0, 5, 0},
 918   /* word conditionals add 3 bytes to frag:
 919      1 extra opcode byte, 2 displacement bytes.  */
 920   {0, 0, 3, 0},
 921
 922   /* COND_JUMP86 states.  */
 923   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
 924   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
 925   /* dword conditionals adds 5 bytes to frag:
 926      1 extra opcode byte, 4 displacement bytes.  */
 927   {0, 0, 5, 0},
 928   /* word conditionals add 4 bytes to frag:
 929      1 displacement byte and a 3 byte long branch insn.  */
 930   {0, 0, 4, 0}
 931 };
 932
 933 static const arch_entry cpu_arch[] =
 934 {
 935   /* Do not replace the first two entries - i386_target_format()
 936      relies on them being there in this order.  */
 937   { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
 938     CPU_GENERIC32_FLAGS, 0 },
 939   { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
 940     CPU_GENERIC64_FLAGS, 0 },
 941   { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
 942     CPU_NONE_FLAGS, 0 },
 943   { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
 944     CPU_I186_FLAGS, 0 },
 945   { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
 946     CPU_I286_FLAGS, 0 },
 947   { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
 948     CPU_I386_FLAGS, 0 },
 949   { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
 950     CPU_I486_FLAGS, 0 },
 951   { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
 952     CPU_I586_FLAGS, 0 },
 953   { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
 954     CPU_I686_FLAGS, 0 },
 955   { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
 956     CPU_I586_FLAGS, 0 },
 957   { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
 958     CPU_PENTIUMPRO_FLAGS, 0 },
 959   { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
 960     CPU_P2_FLAGS, 0 },
 961   { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
 962     CPU_P3_FLAGS, 0 },
 963   { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
 964     CPU_P4_FLAGS, 0 },
 965   { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
 966     CPU_CORE_FLAGS, 0 },
 967   { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
 968     CPU_NOCONA_FLAGS, 0 },
 969   { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
 970     CPU_CORE_FLAGS, 1 },
 971   { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
 972     CPU_CORE_FLAGS, 0 },
 973   { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
 974     CPU_CORE2_FLAGS, 1 },
 975   { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
 976     CPU_CORE2_FLAGS, 0 },
 977   { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
 978     CPU_COREI7_FLAGS, 0 },
 979   { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
 980     CPU_L1OM_FLAGS, 0 },
 981   { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
 982     CPU_K1OM_FLAGS, 0 },
 983   { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
 984     CPU_IAMCU_FLAGS, 0 },
 985   { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
 986     CPU_K6_FLAGS, 0 },
 987   { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
 988     CPU_K6_2_FLAGS, 0 },
 989   { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
 990     CPU_ATHLON_FLAGS, 0 },
 991   { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
 992     CPU_K8_FLAGS, 1 },
 993   { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
 994     CPU_K8_FLAGS, 0 },
 995   { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
 996     CPU_K8_FLAGS, 0 },
 997   { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
 998     CPU_AMDFAM10_FLAGS, 0 },
 999   { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
1000     CPU_BDVER1_FLAGS, 0 },
1001   { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
1002     CPU_BDVER2_FLAGS, 0 },
1003   { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
1004     CPU_BDVER3_FLAGS, 0 },
1005   { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
1006     CPU_BDVER4_FLAGS, 0 },
1007   { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
1008     CPU_ZNVER1_FLAGS, 0 },
1009   { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1010     CPU_ZNVER2_FLAGS, 0 },
1011   { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
1012     CPU_BTVER1_FLAGS, 0 },
1013   { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
1014     CPU_BTVER2_FLAGS, 0 },
1015   { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
1016     CPU_8087_FLAGS, 0 },
1017   { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
1018     CPU_287_FLAGS, 0 },
1019   { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
1020     CPU_387_FLAGS, 0 },
1021   { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1022     CPU_687_FLAGS, 0 },
1023   { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1024     CPU_CMOV_FLAGS, 0 },
1025   { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1026     CPU_FXSR_FLAGS, 0 },
1027   { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
1028     CPU_MMX_FLAGS, 0 },
1029   { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
1030     CPU_SSE_FLAGS, 0 },
1031   { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
1032     CPU_SSE2_FLAGS, 0 },
1033   { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
1034     CPU_SSE3_FLAGS, 0 },
1035   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1036     CPU_SSE4A_FLAGS, 0 },
1037   { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
1038     CPU_SSSE3_FLAGS, 0 },
1039   { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
1040     CPU_SSE4_1_FLAGS, 0 },
1041   { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
1042     CPU_SSE4_2_FLAGS, 0 },
1043   { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
1044     CPU_SSE4_2_FLAGS, 0 },
1045   { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
1046     CPU_AVX_FLAGS, 0 },
1047   { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
1048     CPU_AVX2_FLAGS, 0 },
1049   { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
1050     CPU_AVX512F_FLAGS, 0 },
1051   { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1052     CPU_AVX512CD_FLAGS, 0 },
1053   { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1054     CPU_AVX512ER_FLAGS, 0 },
1055   { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1056     CPU_AVX512PF_FLAGS, 0 },
1057   { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1058     CPU_AVX512DQ_FLAGS, 0 },
1059   { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1060     CPU_AVX512BW_FLAGS, 0 },
1061   { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1062     CPU_AVX512VL_FLAGS, 0 },
1063   { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1064     CPU_VMX_FLAGS, 0 },
1065   { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1066     CPU_VMFUNC_FLAGS, 0 },
1067   { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1068     CPU_SMX_FLAGS, 0 },
1069   { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1070     CPU_XSAVE_FLAGS, 0 },
1071   { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1072     CPU_XSAVEOPT_FLAGS, 0 },
1073   { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1074     CPU_XSAVEC_FLAGS, 0 },
1075   { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1076     CPU_XSAVES_FLAGS, 0 },
1077   { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1078     CPU_AES_FLAGS, 0 },
1079   { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1080     CPU_PCLMUL_FLAGS, 0 },
1081   { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1082     CPU_PCLMUL_FLAGS, 1 },
1083   { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1084     CPU_FSGSBASE_FLAGS, 0 },
1085   { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1086     CPU_RDRND_FLAGS, 0 },
1087   { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1088     CPU_F16C_FLAGS, 0 },
1089   { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1090     CPU_BMI2_FLAGS, 0 },
1091   { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1092     CPU_FMA_FLAGS, 0 },
1093   { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1094     CPU_FMA4_FLAGS, 0 },
1095   { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1096     CPU_XOP_FLAGS, 0 },
1097   { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1098     CPU_LWP_FLAGS, 0 },
1099   { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1100     CPU_MOVBE_FLAGS, 0 },
1101   { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1102     CPU_CX16_FLAGS, 0 },
1103   { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1104     CPU_EPT_FLAGS, 0 },
1105   { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1106     CPU_LZCNT_FLAGS, 0 },
1107   { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1108     CPU_POPCNT_FLAGS, 0 },
1109   { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1110     CPU_HLE_FLAGS, 0 },
1111   { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1112     CPU_RTM_FLAGS, 0 },
1113   { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1114     CPU_INVPCID_FLAGS, 0 },
1115   { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1116     CPU_CLFLUSH_FLAGS, 0 },
1117   { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1118     CPU_NOP_FLAGS, 0 },
1119   { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1120     CPU_SYSCALL_FLAGS, 0 },
1121   { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1122     CPU_RDTSCP_FLAGS, 0 },
1123   { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1124     CPU_3DNOW_FLAGS, 0 },
1125   { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1126     CPU_3DNOWA_FLAGS, 0 },
1127   { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1128     CPU_PADLOCK_FLAGS, 0 },
1129   { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1130     CPU_SVME_FLAGS, 1 },
1131   { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1132     CPU_SVME_FLAGS, 0 },
1133   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1134     CPU_SSE4A_FLAGS, 0 },
1135   { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1136     CPU_ABM_FLAGS, 0 },
1137   { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1138     CPU_BMI_FLAGS, 0 },
1139   { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1140     CPU_TBM_FLAGS, 0 },
1141   { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1142     CPU_ADX_FLAGS, 0 },
1143   { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1144     CPU_RDSEED_FLAGS, 0 },
1145   { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1146     CPU_PRFCHW_FLAGS, 0 },
1147   { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1148     CPU_SMAP_FLAGS, 0 },
1149   { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1150     CPU_MPX_FLAGS, 0 },
1151   { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1152     CPU_SHA_FLAGS, 0 },
1153   { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1154     CPU_CLFLUSHOPT_FLAGS, 0 },
1155   { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1156     CPU_PREFETCHWT1_FLAGS, 0 },
1157   { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1158     CPU_SE1_FLAGS, 0 },
1159   { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1160     CPU_CLWB_FLAGS, 0 },
1161   { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1162     CPU_AVX512IFMA_FLAGS, 0 },
1163   { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1164     CPU_AVX512VBMI_FLAGS, 0 },
1165   { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1166     CPU_AVX512_4FMAPS_FLAGS, 0 },
1167   { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1168     CPU_AVX512_4VNNIW_FLAGS, 0 },
1169   { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1170     CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1171   { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1172     CPU_AVX512_VBMI2_FLAGS, 0 },
1173   { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1174     CPU_AVX512_VNNI_FLAGS, 0 },
1175   { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1176     CPU_AVX512_BITALG_FLAGS, 0 },
1177   { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1178     CPU_CLZERO_FLAGS, 0 },
1179   { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1180     CPU_MWAITX_FLAGS, 0 },
1181   { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1182     CPU_OSPKE_FLAGS, 0 },
1183   { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1184     CPU_RDPID_FLAGS, 0 },
1185   { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1186     CPU_PTWRITE_FLAGS, 0 },
1187   { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1188     CPU_IBT_FLAGS, 0 },
1189   { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1190     CPU_SHSTK_FLAGS, 0 },
1191   { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1192     CPU_GFNI_FLAGS, 0 },
1193   { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1194     CPU_VAES_FLAGS, 0 },
1195   { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1196     CPU_VPCLMULQDQ_FLAGS, 0 },
1197   { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1198     CPU_WBNOINVD_FLAGS, 0 },
1199   { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1200     CPU_PCONFIG_FLAGS, 0 },
1201   { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1202     CPU_WAITPKG_FLAGS, 0 },
1203   { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1204     CPU_CLDEMOTE_FLAGS, 0 },
1205   { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1206     CPU_MOVDIRI_FLAGS, 0 },
1207   { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1208     CPU_MOVDIR64B_FLAGS, 0 },
1209   { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1210     CPU_AVX512_BF16_FLAGS, 0 },
1211   { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1212     CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1213   { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1214     CPU_ENQCMD_FLAGS, 0 },
1215   { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1216     CPU_SERIALIZE_FLAGS, 0 },
1217   { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1218     CPU_RDPRU_FLAGS, 0 },
1219   { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1220     CPU_MCOMMIT_FLAGS, 0 },
1221   { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1222     CPU_SEV_ES_FLAGS, 0 },
1223   { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1224     CPU_TSXLDTRK_FLAGS, 0 },
1225 };
1226
1227 static const noarch_entry cpu_noarch[] =
1228 {
1229   { STRING_COMMA_LEN ("no87"),  CPU_ANY_X87_FLAGS },
1230   { STRING_COMMA_LEN ("no287"),  CPU_ANY_287_FLAGS },
1231   { STRING_COMMA_LEN ("no387"),  CPU_ANY_387_FLAGS },
1232   { STRING_COMMA_LEN ("no687"),  CPU_ANY_687_FLAGS },
1233   { STRING_COMMA_LEN ("nocmov"),  CPU_ANY_CMOV_FLAGS },
1234   { STRING_COMMA_LEN ("nofxsr"),  CPU_ANY_FXSR_FLAGS },
1235   { STRING_COMMA_LEN ("nommx"),  CPU_ANY_MMX_FLAGS },
1236   { STRING_COMMA_LEN ("nosse"),  CPU_ANY_SSE_FLAGS },
1237   { STRING_COMMA_LEN ("nosse2"),  CPU_ANY_SSE2_FLAGS },
1238   { STRING_COMMA_LEN ("nosse3"),  CPU_ANY_SSE3_FLAGS },
1239   { STRING_COMMA_LEN ("nosse4a"),  CPU_ANY_SSE4A_FLAGS },
1240   { STRING_COMMA_LEN ("nossse3"),  CPU_ANY_SSSE3_FLAGS },
1241   { STRING_COMMA_LEN ("nosse4.1"),  CPU_ANY_SSE4_1_FLAGS },
1242   { STRING_COMMA_LEN ("nosse4.2"),  CPU_ANY_SSE4_2_FLAGS },
1243   { STRING_COMMA_LEN ("nosse4"),  CPU_ANY_SSE4_1_FLAGS },
1244   { STRING_COMMA_LEN ("noavx"),  CPU_ANY_AVX_FLAGS },
1245   { STRING_COMMA_LEN ("noavx2"),  CPU_ANY_AVX2_FLAGS },
1246   { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1247   { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1248   { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1249   { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1250   { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1251   { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1252   { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1253   { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1254   { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1255   { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1256   { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1257   { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1258   { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1259   { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1260   { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1261   { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1262   { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1263   { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1264   { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1265   { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1266   { STRING_COMMA_LEN ("noavx512_vp2intersect"),
1267     CPU_ANY_AVX512_VP2INTERSECT_FLAGS },
1268   { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1269   { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
1270   { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
1271 };
1272
1273 #ifdef I386COFF
1274 /* Like s_lcomm_internal in gas/read.c but the alignment string
1275    is allowed to be optional.  */
1276
1277 static symbolS *
1278 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1279 {
1280   addressT align = 0;
1281
1282   SKIP_WHITESPACE ();
1283
1284   if (needs_align
1285       && *input_line_pointer == ',')
1286     {
1287       align = parse_align (needs_align - 1);
1288
1289       if (align == (addressT) -1)
1290         return NULL;
1291     }
1292   else
1293     {
1294       if (size >= 8)
1295         align = 3;
1296       else if (size >= 4)
1297         align = 2;
1298       else if (size >= 2)
1299         align = 1;
1300       else
1301         align = 0;
1302     }
1303
1304   bss_alloc (symbolP, size, align);
1305   return symbolP;
1306 }
1307
1308 static void
1309 pe_lcomm (int needs_align)
1310 {
1311   s_comm_internal (needs_align * 2, pe_lcomm_internal);
1312 }
1313 #endif
1314
1315 const pseudo_typeS md_pseudo_table[] =
1316 {
1317 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1318   {"align", s_align_bytes, 0},
1319 #else
1320   {"align", s_align_ptwo, 0},
1321 #endif
1322   {"arch", set_cpu_arch, 0},
1323 #ifndef I386COFF
1324   {"bss", s_bss, 0},
1325 #else
1326   {"lcomm", pe_lcomm, 1},
1327 #endif
1328   {"ffloat", float_cons, 'f'},
1329   {"dfloat", float_cons, 'd'},
1330   {"tfloat", float_cons, 'x'},
1331   {"value", cons, 2},
1332   {"slong", signed_cons, 4},
1333   {"noopt", s_ignore, 0},
1334   {"optim", s_ignore, 0},
1335   {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1336   {"code16", set_code_flag, CODE_16BIT},
1337   {"code32", set_code_flag, CODE_32BIT},
1338 #ifdef BFD64
1339   {"code64", set_code_flag, CODE_64BIT},
1340 #endif
1341   {"intel_syntax", set_intel_syntax, 1},
1342   {"att_syntax", set_intel_syntax, 0},
1343   {"intel_mnemonic", set_intel_mnemonic, 1},
1344   {"att_mnemonic", set_intel_mnemonic, 0},
1345   {"allow_index_reg", set_allow_index_reg, 1},
1346   {"disallow_index_reg", set_allow_index_reg, 0},
1347   {"sse_check", set_check, 0},
1348   {"operand_check", set_check, 1},
1349 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1350   {"largecomm", handle_large_common, 0},
1351 #else
1352   {"file", dwarf2_directive_file, 0},
1353   {"loc", dwarf2_directive_loc, 0},
1354   {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1355 #endif
1356 #ifdef TE_PE
1357   {"secrel32", pe_directive_secrel, 0},
1358 #endif
1359   {0, 0, 0}
1360 };
1361
1362 /* For interface with expression ().  */
1363 extern char *input_line_pointer;
1364
1365 /* Hash table for instruction mnemonic lookup.  */
1366 static struct hash_control *op_hash;
1367
1368 /* Hash table for register lookup.  */
1369 static struct hash_control *reg_hash;
1370 \f
1371   /* Various efficient no-op patterns for aligning code labels.
1372      Note: Don't try to assemble the instructions in the comments.
1373      0L and 0w are not legal.  */
1374 static const unsigned char f32_1[] =
1375   {0x90};                               /* nop                  */
1376 static const unsigned char f32_2[] =
1377   {0x66,0x90};                          /* xchg %ax,%ax         */
1378 static const unsigned char f32_3[] =
1379   {0x8d,0x76,0x00};                     /* leal 0(%esi),%esi    */
1380 static const unsigned char f32_4[] =
1381   {0x8d,0x74,0x26,0x00};                /* leal 0(%esi,1),%esi  */
1382 static const unsigned char f32_6[] =
1383   {0x8d,0xb6,0x00,0x00,0x00,0x00};      /* leal 0L(%esi),%esi   */
1384 static const unsigned char f32_7[] =
1385   {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1386 static const unsigned char f16_3[] =
1387   {0x8d,0x74,0x00};                     /* lea 0(%si),%si       */
1388 static const unsigned char f16_4[] =
1389   {0x8d,0xb4,0x00,0x00};                /* lea 0W(%si),%si      */
1390 static const unsigned char jump_disp8[] =
1391   {0xeb};                               /* jmp disp8           */
1392 static const unsigned char jump32_disp32[] =
1393   {0xe9};                               /* jmp disp32          */
1394 static const unsigned char jump16_disp32[] =
1395   {0x66,0xe9};                          /* jmp disp32          */
1396 /* 32-bit NOPs patterns.  */
1397 static const unsigned char *const f32_patt[] = {
1398   f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1399 };
1400 /* 16-bit NOPs patterns.  */
1401 static const unsigned char *const f16_patt[] = {
1402   f32_1, f32_2, f16_3, f16_4
1403 };
1404 /* nopl (%[re]ax) */
1405 static const unsigned char alt_3[] =
1406   {0x0f,0x1f,0x00};
1407 /* nopl 0(%[re]ax) */
1408 static const unsigned char alt_4[] =
1409   {0x0f,0x1f,0x40,0x00};
1410 /* nopl 0(%[re]ax,%[re]ax,1) */
1411 static const unsigned char alt_5[] =
1412   {0x0f,0x1f,0x44,0x00,0x00};
1413 /* nopw 0(%[re]ax,%[re]ax,1) */
1414 static const unsigned char alt_6[] =
1415   {0x66,0x0f,0x1f,0x44,0x00,0x00};
1416 /* nopl 0L(%[re]ax) */
1417 static const unsigned char alt_7[] =
1418   {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1419 /* nopl 0L(%[re]ax,%[re]ax,1) */
1420 static const unsigned char alt_8[] =
1421   {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1422 /* nopw 0L(%[re]ax,%[re]ax,1) */
1423 static const unsigned char alt_9[] =
1424   {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1425 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1426 static const unsigned char alt_10[] =
1427   {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1428 /* data16 nopw %cs:0L(%eax,%eax,1) */
1429 static const unsigned char alt_11[] =
1430   {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1431 /* 32-bit and 64-bit NOPs patterns.  */
1432 static const unsigned char *const alt_patt[] = {
1433   f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1434   alt_9, alt_10, alt_11
1435 };
1436
1437 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1438    size of a single NOP instruction MAX_SINGLE_NOP_SIZE.  */
1439
1440 static void
1441 i386_output_nops (char *where, const unsigned char *const *patt,
1442                   int count, int max_single_nop_size)
1443
1444 {
1445   /* Place the longer NOP first.  */
1446   int last;
1447   int offset;
1448   const unsigned char *nops;
1449
1450   if (max_single_nop_size < 1)
1451     {
1452       as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1453                 max_single_nop_size);
1454       return;
1455     }
1456
1457   nops = patt[max_single_nop_size - 1];
1458
1459   /* Use the smaller one if the requsted one isn't available.  */
1460   if (nops == NULL)
1461     {
1462       max_single_nop_size--;
1463       nops = patt[max_single_nop_size - 1];
1464     }
1465
1466   last = count % max_single_nop_size;
1467
1468   count -= last;
1469   for (offset = 0; offset < count; offset += max_single_nop_size)
1470     memcpy (where + offset, nops, max_single_nop_size);
1471
1472   if (last)
1473     {
1474       nops = patt[last - 1];
1475       if (nops == NULL)
1476         {
1477           /* Use the smaller one plus one-byte NOP if the needed one
1478              isn't available.  */
1479           last--;
1480           nops = patt[last - 1];
1481           memcpy (where + offset, nops, last);
1482           where[offset + last] = *patt[0];
1483         }
1484       else
1485         memcpy (where + offset, nops, last);
1486     }
1487 }
1488
1489 static INLINE int
1490 fits_in_imm7 (offsetT num)
1491 {
1492   return (num & 0x7f) == num;
1493 }
1494
1495 static INLINE int
1496 fits_in_imm31 (offsetT num)
1497 {
1498   return (num & 0x7fffffff) == num;
1499 }
1500
1501 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1502    single NOP instruction LIMIT.  */
1503
1504 void
1505 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1506 {
1507   const unsigned char *const *patt = NULL;
1508   int max_single_nop_size;
1509   /* Maximum number of NOPs before switching to jump over NOPs.  */
1510   int max_number_of_nops;
1511
1512   switch (fragP->fr_type)
1513     {
1514     case rs_fill_nop:
1515     case rs_align_code:
1516       break;
1517     case rs_machine_dependent:
1518       /* Allow NOP padding for jumps and calls.  */
1519       if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1520           || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1521         break;
1522       /* Fall through.  */
1523     default:
1524       return;
1525     }
1526
1527   /* We need to decide which NOP sequence to use for 32bit and
1528      64bit. When -mtune= is used:
1529
1530      1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1531      PROCESSOR_GENERIC32, f32_patt will be used.
1532      2. For the rest, alt_patt will be used.
1533
1534      When -mtune= isn't used, alt_patt will be used if
1535      cpu_arch_isa_flags has CpuNop.  Otherwise, f32_patt will
1536      be used.
1537
1538      When -march= or .arch is used, we can't use anything beyond
1539      cpu_arch_isa_flags.   */
1540
1541   if (flag_code == CODE_16BIT)
1542     {
1543       patt = f16_patt;
1544       max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1545       /* Limit number of NOPs to 2 in 16-bit mode.  */
1546       max_number_of_nops = 2;
1547     }
1548   else
1549     {
1550       if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1551         {
1552           /* PROCESSOR_UNKNOWN means that all ISAs may be used.  */
1553           switch (cpu_arch_tune)
1554             {
1555             case PROCESSOR_UNKNOWN:
1556               /* We use cpu_arch_isa_flags to check if we SHOULD
1557                  optimize with nops.  */
1558               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1559                 patt = alt_patt;
1560               else
1561                 patt = f32_patt;
1562               break;
1563             case PROCESSOR_PENTIUM4:
1564             case PROCESSOR_NOCONA:
1565             case PROCESSOR_CORE:
1566             case PROCESSOR_CORE2:
1567             case PROCESSOR_COREI7:
1568             case PROCESSOR_L1OM:
1569             case PROCESSOR_K1OM:
1570             case PROCESSOR_GENERIC64:
1571             case PROCESSOR_K6:
1572             case PROCESSOR_ATHLON:
1573             case PROCESSOR_K8:
1574             case PROCESSOR_AMDFAM10:
1575             case PROCESSOR_BD:
1576             case PROCESSOR_ZNVER:
1577             case PROCESSOR_BT:
1578               patt = alt_patt;
1579               break;
1580             case PROCESSOR_I386:
1581             case PROCESSOR_I486:
1582             case PROCESSOR_PENTIUM:
1583             case PROCESSOR_PENTIUMPRO:
1584             case PROCESSOR_IAMCU:
1585             case PROCESSOR_GENERIC32:
1586               patt = f32_patt;
1587               break;
1588             }
1589         }
1590       else
1591         {
1592           switch (fragP->tc_frag_data.tune)
1593             {
1594             case PROCESSOR_UNKNOWN:
1595               /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1596                  PROCESSOR_UNKNOWN.  */
1597               abort ();
1598               break;
1599
1600             case PROCESSOR_I386:
1601             case PROCESSOR_I486:
1602             case PROCESSOR_PENTIUM:
1603             case PROCESSOR_IAMCU:
1604             case PROCESSOR_K6:
1605             case PROCESSOR_ATHLON:
1606             case PROCESSOR_K8:
1607             case PROCESSOR_AMDFAM10:
1608             case PROCESSOR_BD:
1609             case PROCESSOR_ZNVER:
1610             case PROCESSOR_BT:
1611             case PROCESSOR_GENERIC32:
1612               /* We use cpu_arch_isa_flags to check if we CAN optimize
1613                  with nops.  */
1614               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1615                 patt = alt_patt;
1616               else
1617                 patt = f32_patt;
1618               break;
1619             case PROCESSOR_PENTIUMPRO:
1620             case PROCESSOR_PENTIUM4:
1621             case PROCESSOR_NOCONA:
1622             case PROCESSOR_CORE:
1623             case PROCESSOR_CORE2:
1624             case PROCESSOR_COREI7:
1625             case PROCESSOR_L1OM:
1626             case PROCESSOR_K1OM:
1627               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1628                 patt = alt_patt;
1629               else
1630                 patt = f32_patt;
1631               break;
1632             case PROCESSOR_GENERIC64:
1633               patt = alt_patt;
1634               break;
1635             }
1636         }
1637
1638       if (patt == f32_patt)
1639         {
1640           max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1641           /* Limit number of NOPs to 2 for older processors.  */
1642           max_number_of_nops = 2;
1643         }
1644       else
1645         {
1646           max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1647           /* Limit number of NOPs to 7 for newer processors.  */
1648           max_number_of_nops = 7;
1649         }
1650     }
1651
1652   if (limit == 0)
1653     limit = max_single_nop_size;
1654
1655   if (fragP->fr_type == rs_fill_nop)
1656     {
1657       /* Output NOPs for .nop directive.  */
1658       if (limit > max_single_nop_size)
1659         {
1660           as_bad_where (fragP->fr_file, fragP->fr_line,
1661                         _("invalid single nop size: %d "
1662                           "(expect within [0, %d])"),
1663                         limit, max_single_nop_size);
1664           return;
1665         }
1666     }
1667   else if (fragP->fr_type != rs_machine_dependent)
1668     fragP->fr_var = count;
1669
1670   if ((count / max_single_nop_size) > max_number_of_nops)
1671     {
1672       /* Generate jump over NOPs.  */
1673       offsetT disp = count - 2;
1674       if (fits_in_imm7 (disp))
1675         {
1676           /* Use "jmp disp8" if possible.  */
1677           count = disp;
1678           where[0] = jump_disp8[0];
1679           where[1] = count;
1680           where += 2;
1681         }
1682       else
1683         {
1684           unsigned int size_of_jump;
1685
1686           if (flag_code == CODE_16BIT)
1687             {
1688               where[0] = jump16_disp32[0];
1689               where[1] = jump16_disp32[1];
1690               size_of_jump = 2;
1691             }
1692           else
1693             {
1694               where[0] = jump32_disp32[0];
1695               size_of_jump = 1;
1696             }
1697
1698           count -= size_of_jump + 4;
1699           if (!fits_in_imm31 (count))
1700             {
1701               as_bad_where (fragP->fr_file, fragP->fr_line,
1702                             _("jump over nop padding out of range"));
1703               return;
1704             }
1705
1706           md_number_to_chars (where + size_of_jump, count, 4);
1707           where += size_of_jump + 4;
1708         }
1709     }
1710
1711   /* Generate multiple NOPs.  */
1712   i386_output_nops (where, patt, count, limit);
1713 }
1714
1715 static INLINE int
1716 operand_type_all_zero (const union i386_operand_type *x)
1717 {
1718   switch (ARRAY_SIZE(x->array))
1719     {
1720     case 3:
1721       if (x->array[2])
1722         return 0;
1723       /* Fall through.  */
1724     case 2:
1725       if (x->array[1])
1726         return 0;
1727       /* Fall through.  */
1728     case 1:
1729       return !x->array[0];
1730     default:
1731       abort ();
1732     }
1733 }
1734
1735 static INLINE void
1736 operand_type_set (union i386_operand_type *x, unsigned int v)
1737 {
1738   switch (ARRAY_SIZE(x->array))
1739     {
1740     case 3:
1741       x->array[2] = v;
1742       /* Fall through.  */
1743     case 2:
1744       x->array[1] = v;
1745       /* Fall through.  */
1746     case 1:
1747       x->array[0] = v;
1748       /* Fall through.  */
1749       break;
1750     default:
1751       abort ();
1752     }
1753
1754   x->bitfield.class = ClassNone;
1755   x->bitfield.instance = InstanceNone;
1756 }
1757
1758 static INLINE int
1759 operand_type_equal (const union i386_operand_type *x,
1760                     const union i386_operand_type *y)
1761 {
1762   switch (ARRAY_SIZE(x->array))
1763     {
1764     case 3:
1765       if (x->array[2] != y->array[2])
1766         return 0;
1767       /* Fall through.  */
1768     case 2:
1769       if (x->array[1] != y->array[1])
1770         return 0;
1771       /* Fall through.  */
1772     case 1:
1773       return x->array[0] == y->array[0];
1774       break;
1775     default:
1776       abort ();
1777     }
1778 }
1779
1780 static INLINE int
1781 cpu_flags_all_zero (const union i386_cpu_flags *x)
1782 {
1783   switch (ARRAY_SIZE(x->array))
1784     {
1785     case 4:
1786       if (x->array[3])
1787         return 0;
1788       /* Fall through.  */
1789     case 3:
1790       if (x->array[2])
1791         return 0;
1792       /* Fall through.  */
1793     case 2:
1794       if (x->array[1])
1795         return 0;
1796       /* Fall through.  */
1797     case 1:
1798       return !x->array[0];
1799     default:
1800       abort ();
1801     }
1802 }
1803
1804 static INLINE int
1805 cpu_flags_equal (const union i386_cpu_flags *x,
1806                  const union i386_cpu_flags *y)
1807 {
1808   switch (ARRAY_SIZE(x->array))
1809     {
1810     case 4:
1811       if (x->array[3] != y->array[3])
1812         return 0;
1813       /* Fall through.  */
1814     case 3:
1815       if (x->array[2] != y->array[2])
1816         return 0;
1817       /* Fall through.  */
1818     case 2:
1819       if (x->array[1] != y->array[1])
1820         return 0;
1821       /* Fall through.  */
1822     case 1:
1823       return x->array[0] == y->array[0];
1824       break;
1825     default:
1826       abort ();
1827     }
1828 }
1829
1830 static INLINE int
1831 cpu_flags_check_cpu64 (i386_cpu_flags f)
1832 {
1833   return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1834            || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1835 }
1836
1837 static INLINE i386_cpu_flags
1838 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1839 {
1840   switch (ARRAY_SIZE (x.array))
1841     {
1842     case 4:
1843       x.array [3] &= y.array [3];
1844       /* Fall through.  */
1845     case 3:
1846       x.array [2] &= y.array [2];
1847       /* Fall through.  */
1848     case 2:
1849       x.array [1] &= y.array [1];
1850       /* Fall through.  */
1851     case 1:
1852       x.array [0] &= y.array [0];
1853       break;
1854     default:
1855       abort ();
1856     }
1857   return x;
1858 }
1859
1860 static INLINE i386_cpu_flags
1861 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1862 {
1863   switch (ARRAY_SIZE (x.array))
1864     {
1865     case 4:
1866       x.array [3] |= y.array [3];
1867       /* Fall through.  */
1868     case 3:
1869       x.array [2] |= y.array [2];
1870       /* Fall through.  */
1871     case 2:
1872       x.array [1] |= y.array [1];
1873       /* Fall through.  */
1874     case 1:
1875       x.array [0] |= y.array [0];
1876       break;
1877     default:
1878       abort ();
1879     }
1880   return x;
1881 }
1882
1883 static INLINE i386_cpu_flags
1884 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1885 {
1886   switch (ARRAY_SIZE (x.array))
1887     {
1888     case 4:
1889       x.array [3] &= ~y.array [3];
1890       /* Fall through.  */
1891     case 3:
1892       x.array [2] &= ~y.array [2];
1893       /* Fall through.  */
1894     case 2:
1895       x.array [1] &= ~y.array [1];
1896       /* Fall through.  */
1897     case 1:
1898       x.array [0] &= ~y.array [0];
1899       break;
1900     default:
1901       abort ();
1902     }
1903   return x;
1904 }
1905
1906 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1907
1908 #define CPU_FLAGS_ARCH_MATCH            0x1
1909 #define CPU_FLAGS_64BIT_MATCH           0x2
1910
1911 #define CPU_FLAGS_PERFECT_MATCH \
1912   (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1913
1914 /* Return CPU flags match bits. */
1915
1916 static int
1917 cpu_flags_match (const insn_template *t)
1918 {
1919   i386_cpu_flags x = t->cpu_flags;
1920   int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1921
1922   x.bitfield.cpu64 = 0;
1923   x.bitfield.cpuno64 = 0;
1924
1925   if (cpu_flags_all_zero (&x))
1926     {
1927       /* This instruction is available on all archs.  */
1928       match |= CPU_FLAGS_ARCH_MATCH;
1929     }
1930   else
1931     {
1932       /* This instruction is available only on some archs.  */
1933       i386_cpu_flags cpu = cpu_arch_flags;
1934
1935       /* AVX512VL is no standalone feature - match it and then strip it.  */
1936       if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1937         return match;
1938       x.bitfield.cpuavx512vl = 0;
1939
1940       cpu = cpu_flags_and (x, cpu);
1941       if (!cpu_flags_all_zero (&cpu))
1942         {
1943           if (x.bitfield.cpuavx)
1944             {
1945               /* We need to check a few extra flags with AVX.  */
1946               if (cpu.bitfield.cpuavx
1947                   && (!t->opcode_modifier.sse2avx
1948                       || (sse2avx && !i.prefix[DATA_PREFIX]))
1949                   && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1950                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1951                   && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1952                 match |= CPU_FLAGS_ARCH_MATCH;
1953             }
1954           else if (x.bitfield.cpuavx512f)
1955             {
1956               /* We need to check a few extra flags with AVX512F.  */
1957               if (cpu.bitfield.cpuavx512f
1958                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1959                   && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1960                   && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1961                 match |= CPU_FLAGS_ARCH_MATCH;
1962             }
1963           else
1964             match |= CPU_FLAGS_ARCH_MATCH;
1965         }
1966     }
1967   return match;
1968 }
1969
1970 static INLINE i386_operand_type
1971 operand_type_and (i386_operand_type x, i386_operand_type y)
1972 {
1973   if (x.bitfield.class != y.bitfield.class)
1974     x.bitfield.class = ClassNone;
1975   if (x.bitfield.instance != y.bitfield.instance)
1976     x.bitfield.instance = InstanceNone;
1977
1978   switch (ARRAY_SIZE (x.array))
1979     {
1980     case 3:
1981       x.array [2] &= y.array [2];
1982       /* Fall through.  */
1983     case 2:
1984       x.array [1] &= y.array [1];
1985       /* Fall through.  */
1986     case 1:
1987       x.array [0] &= y.array [0];
1988       break;
1989     default:
1990       abort ();
1991     }
1992   return x;
1993 }
1994
1995 static INLINE i386_operand_type
1996 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1997 {
1998   gas_assert (y.bitfield.class == ClassNone);
1999   gas_assert (y.bitfield.instance == InstanceNone);
2000
2001   switch (ARRAY_SIZE (x.array))
2002     {
2003     case 3:
2004       x.array [2] &= ~y.array [2];
2005       /* Fall through.  */
2006     case 2:
2007       x.array [1] &= ~y.array [1];
2008       /* Fall through.  */
2009     case 1:
2010       x.array [0] &= ~y.array [0];
2011       break;
2012     default:
2013       abort ();
2014     }
2015   return x;
2016 }
2017
2018 static INLINE i386_operand_type
2019 operand_type_or (i386_operand_type x, i386_operand_type y)
2020 {
2021   gas_assert (x.bitfield.class == ClassNone ||
2022               y.bitfield.class == ClassNone ||
2023               x.bitfield.class == y.bitfield.class);
2024   gas_assert (x.bitfield.instance == InstanceNone ||
2025               y.bitfield.instance == InstanceNone ||
2026               x.bitfield.instance == y.bitfield.instance);
2027
2028   switch (ARRAY_SIZE (x.array))
2029     {
2030     case 3:
2031       x.array [2] |= y.array [2];
2032       /* Fall through.  */
2033     case 2:
2034       x.array [1] |= y.array [1];
2035       /* Fall through.  */
2036     case 1:
2037       x.array [0] |= y.array [0];
2038       break;
2039     default:
2040       abort ();
2041     }
2042   return x;
2043 }
2044
2045 static INLINE i386_operand_type
2046 operand_type_xor (i386_operand_type x, i386_operand_type y)
2047 {
2048   gas_assert (y.bitfield.class == ClassNone);
2049   gas_assert (y.bitfield.instance == InstanceNone);
2050
2051   switch (ARRAY_SIZE (x.array))
2052     {
2053     case 3:
2054       x.array [2] ^= y.array [2];
2055       /* Fall through.  */
2056     case 2:
2057       x.array [1] ^= y.array [1];
2058       /* Fall through.  */
2059     case 1:
2060       x.array [0] ^= y.array [0];
2061       break;
2062     default:
2063       abort ();
2064     }
2065   return x;
2066 }
2067
2068 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2069 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2070 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2071 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2072 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2073 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2074 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2075 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2076 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2077 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2078 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2079 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2080 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2081 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2082 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2083 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2084 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2085
2086 enum operand_type
2087 {
2088   reg,
2089   imm,
2090   disp,
2091   anymem
2092 };
2093
2094 static INLINE int
2095 operand_type_check (i386_operand_type t, enum operand_type c)
2096 {
2097   switch (c)
2098     {
2099     case reg:
2100       return t.bitfield.class == Reg;
2101
2102     case imm:
2103       return (t.bitfield.imm8
2104               || t.bitfield.imm8s
2105               || t.bitfield.imm16
2106               || t.bitfield.imm32
2107               || t.bitfield.imm32s
2108               || t.bitfield.imm64);
2109
2110     case disp:
2111       return (t.bitfield.disp8
2112               || t.bitfield.disp16
2113               || t.bitfield.disp32
2114               || t.bitfield.disp32s
2115               || t.bitfield.disp64);
2116
2117     case anymem:
2118       return (t.bitfield.disp8
2119               || t.bitfield.disp16
2120               || t.bitfield.disp32
2121               || t.bitfield.disp32s
2122               || t.bitfield.disp64
2123               || t.bitfield.baseindex);
2124
2125     default:
2126       abort ();
2127     }
2128
2129   return 0;
2130 }
2131
2132 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2133    between operand GIVEN and opeand WANTED for instruction template T.  */
2134
2135 static INLINE int
2136 match_operand_size (const insn_template *t, unsigned int wanted,
2137                     unsigned int given)
2138 {
2139   return !((i.types[given].bitfield.byte
2140             && !t->operand_types[wanted].bitfield.byte)
2141            || (i.types[given].bitfield.word
2142                && !t->operand_types[wanted].bitfield.word)
2143            || (i.types[given].bitfield.dword
2144                && !t->operand_types[wanted].bitfield.dword)
2145            || (i.types[given].bitfield.qword
2146                && !t->operand_types[wanted].bitfield.qword)
2147            || (i.types[given].bitfield.tbyte
2148                && !t->operand_types[wanted].bitfield.tbyte));
2149 }
2150
2151 /* Return 1 if there is no conflict in SIMD register between operand
2152    GIVEN and opeand WANTED for instruction template T.  */
2153
2154 static INLINE int
2155 match_simd_size (const insn_template *t, unsigned int wanted,
2156                  unsigned int given)
2157 {
2158   return !((i.types[given].bitfield.xmmword
2159             && !t->operand_types[wanted].bitfield.xmmword)
2160            || (i.types[given].bitfield.ymmword
2161                && !t->operand_types[wanted].bitfield.ymmword)
2162            || (i.types[given].bitfield.zmmword
2163                && !t->operand_types[wanted].bitfield.zmmword));
2164 }
2165
2166 /* Return 1 if there is no conflict in any size between operand GIVEN
2167    and opeand WANTED for instruction template T.  */
2168
2169 static INLINE int
2170 match_mem_size (const insn_template *t, unsigned int wanted,
2171                 unsigned int given)
2172 {
2173   return (match_operand_size (t, wanted, given)
2174           && !((i.types[given].bitfield.unspecified
2175                 && !i.broadcast
2176                 && !t->operand_types[wanted].bitfield.unspecified)
2177                || (i.types[given].bitfield.fword
2178                    && !t->operand_types[wanted].bitfield.fword)
2179                /* For scalar opcode templates to allow register and memory
2180                   operands at the same time, some special casing is needed
2181                   here.  Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2182                   down-conversion vpmov*.  */
2183                || ((t->operand_types[wanted].bitfield.class == RegSIMD
2184                     && t->operand_types[wanted].bitfield.byte
2185                        + t->operand_types[wanted].bitfield.word
2186                        + t->operand_types[wanted].bitfield.dword
2187                        + t->operand_types[wanted].bitfield.qword
2188                        > !!t->opcode_modifier.broadcast)
2189                    ? (i.types[given].bitfield.xmmword
2190                       || i.types[given].bitfield.ymmword
2191                       || i.types[given].bitfield.zmmword)
2192                    : !match_simd_size(t, wanted, given))));
2193 }
2194
2195 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2196    operands for instruction template T, and it has MATCH_REVERSE set if there
2197    is no size conflict on any operands for the template with operands reversed
2198    (and the template allows for reversing in the first place).  */
2199
2200 #define MATCH_STRAIGHT 1
2201 #define MATCH_REVERSE  2
2202
2203 static INLINE unsigned int
2204 operand_size_match (const insn_template *t)
2205 {
2206   unsigned int j, match = MATCH_STRAIGHT;
2207
2208   /* Don't check non-absolute jump instructions.  */
2209   if (t->opcode_modifier.jump
2210       && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2211     return match;
2212
2213   /* Check memory and accumulator operand size.  */
2214   for (j = 0; j < i.operands; j++)
2215     {
2216       if (i.types[j].bitfield.class != Reg
2217           && i.types[j].bitfield.class != RegSIMD
2218           && t->opcode_modifier.anysize)
2219         continue;
2220
2221       if (t->operand_types[j].bitfield.class == Reg
2222           && !match_operand_size (t, j, j))
2223         {
2224           match = 0;
2225           break;
2226         }
2227
2228       if (t->operand_types[j].bitfield.class == RegSIMD
2229           && !match_simd_size (t, j, j))
2230         {
2231           match = 0;
2232           break;
2233         }
2234
2235       if (t->operand_types[j].bitfield.instance == Accum
2236           && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2237         {
2238           match = 0;
2239           break;
2240         }
2241
2242       if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2243         {
2244           match = 0;
2245           break;
2246         }
2247     }
2248
2249   if (!t->opcode_modifier.d)
2250     {
2251     mismatch:
2252       if (!match)
2253         i.error = operand_size_mismatch;
2254       return match;
2255     }
2256
2257   /* Check reverse.  */
2258   gas_assert (i.operands >= 2 && i.operands <= 3);
2259
2260   for (j = 0; j < i.operands; j++)
2261     {
2262       unsigned int given = i.operands - j - 1;
2263
2264       if (t->operand_types[j].bitfield.class == Reg
2265           && !match_operand_size (t, j, given))
2266         goto mismatch;
2267
2268       if (t->operand_types[j].bitfield.class == RegSIMD
2269           && !match_simd_size (t, j, given))
2270         goto mismatch;
2271
2272       if (t->operand_types[j].bitfield.instance == Accum
2273           && (!match_operand_size (t, j, given)
2274               || !match_simd_size (t, j, given)))
2275         goto mismatch;
2276
2277       if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2278         goto mismatch;
2279     }
2280
2281   return match | MATCH_REVERSE;
2282 }
2283
2284 static INLINE int
2285 operand_type_match (i386_operand_type overlap,
2286                     i386_operand_type given)
2287 {
2288   i386_operand_type temp = overlap;
2289
2290   temp.bitfield.unspecified = 0;
2291   temp.bitfield.byte = 0;
2292   temp.bitfield.word = 0;
2293   temp.bitfield.dword = 0;
2294   temp.bitfield.fword = 0;
2295   temp.bitfield.qword = 0;
2296   temp.bitfield.tbyte = 0;
2297   temp.bitfield.xmmword = 0;
2298   temp.bitfield.ymmword = 0;
2299   temp.bitfield.zmmword = 0;
2300   if (operand_type_all_zero (&temp))
2301     goto mismatch;
2302
2303   if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2304     return 1;
2305
2306  mismatch:
2307   i.error = operand_type_mismatch;
2308   return 0;
2309 }
2310
2311 /* If given types g0 and g1 are registers they must be of the same type
2312    unless the expected operand type register overlap is null.
2313    Some Intel syntax memory operand size checking also happens here.  */
2314
2315 static INLINE int
2316 operand_type_register_match (i386_operand_type g0,
2317                              i386_operand_type t0,
2318                              i386_operand_type g1,
2319                              i386_operand_type t1)
2320 {
2321   if (g0.bitfield.class != Reg
2322       && g0.bitfield.class != RegSIMD
2323       && (!operand_type_check (g0, anymem)
2324           || g0.bitfield.unspecified
2325           || (t0.bitfield.class != Reg
2326               && t0.bitfield.class != RegSIMD)))
2327     return 1;
2328
2329   if (g1.bitfield.class != Reg
2330       && g1.bitfield.class != RegSIMD
2331       && (!operand_type_check (g1, anymem)
2332           || g1.bitfield.unspecified
2333           || (t1.bitfield.class != Reg
2334               && t1.bitfield.class != RegSIMD)))
2335     return 1;
2336
2337   if (g0.bitfield.byte == g1.bitfield.byte
2338       && g0.bitfield.word == g1.bitfield.word
2339       && g0.bitfield.dword == g1.bitfield.dword
2340       && g0.bitfield.qword == g1.bitfield.qword
2341       && g0.bitfield.xmmword == g1.bitfield.xmmword
2342       && g0.bitfield.ymmword == g1.bitfield.ymmword
2343       && g0.bitfield.zmmword == g1.bitfield.zmmword)
2344     return 1;
2345
2346   if (!(t0.bitfield.byte & t1.bitfield.byte)
2347       && !(t0.bitfield.word & t1.bitfield.word)
2348       && !(t0.bitfield.dword & t1.bitfield.dword)
2349       && !(t0.bitfield.qword & t1.bitfield.qword)
2350       && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2351       && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2352       && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2353     return 1;
2354
2355   i.error = register_type_mismatch;
2356
2357   return 0;
2358 }
2359
2360 static INLINE unsigned int
2361 register_number (const reg_entry *r)
2362 {
2363   unsigned int nr = r->reg_num;
2364
2365   if (r->reg_flags & RegRex)
2366     nr += 8;
2367
2368   if (r->reg_flags & RegVRex)
2369     nr += 16;
2370
2371   return nr;
2372 }
2373
2374 static INLINE unsigned int
2375 mode_from_disp_size (i386_operand_type t)
2376 {
2377   if (t.bitfield.disp8)
2378     return 1;
2379   else if (t.bitfield.disp16
2380            || t.bitfield.disp32
2381            || t.bitfield.disp32s)
2382     return 2;
2383   else
2384     return 0;
2385 }
2386
2387 static INLINE int
2388 fits_in_signed_byte (addressT num)
2389 {
2390   return num + 0x80 <= 0xff;
2391 }
2392
2393 static INLINE int
2394 fits_in_unsigned_byte (addressT num)
2395 {
2396   return num <= 0xff;
2397 }
2398
2399 static INLINE int
2400 fits_in_unsigned_word (addressT num)
2401 {
2402   return num <= 0xffff;
2403 }
2404
2405 static INLINE int
2406 fits_in_signed_word (addressT num)
2407 {
2408   return num + 0x8000 <= 0xffff;
2409 }
2410
2411 static INLINE int
2412 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2413 {
2414 #ifndef BFD64
2415   return 1;
2416 #else
2417   return num + 0x80000000 <= 0xffffffff;
2418 #endif
2419 }                               /* fits_in_signed_long() */
2420
2421 static INLINE int
2422 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2423 {
2424 #ifndef BFD64
2425   return 1;
2426 #else
2427   return num <= 0xffffffff;
2428 #endif
2429 }                               /* fits_in_unsigned_long() */
2430
2431 static INLINE int
2432 fits_in_disp8 (offsetT num)
2433 {
2434   int shift = i.memshift;
2435   unsigned int mask;
2436
2437   if (shift == -1)
2438     abort ();
2439
2440   mask = (1 << shift) - 1;
2441
2442   /* Return 0 if NUM isn't properly aligned.  */
2443   if ((num & mask))
2444     return 0;
2445
2446   /* Check if NUM will fit in 8bit after shift.  */
2447   return fits_in_signed_byte (num >> shift);
2448 }
2449
2450 static INLINE int
2451 fits_in_imm4 (offsetT num)
2452 {
2453   return (num & 0xf) == num;
2454 }
2455
2456 static i386_operand_type
2457 smallest_imm_type (offsetT num)
2458 {
2459   i386_operand_type t;
2460
2461   operand_type_set (&t, 0);
2462   t.bitfield.imm64 = 1;
2463
2464   if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2465     {
2466       /* This code is disabled on the 486 because all the Imm1 forms
2467          in the opcode table are slower on the i486.  They're the
2468          versions with the implicitly specified single-position
2469          displacement, which has another syntax if you really want to
2470          use that form.  */
2471       t.bitfield.imm1 = 1;
2472       t.bitfield.imm8 = 1;
2473       t.bitfield.imm8s = 1;
2474       t.bitfield.imm16 = 1;
2475       t.bitfield.imm32 = 1;
2476       t.bitfield.imm32s = 1;
2477     }
2478   else if (fits_in_signed_byte (num))
2479     {
2480       t.bitfield.imm8 = 1;
2481       t.bitfield.imm8s = 1;
2482       t.bitfield.imm16 = 1;
2483       t.bitfield.imm32 = 1;
2484       t.bitfield.imm32s = 1;
2485     }
2486   else if (fits_in_unsigned_byte (num))
2487     {
2488       t.bitfield.imm8 = 1;
2489       t.bitfield.imm16 = 1;
2490       t.bitfield.imm32 = 1;
2491       t.bitfield.imm32s = 1;
2492     }
2493   else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2494     {
2495       t.bitfield.imm16 = 1;
2496       t.bitfield.imm32 = 1;
2497       t.bitfield.imm32s = 1;
2498     }
2499   else if (fits_in_signed_long (num))
2500     {
2501       t.bitfield.imm32 = 1;
2502       t.bitfield.imm32s = 1;
2503     }
2504   else if (fits_in_unsigned_long (num))
2505     t.bitfield.imm32 = 1;
2506
2507   return t;
2508 }
2509
2510 static offsetT
2511 offset_in_range (offsetT val, int size)
2512 {
2513   addressT mask;
2514
2515   switch (size)
2516     {
2517     case 1: mask = ((addressT) 1 <<  8) - 1; break;
2518     case 2: mask = ((addressT) 1 << 16) - 1; break;
2519     case 4: mask = ((addressT) 2 << 31) - 1; break;
2520 #ifdef BFD64
2521     case 8: mask = ((addressT) 2 << 63) - 1; break;
2522 #endif
2523     default: abort ();
2524     }
2525
2526 #ifdef BFD64
2527   /* If BFD64, sign extend val for 32bit address mode.  */
2528   if (flag_code != CODE_64BIT
2529       || i.prefix[ADDR_PREFIX])
2530     if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2531       val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2532 #endif
2533
2534   if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2535     {
2536       char buf1[40], buf2[40];
2537
2538       sprint_value (buf1, val);
2539       sprint_value (buf2, val & mask);
2540       as_warn (_("%s shortened to %s"), buf1, buf2);
2541     }
2542   return val & mask;
2543 }
2544
2545 enum PREFIX_GROUP
2546 {
2547   PREFIX_EXIST = 0,
2548   PREFIX_LOCK,
2549   PREFIX_REP,
2550   PREFIX_DS,
2551   PREFIX_OTHER
2552 };
2553
2554 /* Returns
2555    a. PREFIX_EXIST if attempting to add a prefix where one from the
2556    same class already exists.
2557    b. PREFIX_LOCK if lock prefix is added.
2558    c. PREFIX_REP if rep/repne prefix is added.
2559    d. PREFIX_DS if ds prefix is added.
2560    e. PREFIX_OTHER if other prefix is added.
2561  */
2562
2563 static enum PREFIX_GROUP
2564 add_prefix (unsigned int prefix)
2565 {
2566   enum PREFIX_GROUP ret = PREFIX_OTHER;
2567   unsigned int q;
2568
2569   if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2570       && flag_code == CODE_64BIT)
2571     {
2572       if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2573           || (i.prefix[REX_PREFIX] & prefix & REX_R)
2574           || (i.prefix[REX_PREFIX] & prefix & REX_X)
2575           || (i.prefix[REX_PREFIX] & prefix & REX_B))
2576         ret = PREFIX_EXIST;
2577       q = REX_PREFIX;
2578     }
2579   else
2580     {
2581       switch (prefix)
2582         {
2583         default:
2584           abort ();
2585
2586         case DS_PREFIX_OPCODE:
2587           ret = PREFIX_DS;
2588           /* Fall through.  */
2589         case CS_PREFIX_OPCODE:
2590         case ES_PREFIX_OPCODE:
2591         case FS_PREFIX_OPCODE:
2592         case GS_PREFIX_OPCODE:
2593         case SS_PREFIX_OPCODE:
2594           q = SEG_PREFIX;
2595           break;
2596
2597         case REPNE_PREFIX_OPCODE:
2598         case REPE_PREFIX_OPCODE:
2599           q = REP_PREFIX;
2600           ret = PREFIX_REP;
2601           break;
2602
2603         case LOCK_PREFIX_OPCODE:
2604           q = LOCK_PREFIX;
2605           ret = PREFIX_LOCK;
2606           break;
2607
2608         case FWAIT_OPCODE:
2609           q = WAIT_PREFIX;
2610           break;
2611
2612         case ADDR_PREFIX_OPCODE:
2613           q = ADDR_PREFIX;
2614           break;
2615
2616         case DATA_PREFIX_OPCODE:
2617           q = DATA_PREFIX;
2618           break;
2619         }
2620       if (i.prefix[q] != 0)
2621         ret = PREFIX_EXIST;
2622     }
2623
2624   if (ret)
2625     {
2626       if (!i.prefix[q])
2627         ++i.prefixes;
2628       i.prefix[q] |= prefix;
2629     }
2630   else
2631     as_bad (_("same type of prefix used twice"));
2632
2633   return ret;
2634 }
2635
2636 static void
2637 update_code_flag (int value, int check)
2638 {
2639   PRINTF_LIKE ((*as_error));
2640
2641   flag_code = (enum flag_code) value;
2642   if (flag_code == CODE_64BIT)
2643     {
2644       cpu_arch_flags.bitfield.cpu64 = 1;
2645       cpu_arch_flags.bitfield.cpuno64 = 0;
2646     }
2647   else
2648     {
2649       cpu_arch_flags.bitfield.cpu64 = 0;
2650       cpu_arch_flags.bitfield.cpuno64 = 1;
2651     }
2652   if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2653     {
2654       if (check)
2655         as_error = as_fatal;
2656       else
2657         as_error = as_bad;
2658       (*as_error) (_("64bit mode not supported on `%s'."),
2659                    cpu_arch_name ? cpu_arch_name : default_arch);
2660     }
2661   if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2662     {
2663       if (check)
2664         as_error = as_fatal;
2665       else
2666         as_error = as_bad;
2667       (*as_error) (_("32bit mode not supported on `%s'."),
2668                    cpu_arch_name ? cpu_arch_name : default_arch);
2669     }
2670   stackop_size = '\0';
2671 }
2672
2673 static void
2674 set_code_flag (int value)
2675 {
2676   update_code_flag (value, 0);
2677 }
2678
2679 static void
2680 set_16bit_gcc_code_flag (int new_code_flag)
2681 {
2682   flag_code = (enum flag_code) new_code_flag;
2683   if (flag_code != CODE_16BIT)
2684     abort ();
2685   cpu_arch_flags.bitfield.cpu64 = 0;
2686   cpu_arch_flags.bitfield.cpuno64 = 1;
2687   stackop_size = LONG_MNEM_SUFFIX;
2688 }
2689
2690 static void
2691 set_intel_syntax (int syntax_flag)
2692 {
2693   /* Find out if register prefixing is specified.  */
2694   int ask_naked_reg = 0;
2695
2696   SKIP_WHITESPACE ();
2697   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2698     {
2699       char *string;
2700       int e = get_symbol_name (&string);
2701
2702       if (strcmp (string, "prefix") == 0)
2703         ask_naked_reg = 1;
2704       else if (strcmp (string, "noprefix") == 0)
2705         ask_naked_reg = -1;
2706       else
2707         as_bad (_("bad argument to syntax directive."));
2708       (void) restore_line_pointer (e);
2709     }
2710   demand_empty_rest_of_line ();
2711
2712   intel_syntax = syntax_flag;
2713
2714   if (ask_naked_reg == 0)
2715     allow_naked_reg = (intel_syntax
2716                        && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2717   else
2718     allow_naked_reg = (ask_naked_reg < 0);
2719
2720   expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2721
2722   identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2723   identifier_chars['$'] = intel_syntax ? '$' : 0;
2724   register_prefix = allow_naked_reg ? "" : "%";
2725 }
2726
2727 static void
2728 set_intel_mnemonic (int mnemonic_flag)
2729 {
2730   intel_mnemonic = mnemonic_flag;
2731 }
2732
2733 static void
2734 set_allow_index_reg (int flag)
2735 {
2736   allow_index_reg = flag;
2737 }
2738
2739 static void
2740 set_check (int what)
2741 {
2742   enum check_kind *kind;
2743   const char *str;
2744
2745   if (what)
2746     {
2747       kind = &operand_check;
2748       str = "operand";
2749     }
2750   else
2751     {
2752       kind = &sse_check;
2753       str = "sse";
2754     }
2755
2756   SKIP_WHITESPACE ();
2757
2758   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2759     {
2760       char *string;
2761       int e = get_symbol_name (&string);
2762
2763       if (strcmp (string, "none") == 0)
2764         *kind = check_none;
2765       else if (strcmp (string, "warning") == 0)
2766         *kind = check_warning;
2767       else if (strcmp (string, "error") == 0)
2768         *kind = check_error;
2769       else
2770         as_bad (_("bad argument to %s_check directive."), str);
2771       (void) restore_line_pointer (e);
2772     }
2773   else
2774     as_bad (_("missing argument for %s_check directive"), str);
2775
2776   demand_empty_rest_of_line ();
2777 }
2778
2779 static void
2780 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2781                            i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2782 {
2783 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2784   static const char *arch;
2785
2786   /* Intel LIOM is only supported on ELF.  */
2787   if (!IS_ELF)
2788     return;
2789
2790   if (!arch)
2791     {
2792       /* Use cpu_arch_name if it is set in md_parse_option.  Otherwise
2793          use default_arch.  */
2794       arch = cpu_arch_name;
2795       if (!arch)
2796         arch = default_arch;
2797     }
2798
2799   /* If we are targeting Intel MCU, we must enable it.  */
2800   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2801       || new_flag.bitfield.cpuiamcu)
2802     return;
2803
2804   /* If we are targeting Intel L1OM, we must enable it.  */
2805   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2806       || new_flag.bitfield.cpul1om)
2807     return;
2808
2809   /* If we are targeting Intel K1OM, we must enable it.  */
2810   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2811       || new_flag.bitfield.cpuk1om)
2812     return;
2813
2814   as_bad (_("`%s' is not supported on `%s'"), name, arch);
2815 #endif
2816 }
2817
2818 static void
2819 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2820 {
2821   SKIP_WHITESPACE ();
2822
2823   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2824     {
2825       char *string;
2826       int e = get_symbol_name (&string);
2827       unsigned int j;
2828       i386_cpu_flags flags;
2829
2830       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2831         {
2832           if (strcmp (string, cpu_arch[j].name) == 0)
2833             {
2834               check_cpu_arch_compatible (string, cpu_arch[j].flags);
2835
2836               if (*string != '.')
2837                 {
2838                   cpu_arch_name = cpu_arch[j].name;
2839                   cpu_sub_arch_name = NULL;
2840                   cpu_arch_flags = cpu_arch[j].flags;
2841                   if (flag_code == CODE_64BIT)
2842                     {
2843                       cpu_arch_flags.bitfield.cpu64 = 1;
2844                       cpu_arch_flags.bitfield.cpuno64 = 0;
2845                     }
2846                   else
2847                     {
2848                       cpu_arch_flags.bitfield.cpu64 = 0;
2849                       cpu_arch_flags.bitfield.cpuno64 = 1;
2850                     }
2851                   cpu_arch_isa = cpu_arch[j].type;
2852                   cpu_arch_isa_flags = cpu_arch[j].flags;
2853                   if (!cpu_arch_tune_set)
2854                     {
2855                       cpu_arch_tune = cpu_arch_isa;
2856                       cpu_arch_tune_flags = cpu_arch_isa_flags;
2857                     }
2858                   break;
2859                 }
2860
2861               flags = cpu_flags_or (cpu_arch_flags,
2862                                     cpu_arch[j].flags);
2863
2864               if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2865                 {
2866                   if (cpu_sub_arch_name)
2867                     {
2868                       char *name = cpu_sub_arch_name;
2869                       cpu_sub_arch_name = concat (name,
2870                                                   cpu_arch[j].name,
2871                                                   (const char *) NULL);
2872                       free (name);
2873                     }
2874                   else
2875                     cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2876                   cpu_arch_flags = flags;
2877                   cpu_arch_isa_flags = flags;
2878                 }
2879               else
2880                 cpu_arch_isa_flags
2881                   = cpu_flags_or (cpu_arch_isa_flags,
2882                                   cpu_arch[j].flags);
2883               (void) restore_line_pointer (e);
2884               demand_empty_rest_of_line ();
2885               return;
2886             }
2887         }
2888
2889       if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2890         {
2891           /* Disable an ISA extension.  */
2892           for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2893             if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2894               {
2895                 flags = cpu_flags_and_not (cpu_arch_flags,
2896                                            cpu_noarch[j].flags);
2897                 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2898                   {
2899                     if (cpu_sub_arch_name)
2900                       {
2901                         char *name = cpu_sub_arch_name;
2902                         cpu_sub_arch_name = concat (name, string,
2903                                                     (const char *) NULL);
2904                         free (name);
2905                       }
2906                     else
2907                       cpu_sub_arch_name = xstrdup (string);
2908                     cpu_arch_flags = flags;
2909                     cpu_arch_isa_flags = flags;
2910                   }
2911                 (void) restore_line_pointer (e);
2912                 demand_empty_rest_of_line ();
2913                 return;
2914               }
2915
2916           j = ARRAY_SIZE (cpu_arch);
2917         }
2918
2919       if (j >= ARRAY_SIZE (cpu_arch))
2920         as_bad (_("no such architecture: `%s'"), string);
2921
2922       *input_line_pointer = e;
2923     }
2924   else
2925     as_bad (_("missing cpu architecture"));
2926
2927   no_cond_jump_promotion = 0;
2928   if (*input_line_pointer == ','
2929       && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2930     {
2931       char *string;
2932       char e;
2933
2934       ++input_line_pointer;
2935       e = get_symbol_name (&string);
2936
2937       if (strcmp (string, "nojumps") == 0)
2938         no_cond_jump_promotion = 1;
2939       else if (strcmp (string, "jumps") == 0)
2940         ;
2941       else
2942         as_bad (_("no such architecture modifier: `%s'"), string);
2943
2944       (void) restore_line_pointer (e);
2945     }
2946
2947   demand_empty_rest_of_line ();
2948 }
2949
2950 enum bfd_architecture
2951 i386_arch (void)
2952 {
2953   if (cpu_arch_isa == PROCESSOR_L1OM)
2954     {
2955       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2956           || flag_code != CODE_64BIT)
2957         as_fatal (_("Intel L1OM is 64bit ELF only"));
2958       return bfd_arch_l1om;
2959     }
2960   else if (cpu_arch_isa == PROCESSOR_K1OM)
2961     {
2962       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2963           || flag_code != CODE_64BIT)
2964         as_fatal (_("Intel K1OM is 64bit ELF only"));
2965       return bfd_arch_k1om;
2966     }
2967   else if (cpu_arch_isa == PROCESSOR_IAMCU)
2968     {
2969       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2970           || flag_code == CODE_64BIT)
2971         as_fatal (_("Intel MCU is 32bit ELF only"));
2972       return bfd_arch_iamcu;
2973     }
2974   else
2975     return bfd_arch_i386;
2976 }
2977
2978 unsigned long
2979 i386_mach (void)
2980 {
2981   if (!strncmp (default_arch, "x86_64", 6))
2982     {
2983       if (cpu_arch_isa == PROCESSOR_L1OM)
2984         {
2985           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2986               || default_arch[6] != '\0')
2987             as_fatal (_("Intel L1OM is 64bit ELF only"));
2988           return bfd_mach_l1om;
2989         }
2990       else if (cpu_arch_isa == PROCESSOR_K1OM)
2991         {
2992           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2993               || default_arch[6] != '\0')
2994             as_fatal (_("Intel K1OM is 64bit ELF only"));
2995           return bfd_mach_k1om;
2996         }
2997       else if (default_arch[6] == '\0')
2998         return bfd_mach_x86_64;
2999       else
3000         return bfd_mach_x64_32;
3001     }
3002   else if (!strcmp (default_arch, "i386")
3003            || !strcmp (default_arch, "iamcu"))
3004     {
3005       if (cpu_arch_isa == PROCESSOR_IAMCU)
3006         {
3007           if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3008             as_fatal (_("Intel MCU is 32bit ELF only"));
3009           return bfd_mach_i386_iamcu;
3010         }
3011       else
3012         return bfd_mach_i386_i386;
3013     }
3014   else
3015     as_fatal (_("unknown architecture"));
3016 }
3017 \f
3018 void
3019 md_begin (void)
3020 {
3021   const char *hash_err;
3022
3023   /* Support pseudo prefixes like {disp32}.  */
3024   lex_type ['{'] = LEX_BEGIN_NAME;
3025
3026   /* Initialize op_hash hash table.  */
3027   op_hash = hash_new ();
3028
3029   {
3030     const insn_template *optab;
3031     templates *core_optab;
3032
3033     /* Setup for loop.  */
3034     optab = i386_optab;
3035     core_optab = XNEW (templates);
3036     core_optab->start = optab;
3037
3038     while (1)
3039       {
3040         ++optab;
3041         if (optab->name == NULL
3042             || strcmp (optab->name, (optab - 1)->name) != 0)
3043           {
3044             /* different name --> ship out current template list;
3045                add to hash table; & begin anew.  */
3046             core_optab->end = optab;
3047             hash_err = hash_insert (op_hash,
3048                                     (optab - 1)->name,
3049                                     (void *) core_optab);
3050             if (hash_err)
3051               {
3052                 as_fatal (_("can't hash %s: %s"),
3053                           (optab - 1)->name,
3054                           hash_err);
3055               }
3056             if (optab->name == NULL)
3057               break;
3058             core_optab = XNEW (templates);
3059             core_optab->start = optab;
3060           }
3061       }
3062   }
3063
3064   /* Initialize reg_hash hash table.  */
3065   reg_hash = hash_new ();
3066   {
3067     const reg_entry *regtab;
3068     unsigned int regtab_size = i386_regtab_size;
3069
3070     for (regtab = i386_regtab; regtab_size--; regtab++)
3071       {
3072         hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
3073         if (hash_err)
3074           as_fatal (_("can't hash %s: %s"),
3075                     regtab->reg_name,
3076                     hash_err);
3077       }
3078   }
3079
3080   /* Fill in lexical tables:  mnemonic_chars, operand_chars.  */
3081   {
3082     int c;
3083     char *p;
3084
3085     for (c = 0; c < 256; c++)
3086       {
3087         if (ISDIGIT (c))
3088           {
3089             digit_chars[c] = c;
3090             mnemonic_chars[c] = c;
3091             register_chars[c] = c;
3092             operand_chars[c] = c;
3093           }
3094         else if (ISLOWER (c))
3095           {
3096             mnemonic_chars[c] = c;
3097             register_chars[c] = c;
3098             operand_chars[c] = c;
3099           }
3100         else if (ISUPPER (c))
3101           {
3102             mnemonic_chars[c] = TOLOWER (c);
3103             register_chars[c] = mnemonic_chars[c];
3104             operand_chars[c] = c;
3105           }
3106         else if (c == '{' || c == '}')
3107           {
3108             mnemonic_chars[c] = c;
3109             operand_chars[c] = c;
3110           }
3111
3112         if (ISALPHA (c) || ISDIGIT (c))
3113           identifier_chars[c] = c;
3114         else if (c >= 128)
3115           {
3116             identifier_chars[c] = c;
3117             operand_chars[c] = c;
3118           }
3119       }
3120
3121 #ifdef LEX_AT
3122     identifier_chars['@'] = '@';
3123 #endif
3124 #ifdef LEX_QM
3125     identifier_chars['?'] = '?';
3126     operand_chars['?'] = '?';
3127 #endif
3128     digit_chars['-'] = '-';
3129     mnemonic_chars['_'] = '_';
3130     mnemonic_chars['-'] = '-';
3131     mnemonic_chars['.'] = '.';
3132     identifier_chars['_'] = '_';
3133     identifier_chars['.'] = '.';
3134
3135     for (p = operand_special_chars; *p != '\0'; p++)
3136       operand_chars[(unsigned char) *p] = *p;
3137   }
3138
3139   if (flag_code == CODE_64BIT)
3140     {
3141 #if defined (OBJ_COFF) && defined (TE_PE)
3142       x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3143                                   ? 32 : 16);
3144 #else
3145       x86_dwarf2_return_column = 16;
3146 #endif
3147       x86_cie_data_alignment = -8;
3148     }
3149   else
3150     {
3151       x86_dwarf2_return_column = 8;
3152       x86_cie_data_alignment = -4;
3153     }
3154
3155   /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3156      can be turned into BRANCH_PREFIX frag.  */
3157   if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3158     abort ();
3159 }
3160
3161 void
3162 i386_print_statistics (FILE *file)
3163 {
3164   hash_print_statistics (file, "i386 opcode", op_hash);
3165   hash_print_statistics (file, "i386 register", reg_hash);
3166 }
3167 \f
3168 #ifdef DEBUG386
3169
3170 /* Debugging routines for md_assemble.  */
3171 static void pte (insn_template *);
3172 static void pt (i386_operand_type);
3173 static void pe (expressionS *);
3174 static void ps (symbolS *);
3175
3176 static void
3177 pi (const char *line, i386_insn *x)
3178 {
3179   unsigned int j;
3180
3181   fprintf (stdout, "%s: template ", line);
3182   pte (&x->tm);
3183   fprintf (stdout, "  address: base %s  index %s  scale %x\n",
3184            x->base_reg ? x->base_reg->reg_name : "none",
3185            x->index_reg ? x->index_reg->reg_name : "none",
3186            x->log2_scale_factor);
3187   fprintf (stdout, "  modrm:  mode %x  reg %x  reg/mem %x\n",
3188            x->rm.mode, x->rm.reg, x->rm.regmem);
3189   fprintf (stdout, "  sib:  base %x  index %x  scale %x\n",
3190            x->sib.base, x->sib.index, x->sib.scale);
3191   fprintf (stdout, "  rex: 64bit %x  extX %x  extY %x  extZ %x\n",
3192            (x->rex & REX_W) != 0,
3193            (x->rex & REX_R) != 0,
3194            (x->rex & REX_X) != 0,
3195            (x->rex & REX_B) != 0);
3196   for (j = 0; j < x->operands; j++)
3197     {
3198       fprintf (stdout, "    #%d:  ", j + 1);
3199       pt (x->types[j]);
3200       fprintf (stdout, "\n");
3201       if (x->types[j].bitfield.class == Reg
3202           || x->types[j].bitfield.class == RegMMX
3203           || x->types[j].bitfield.class == RegSIMD
3204           || x->types[j].bitfield.class == RegMask
3205           || x->types[j].bitfield.class == SReg
3206           || x->types[j].bitfield.class == RegCR
3207           || x->types[j].bitfield.class == RegDR
3208           || x->types[j].bitfield.class == RegTR
3209           || x->types[j].bitfield.class == RegBND)
3210         fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3211       if (operand_type_check (x->types[j], imm))
3212         pe (x->op[j].imms);
3213       if (operand_type_check (x->types[j], disp))
3214         pe (x->op[j].disps);
3215     }
3216 }
3217
3218 static void
3219 pte (insn_template *t)
3220 {
3221   unsigned int j;
3222   fprintf (stdout, " %d operands ", t->operands);
3223   fprintf (stdout, "opcode %x ", t->base_opcode);
3224   if (t->extension_opcode != None)
3225     fprintf (stdout, "ext %x ", t->extension_opcode);
3226   if (t->opcode_modifier.d)
3227     fprintf (stdout, "D");
3228   if (t->opcode_modifier.w)
3229     fprintf (stdout, "W");
3230   fprintf (stdout, "\n");
3231   for (j = 0; j < t->operands; j++)
3232     {
3233       fprintf (stdout, "    #%d type ", j + 1);
3234       pt (t->operand_types[j]);
3235       fprintf (stdout, "\n");
3236     }
3237 }
3238
3239 static void
3240 pe (expressionS *e)
3241 {
3242   fprintf (stdout, "    operation     %d\n", e->X_op);
3243   fprintf (stdout, "    add_number    %ld (%lx)\n",
3244            (long) e->X_add_number, (long) e->X_add_number);
3245   if (e->X_add_symbol)
3246     {
3247       fprintf (stdout, "    add_symbol    ");
3248       ps (e->X_add_symbol);
3249       fprintf (stdout, "\n");
3250     }
3251   if (e->X_op_symbol)
3252     {
3253       fprintf (stdout, "    op_symbol    ");
3254       ps (e->X_op_symbol);
3255       fprintf (stdout, "\n");
3256     }
3257 }
3258
3259 static void
3260 ps (symbolS *s)
3261 {
3262   fprintf (stdout, "%s type %s%s",
3263            S_GET_NAME (s),
3264            S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3265            segment_name (S_GET_SEGMENT (s)));
3266 }
3267
3268 static struct type_name
3269   {
3270     i386_operand_type mask;
3271     const char *name;
3272   }
3273 const type_names[] =
3274 {
3275   { OPERAND_TYPE_REG8, "r8" },
3276   { OPERAND_TYPE_REG16, "r16" },
3277   { OPERAND_TYPE_REG32, "r32" },
3278   { OPERAND_TYPE_REG64, "r64" },
3279   { OPERAND_TYPE_ACC8, "acc8" },
3280   { OPERAND_TYPE_ACC16, "acc16" },
3281   { OPERAND_TYPE_ACC32, "acc32" },
3282   { OPERAND_TYPE_ACC64, "acc64" },
3283   { OPERAND_TYPE_IMM8, "i8" },
3284   { OPERAND_TYPE_IMM8, "i8s" },
3285   { OPERAND_TYPE_IMM16, "i16" },
3286   { OPERAND_TYPE_IMM32, "i32" },
3287   { OPERAND_TYPE_IMM32S, "i32s" },
3288   { OPERAND_TYPE_IMM64, "i64" },
3289   { OPERAND_TYPE_IMM1, "i1" },
3290   { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3291   { OPERAND_TYPE_DISP8, "d8" },
3292   { OPERAND_TYPE_DISP16, "d16" },
3293   { OPERAND_TYPE_DISP32, "d32" },
3294   { OPERAND_TYPE_DISP32S, "d32s" },
3295   { OPERAND_TYPE_DISP64, "d64" },
3296   { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3297   { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3298   { OPERAND_TYPE_CONTROL, "control reg" },
3299   { OPERAND_TYPE_TEST, "test reg" },
3300   { OPERAND_TYPE_DEBUG, "debug reg" },
3301   { OPERAND_TYPE_FLOATREG, "FReg" },
3302   { OPERAND_TYPE_FLOATACC, "FAcc" },
3303   { OPERAND_TYPE_SREG, "SReg" },
3304   { OPERAND_TYPE_REGMMX, "rMMX" },
3305   { OPERAND_TYPE_REGXMM, "rXMM" },
3306   { OPERAND_TYPE_REGYMM, "rYMM" },
3307   { OPERAND_TYPE_REGZMM, "rZMM" },
3308   { OPERAND_TYPE_REGMASK, "Mask reg" },
3309 };
3310
3311 static void
3312 pt (i386_operand_type t)
3313 {
3314   unsigned int j;
3315   i386_operand_type a;
3316
3317   for (j = 0; j < ARRAY_SIZE (type_names); j++)
3318     {
3319       a = operand_type_and (t, type_names[j].mask);
3320       if (operand_type_equal (&a, &type_names[j].mask))
3321         fprintf (stdout, "%s, ",  type_names[j].name);
3322     }
3323   fflush (stdout);
3324 }
3325
3326 #endif /* DEBUG386 */
3327 \f
3328 static bfd_reloc_code_real_type
3329 reloc (unsigned int size,
3330        int pcrel,
3331        int sign,
3332        bfd_reloc_code_real_type other)
3333 {
3334   if (other != NO_RELOC)
3335     {
3336       reloc_howto_type *rel;
3337
3338       if (size == 8)
3339         switch (other)
3340           {
3341           case BFD_RELOC_X86_64_GOT32:
3342             return BFD_RELOC_X86_64_GOT64;
3343             break;
3344           case BFD_RELOC_X86_64_GOTPLT64:
3345             return BFD_RELOC_X86_64_GOTPLT64;
3346             break;
3347           case BFD_RELOC_X86_64_PLTOFF64:
3348             return BFD_RELOC_X86_64_PLTOFF64;
3349             break;
3350           case BFD_RELOC_X86_64_GOTPC32:
3351             other = BFD_RELOC_X86_64_GOTPC64;
3352             break;
3353           case BFD_RELOC_X86_64_GOTPCREL:
3354             other = BFD_RELOC_X86_64_GOTPCREL64;
3355             break;
3356           case BFD_RELOC_X86_64_TPOFF32:
3357             other = BFD_RELOC_X86_64_TPOFF64;
3358             break;
3359           case BFD_RELOC_X86_64_DTPOFF32:
3360             other = BFD_RELOC_X86_64_DTPOFF64;
3361             break;
3362           default:
3363             break;
3364           }
3365
3366 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3367       if (other == BFD_RELOC_SIZE32)
3368         {
3369           if (size == 8)
3370             other = BFD_RELOC_SIZE64;
3371           if (pcrel)
3372             {
3373               as_bad (_("there are no pc-relative size relocations"));
3374               return NO_RELOC;
3375             }
3376         }
3377 #endif
3378
3379       /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless.  */
3380       if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3381         sign = -1;
3382
3383       rel = bfd_reloc_type_lookup (stdoutput, other);
3384       if (!rel)
3385         as_bad (_("unknown relocation (%u)"), other);
3386       else if (size != bfd_get_reloc_size (rel))
3387         as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3388                 bfd_get_reloc_size (rel),
3389                 size);
3390       else if (pcrel && !rel->pc_relative)
3391         as_bad (_("non-pc-relative relocation for pc-relative field"));
3392       else if ((rel->complain_on_overflow == complain_overflow_signed
3393                 && !sign)
3394                || (rel->complain_on_overflow == complain_overflow_unsigned
3395                    && sign > 0))
3396         as_bad (_("relocated field and relocation type differ in signedness"));
3397       else
3398         return other;
3399       return NO_RELOC;
3400     }
3401
3402   if (pcrel)
3403     {
3404       if (!sign)
3405         as_bad (_("there are no unsigned pc-relative relocations"));
3406       switch (size)
3407         {
3408         case 1: return BFD_RELOC_8_PCREL;
3409         case 2: return BFD_RELOC_16_PCREL;
3410         case 4: return BFD_RELOC_32_PCREL;
3411         case 8: return BFD_RELOC_64_PCREL;
3412         }
3413       as_bad (_("cannot do %u byte pc-relative relocation"), size);
3414     }
3415   else
3416     {
3417       if (sign > 0)
3418         switch (size)
3419           {
3420           case 4: return BFD_RELOC_X86_64_32S;
3421           }
3422       else
3423         switch (size)
3424           {
3425           case 1: return BFD_RELOC_8;
3426           case 2: return BFD_RELOC_16;
3427           case 4: return BFD_RELOC_32;
3428           case 8: return BFD_RELOC_64;
3429           }
3430       as_bad (_("cannot do %s %u byte relocation"),
3431               sign > 0 ? "signed" : "unsigned", size);
3432     }
3433
3434   return NO_RELOC;
3435 }
3436
3437 /* Here we decide which fixups can be adjusted to make them relative to
3438    the beginning of the section instead of the symbol.  Basically we need
3439    to make sure that the dynamic relocations are done correctly, so in
3440    some cases we force the original symbol to be used.  */
3441
3442 int
3443 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3444 {
3445 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3446   if (!IS_ELF)
3447     return 1;
3448
3449   /* Don't adjust pc-relative references to merge sections in 64-bit
3450      mode.  */
3451   if (use_rela_relocations
3452       && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3453       && fixP->fx_pcrel)
3454     return 0;
3455
3456   /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3457      and changed later by validate_fix.  */
3458   if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3459       && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3460     return 0;
3461
3462   /* Adjust_reloc_syms doesn't know about the GOT.  Need to keep symbol
3463      for size relocations.  */
3464   if (fixP->fx_r_type == BFD_RELOC_SIZE32
3465       || fixP->fx_r_type == BFD_RELOC_SIZE64
3466       || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3467       || fixP->fx_r_type == BFD_RELOC_386_GOT32
3468       || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3469       || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3470       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3471       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3472       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3473       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3474       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3475       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3476       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3477       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3478       || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3479       || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3480       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3481       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3482       || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3483       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3484       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3485       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3486       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3487       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3488       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3489       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3490       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3491       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3492       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3493       || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3494       || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3495     return 0;
3496 #endif
3497   return 1;
3498 }
3499
3500 static int
3501 intel_float_operand (const char *mnemonic)
3502 {
3503   /* Note that the value returned is meaningful only for opcodes with (memory)
3504      operands, hence the code here is free to improperly handle opcodes that
3505      have no operands (for better performance and smaller code). */
3506
3507   if (mnemonic[0] != 'f')
3508     return 0; /* non-math */
3509
3510   switch (mnemonic[1])
3511     {
3512     /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3513        the fs segment override prefix not currently handled because no
3514        call path can make opcodes without operands get here */
3515     case 'i':
3516       return 2 /* integer op */;
3517     case 'l':
3518       if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3519         return 3; /* fldcw/fldenv */
3520       break;
3521     case 'n':
3522       if (mnemonic[2] != 'o' /* fnop */)
3523         return 3; /* non-waiting control op */
3524       break;
3525     case 'r':
3526       if (mnemonic[2] == 's')
3527         return 3; /* frstor/frstpm */
3528       break;
3529     case 's':
3530       if (mnemonic[2] == 'a')
3531         return 3; /* fsave */
3532       if (mnemonic[2] == 't')
3533         {
3534           switch (mnemonic[3])
3535             {
3536             case 'c': /* fstcw */
3537             case 'd': /* fstdw */
3538             case 'e': /* fstenv */
3539             case 's': /* fsts[gw] */
3540               return 3;
3541             }
3542         }
3543       break;
3544     case 'x':
3545       if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3546         return 0; /* fxsave/fxrstor are not really math ops */
3547       break;
3548     }
3549
3550   return 1;
3551 }
3552
3553 /* Build the VEX prefix.  */
3554
3555 static void
3556 build_vex_prefix (const insn_template *t)
3557 {
3558   unsigned int register_specifier;
3559   unsigned int implied_prefix;
3560   unsigned int vector_length;
3561   unsigned int w;
3562
3563   /* Check register specifier.  */
3564   if (i.vex.register_specifier)
3565     {
3566       register_specifier =
3567         ~register_number (i.vex.register_specifier) & 0xf;
3568       gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3569     }
3570   else
3571     register_specifier = 0xf;
3572
3573   /* Use 2-byte VEX prefix by swapping destination and source operand
3574      if there are more than 1 register operand.  */
3575   if (i.reg_operands > 1
3576       && i.vec_encoding != vex_encoding_vex3
3577       && i.dir_encoding == dir_encoding_default
3578       && i.operands == i.reg_operands
3579       && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3580       && i.tm.opcode_modifier.vexopcode == VEX0F
3581       && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3582       && i.rex == REX_B)
3583     {
3584       unsigned int xchg = i.operands - 1;
3585       union i386_op temp_op;
3586       i386_operand_type temp_type;
3587
3588       temp_type = i.types[xchg];
3589       i.types[xchg] = i.types[0];
3590       i.types[0] = temp_type;
3591       temp_op = i.op[xchg];
3592       i.op[xchg] = i.op[0];
3593       i.op[0] = temp_op;
3594
3595       gas_assert (i.rm.mode == 3);
3596
3597       i.rex = REX_R;
3598       xchg = i.rm.regmem;
3599       i.rm.regmem = i.rm.reg;
3600       i.rm.reg = xchg;
3601
3602       if (i.tm.opcode_modifier.d)
3603         i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3604                             ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3605       else /* Use the next insn.  */
3606         i.tm = t[1];
3607     }
3608
3609   /* Use 2-byte VEX prefix by swapping commutative source operands if there
3610      are no memory operands and at least 3 register ones.  */
3611   if (i.reg_operands >= 3
3612       && i.vec_encoding != vex_encoding_vex3
3613       && i.reg_operands == i.operands - i.imm_operands
3614       && i.tm.opcode_modifier.vex
3615       && i.tm.opcode_modifier.commutative
3616       && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3617       && i.rex == REX_B
3618       && i.vex.register_specifier
3619       && !(i.vex.register_specifier->reg_flags & RegRex))
3620     {
3621       unsigned int xchg = i.operands - i.reg_operands;
3622       union i386_op temp_op;
3623       i386_operand_type temp_type;
3624
3625       gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3626       gas_assert (!i.tm.opcode_modifier.sae);
3627       gas_assert (operand_type_equal (&i.types[i.operands - 2],
3628                                       &i.types[i.operands - 3]));
3629       gas_assert (i.rm.mode == 3);
3630
3631       temp_type = i.types[xchg];
3632       i.types[xchg] = i.types[xchg + 1];
3633       i.types[xchg + 1] = temp_type;
3634       temp_op = i.op[xchg];
3635       i.op[xchg] = i.op[xchg + 1];
3636       i.op[xchg + 1] = temp_op;
3637
3638       i.rex = 0;
3639       xchg = i.rm.regmem | 8;
3640       i.rm.regmem = ~register_specifier & 0xf;
3641       gas_assert (!(i.rm.regmem & 8));
3642       i.vex.register_specifier += xchg - i.rm.regmem;
3643       register_specifier = ~xchg & 0xf;
3644     }
3645
3646   if (i.tm.opcode_modifier.vex == VEXScalar)
3647     vector_length = avxscalar;
3648   else if (i.tm.opcode_modifier.vex == VEX256)
3649     vector_length = 1;
3650   else
3651     {
3652       unsigned int op;
3653
3654       /* Determine vector length from the last multi-length vector
3655          operand.  */
3656       vector_length = 0;
3657       for (op = t->operands; op--;)
3658         if (t->operand_types[op].bitfield.xmmword
3659             && t->operand_types[op].bitfield.ymmword
3660             && i.types[op].bitfield.ymmword)
3661           {
3662             vector_length = 1;
3663             break;
3664           }
3665     }
3666
3667   switch ((i.tm.base_opcode >> 8) & 0xff)
3668     {
3669     case 0:
3670       implied_prefix = 0;
3671       break;
3672     case DATA_PREFIX_OPCODE:
3673       implied_prefix = 1;
3674       break;
3675     case REPE_PREFIX_OPCODE:
3676       implied_prefix = 2;
3677       break;
3678     case REPNE_PREFIX_OPCODE:
3679       implied_prefix = 3;
3680       break;
3681     default:
3682       abort ();
3683     }
3684
3685   /* Check the REX.W bit and VEXW.  */
3686   if (i.tm.opcode_modifier.vexw == VEXWIG)
3687     w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3688   else if (i.tm.opcode_modifier.vexw)
3689     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3690   else
3691     w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3692
3693   /* Use 2-byte VEX prefix if possible.  */
3694   if (w == 0
3695       && i.vec_encoding != vex_encoding_vex3
3696       && i.tm.opcode_modifier.vexopcode == VEX0F
3697       && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3698     {
3699       /* 2-byte VEX prefix.  */
3700       unsigned int r;
3701
3702       i.vex.length = 2;
3703       i.vex.bytes[0] = 0xc5;
3704
3705       /* Check the REX.R bit.  */
3706       r = (i.rex & REX_R) ? 0 : 1;
3707       i.vex.bytes[1] = (r << 7
3708                         | register_specifier << 3
3709                         | vector_length << 2
3710                         | implied_prefix);
3711     }
3712   else
3713     {
3714       /* 3-byte VEX prefix.  */
3715       unsigned int m;
3716
3717       i.vex.length = 3;
3718
3719       switch (i.tm.opcode_modifier.vexopcode)
3720         {
3721         case VEX0F:
3722           m = 0x1;
3723           i.vex.bytes[0] = 0xc4;
3724           break;
3725         case VEX0F38:
3726           m = 0x2;
3727           i.vex.bytes[0] = 0xc4;
3728           break;
3729         case VEX0F3A:
3730           m = 0x3;
3731           i.vex.bytes[0] = 0xc4;
3732           break;
3733         case XOP08:
3734           m = 0x8;
3735           i.vex.bytes[0] = 0x8f;
3736           break;
3737         case XOP09:
3738           m = 0x9;
3739           i.vex.bytes[0] = 0x8f;
3740           break;
3741         case XOP0A:
3742           m = 0xa;
3743           i.vex.bytes[0] = 0x8f;
3744           break;
3745         default:
3746           abort ();
3747         }
3748
3749       /* The high 3 bits of the second VEX byte are 1's compliment
3750          of RXB bits from REX.  */
3751       i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3752
3753       i.vex.bytes[2] = (w << 7
3754                         | register_specifier << 3
3755                         | vector_length << 2
3756                         | implied_prefix);
3757     }
3758 }
3759
3760 static INLINE bfd_boolean
3761 is_evex_encoding (const insn_template *t)
3762 {
3763   return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3764          || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3765          || t->opcode_modifier.sae;
3766 }
3767
3768 static INLINE bfd_boolean
3769 is_any_vex_encoding (const insn_template *t)
3770 {
3771   return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3772          || is_evex_encoding (t);
3773 }
3774
3775 /* Build the EVEX prefix.  */
3776
3777 static void
3778 build_evex_prefix (void)
3779 {
3780   unsigned int register_specifier;
3781   unsigned int implied_prefix;
3782   unsigned int m, w;
3783   rex_byte vrex_used = 0;
3784
3785   /* Check register specifier.  */
3786   if (i.vex.register_specifier)
3787     {
3788       gas_assert ((i.vrex & REX_X) == 0);
3789
3790       register_specifier = i.vex.register_specifier->reg_num;
3791       if ((i.vex.register_specifier->reg_flags & RegRex))
3792         register_specifier += 8;
3793       /* The upper 16 registers are encoded in the fourth byte of the
3794          EVEX prefix.  */
3795       if (!(i.vex.register_specifier->reg_flags & RegVRex))
3796         i.vex.bytes[3] = 0x8;
3797       register_specifier = ~register_specifier & 0xf;
3798     }
3799   else
3800     {
3801       register_specifier = 0xf;
3802
3803       /* Encode upper 16 vector index register in the fourth byte of
3804          the EVEX prefix.  */
3805       if (!(i.vrex & REX_X))
3806         i.vex.bytes[3] = 0x8;
3807       else
3808         vrex_used |= REX_X;
3809     }
3810
3811   switch ((i.tm.base_opcode >> 8) & 0xff)
3812     {
3813     case 0:
3814       implied_prefix = 0;
3815       break;
3816     case DATA_PREFIX_OPCODE:
3817       implied_prefix = 1;
3818       break;
3819     case REPE_PREFIX_OPCODE:
3820       implied_prefix = 2;
3821       break;
3822     case REPNE_PREFIX_OPCODE:
3823       implied_prefix = 3;
3824       break;
3825     default:
3826       abort ();
3827     }
3828
3829   /* 4 byte EVEX prefix.  */
3830   i.vex.length = 4;
3831   i.vex.bytes[0] = 0x62;
3832
3833   /* mmmm bits.  */
3834   switch (i.tm.opcode_modifier.vexopcode)
3835     {
3836     case VEX0F:
3837       m = 1;
3838       break;
3839     case VEX0F38:
3840       m = 2;
3841       break;
3842     case VEX0F3A:
3843       m = 3;
3844       break;
3845     default:
3846       abort ();
3847       break;
3848     }
3849
3850   /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3851      bits from REX.  */
3852   i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3853
3854   /* The fifth bit of the second EVEX byte is 1's compliment of the
3855      REX_R bit in VREX.  */
3856   if (!(i.vrex & REX_R))
3857     i.vex.bytes[1] |= 0x10;
3858   else
3859     vrex_used |= REX_R;
3860
3861   if ((i.reg_operands + i.imm_operands) == i.operands)
3862     {
3863       /* When all operands are registers, the REX_X bit in REX is not
3864          used.  We reuse it to encode the upper 16 registers, which is
3865          indicated by the REX_B bit in VREX.  The REX_X bit is encoded
3866          as 1's compliment.  */
3867       if ((i.vrex & REX_B))
3868         {
3869           vrex_used |= REX_B;
3870           i.vex.bytes[1] &= ~0x40;
3871         }
3872     }
3873
3874   /* EVEX instructions shouldn't need the REX prefix.  */
3875   i.vrex &= ~vrex_used;
3876   gas_assert (i.vrex == 0);
3877
3878   /* Check the REX.W bit and VEXW.  */
3879   if (i.tm.opcode_modifier.vexw == VEXWIG)
3880     w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3881   else if (i.tm.opcode_modifier.vexw)
3882     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3883   else
3884     w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3885
3886   /* Encode the U bit.  */
3887   implied_prefix |= 0x4;
3888
3889   /* The third byte of the EVEX prefix.  */
3890   i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3891
3892   /* The fourth byte of the EVEX prefix.  */
3893   /* The zeroing-masking bit.  */
3894   if (i.mask && i.mask->zeroing)
3895     i.vex.bytes[3] |= 0x80;
3896
3897   /* Don't always set the broadcast bit if there is no RC.  */
3898   if (!i.rounding)
3899     {
3900       /* Encode the vector length.  */
3901       unsigned int vec_length;
3902
3903       if (!i.tm.opcode_modifier.evex
3904           || i.tm.opcode_modifier.evex == EVEXDYN)
3905         {
3906           unsigned int op;
3907
3908           /* Determine vector length from the last multi-length vector
3909              operand.  */
3910           for (op = i.operands; op--;)
3911             if (i.tm.operand_types[op].bitfield.xmmword
3912                 + i.tm.operand_types[op].bitfield.ymmword
3913                 + i.tm.operand_types[op].bitfield.zmmword > 1)
3914               {
3915                 if (i.types[op].bitfield.zmmword)
3916                   {
3917                     i.tm.opcode_modifier.evex = EVEX512;
3918                     break;
3919                   }
3920                 else if (i.types[op].bitfield.ymmword)
3921                   {
3922                     i.tm.opcode_modifier.evex = EVEX256;
3923                     break;
3924                   }
3925                 else if (i.types[op].bitfield.xmmword)
3926                   {
3927                     i.tm.opcode_modifier.evex = EVEX128;
3928                     break;
3929                   }
3930                 else if (i.broadcast && (int) op == i.broadcast->operand)
3931                   {
3932                     switch (i.broadcast->bytes)
3933                       {
3934                         case 64:
3935                           i.tm.opcode_modifier.evex = EVEX512;
3936                           break;
3937                         case 32:
3938                           i.tm.opcode_modifier.evex = EVEX256;
3939                           break;
3940                         case 16:
3941                           i.tm.opcode_modifier.evex = EVEX128;
3942                           break;
3943                         default:
3944                           abort ();
3945                       }
3946                     break;
3947                   }
3948               }
3949
3950           if (op >= MAX_OPERANDS)
3951             abort ();
3952         }
3953
3954       switch (i.tm.opcode_modifier.evex)
3955         {
3956         case EVEXLIG: /* LL' is ignored */
3957           vec_length = evexlig << 5;
3958           break;
3959         case EVEX128:
3960           vec_length = 0 << 5;
3961           break;
3962         case EVEX256:
3963           vec_length = 1 << 5;
3964           break;
3965         case EVEX512:
3966           vec_length = 2 << 5;
3967           break;
3968         default:
3969           abort ();
3970           break;
3971         }
3972       i.vex.bytes[3] |= vec_length;
3973       /* Encode the broadcast bit.  */
3974       if (i.broadcast)
3975         i.vex.bytes[3] |= 0x10;
3976     }
3977   else
3978     {
3979       if (i.rounding->type != saeonly)
3980         i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3981       else
3982         i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3983     }
3984
3985   if (i.mask && i.mask->mask)
3986     i.vex.bytes[3] |= i.mask->mask->reg_num;
3987 }
3988
3989 static void
3990 process_immext (void)
3991 {
3992   expressionS *exp;
3993
3994   /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3995      which is coded in the same place as an 8-bit immediate field
3996      would be.  Here we fake an 8-bit immediate operand from the
3997      opcode suffix stored in tm.extension_opcode.
3998
3999      AVX instructions also use this encoding, for some of
4000      3 argument instructions.  */
4001
4002   gas_assert (i.imm_operands <= 1
4003               && (i.operands <= 2
4004                   || (is_any_vex_encoding (&i.tm)
4005                       && i.operands <= 4)));
4006
4007   exp = &im_expressions[i.imm_operands++];
4008   i.op[i.operands].imms = exp;
4009   i.types[i.operands] = imm8;
4010   i.operands++;
4011   exp->X_op = O_constant;
4012   exp->X_add_number = i.tm.extension_opcode;
4013   i.tm.extension_opcode = None;
4014 }
4015
4016
4017 static int
4018 check_hle (void)
4019 {
4020   switch (i.tm.opcode_modifier.hleprefixok)
4021     {
4022     default:
4023       abort ();
4024     case HLEPrefixNone:
4025       as_bad (_("invalid instruction `%s' after `%s'"),
4026               i.tm.name, i.hle_prefix);
4027       return 0;
4028     case HLEPrefixLock:
4029       if (i.prefix[LOCK_PREFIX])
4030         return 1;
4031       as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
4032       return 0;
4033     case HLEPrefixAny:
4034       return 1;
4035     case HLEPrefixRelease:
4036       if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4037         {
4038           as_bad (_("instruction `%s' after `xacquire' not allowed"),
4039                   i.tm.name);
4040           return 0;
4041         }
4042       if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
4043         {
4044           as_bad (_("memory destination needed for instruction `%s'"
4045                     " after `xrelease'"), i.tm.name);
4046           return 0;
4047         }
4048       return 1;
4049     }
4050 }
4051
4052 /* Try the shortest encoding by shortening operand size.  */
4053
4054 static void
4055 optimize_encoding (void)
4056 {
4057   unsigned int j;
4058
4059   if (optimize_for_space
4060       && !is_any_vex_encoding (&i.tm)
4061       && i.reg_operands == 1
4062       && i.imm_operands == 1
4063       && !i.types[1].bitfield.byte
4064       && i.op[0].imms->X_op == O_constant
4065       && fits_in_imm7 (i.op[0].imms->X_add_number)
4066       && (i.tm.base_opcode == 0xa8
4067           || (i.tm.base_opcode == 0xf6
4068               && i.tm.extension_opcode == 0x0)))
4069     {
4070       /* Optimize: -Os:
4071            test $imm7, %r64/%r32/%r16  -> test $imm7, %r8
4072        */
4073       unsigned int base_regnum = i.op[1].regs->reg_num;
4074       if (flag_code == CODE_64BIT || base_regnum < 4)
4075         {
4076           i.types[1].bitfield.byte = 1;
4077           /* Ignore the suffix.  */
4078           i.suffix = 0;
4079           /* Convert to byte registers.  */
4080           if (i.types[1].bitfield.word)
4081             j = 16;
4082           else if (i.types[1].bitfield.dword)
4083             j = 32;
4084           else
4085             j = 48;
4086           if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4087             j += 8;
4088           i.op[1].regs -= j;
4089         }
4090     }
4091   else if (flag_code == CODE_64BIT
4092            && !is_any_vex_encoding (&i.tm)
4093            && ((i.types[1].bitfield.qword
4094                 && i.reg_operands == 1
4095                 && i.imm_operands == 1
4096                 && i.op[0].imms->X_op == O_constant
4097                 && ((i.tm.base_opcode == 0xb8
4098                      && i.tm.extension_opcode == None
4099                      && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4100                     || (fits_in_imm31 (i.op[0].imms->X_add_number)
4101                         && ((i.tm.base_opcode == 0x24
4102                              || i.tm.base_opcode == 0xa8)
4103                             || (i.tm.base_opcode == 0x80
4104                                 && i.tm.extension_opcode == 0x4)
4105                             || ((i.tm.base_opcode == 0xf6
4106                                  || (i.tm.base_opcode | 1) == 0xc7)
4107                                 && i.tm.extension_opcode == 0x0)))
4108                     || (fits_in_imm7 (i.op[0].imms->X_add_number)
4109                         && i.tm.base_opcode == 0x83
4110                         && i.tm.extension_opcode == 0x4)))
4111                || (i.types[0].bitfield.qword
4112                    && ((i.reg_operands == 2
4113                         && i.op[0].regs == i.op[1].regs
4114                         && (i.tm.base_opcode == 0x30
4115                             || i.tm.base_opcode == 0x28))
4116                        || (i.reg_operands == 1
4117                            && i.operands == 1
4118                            && i.tm.base_opcode == 0x30)))))
4119     {
4120       /* Optimize: -O:
4121            andq $imm31, %r64   -> andl $imm31, %r32
4122            andq $imm7, %r64    -> andl $imm7, %r32
4123            testq $imm31, %r64  -> testl $imm31, %r32
4124            xorq %r64, %r64     -> xorl %r32, %r32
4125            subq %r64, %r64     -> subl %r32, %r32
4126            movq $imm31, %r64   -> movl $imm31, %r32
4127            movq $imm32, %r64   -> movl $imm32, %r32
4128         */
4129       i.tm.opcode_modifier.norex64 = 1;
4130       if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4131         {
4132           /* Handle
4133                movq $imm31, %r64   -> movl $imm31, %r32
4134                movq $imm32, %r64   -> movl $imm32, %r32
4135            */
4136           i.tm.operand_types[0].bitfield.imm32 = 1;
4137           i.tm.operand_types[0].bitfield.imm32s = 0;
4138           i.tm.operand_types[0].bitfield.imm64 = 0;
4139           i.types[0].bitfield.imm32 = 1;
4140           i.types[0].bitfield.imm32s = 0;
4141           i.types[0].bitfield.imm64 = 0;
4142           i.types[1].bitfield.dword = 1;
4143           i.types[1].bitfield.qword = 0;
4144           if ((i.tm.base_opcode | 1) == 0xc7)
4145             {
4146               /* Handle
4147                    movq $imm31, %r64   -> movl $imm31, %r32
4148                */
4149               i.tm.base_opcode = 0xb8;
4150               i.tm.extension_opcode = None;
4151               i.tm.opcode_modifier.w = 0;
4152               i.tm.opcode_modifier.modrm = 0;
4153             }
4154         }
4155     }
4156   else if (optimize > 1
4157            && !optimize_for_space
4158            && !is_any_vex_encoding (&i.tm)
4159            && i.reg_operands == 2
4160            && i.op[0].regs == i.op[1].regs
4161            && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4162                || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4163            && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4164     {
4165       /* Optimize: -O2:
4166            andb %rN, %rN  -> testb %rN, %rN
4167            andw %rN, %rN  -> testw %rN, %rN
4168            andq %rN, %rN  -> testq %rN, %rN
4169            orb %rN, %rN   -> testb %rN, %rN
4170            orw %rN, %rN   -> testw %rN, %rN
4171            orq %rN, %rN   -> testq %rN, %rN
4172
4173            and outside of 64-bit mode
4174
4175            andl %rN, %rN  -> testl %rN, %rN
4176            orl %rN, %rN   -> testl %rN, %rN
4177        */
4178       i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4179     }
4180   else if (i.reg_operands == 3
4181            && i.op[0].regs == i.op[1].regs
4182            && !i.types[2].bitfield.xmmword
4183            && (i.tm.opcode_modifier.vex
4184                || ((!i.mask || i.mask->zeroing)
4185                    && !i.rounding
4186                    && is_evex_encoding (&i.tm)
4187                    && (i.vec_encoding != vex_encoding_evex
4188                        || cpu_arch_isa_flags.bitfield.cpuavx512vl
4189                        || i.tm.cpu_flags.bitfield.cpuavx512vl
4190                        || (i.tm.operand_types[2].bitfield.zmmword
4191                            && i.types[2].bitfield.ymmword))))
4192            && ((i.tm.base_opcode == 0x55
4193                 || i.tm.base_opcode == 0x6655
4194                 || i.tm.base_opcode == 0x66df
4195                 || i.tm.base_opcode == 0x57
4196                 || i.tm.base_opcode == 0x6657
4197                 || i.tm.base_opcode == 0x66ef
4198                 || i.tm.base_opcode == 0x66f8
4199                 || i.tm.base_opcode == 0x66f9
4200                 || i.tm.base_opcode == 0x66fa
4201                 || i.tm.base_opcode == 0x66fb
4202                 || i.tm.base_opcode == 0x42
4203                 || i.tm.base_opcode == 0x6642
4204                 || i.tm.base_opcode == 0x47
4205                 || i.tm.base_opcode == 0x6647)
4206                && i.tm.extension_opcode == None))
4207     {
4208       /* Optimize: -O1:
4209            VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4210            vpsubq and vpsubw:
4211              EVEX VOP %zmmM, %zmmM, %zmmN
4212                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4213                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4214              EVEX VOP %ymmM, %ymmM, %ymmN
4215                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4216                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4217              VEX VOP %ymmM, %ymmM, %ymmN
4218                -> VEX VOP %xmmM, %xmmM, %xmmN
4219            VOP, one of vpandn and vpxor:
4220              VEX VOP %ymmM, %ymmM, %ymmN
4221                -> VEX VOP %xmmM, %xmmM, %xmmN
4222            VOP, one of vpandnd and vpandnq:
4223              EVEX VOP %zmmM, %zmmM, %zmmN
4224                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4225                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4226              EVEX VOP %ymmM, %ymmM, %ymmN
4227                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4228                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4229            VOP, one of vpxord and vpxorq:
4230              EVEX VOP %zmmM, %zmmM, %zmmN
4231                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4232                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4233              EVEX VOP %ymmM, %ymmM, %ymmN
4234                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4235                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4236            VOP, one of kxord and kxorq:
4237              VEX VOP %kM, %kM, %kN
4238                -> VEX kxorw %kM, %kM, %kN
4239            VOP, one of kandnd and kandnq:
4240              VEX VOP %kM, %kM, %kN
4241                -> VEX kandnw %kM, %kM, %kN
4242        */
4243       if (is_evex_encoding (&i.tm))
4244         {
4245           if (i.vec_encoding != vex_encoding_evex)
4246             {
4247               i.tm.opcode_modifier.vex = VEX128;
4248               i.tm.opcode_modifier.vexw = VEXW0;
4249               i.tm.opcode_modifier.evex = 0;
4250             }
4251           else if (optimize > 1)
4252             i.tm.opcode_modifier.evex = EVEX128;
4253           else
4254             return;
4255         }
4256       else if (i.tm.operand_types[0].bitfield.class == RegMask)
4257         {
4258           i.tm.base_opcode &= 0xff;
4259           i.tm.opcode_modifier.vexw = VEXW0;
4260         }
4261       else
4262         i.tm.opcode_modifier.vex = VEX128;
4263
4264       if (i.tm.opcode_modifier.vex)
4265         for (j = 0; j < 3; j++)
4266           {
4267             i.types[j].bitfield.xmmword = 1;
4268             i.types[j].bitfield.ymmword = 0;
4269           }
4270     }
4271   else if (i.vec_encoding != vex_encoding_evex
4272            && !i.types[0].bitfield.zmmword
4273            && !i.types[1].bitfield.zmmword
4274            && !i.mask
4275            && !i.broadcast
4276            && is_evex_encoding (&i.tm)
4277            && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4278                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4279                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4280                || (i.tm.base_opcode & ~4) == 0x66db
4281                || (i.tm.base_opcode & ~4) == 0x66eb)
4282            && i.tm.extension_opcode == None)
4283     {
4284       /* Optimize: -O1:
4285            VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4286            vmovdqu32 and vmovdqu64:
4287              EVEX VOP %xmmM, %xmmN
4288                -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4289              EVEX VOP %ymmM, %ymmN
4290                -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4291              EVEX VOP %xmmM, mem
4292                -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4293              EVEX VOP %ymmM, mem
4294                -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4295              EVEX VOP mem, %xmmN
4296                -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4297              EVEX VOP mem, %ymmN
4298                -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4299            VOP, one of vpand, vpandn, vpor, vpxor:
4300              EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4301                -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4302              EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4303                -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4304              EVEX VOP{d,q} mem, %xmmM, %xmmN
4305                -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4306              EVEX VOP{d,q} mem, %ymmM, %ymmN
4307                -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4308        */
4309       for (j = 0; j < i.operands; j++)
4310         if (operand_type_check (i.types[j], disp)
4311             && i.op[j].disps->X_op == O_constant)
4312           {
4313             /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4314                has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4315                bytes, we choose EVEX Disp8 over VEX Disp32.  */
4316             int evex_disp8, vex_disp8;
4317             unsigned int memshift = i.memshift;
4318             offsetT n = i.op[j].disps->X_add_number;
4319
4320             evex_disp8 = fits_in_disp8 (n);
4321             i.memshift = 0;
4322             vex_disp8 = fits_in_disp8 (n);
4323             if (evex_disp8 != vex_disp8)
4324               {
4325                 i.memshift = memshift;
4326                 return;
4327               }
4328
4329             i.types[j].bitfield.disp8 = vex_disp8;
4330             break;
4331           }
4332       if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4333         i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4334       i.tm.opcode_modifier.vex
4335         = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4336       i.tm.opcode_modifier.vexw = VEXW0;
4337       /* VPAND, VPOR, and VPXOR are commutative.  */
4338       if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4339         i.tm.opcode_modifier.commutative = 1;
4340       i.tm.opcode_modifier.evex = 0;
4341       i.tm.opcode_modifier.masking = 0;
4342       i.tm.opcode_modifier.broadcast = 0;
4343       i.tm.opcode_modifier.disp8memshift = 0;
4344       i.memshift = 0;
4345       if (j < i.operands)
4346         i.types[j].bitfield.disp8
4347           = fits_in_disp8 (i.op[j].disps->X_add_number);
4348     }
4349 }
4350
4351 /* Return non-zero for load instruction.  */
4352
4353 static int
4354 load_insn_p (void)
4355 {
4356   unsigned int dest;
4357   int any_vex_p = is_any_vex_encoding (&i.tm);
4358   unsigned int base_opcode = i.tm.base_opcode | 1;
4359
4360   if (!any_vex_p)
4361     {
4362       /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4363          prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4364          bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote.  */
4365       if (i.tm.opcode_modifier.anysize)
4366         return 0;
4367
4368       /* pop, popf, popa.   */
4369       if (strcmp (i.tm.name, "pop") == 0
4370           || i.tm.base_opcode == 0x9d
4371           || i.tm.base_opcode == 0x61)
4372         return 1;
4373
4374       /* movs, cmps, lods, scas.  */
4375       if ((i.tm.base_opcode | 0xb) == 0xaf)
4376         return 1;
4377
4378       /* outs, xlatb.  */
4379       if (base_opcode == 0x6f
4380           || i.tm.base_opcode == 0xd7)
4381         return 1;
4382       /* NB: For AMD-specific insns with implicit memory operands,
4383          they're intentionally not covered.  */
4384     }
4385
4386   /* No memory operand.  */
4387   if (!i.mem_operands)
4388     return 0;
4389
4390   if (any_vex_p)
4391     {
4392       /* vldmxcsr.  */
4393       if (i.tm.base_opcode == 0xae
4394           && i.tm.opcode_modifier.vex
4395           && i.tm.opcode_modifier.vexopcode == VEX0F
4396           && i.tm.extension_opcode == 2)
4397         return 1;
4398     }
4399   else
4400     {
4401       /* test, not, neg, mul, imul, div, idiv.  */
4402       if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4403           && i.tm.extension_opcode != 1)
4404         return 1;
4405
4406       /* inc, dec.  */
4407       if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4408         return 1;
4409
4410       /* add, or, adc, sbb, and, sub, xor, cmp.  */
4411       if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4412         return 1;
4413
4414       /* bt, bts, btr, btc.  */
4415       if (i.tm.base_opcode == 0xfba
4416           && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4417         return 1;
4418
4419       /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4420       if ((base_opcode == 0xc1
4421            || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4422           && i.tm.extension_opcode != 6)
4423         return 1;
4424
4425       /* cmpxchg8b, cmpxchg16b, xrstors.  */
4426       if (i.tm.base_opcode == 0xfc7
4427           && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3))
4428         return 1;
4429
4430       /* fxrstor, ldmxcsr, xrstor.  */
4431       if (i.tm.base_opcode == 0xfae
4432           && (i.tm.extension_opcode == 1
4433               || i.tm.extension_opcode == 2
4434               || i.tm.extension_opcode == 5))
4435         return 1;
4436
4437       /* lgdt, lidt, lmsw.  */
4438       if (i.tm.base_opcode == 0xf01
4439           && (i.tm.extension_opcode == 2
4440               || i.tm.extension_opcode == 3
4441               || i.tm.extension_opcode == 6))
4442         return 1;
4443
4444       /* vmptrld */
4445       if (i.tm.base_opcode == 0xfc7
4446           && i.tm.extension_opcode == 6)
4447         return 1;
4448
4449       /* Check for x87 instructions.  */
4450       if (i.tm.base_opcode >= 0xd8 && i.tm.base_opcode <= 0xdf)
4451         {
4452           /* Skip fst, fstp, fstenv, fstcw.  */
4453           if (i.tm.base_opcode == 0xd9
4454               && (i.tm.extension_opcode == 2
4455                   || i.tm.extension_opcode == 3
4456                   || i.tm.extension_opcode == 6
4457                   || i.tm.extension_opcode == 7))
4458             return 0;
4459
4460           /* Skip fisttp, fist, fistp, fstp.  */
4461           if (i.tm.base_opcode == 0xdb
4462               && (i.tm.extension_opcode == 1
4463                   || i.tm.extension_opcode == 2
4464                   || i.tm.extension_opcode == 3
4465                   || i.tm.extension_opcode == 7))
4466             return 0;
4467
4468           /* Skip fisttp, fst, fstp, fsave, fstsw.  */
4469           if (i.tm.base_opcode == 0xdd
4470               && (i.tm.extension_opcode == 1
4471                   || i.tm.extension_opcode == 2
4472                   || i.tm.extension_opcode == 3
4473                   || i.tm.extension_opcode == 6
4474                   || i.tm.extension_opcode == 7))
4475             return 0;
4476
4477           /* Skip fisttp, fist, fistp, fbstp, fistp.  */
4478           if (i.tm.base_opcode == 0xdf
4479               && (i.tm.extension_opcode == 1
4480                   || i.tm.extension_opcode == 2
4481                   || i.tm.extension_opcode == 3
4482                   || i.tm.extension_opcode == 6
4483                   || i.tm.extension_opcode == 7))
4484             return 0;
4485
4486           return 1;
4487         }
4488     }
4489
4490   dest = i.operands - 1;
4491
4492   /* Check fake imm8 operand and 3 source operands.  */
4493   if ((i.tm.opcode_modifier.immext
4494        || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4495       && i.types[dest].bitfield.imm8)
4496     dest--;
4497
4498   /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg, xadd  */
4499   if (!any_vex_p
4500       && (base_opcode == 0x1
4501           || base_opcode == 0x9
4502           || base_opcode == 0x11
4503           || base_opcode == 0x19
4504           || base_opcode == 0x21
4505           || base_opcode == 0x29
4506           || base_opcode == 0x31
4507           || base_opcode == 0x39
4508           || (i.tm.base_opcode >= 0x84 && i.tm.base_opcode <= 0x87)
4509           || base_opcode == 0xfc1))
4510     return 1;
4511
4512   /* Check for load instruction.  */
4513   return (i.types[dest].bitfield.class != ClassNone
4514           || i.types[dest].bitfield.instance == Accum);
4515 }
4516
4517 /* Output lfence, 0xfaee8, after instruction.  */
4518
4519 static void
4520 insert_lfence_after (void)
4521 {
4522   if (lfence_after_load && load_insn_p ())
4523     {
4524       /* There are also two REP string instructions that require
4525          special treatment. Specifically, the compare string (CMPS)
4526          and scan string (SCAS) instructions set EFLAGS in a manner
4527          that depends on the data being compared/scanned. When used
4528          with a REP prefix, the number of iterations may therefore
4529          vary depending on this data. If the data is a program secret
4530          chosen by the adversary using an LVI method,
4531          then this data-dependent behavior may leak some aspect
4532          of the secret.  */
4533       if (((i.tm.base_opcode | 0x1) == 0xa7
4534            || (i.tm.base_opcode | 0x1) == 0xaf)
4535           && i.prefix[REP_PREFIX])
4536         {
4537             as_warn (_("`%s` changes flags which would affect control flow behavior"),
4538                      i.tm.name);
4539         }
4540       char *p = frag_more (3);
4541       *p++ = 0xf;
4542       *p++ = 0xae;
4543       *p = 0xe8;
4544     }
4545 }
4546
4547 /* Output lfence, 0xfaee8, before instruction.  */
4548
4549 static void
4550 insert_lfence_before (void)
4551 {
4552   char *p;
4553
4554   if (is_any_vex_encoding (&i.tm))
4555     return;
4556
4557   if (i.tm.base_opcode == 0xff
4558       && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4559     {
4560       /* Insert lfence before indirect branch if needed.  */
4561
4562       if (lfence_before_indirect_branch == lfence_branch_none)
4563         return;
4564
4565       if (i.operands != 1)
4566         abort ();
4567
4568       if (i.reg_operands == 1)
4569         {
4570           /* Indirect branch via register.  Don't insert lfence with
4571              -mlfence-after-load=yes.  */
4572           if (lfence_after_load
4573               || lfence_before_indirect_branch == lfence_branch_memory)
4574             return;
4575         }
4576       else if (i.mem_operands == 1
4577                && lfence_before_indirect_branch != lfence_branch_register)
4578         {
4579           as_warn (_("indirect `%s` with memory operand should be avoided"),
4580                    i.tm.name);
4581           return;
4582         }
4583       else
4584         return;
4585
4586       if (last_insn.kind != last_insn_other
4587           && last_insn.seg == now_seg)
4588         {
4589           as_warn_where (last_insn.file, last_insn.line,
4590                          _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4591                          last_insn.name, i.tm.name);
4592           return;
4593         }
4594
4595       p = frag_more (3);
4596       *p++ = 0xf;
4597       *p++ = 0xae;
4598       *p = 0xe8;
4599       return;
4600     }
4601
4602   /* Output or/not/shl and lfence before near ret.  */
4603   if (lfence_before_ret != lfence_before_ret_none
4604       && (i.tm.base_opcode == 0xc2
4605           || i.tm.base_opcode == 0xc3))
4606     {
4607       if (last_insn.kind != last_insn_other
4608           && last_insn.seg == now_seg)
4609         {
4610           as_warn_where (last_insn.file, last_insn.line,
4611                          _("`%s` skips -mlfence-before-ret on `%s`"),
4612                          last_insn.name, i.tm.name);
4613           return;
4614         }
4615
4616       /* Near ret ingore operand size override under CPU64.  */
4617       char prefix = flag_code == CODE_64BIT
4618                     ? 0x48
4619                     : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
4620
4621       if (lfence_before_ret == lfence_before_ret_not)
4622         {
4623           /* not: 0xf71424, may add prefix
4624              for operand size override or 64-bit code.  */
4625           p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4626           if (prefix)
4627             *p++ = prefix;
4628           *p++ = 0xf7;
4629           *p++ = 0x14;
4630           *p++ = 0x24;
4631           if (prefix)
4632             *p++ = prefix;
4633           *p++ = 0xf7;
4634           *p++ = 0x14;
4635           *p++ = 0x24;
4636         }
4637       else
4638         {
4639           p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4640           if (prefix)
4641             *p++ = prefix;
4642           if (lfence_before_ret == lfence_before_ret_or)
4643             {
4644               /* or: 0x830c2400, may add prefix
4645                  for operand size override or 64-bit code.  */
4646               *p++ = 0x83;
4647               *p++ = 0x0c;
4648             }
4649           else
4650             {
4651               /* shl: 0xc1242400, may add prefix
4652                  for operand size override or 64-bit code.  */
4653               *p++ = 0xc1;
4654               *p++ = 0x24;
4655             }
4656
4657           *p++ = 0x24;
4658           *p++ = 0x0;
4659         }
4660
4661       *p++ = 0xf;
4662       *p++ = 0xae;
4663       *p = 0xe8;
4664     }
4665 }
4666
4667 /* This is the guts of the machine-dependent assembler.  LINE points to a
4668    machine dependent instruction.  This function is supposed to emit
4669    the frags/bytes it assembles to.  */
4670
4671 void
4672 md_assemble (char *line)
4673 {
4674   unsigned int j;
4675   char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4676   const insn_template *t;
4677
4678   /* Initialize globals.  */
4679   memset (&i, '\0', sizeof (i));
4680   for (j = 0; j < MAX_OPERANDS; j++)
4681     i.reloc[j] = NO_RELOC;
4682   memset (disp_expressions, '\0', sizeof (disp_expressions));
4683   memset (im_expressions, '\0', sizeof (im_expressions));
4684   save_stack_p = save_stack;
4685
4686   /* First parse an instruction mnemonic & call i386_operand for the operands.
4687      We assume that the scrubber has arranged it so that line[0] is the valid
4688      start of a (possibly prefixed) mnemonic.  */
4689
4690   line = parse_insn (line, mnemonic);
4691   if (line == NULL)
4692     return;
4693   mnem_suffix = i.suffix;
4694
4695   line = parse_operands (line, mnemonic);
4696   this_operand = -1;
4697   xfree (i.memop1_string);
4698   i.memop1_string = NULL;
4699   if (line == NULL)
4700     return;
4701
4702   /* Now we've parsed the mnemonic into a set of templates, and have the
4703      operands at hand.  */
4704
4705   /* All Intel opcodes have reversed operands except for "bound", "enter",
4706      "monitor*", "mwait*", "tpause", and "umwait".  We also don't reverse
4707      intersegment "jmp" and "call" instructions with 2 immediate operands so
4708      that the immediate segment precedes the offset, as it does when in AT&T
4709      mode.  */
4710   if (intel_syntax
4711       && i.operands > 1
4712       && (strcmp (mnemonic, "bound") != 0)
4713       && (strcmp (mnemonic, "invlpga") != 0)
4714       && (strncmp (mnemonic, "monitor", 7) != 0)
4715       && (strncmp (mnemonic, "mwait", 5) != 0)
4716       && (strcmp (mnemonic, "tpause") != 0)
4717       && (strcmp (mnemonic, "umwait") != 0)
4718       && !(operand_type_check (i.types[0], imm)
4719            && operand_type_check (i.types[1], imm)))
4720     swap_operands ();
4721
4722   /* The order of the immediates should be reversed
4723      for 2 immediates extrq and insertq instructions */
4724   if (i.imm_operands == 2
4725       && (strcmp (mnemonic, "extrq") == 0
4726           || strcmp (mnemonic, "insertq") == 0))
4727       swap_2_operands (0, 1);
4728
4729   if (i.imm_operands)
4730     optimize_imm ();
4731
4732   /* Don't optimize displacement for movabs since it only takes 64bit
4733      displacement.  */
4734   if (i.disp_operands
4735       && i.disp_encoding != disp_encoding_32bit
4736       && (flag_code != CODE_64BIT
4737           || strcmp (mnemonic, "movabs") != 0))
4738     optimize_disp ();
4739
4740   /* Next, we find a template that matches the given insn,
4741      making sure the overlap of the given operands types is consistent
4742      with the template operand types.  */
4743
4744   if (!(t = match_template (mnem_suffix)))
4745     return;
4746
4747   if (sse_check != check_none
4748       && !i.tm.opcode_modifier.noavx
4749       && !i.tm.cpu_flags.bitfield.cpuavx
4750       && !i.tm.cpu_flags.bitfield.cpuavx512f
4751       && (i.tm.cpu_flags.bitfield.cpusse
4752           || i.tm.cpu_flags.bitfield.cpusse2
4753           || i.tm.cpu_flags.bitfield.cpusse3
4754           || i.tm.cpu_flags.bitfield.cpussse3
4755           || i.tm.cpu_flags.bitfield.cpusse4_1
4756           || i.tm.cpu_flags.bitfield.cpusse4_2
4757           || i.tm.cpu_flags.bitfield.cpupclmul
4758           || i.tm.cpu_flags.bitfield.cpuaes
4759           || i.tm.cpu_flags.bitfield.cpusha
4760           || i.tm.cpu_flags.bitfield.cpugfni))
4761     {
4762       (sse_check == check_warning
4763        ? as_warn
4764        : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4765     }
4766
4767   if (i.tm.opcode_modifier.fwait)
4768     if (!add_prefix (FWAIT_OPCODE))
4769       return;
4770
4771   /* Check if REP prefix is OK.  */
4772   if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4773     {
4774       as_bad (_("invalid instruction `%s' after `%s'"),
4775                 i.tm.name, i.rep_prefix);
4776       return;
4777     }
4778
4779   /* Check for lock without a lockable instruction.  Destination operand
4780      must be memory unless it is xchg (0x86).  */
4781   if (i.prefix[LOCK_PREFIX]
4782       && (!i.tm.opcode_modifier.islockable
4783           || i.mem_operands == 0
4784           || (i.tm.base_opcode != 0x86
4785               && !(i.flags[i.operands - 1] & Operand_Mem))))
4786     {
4787       as_bad (_("expecting lockable instruction after `lock'"));
4788       return;
4789     }
4790
4791   /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns.  */
4792   if (i.prefix[DATA_PREFIX]
4793       && (is_any_vex_encoding (&i.tm)
4794           || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
4795           || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX))
4796     {
4797       as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4798       return;
4799     }
4800
4801   /* Check if HLE prefix is OK.  */
4802   if (i.hle_prefix && !check_hle ())
4803     return;
4804
4805   /* Check BND prefix.  */
4806   if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4807     as_bad (_("expecting valid branch instruction after `bnd'"));
4808
4809   /* Check NOTRACK prefix.  */
4810   if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4811     as_bad (_("expecting indirect branch instruction after `notrack'"));
4812
4813   if (i.tm.cpu_flags.bitfield.cpumpx)
4814     {
4815       if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4816         as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4817       else if (flag_code != CODE_16BIT
4818                ? i.prefix[ADDR_PREFIX]
4819                : i.mem_operands && !i.prefix[ADDR_PREFIX])
4820         as_bad (_("16-bit address isn't allowed in MPX instructions"));
4821     }
4822
4823   /* Insert BND prefix.  */
4824   if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4825     {
4826       if (!i.prefix[BND_PREFIX])
4827         add_prefix (BND_PREFIX_OPCODE);
4828       else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4829         {
4830           as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4831           i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4832         }
4833     }
4834
4835   /* Check string instruction segment overrides.  */
4836   if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4837     {
4838       gas_assert (i.mem_operands);
4839       if (!check_string ())
4840         return;
4841       i.disp_operands = 0;
4842     }
4843
4844   if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4845     optimize_encoding ();
4846
4847   if (!process_suffix ())
4848     return;
4849
4850   /* Update operand types.  */
4851   for (j = 0; j < i.operands; j++)
4852     i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4853
4854   /* Make still unresolved immediate matches conform to size of immediate
4855      given in i.suffix.  */
4856   if (!finalize_imm ())
4857     return;
4858
4859   if (i.types[0].bitfield.imm1)
4860     i.imm_operands = 0; /* kludge for shift insns.  */
4861
4862   /* We only need to check those implicit registers for instructions
4863      with 3 operands or less.  */
4864   if (i.operands <= 3)
4865     for (j = 0; j < i.operands; j++)
4866       if (i.types[j].bitfield.instance != InstanceNone
4867           && !i.types[j].bitfield.xmmword)
4868         i.reg_operands--;
4869
4870   /* For insns with operands there are more diddles to do to the opcode.  */
4871   if (i.operands)
4872     {
4873       if (!process_operands ())
4874         return;
4875     }
4876   else
4877     {
4878       if (i.tm.opcode_modifier.immext)
4879         process_immext ();
4880
4881       if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4882       /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc.  */
4883       as_warn (_("translating to `%sp'"), i.tm.name);
4884     }
4885
4886   if (is_any_vex_encoding (&i.tm))
4887     {
4888       if (!cpu_arch_flags.bitfield.cpui286)
4889         {
4890           as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4891                   i.tm.name);
4892           return;
4893         }
4894
4895       /* Check for explicit REX prefix.  */
4896       if (i.prefix[REX_PREFIX] || i.rex_encoding)
4897         {
4898           as_bad (_("REX prefix invalid with `%s'"), i.tm.name);
4899           return;
4900         }
4901
4902       if (i.tm.opcode_modifier.vex)
4903         build_vex_prefix (t);
4904       else
4905         build_evex_prefix ();
4906
4907       /* The individual REX.RXBW bits got consumed.  */
4908       i.rex &= REX_OPCODE;
4909     }
4910
4911   /* Handle conversion of 'int $3' --> special int3 insn.  XOP or FMA4
4912      instructions may define INT_OPCODE as well, so avoid this corner
4913      case for those instructions that use MODRM.  */
4914   if (i.tm.base_opcode == INT_OPCODE
4915       && !i.tm.opcode_modifier.modrm
4916       && i.op[0].imms->X_add_number == 3)
4917     {
4918       i.tm.base_opcode = INT3_OPCODE;
4919       i.imm_operands = 0;
4920     }
4921
4922   if ((i.tm.opcode_modifier.jump == JUMP
4923        || i.tm.opcode_modifier.jump == JUMP_BYTE
4924        || i.tm.opcode_modifier.jump == JUMP_DWORD)
4925       && i.op[0].disps->X_op == O_constant)
4926     {
4927       /* Convert "jmp constant" (and "call constant") to a jump (call) to
4928          the absolute address given by the constant.  Since ix86 jumps and
4929          calls are pc relative, we need to generate a reloc.  */
4930       i.op[0].disps->X_add_symbol = &abs_symbol;
4931       i.op[0].disps->X_op = O_symbol;
4932     }
4933
4934   /* For 8 bit registers we need an empty rex prefix.  Also if the
4935      instruction already has a prefix, we need to convert old
4936      registers to new ones.  */
4937
4938   if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4939        && (i.op[0].regs->reg_flags & RegRex64) != 0)
4940       || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4941           && (i.op[1].regs->reg_flags & RegRex64) != 0)
4942       || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4943            || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4944           && i.rex != 0))
4945     {
4946       int x;
4947
4948       i.rex |= REX_OPCODE;
4949       for (x = 0; x < 2; x++)
4950         {
4951           /* Look for 8 bit operand that uses old registers.  */
4952           if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4953               && (i.op[x].regs->reg_flags & RegRex64) == 0)
4954             {
4955               gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4956               /* In case it is "hi" register, give up.  */
4957               if (i.op[x].regs->reg_num > 3)
4958                 as_bad (_("can't encode register '%s%s' in an "
4959                           "instruction requiring REX prefix."),
4960                         register_prefix, i.op[x].regs->reg_name);
4961
4962               /* Otherwise it is equivalent to the extended register.
4963                  Since the encoding doesn't change this is merely
4964                  cosmetic cleanup for debug output.  */
4965
4966               i.op[x].regs = i.op[x].regs + 8;
4967             }
4968         }
4969     }
4970
4971   if (i.rex == 0 && i.rex_encoding)
4972     {
4973       /* Check if we can add a REX_OPCODE byte.  Look for 8 bit operand
4974          that uses legacy register.  If it is "hi" register, don't add
4975          the REX_OPCODE byte.  */
4976       int x;
4977       for (x = 0; x < 2; x++)
4978         if (i.types[x].bitfield.class == Reg
4979             && i.types[x].bitfield.byte
4980             && (i.op[x].regs->reg_flags & RegRex64) == 0
4981             && i.op[x].regs->reg_num > 3)
4982           {
4983             gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4984             i.rex_encoding = FALSE;
4985             break;
4986           }
4987
4988       if (i.rex_encoding)
4989         i.rex = REX_OPCODE;
4990     }
4991
4992   if (i.rex != 0)
4993     add_prefix (REX_OPCODE | i.rex);
4994
4995   insert_lfence_before ();
4996
4997   /* We are ready to output the insn.  */
4998   output_insn ();
4999
5000   insert_lfence_after ();
5001
5002   last_insn.seg = now_seg;
5003
5004   if (i.tm.opcode_modifier.isprefix)
5005     {
5006       last_insn.kind = last_insn_prefix;
5007       last_insn.name = i.tm.name;
5008       last_insn.file = as_where (&last_insn.line);
5009     }
5010   else
5011     last_insn.kind = last_insn_other;
5012 }
5013
5014 static char *
5015 parse_insn (char *line, char *mnemonic)
5016 {
5017   char *l = line;
5018   char *token_start = l;
5019   char *mnem_p;
5020   int supported;
5021   const insn_template *t;
5022   char *dot_p = NULL;
5023
5024   while (1)
5025     {
5026       mnem_p = mnemonic;
5027       while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5028         {
5029           if (*mnem_p == '.')
5030             dot_p = mnem_p;
5031           mnem_p++;
5032           if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
5033             {
5034               as_bad (_("no such instruction: `%s'"), token_start);
5035               return NULL;
5036             }
5037           l++;
5038         }
5039       if (!is_space_char (*l)
5040           && *l != END_OF_INSN
5041           && (intel_syntax
5042               || (*l != PREFIX_SEPARATOR
5043                   && *l != ',')))
5044         {
5045           as_bad (_("invalid character %s in mnemonic"),
5046                   output_invalid (*l));
5047           return NULL;
5048         }
5049       if (token_start == l)
5050         {
5051           if (!intel_syntax && *l == PREFIX_SEPARATOR)
5052             as_bad (_("expecting prefix; got nothing"));
5053           else
5054             as_bad (_("expecting mnemonic; got nothing"));
5055           return NULL;
5056         }
5057
5058       /* Look up instruction (or prefix) via hash table.  */
5059       current_templates = (const templates *) hash_find (op_hash, mnemonic);
5060
5061       if (*l != END_OF_INSN
5062           && (!is_space_char (*l) || l[1] != END_OF_INSN)
5063           && current_templates
5064           && current_templates->start->opcode_modifier.isprefix)
5065         {
5066           if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
5067             {
5068               as_bad ((flag_code != CODE_64BIT
5069                        ? _("`%s' is only supported in 64-bit mode")
5070                        : _("`%s' is not supported in 64-bit mode")),
5071                       current_templates->start->name);
5072               return NULL;
5073             }
5074           /* If we are in 16-bit mode, do not allow addr16 or data16.
5075              Similarly, in 32-bit mode, do not allow addr32 or data32.  */
5076           if ((current_templates->start->opcode_modifier.size == SIZE16
5077                || current_templates->start->opcode_modifier.size == SIZE32)
5078               && flag_code != CODE_64BIT
5079               && ((current_templates->start->opcode_modifier.size == SIZE32)
5080                   ^ (flag_code == CODE_16BIT)))
5081             {
5082               as_bad (_("redundant %s prefix"),
5083                       current_templates->start->name);
5084               return NULL;
5085             }
5086           if (current_templates->start->opcode_length == 0)
5087             {
5088               /* Handle pseudo prefixes.  */
5089               switch (current_templates->start->base_opcode)
5090                 {
5091                 case 0x0:
5092                   /* {disp8} */
5093                   i.disp_encoding = disp_encoding_8bit;
5094                   break;
5095                 case 0x1:
5096                   /* {disp32} */
5097                   i.disp_encoding = disp_encoding_32bit;
5098                   break;
5099                 case 0x2:
5100                   /* {load} */
5101                   i.dir_encoding = dir_encoding_load;
5102                   break;
5103                 case 0x3:
5104                   /* {store} */
5105                   i.dir_encoding = dir_encoding_store;
5106                   break;
5107                 case 0x4:
5108                   /* {vex} */
5109                   i.vec_encoding = vex_encoding_vex;
5110                   break;
5111                 case 0x5:
5112                   /* {vex3} */
5113                   i.vec_encoding = vex_encoding_vex3;
5114                   break;
5115                 case 0x6:
5116                   /* {evex} */
5117                   i.vec_encoding = vex_encoding_evex;
5118                   break;
5119                 case 0x7:
5120                   /* {rex} */
5121                   i.rex_encoding = TRUE;
5122                   break;
5123                 case 0x8:
5124                   /* {nooptimize} */
5125                   i.no_optimize = TRUE;
5126                   break;
5127                 default:
5128                   abort ();
5129                 }
5130             }
5131           else
5132             {
5133               /* Add prefix, checking for repeated prefixes.  */
5134               switch (add_prefix (current_templates->start->base_opcode))
5135                 {
5136                 case PREFIX_EXIST:
5137                   return NULL;
5138                 case PREFIX_DS:
5139                   if (current_templates->start->cpu_flags.bitfield.cpuibt)
5140                     i.notrack_prefix = current_templates->start->name;
5141                   break;
5142                 case PREFIX_REP:
5143                   if (current_templates->start->cpu_flags.bitfield.cpuhle)
5144                     i.hle_prefix = current_templates->start->name;
5145                   else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5146                     i.bnd_prefix = current_templates->start->name;
5147                   else
5148                     i.rep_prefix = current_templates->start->name;
5149                   break;
5150                 default:
5151                   break;
5152                 }
5153             }
5154           /* Skip past PREFIX_SEPARATOR and reset token_start.  */
5155           token_start = ++l;
5156         }
5157       else
5158         break;
5159     }
5160
5161   if (!current_templates)
5162     {
5163       /* Deprecated functionality (new code should use pseudo-prefixes instead):
5164          Check if we should swap operand or force 32bit displacement in
5165          encoding.  */
5166       if (mnem_p - 2 == dot_p && dot_p[1] == 's')
5167         i.dir_encoding = dir_encoding_swap;
5168       else if (mnem_p - 3 == dot_p
5169                && dot_p[1] == 'd'
5170                && dot_p[2] == '8')
5171         i.disp_encoding = disp_encoding_8bit;
5172       else if (mnem_p - 4 == dot_p
5173                && dot_p[1] == 'd'
5174                && dot_p[2] == '3'
5175                && dot_p[3] == '2')
5176         i.disp_encoding = disp_encoding_32bit;
5177       else
5178         goto check_suffix;
5179       mnem_p = dot_p;
5180       *dot_p = '\0';
5181       current_templates = (const templates *) hash_find (op_hash, mnemonic);
5182     }
5183
5184   if (!current_templates)
5185     {
5186     check_suffix:
5187       if (mnem_p > mnemonic)
5188         {
5189           /* See if we can get a match by trimming off a suffix.  */
5190           switch (mnem_p[-1])
5191             {
5192             case WORD_MNEM_SUFFIX:
5193               if (intel_syntax && (intel_float_operand (mnemonic) & 2))
5194                 i.suffix = SHORT_MNEM_SUFFIX;
5195               else
5196                 /* Fall through.  */
5197               case BYTE_MNEM_SUFFIX:
5198               case QWORD_MNEM_SUFFIX:
5199                 i.suffix = mnem_p[-1];
5200               mnem_p[-1] = '\0';
5201               current_templates = (const templates *) hash_find (op_hash,
5202                                                                  mnemonic);
5203               break;
5204             case SHORT_MNEM_SUFFIX:
5205             case LONG_MNEM_SUFFIX:
5206               if (!intel_syntax)
5207                 {
5208                   i.suffix = mnem_p[-1];
5209                   mnem_p[-1] = '\0';
5210                   current_templates = (const templates *) hash_find (op_hash,
5211                                                                      mnemonic);
5212                 }
5213               break;
5214
5215               /* Intel Syntax.  */
5216             case 'd':
5217               if (intel_syntax)
5218                 {
5219                   if (intel_float_operand (mnemonic) == 1)
5220                     i.suffix = SHORT_MNEM_SUFFIX;
5221                   else
5222                     i.suffix = LONG_MNEM_SUFFIX;
5223                   mnem_p[-1] = '\0';
5224                   current_templates = (const templates *) hash_find (op_hash,
5225                                                                      mnemonic);
5226                 }
5227               break;
5228             }
5229         }
5230
5231       if (!current_templates)
5232         {
5233           as_bad (_("no such instruction: `%s'"), token_start);
5234           return NULL;
5235         }
5236     }
5237
5238   if (current_templates->start->opcode_modifier.jump == JUMP
5239       || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
5240     {
5241       /* Check for a branch hint.  We allow ",pt" and ",pn" for
5242          predict taken and predict not taken respectively.
5243          I'm not sure that branch hints actually do anything on loop
5244          and jcxz insns (JumpByte) for current Pentium4 chips.  They
5245          may work in the future and it doesn't hurt to accept them
5246          now.  */
5247       if (l[0] == ',' && l[1] == 'p')
5248         {
5249           if (l[2] == 't')
5250             {
5251               if (!add_prefix (DS_PREFIX_OPCODE))
5252                 return NULL;
5253               l += 3;
5254             }
5255           else if (l[2] == 'n')
5256             {
5257               if (!add_prefix (CS_PREFIX_OPCODE))
5258                 return NULL;
5259               l += 3;
5260             }
5261         }
5262     }
5263   /* Any other comma loses.  */
5264   if (*l == ',')
5265     {
5266       as_bad (_("invalid character %s in mnemonic"),
5267               output_invalid (*l));
5268       return NULL;
5269     }
5270
5271   /* Check if instruction is supported on specified architecture.  */
5272   supported = 0;
5273   for (t = current_templates->start; t < current_templates->end; ++t)
5274     {
5275       supported |= cpu_flags_match (t);
5276       if (supported == CPU_FLAGS_PERFECT_MATCH)
5277         {
5278           if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5279             as_warn (_("use .code16 to ensure correct addressing mode"));
5280
5281           return l;
5282         }
5283     }
5284
5285   if (!(supported & CPU_FLAGS_64BIT_MATCH))
5286     as_bad (flag_code == CODE_64BIT
5287             ? _("`%s' is not supported in 64-bit mode")
5288             : _("`%s' is only supported in 64-bit mode"),
5289             current_templates->start->name);
5290   else
5291     as_bad (_("`%s' is not supported on `%s%s'"),
5292             current_templates->start->name,
5293             cpu_arch_name ? cpu_arch_name : default_arch,
5294             cpu_sub_arch_name ? cpu_sub_arch_name : "");
5295
5296   return NULL;
5297 }
5298
5299 static char *
5300 parse_operands (char *l, const char *mnemonic)
5301 {
5302   char *token_start;
5303
5304   /* 1 if operand is pending after ','.  */
5305   unsigned int expecting_operand = 0;
5306
5307   /* Non-zero if operand parens not balanced.  */
5308   unsigned int paren_not_balanced;
5309
5310   while (*l != END_OF_INSN)
5311     {
5312       /* Skip optional white space before operand.  */
5313       if (is_space_char (*l))
5314         ++l;
5315       if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
5316         {
5317           as_bad (_("invalid character %s before operand %d"),
5318                   output_invalid (*l),
5319                   i.operands + 1);
5320           return NULL;
5321         }
5322       token_start = l;  /* After white space.  */
5323       paren_not_balanced = 0;
5324       while (paren_not_balanced || *l != ',')
5325         {
5326           if (*l == END_OF_INSN)
5327             {
5328               if (paren_not_balanced)
5329                 {
5330                   if (!intel_syntax)
5331                     as_bad (_("unbalanced parenthesis in operand %d."),
5332                             i.operands + 1);
5333                   else
5334                     as_bad (_("unbalanced brackets in operand %d."),
5335                             i.operands + 1);
5336                   return NULL;
5337                 }
5338               else
5339                 break;  /* we are done */
5340             }
5341           else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
5342             {
5343               as_bad (_("invalid character %s in operand %d"),
5344                       output_invalid (*l),
5345                       i.operands + 1);
5346               return NULL;
5347             }
5348           if (!intel_syntax)
5349             {
5350               if (*l == '(')
5351                 ++paren_not_balanced;
5352               if (*l == ')')
5353                 --paren_not_balanced;
5354             }
5355           else
5356             {
5357               if (*l == '[')
5358                 ++paren_not_balanced;
5359               if (*l == ']')
5360                 --paren_not_balanced;
5361             }
5362           l++;
5363         }
5364       if (l != token_start)
5365         {                       /* Yes, we've read in another operand.  */
5366           unsigned int operand_ok;
5367           this_operand = i.operands++;
5368           if (i.operands > MAX_OPERANDS)
5369             {
5370               as_bad (_("spurious operands; (%d operands/instruction max)"),
5371                       MAX_OPERANDS);
5372               return NULL;
5373             }
5374           i.types[this_operand].bitfield.unspecified = 1;
5375           /* Now parse operand adding info to 'i' as we go along.  */
5376           END_STRING_AND_SAVE (l);
5377
5378           if (i.mem_operands > 1)
5379             {
5380               as_bad (_("too many memory references for `%s'"),
5381                       mnemonic);
5382               return 0;
5383             }
5384
5385           if (intel_syntax)
5386             operand_ok =
5387               i386_intel_operand (token_start,
5388                                   intel_float_operand (mnemonic));
5389           else
5390             operand_ok = i386_att_operand (token_start);
5391
5392           RESTORE_END_STRING (l);
5393           if (!operand_ok)
5394             return NULL;
5395         }
5396       else
5397         {
5398           if (expecting_operand)
5399             {
5400             expecting_operand_after_comma:
5401               as_bad (_("expecting operand after ','; got nothing"));
5402               return NULL;
5403             }
5404           if (*l == ',')
5405             {
5406               as_bad (_("expecting operand before ','; got nothing"));
5407               return NULL;
5408             }
5409         }
5410
5411       /* Now *l must be either ',' or END_OF_INSN.  */
5412       if (*l == ',')
5413         {
5414           if (*++l == END_OF_INSN)
5415             {
5416               /* Just skip it, if it's \n complain.  */
5417               goto expecting_operand_after_comma;
5418             }
5419           expecting_operand = 1;
5420         }
5421     }
5422   return l;
5423 }
5424
5425 static void
5426 swap_2_operands (int xchg1, int xchg2)
5427 {
5428   union i386_op temp_op;
5429   i386_operand_type temp_type;
5430   unsigned int temp_flags;
5431   enum bfd_reloc_code_real temp_reloc;
5432
5433   temp_type = i.types[xchg2];
5434   i.types[xchg2] = i.types[xchg1];
5435   i.types[xchg1] = temp_type;
5436
5437   temp_flags = i.flags[xchg2];
5438   i.flags[xchg2] = i.flags[xchg1];
5439   i.flags[xchg1] = temp_flags;
5440
5441   temp_op = i.op[xchg2];
5442   i.op[xchg2] = i.op[xchg1];
5443   i.op[xchg1] = temp_op;
5444
5445   temp_reloc = i.reloc[xchg2];
5446   i.reloc[xchg2] = i.reloc[xchg1];
5447   i.reloc[xchg1] = temp_reloc;
5448
5449   if (i.mask)
5450     {
5451       if (i.mask->operand == xchg1)
5452         i.mask->operand = xchg2;
5453       else if (i.mask->operand == xchg2)
5454         i.mask->operand = xchg1;
5455     }
5456   if (i.broadcast)
5457     {
5458       if (i.broadcast->operand == xchg1)
5459         i.broadcast->operand = xchg2;
5460       else if (i.broadcast->operand == xchg2)
5461         i.broadcast->operand = xchg1;
5462     }
5463   if (i.rounding)
5464     {
5465       if (i.rounding->operand == xchg1)
5466         i.rounding->operand = xchg2;
5467       else if (i.rounding->operand == xchg2)
5468         i.rounding->operand = xchg1;
5469     }
5470 }
5471
5472 static void
5473 swap_operands (void)
5474 {
5475   switch (i.operands)
5476     {
5477     case 5:
5478     case 4:
5479       swap_2_operands (1, i.operands - 2);
5480       /* Fall through.  */
5481     case 3:
5482     case 2:
5483       swap_2_operands (0, i.operands - 1);
5484       break;
5485     default:
5486       abort ();
5487     }
5488
5489   if (i.mem_operands == 2)
5490     {
5491       const seg_entry *temp_seg;
5492       temp_seg = i.seg[0];
5493       i.seg[0] = i.seg[1];
5494       i.seg[1] = temp_seg;
5495     }
5496 }
5497
5498 /* Try to ensure constant immediates are represented in the smallest
5499    opcode possible.  */
5500 static void
5501 optimize_imm (void)
5502 {
5503   char guess_suffix = 0;
5504   int op;
5505
5506   if (i.suffix)
5507     guess_suffix = i.suffix;
5508   else if (i.reg_operands)
5509     {
5510       /* Figure out a suffix from the last register operand specified.
5511          We can't do this properly yet, i.e. excluding special register
5512          instances, but the following works for instructions with
5513          immediates.  In any case, we can't set i.suffix yet.  */
5514       for (op = i.operands; --op >= 0;)
5515         if (i.types[op].bitfield.class != Reg)
5516           continue;
5517         else if (i.types[op].bitfield.byte)
5518           {
5519             guess_suffix = BYTE_MNEM_SUFFIX;
5520             break;
5521           }
5522         else if (i.types[op].bitfield.word)
5523           {
5524             guess_suffix = WORD_MNEM_SUFFIX;
5525             break;
5526           }
5527         else if (i.types[op].bitfield.dword)
5528           {
5529             guess_suffix = LONG_MNEM_SUFFIX;
5530             break;
5531           }
5532         else if (i.types[op].bitfield.qword)
5533           {
5534             guess_suffix = QWORD_MNEM_SUFFIX;
5535             break;
5536           }
5537     }
5538   else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5539     guess_suffix = WORD_MNEM_SUFFIX;
5540
5541   for (op = i.operands; --op >= 0;)
5542     if (operand_type_check (i.types[op], imm))
5543       {
5544         switch (i.op[op].imms->X_op)
5545           {
5546           case O_constant:
5547             /* If a suffix is given, this operand may be shortened.  */
5548             switch (guess_suffix)
5549               {
5550               case LONG_MNEM_SUFFIX:
5551                 i.types[op].bitfield.imm32 = 1;
5552                 i.types[op].bitfield.imm64 = 1;
5553                 break;
5554               case WORD_MNEM_SUFFIX:
5555                 i.types[op].bitfield.imm16 = 1;
5556                 i.types[op].bitfield.imm32 = 1;
5557                 i.types[op].bitfield.imm32s = 1;
5558                 i.types[op].bitfield.imm64 = 1;
5559                 break;
5560               case BYTE_MNEM_SUFFIX:
5561                 i.types[op].bitfield.imm8 = 1;
5562                 i.types[op].bitfield.imm8s = 1;
5563                 i.types[op].bitfield.imm16 = 1;
5564                 i.types[op].bitfield.imm32 = 1;
5565                 i.types[op].bitfield.imm32s = 1;
5566                 i.types[op].bitfield.imm64 = 1;
5567                 break;
5568               }
5569
5570             /* If this operand is at most 16 bits, convert it
5571                to a signed 16 bit number before trying to see
5572                whether it will fit in an even smaller size.
5573                This allows a 16-bit operand such as $0xffe0 to
5574                be recognised as within Imm8S range.  */
5575             if ((i.types[op].bitfield.imm16)
5576                 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5577               {
5578                 i.op[op].imms->X_add_number =
5579                   (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5580               }
5581 #ifdef BFD64
5582             /* Store 32-bit immediate in 64-bit for 64-bit BFD.  */
5583             if ((i.types[op].bitfield.imm32)
5584                 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5585                     == 0))
5586               {
5587                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5588                                                 ^ ((offsetT) 1 << 31))
5589                                                - ((offsetT) 1 << 31));
5590               }
5591 #endif
5592             i.types[op]
5593               = operand_type_or (i.types[op],
5594                                  smallest_imm_type (i.op[op].imms->X_add_number));
5595
5596             /* We must avoid matching of Imm32 templates when 64bit
5597                only immediate is available.  */
5598             if (guess_suffix == QWORD_MNEM_SUFFIX)
5599               i.types[op].bitfield.imm32 = 0;
5600             break;
5601
5602           case O_absent:
5603           case O_register:
5604             abort ();
5605
5606             /* Symbols and expressions.  */
5607           default:
5608             /* Convert symbolic operand to proper sizes for matching, but don't
5609                prevent matching a set of insns that only supports sizes other
5610                than those matching the insn suffix.  */
5611             {
5612               i386_operand_type mask, allowed;
5613               const insn_template *t;
5614
5615               operand_type_set (&mask, 0);
5616               operand_type_set (&allowed, 0);
5617
5618               for (t = current_templates->start;
5619                    t < current_templates->end;
5620                    ++t)
5621                 {
5622                   allowed = operand_type_or (allowed, t->operand_types[op]);
5623                   allowed = operand_type_and (allowed, anyimm);
5624                 }
5625               switch (guess_suffix)
5626                 {
5627                 case QWORD_MNEM_SUFFIX:
5628                   mask.bitfield.imm64 = 1;
5629                   mask.bitfield.imm32s = 1;
5630                   break;
5631                 case LONG_MNEM_SUFFIX:
5632                   mask.bitfield.imm32 = 1;
5633                   break;
5634                 case WORD_MNEM_SUFFIX:
5635                   mask.bitfield.imm16 = 1;
5636                   break;
5637                 case BYTE_MNEM_SUFFIX:
5638                   mask.bitfield.imm8 = 1;
5639                   break;
5640                 default:
5641                   break;
5642                 }
5643               allowed = operand_type_and (mask, allowed);
5644               if (!operand_type_all_zero (&allowed))
5645                 i.types[op] = operand_type_and (i.types[op], mask);
5646             }
5647             break;
5648           }
5649       }
5650 }
5651
5652 /* Try to use the smallest displacement type too.  */
5653 static void
5654 optimize_disp (void)
5655 {
5656   int op;
5657
5658   for (op = i.operands; --op >= 0;)
5659     if (operand_type_check (i.types[op], disp))
5660       {
5661         if (i.op[op].disps->X_op == O_constant)
5662           {
5663             offsetT op_disp = i.op[op].disps->X_add_number;
5664
5665             if (i.types[op].bitfield.disp16
5666                 && (op_disp & ~(offsetT) 0xffff) == 0)
5667               {
5668                 /* If this operand is at most 16 bits, convert
5669                    to a signed 16 bit number and don't use 64bit
5670                    displacement.  */
5671                 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5672                 i.types[op].bitfield.disp64 = 0;
5673               }
5674 #ifdef BFD64
5675             /* Optimize 64-bit displacement to 32-bit for 64-bit BFD.  */
5676             if (i.types[op].bitfield.disp32
5677                 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5678               {
5679                 /* If this operand is at most 32 bits, convert
5680                    to a signed 32 bit number and don't use 64bit
5681                    displacement.  */
5682                 op_disp &= (((offsetT) 2 << 31) - 1);
5683                 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5684                 i.types[op].bitfield.disp64 = 0;
5685               }
5686 #endif
5687             if (!op_disp && i.types[op].bitfield.baseindex)
5688               {
5689                 i.types[op].bitfield.disp8 = 0;
5690                 i.types[op].bitfield.disp16 = 0;
5691                 i.types[op].bitfield.disp32 = 0;
5692                 i.types[op].bitfield.disp32s = 0;
5693                 i.types[op].bitfield.disp64 = 0;
5694                 i.op[op].disps = 0;
5695                 i.disp_operands--;
5696               }
5697             else if (flag_code == CODE_64BIT)
5698               {
5699                 if (fits_in_signed_long (op_disp))
5700                   {
5701                     i.types[op].bitfield.disp64 = 0;
5702                     i.types[op].bitfield.disp32s = 1;
5703                   }
5704                 if (i.prefix[ADDR_PREFIX]
5705                     && fits_in_unsigned_long (op_disp))
5706                   i.types[op].bitfield.disp32 = 1;
5707               }
5708             if ((i.types[op].bitfield.disp32
5709                  || i.types[op].bitfield.disp32s
5710                  || i.types[op].bitfield.disp16)
5711                 && fits_in_disp8 (op_disp))
5712               i.types[op].bitfield.disp8 = 1;
5713           }
5714         else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5715                  || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5716           {
5717             fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5718                          i.op[op].disps, 0, i.reloc[op]);
5719             i.types[op].bitfield.disp8 = 0;
5720             i.types[op].bitfield.disp16 = 0;
5721             i.types[op].bitfield.disp32 = 0;
5722             i.types[op].bitfield.disp32s = 0;
5723             i.types[op].bitfield.disp64 = 0;
5724           }
5725         else
5726           /* We only support 64bit displacement on constants.  */
5727           i.types[op].bitfield.disp64 = 0;
5728       }
5729 }
5730
5731 /* Return 1 if there is a match in broadcast bytes between operand
5732    GIVEN and instruction template T.   */
5733
5734 static INLINE int
5735 match_broadcast_size (const insn_template *t, unsigned int given)
5736 {
5737   return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5738            && i.types[given].bitfield.byte)
5739           || (t->opcode_modifier.broadcast == WORD_BROADCAST
5740               && i.types[given].bitfield.word)
5741           || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5742               && i.types[given].bitfield.dword)
5743           || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5744               && i.types[given].bitfield.qword));
5745 }
5746
5747 /* Check if operands are valid for the instruction.  */
5748
5749 static int
5750 check_VecOperands (const insn_template *t)
5751 {
5752   unsigned int op;
5753   i386_cpu_flags cpu;
5754
5755   /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5756      any one operand are implicity requiring AVX512VL support if the actual
5757      operand size is YMMword or XMMword.  Since this function runs after
5758      template matching, there's no need to check for YMMword/XMMword in
5759      the template.  */
5760   cpu = cpu_flags_and (t->cpu_flags, avx512);
5761   if (!cpu_flags_all_zero (&cpu)
5762       && !t->cpu_flags.bitfield.cpuavx512vl
5763       && !cpu_arch_flags.bitfield.cpuavx512vl)
5764     {
5765       for (op = 0; op < t->operands; ++op)
5766         {
5767           if (t->operand_types[op].bitfield.zmmword
5768               && (i.types[op].bitfield.ymmword
5769                   || i.types[op].bitfield.xmmword))
5770             {
5771               i.error = unsupported;
5772               return 1;
5773             }
5774         }
5775     }
5776
5777   /* Without VSIB byte, we can't have a vector register for index.  */
5778   if (!t->opcode_modifier.sib
5779       && i.index_reg
5780       && (i.index_reg->reg_type.bitfield.xmmword
5781           || i.index_reg->reg_type.bitfield.ymmword
5782           || i.index_reg->reg_type.bitfield.zmmword))
5783     {
5784       i.error = unsupported_vector_index_register;
5785       return 1;
5786     }
5787
5788   /* Check if default mask is allowed.  */
5789   if (t->opcode_modifier.nodefmask
5790       && (!i.mask || i.mask->mask->reg_num == 0))
5791     {
5792       i.error = no_default_mask;
5793       return 1;
5794     }
5795
5796   /* For VSIB byte, we need a vector register for index, and all vector
5797      registers must be distinct.  */
5798   if (t->opcode_modifier.sib)
5799     {
5800       if (!i.index_reg
5801           || !((t->opcode_modifier.sib == VECSIB128
5802                 && i.index_reg->reg_type.bitfield.xmmword)
5803                || (t->opcode_modifier.sib == VECSIB256
5804                    && i.index_reg->reg_type.bitfield.ymmword)
5805                || (t->opcode_modifier.sib == VECSIB512
5806                    && i.index_reg->reg_type.bitfield.zmmword)))
5807       {
5808         i.error = invalid_vsib_address;
5809         return 1;
5810       }
5811
5812       gas_assert (i.reg_operands == 2 || i.mask);
5813       if (i.reg_operands == 2 && !i.mask)
5814         {
5815           gas_assert (i.types[0].bitfield.class == RegSIMD);
5816           gas_assert (i.types[0].bitfield.xmmword
5817                       || i.types[0].bitfield.ymmword);
5818           gas_assert (i.types[2].bitfield.class == RegSIMD);
5819           gas_assert (i.types[2].bitfield.xmmword
5820                       || i.types[2].bitfield.ymmword);
5821           if (operand_check == check_none)
5822             return 0;
5823           if (register_number (i.op[0].regs)
5824               != register_number (i.index_reg)
5825               && register_number (i.op[2].regs)
5826                  != register_number (i.index_reg)
5827               && register_number (i.op[0].regs)
5828                  != register_number (i.op[2].regs))
5829             return 0;
5830           if (operand_check == check_error)
5831             {
5832               i.error = invalid_vector_register_set;
5833               return 1;
5834             }
5835           as_warn (_("mask, index, and destination registers should be distinct"));
5836         }
5837       else if (i.reg_operands == 1 && i.mask)
5838         {
5839           if (i.types[1].bitfield.class == RegSIMD
5840               && (i.types[1].bitfield.xmmword
5841                   || i.types[1].bitfield.ymmword
5842                   || i.types[1].bitfield.zmmword)
5843               && (register_number (i.op[1].regs)
5844                   == register_number (i.index_reg)))
5845             {
5846               if (operand_check == check_error)
5847                 {
5848                   i.error = invalid_vector_register_set;
5849                   return 1;
5850                 }
5851               if (operand_check != check_none)
5852                 as_warn (_("index and destination registers should be distinct"));
5853             }
5854         }
5855     }
5856
5857   /* Check if broadcast is supported by the instruction and is applied
5858      to the memory operand.  */
5859   if (i.broadcast)
5860     {
5861       i386_operand_type type, overlap;
5862
5863       /* Check if specified broadcast is supported in this instruction,
5864          and its broadcast bytes match the memory operand.  */
5865       op = i.broadcast->operand;
5866       if (!t->opcode_modifier.broadcast
5867           || !(i.flags[op] & Operand_Mem)
5868           || (!i.types[op].bitfield.unspecified
5869               && !match_broadcast_size (t, op)))
5870         {
5871         bad_broadcast:
5872           i.error = unsupported_broadcast;
5873           return 1;
5874         }
5875
5876       i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5877                             * i.broadcast->type);
5878       operand_type_set (&type, 0);
5879       switch (i.broadcast->bytes)
5880         {
5881         case 2:
5882           type.bitfield.word = 1;
5883           break;
5884         case 4:
5885           type.bitfield.dword = 1;
5886           break;
5887         case 8:
5888           type.bitfield.qword = 1;
5889           break;
5890         case 16:
5891           type.bitfield.xmmword = 1;
5892           break;
5893         case 32:
5894           type.bitfield.ymmword = 1;
5895           break;
5896         case 64:
5897           type.bitfield.zmmword = 1;
5898           break;
5899         default:
5900           goto bad_broadcast;
5901         }
5902
5903       overlap = operand_type_and (type, t->operand_types[op]);
5904       if (t->operand_types[op].bitfield.class == RegSIMD
5905           && t->operand_types[op].bitfield.byte
5906              + t->operand_types[op].bitfield.word
5907              + t->operand_types[op].bitfield.dword
5908              + t->operand_types[op].bitfield.qword > 1)
5909         {
5910           overlap.bitfield.xmmword = 0;
5911           overlap.bitfield.ymmword = 0;
5912           overlap.bitfield.zmmword = 0;
5913         }
5914       if (operand_type_all_zero (&overlap))
5915           goto bad_broadcast;
5916
5917       if (t->opcode_modifier.checkregsize)
5918         {
5919           unsigned int j;
5920
5921           type.bitfield.baseindex = 1;
5922           for (j = 0; j < i.operands; ++j)
5923             {
5924               if (j != op
5925                   && !operand_type_register_match(i.types[j],
5926                                                   t->operand_types[j],
5927                                                   type,
5928                                                   t->operand_types[op]))
5929                 goto bad_broadcast;
5930             }
5931         }
5932     }
5933   /* If broadcast is supported in this instruction, we need to check if
5934      operand of one-element size isn't specified without broadcast.  */
5935   else if (t->opcode_modifier.broadcast && i.mem_operands)
5936     {
5937       /* Find memory operand.  */
5938       for (op = 0; op < i.operands; op++)
5939         if (i.flags[op] & Operand_Mem)
5940           break;
5941       gas_assert (op < i.operands);
5942       /* Check size of the memory operand.  */
5943       if (match_broadcast_size (t, op))
5944         {
5945           i.error = broadcast_needed;
5946           return 1;
5947         }
5948     }
5949   else
5950     op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning.  */
5951
5952   /* Check if requested masking is supported.  */
5953   if (i.mask)
5954     {
5955       switch (t->opcode_modifier.masking)
5956         {
5957         case BOTH_MASKING:
5958           break;
5959         case MERGING_MASKING:
5960           if (i.mask->zeroing)
5961             {
5962         case 0:
5963               i.error = unsupported_masking;
5964               return 1;
5965             }
5966           break;
5967         case DYNAMIC_MASKING:
5968           /* Memory destinations allow only merging masking.  */
5969           if (i.mask->zeroing && i.mem_operands)
5970             {
5971               /* Find memory operand.  */
5972               for (op = 0; op < i.operands; op++)
5973                 if (i.flags[op] & Operand_Mem)
5974                   break;
5975               gas_assert (op < i.operands);
5976               if (op == i.operands - 1)
5977                 {
5978                   i.error = unsupported_masking;
5979                   return 1;
5980                 }
5981             }
5982           break;
5983         default:
5984           abort ();
5985         }
5986     }
5987
5988   /* Check if masking is applied to dest operand.  */
5989   if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5990     {
5991       i.error = mask_not_on_destination;
5992       return 1;
5993     }
5994
5995   /* Check RC/SAE.  */
5996   if (i.rounding)
5997     {
5998       if (!t->opcode_modifier.sae
5999           || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
6000         {
6001           i.error = unsupported_rc_sae;
6002           return 1;
6003         }
6004       /* If the instruction has several immediate operands and one of
6005          them is rounding, the rounding operand should be the last
6006          immediate operand.  */
6007       if (i.imm_operands > 1
6008           && i.rounding->operand != (int) (i.imm_operands - 1))
6009         {
6010           i.error = rc_sae_operand_not_last_imm;
6011           return 1;
6012         }
6013     }
6014
6015   /* Check the special Imm4 cases; must be the first operand.  */
6016   if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6017     {
6018       if (i.op[0].imms->X_op != O_constant
6019           || !fits_in_imm4 (i.op[0].imms->X_add_number))
6020         {
6021           i.error = bad_imm4;
6022           return 1;
6023         }
6024
6025       /* Turn off Imm<N> so that update_imm won't complain.  */
6026       operand_type_set (&i.types[0], 0);
6027     }
6028
6029   /* Check vector Disp8 operand.  */
6030   if (t->opcode_modifier.disp8memshift
6031       && i.disp_encoding != disp_encoding_32bit)
6032     {
6033       if (i.broadcast)
6034         i.memshift = t->opcode_modifier.broadcast - 1;
6035       else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
6036         i.memshift = t->opcode_modifier.disp8memshift;
6037       else
6038         {
6039           const i386_operand_type *type = NULL;
6040
6041           i.memshift = 0;
6042           for (op = 0; op < i.operands; op++)
6043             if (i.flags[op] & Operand_Mem)
6044               {
6045                 if (t->opcode_modifier.evex == EVEXLIG)
6046                   i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6047                 else if (t->operand_types[op].bitfield.xmmword
6048                          + t->operand_types[op].bitfield.ymmword
6049                          + t->operand_types[op].bitfield.zmmword <= 1)
6050                   type = &t->operand_types[op];
6051                 else if (!i.types[op].bitfield.unspecified)
6052                   type = &i.types[op];
6053               }
6054             else if (i.types[op].bitfield.class == RegSIMD
6055                      && t->opcode_modifier.evex != EVEXLIG)
6056               {
6057                 if (i.types[op].bitfield.zmmword)
6058                   i.memshift = 6;
6059                 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6060                   i.memshift = 5;
6061                 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6062                   i.memshift = 4;
6063               }
6064
6065           if (type)
6066             {
6067               if (type->bitfield.zmmword)
6068                 i.memshift = 6;
6069               else if (type->bitfield.ymmword)
6070                 i.memshift = 5;
6071               else if (type->bitfield.xmmword)
6072                 i.memshift = 4;
6073             }
6074
6075           /* For the check in fits_in_disp8().  */
6076           if (i.memshift == 0)
6077             i.memshift = -1;
6078         }
6079
6080       for (op = 0; op < i.operands; op++)
6081         if (operand_type_check (i.types[op], disp)
6082             && i.op[op].disps->X_op == O_constant)
6083           {
6084             if (fits_in_disp8 (i.op[op].disps->X_add_number))
6085               {
6086                 i.types[op].bitfield.disp8 = 1;
6087                 return 0;
6088               }
6089             i.types[op].bitfield.disp8 = 0;
6090           }
6091     }
6092
6093   i.memshift = 0;
6094
6095   return 0;
6096 }
6097
6098 /* Check if encoding requirements are met by the instruction.  */
6099
6100 static int
6101 VEX_check_encoding (const insn_template *t)
6102 {
6103   if (i.vec_encoding == vex_encoding_error)
6104     {
6105       i.error = unsupported;
6106       return 1;
6107     }
6108
6109   if (i.vec_encoding == vex_encoding_evex)
6110     {
6111       /* This instruction must be encoded with EVEX prefix.  */
6112       if (!is_evex_encoding (t))
6113         {
6114           i.error = unsupported;
6115           return 1;
6116         }
6117       return 0;
6118     }
6119
6120   if (!t->opcode_modifier.vex)
6121     {
6122       /* This instruction template doesn't have VEX prefix.  */
6123       if (i.vec_encoding != vex_encoding_default)
6124         {
6125           i.error = unsupported;
6126           return 1;
6127         }
6128       return 0;
6129     }
6130
6131   return 0;
6132 }
6133
6134 static const insn_template *
6135 match_template (char mnem_suffix)
6136 {
6137   /* Points to template once we've found it.  */
6138   const insn_template *t;
6139   i386_operand_type overlap0, overlap1, overlap2, overlap3;
6140   i386_operand_type overlap4;
6141   unsigned int found_reverse_match;
6142   i386_opcode_modifier suffix_check;
6143   i386_operand_type operand_types [MAX_OPERANDS];
6144   int addr_prefix_disp;
6145   unsigned int j, size_match, check_register;
6146   enum i386_error specific_error = 0;
6147
6148 #if MAX_OPERANDS != 5
6149 # error "MAX_OPERANDS must be 5."
6150 #endif
6151
6152   found_reverse_match = 0;
6153   addr_prefix_disp = -1;
6154
6155   /* Prepare for mnemonic suffix check.  */
6156   memset (&suffix_check, 0, sizeof (suffix_check));
6157   switch (mnem_suffix)
6158     {
6159     case BYTE_MNEM_SUFFIX:
6160       suffix_check.no_bsuf = 1;
6161       break;
6162     case WORD_MNEM_SUFFIX:
6163       suffix_check.no_wsuf = 1;
6164       break;
6165     case SHORT_MNEM_SUFFIX:
6166       suffix_check.no_ssuf = 1;
6167       break;
6168     case LONG_MNEM_SUFFIX:
6169       suffix_check.no_lsuf = 1;
6170       break;
6171     case QWORD_MNEM_SUFFIX:
6172       suffix_check.no_qsuf = 1;
6173       break;
6174     default:
6175       /* NB: In Intel syntax, normally we can check for memory operand
6176          size when there is no mnemonic suffix.  But jmp and call have
6177          2 different encodings with Dword memory operand size, one with
6178          No_ldSuf and the other without.  i.suffix is set to
6179          LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf.  */
6180       if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6181         suffix_check.no_ldsuf = 1;
6182     }
6183
6184   /* Must have right number of operands.  */
6185   i.error = number_of_operands_mismatch;
6186
6187   for (t = current_templates->start; t < current_templates->end; t++)
6188     {
6189       addr_prefix_disp = -1;
6190       found_reverse_match = 0;
6191
6192       if (i.operands != t->operands)
6193         continue;
6194
6195       /* Check processor support.  */
6196       i.error = unsupported;
6197       if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
6198         continue;
6199
6200       /* Check AT&T mnemonic.   */
6201       i.error = unsupported_with_intel_mnemonic;
6202       if (intel_mnemonic && t->opcode_modifier.attmnemonic)
6203         continue;
6204
6205       /* Check AT&T/Intel syntax.  */
6206       i.error = unsupported_syntax;
6207       if ((intel_syntax && t->opcode_modifier.attsyntax)
6208           || (!intel_syntax && t->opcode_modifier.intelsyntax))
6209         continue;
6210
6211       /* Check Intel64/AMD64 ISA.   */
6212       switch (isa64)
6213         {
6214         default:
6215           /* Default: Don't accept Intel64.  */
6216           if (t->opcode_modifier.isa64 == INTEL64)
6217             continue;
6218           break;
6219         case amd64:
6220           /* -mamd64: Don't accept Intel64 and Intel64 only.  */
6221           if (t->opcode_modifier.isa64 >= INTEL64)
6222             continue;
6223           break;
6224         case intel64:
6225           /* -mintel64: Don't accept AMD64.  */
6226           if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
6227             continue;
6228           break;
6229         }
6230
6231       /* Check the suffix.  */
6232       i.error = invalid_instruction_suffix;
6233       if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6234           || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6235           || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6236           || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6237           || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6238           || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
6239         continue;
6240
6241       size_match = operand_size_match (t);
6242       if (!size_match)
6243         continue;
6244
6245       /* This is intentionally not
6246
6247          if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6248
6249          as the case of a missing * on the operand is accepted (perhaps with
6250          a warning, issued further down).  */
6251       if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6252         {
6253           i.error = operand_type_mismatch;
6254           continue;
6255         }
6256
6257       for (j = 0; j < MAX_OPERANDS; j++)
6258         operand_types[j] = t->operand_types[j];
6259
6260       /* In general, don't allow
6261          - 64-bit operands outside of 64-bit mode,
6262          - 32-bit operands on pre-386.  */
6263       j = i.imm_operands + (t->operands > i.imm_operands + 1);
6264       if (((i.suffix == QWORD_MNEM_SUFFIX
6265             && flag_code != CODE_64BIT
6266             && (t->base_opcode != 0x0fc7
6267                 || t->extension_opcode != 1 /* cmpxchg8b */))
6268            || (i.suffix == LONG_MNEM_SUFFIX
6269                && !cpu_arch_flags.bitfield.cpui386))
6270           && (intel_syntax
6271               ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
6272                  && !intel_float_operand (t->name))
6273               : intel_float_operand (t->name) != 2)
6274           && (t->operands == i.imm_operands
6275               || (operand_types[i.imm_operands].bitfield.class != RegMMX
6276                && operand_types[i.imm_operands].bitfield.class != RegSIMD
6277                && operand_types[i.imm_operands].bitfield.class != RegMask)
6278               || (operand_types[j].bitfield.class != RegMMX
6279                   && operand_types[j].bitfield.class != RegSIMD
6280                   && operand_types[j].bitfield.class != RegMask))
6281           && !t->opcode_modifier.sib)
6282         continue;
6283
6284       /* Do not verify operands when there are none.  */
6285       if (!t->operands)
6286         {
6287           if (VEX_check_encoding (t))
6288             {
6289               specific_error = i.error;
6290               continue;
6291             }
6292
6293           /* We've found a match; break out of loop.  */
6294           break;
6295         }
6296
6297       if (!t->opcode_modifier.jump
6298           || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6299         {
6300           /* There should be only one Disp operand.  */
6301           for (j = 0; j < MAX_OPERANDS; j++)
6302             if (operand_type_check (operand_types[j], disp))
6303               break;
6304           if (j < MAX_OPERANDS)
6305             {
6306               bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
6307
6308               addr_prefix_disp = j;
6309
6310               /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6311                  operand into Disp32/Disp32/Disp16/Disp32 operand.  */
6312               switch (flag_code)
6313                 {
6314                 case CODE_16BIT:
6315                   override = !override;
6316                   /* Fall through.  */
6317                 case CODE_32BIT:
6318                   if (operand_types[j].bitfield.disp32
6319                       && operand_types[j].bitfield.disp16)
6320                     {
6321                       operand_types[j].bitfield.disp16 = override;
6322                       operand_types[j].bitfield.disp32 = !override;
6323                     }
6324                   operand_types[j].bitfield.disp32s = 0;
6325                   operand_types[j].bitfield.disp64 = 0;
6326                   break;
6327
6328                 case CODE_64BIT:
6329                   if (operand_types[j].bitfield.disp32s
6330                       || operand_types[j].bitfield.disp64)
6331                     {
6332                       operand_types[j].bitfield.disp64 &= !override;
6333                       operand_types[j].bitfield.disp32s &= !override;
6334                       operand_types[j].bitfield.disp32 = override;
6335                     }
6336                   operand_types[j].bitfield.disp16 = 0;
6337                   break;
6338                 }
6339             }
6340         }
6341
6342       /* Force 0x8b encoding for "mov foo@GOT, %eax".  */
6343       if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
6344         continue;
6345
6346       /* We check register size if needed.  */
6347       if (t->opcode_modifier.checkregsize)
6348         {
6349           check_register = (1 << t->operands) - 1;
6350           if (i.broadcast)
6351             check_register &= ~(1 << i.broadcast->operand);
6352         }
6353       else
6354         check_register = 0;
6355
6356       overlap0 = operand_type_and (i.types[0], operand_types[0]);
6357       switch (t->operands)
6358         {
6359         case 1:
6360           if (!operand_type_match (overlap0, i.types[0]))
6361             continue;
6362           break;
6363         case 2:
6364           /* xchg %eax, %eax is a special case. It is an alias for nop
6365              only in 32bit mode and we can use opcode 0x90.  In 64bit
6366              mode, we can't use 0x90 for xchg %eax, %eax since it should
6367              zero-extend %eax to %rax.  */
6368           if (flag_code == CODE_64BIT
6369               && t->base_opcode == 0x90
6370               && i.types[0].bitfield.instance == Accum
6371               && i.types[0].bitfield.dword
6372               && i.types[1].bitfield.instance == Accum
6373               && i.types[1].bitfield.dword)
6374             continue;
6375           /* xrelease mov %eax, <disp> is another special case. It must not
6376              match the accumulator-only encoding of mov.  */
6377           if (flag_code != CODE_64BIT
6378               && i.hle_prefix
6379               && t->base_opcode == 0xa0
6380               && i.types[0].bitfield.instance == Accum
6381               && (i.flags[1] & Operand_Mem))
6382             continue;
6383           /* Fall through.  */
6384
6385         case 3:
6386           if (!(size_match & MATCH_STRAIGHT))
6387             goto check_reverse;
6388           /* Reverse direction of operands if swapping is possible in the first
6389              place (operands need to be symmetric) and
6390              - the load form is requested, and the template is a store form,
6391              - the store form is requested, and the template is a load form,
6392              - the non-default (swapped) form is requested.  */
6393           overlap1 = operand_type_and (operand_types[0], operand_types[1]);
6394           if (t->opcode_modifier.d && i.reg_operands == i.operands
6395               && !operand_type_all_zero (&overlap1))
6396             switch (i.dir_encoding)
6397               {
6398               case dir_encoding_load:
6399                 if (operand_type_check (operand_types[i.operands - 1], anymem)
6400                     || t->opcode_modifier.regmem)
6401                   goto check_reverse;
6402                 break;
6403
6404               case dir_encoding_store:
6405                 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6406                     && !t->opcode_modifier.regmem)
6407                   goto check_reverse;
6408                 break;
6409
6410               case dir_encoding_swap:
6411                 goto check_reverse;
6412
6413               case dir_encoding_default:
6414                 break;
6415               }
6416           /* If we want store form, we skip the current load.  */
6417           if ((i.dir_encoding == dir_encoding_store
6418                || i.dir_encoding == dir_encoding_swap)
6419               && i.mem_operands == 0
6420               && t->opcode_modifier.load)
6421             continue;
6422           /* Fall through.  */
6423         case 4:
6424         case 5:
6425           overlap1 = operand_type_and (i.types[1], operand_types[1]);
6426           if (!operand_type_match (overlap0, i.types[0])
6427               || !operand_type_match (overlap1, i.types[1])
6428               || ((check_register & 3) == 3
6429                   && !operand_type_register_match (i.types[0],
6430                                                    operand_types[0],
6431                                                    i.types[1],
6432                                                    operand_types[1])))
6433             {
6434               /* Check if other direction is valid ...  */
6435               if (!t->opcode_modifier.d)
6436                 continue;
6437
6438             check_reverse:
6439               if (!(size_match & MATCH_REVERSE))
6440                 continue;
6441               /* Try reversing direction of operands.  */
6442               overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6443               overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6444               if (!operand_type_match (overlap0, i.types[0])
6445                   || !operand_type_match (overlap1, i.types[i.operands - 1])
6446                   || (check_register
6447                       && !operand_type_register_match (i.types[0],
6448                                                        operand_types[i.operands - 1],
6449                                                        i.types[i.operands - 1],
6450                                                        operand_types[0])))
6451                 {
6452                   /* Does not match either direction.  */
6453                   continue;
6454                 }
6455               /* found_reverse_match holds which of D or FloatR
6456                  we've found.  */
6457               if (!t->opcode_modifier.d)
6458                 found_reverse_match = 0;
6459               else if (operand_types[0].bitfield.tbyte)
6460                 found_reverse_match = Opcode_FloatD;
6461               else if (operand_types[0].bitfield.xmmword
6462                        || operand_types[i.operands - 1].bitfield.xmmword
6463                        || operand_types[0].bitfield.class == RegMMX
6464                        || operand_types[i.operands - 1].bitfield.class == RegMMX
6465                        || is_any_vex_encoding(t))
6466                 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6467                                       ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6468               else
6469                 found_reverse_match = Opcode_D;
6470               if (t->opcode_modifier.floatr)
6471                 found_reverse_match |= Opcode_FloatR;
6472             }
6473           else
6474             {
6475               /* Found a forward 2 operand match here.  */
6476               switch (t->operands)
6477                 {
6478                 case 5:
6479                   overlap4 = operand_type_and (i.types[4],
6480                                                operand_types[4]);
6481                   /* Fall through.  */
6482                 case 4:
6483                   overlap3 = operand_type_and (i.types[3],
6484                                                operand_types[3]);
6485                   /* Fall through.  */
6486                 case 3:
6487                   overlap2 = operand_type_and (i.types[2],
6488                                                operand_types[2]);
6489                   break;
6490                 }
6491
6492               switch (t->operands)
6493                 {
6494                 case 5:
6495                   if (!operand_type_match (overlap4, i.types[4])
6496                       || !operand_type_register_match (i.types[3],
6497                                                        operand_types[3],
6498                                                        i.types[4],
6499                                                        operand_types[4]))
6500                     continue;
6501                   /* Fall through.  */
6502                 case 4:
6503                   if (!operand_type_match (overlap3, i.types[3])
6504                       || ((check_register & 0xa) == 0xa
6505                           && !operand_type_register_match (i.types[1],
6506                                                             operand_types[1],
6507                                                             i.types[3],
6508                                                             operand_types[3]))
6509                       || ((check_register & 0xc) == 0xc
6510                           && !operand_type_register_match (i.types[2],
6511                                                             operand_types[2],
6512                                                             i.types[3],
6513                                                             operand_types[3])))
6514                     continue;
6515                   /* Fall through.  */
6516                 case 3:
6517                   /* Here we make use of the fact that there are no
6518                      reverse match 3 operand instructions.  */
6519                   if (!operand_type_match (overlap2, i.types[2])
6520                       || ((check_register & 5) == 5
6521                           && !operand_type_register_match (i.types[0],
6522                                                             operand_types[0],
6523                                                             i.types[2],
6524                                                             operand_types[2]))
6525                       || ((check_register & 6) == 6
6526                           && !operand_type_register_match (i.types[1],
6527                                                             operand_types[1],
6528                                                             i.types[2],
6529                                                             operand_types[2])))
6530                     continue;
6531                   break;
6532                 }
6533             }
6534           /* Found either forward/reverse 2, 3 or 4 operand match here:
6535              slip through to break.  */
6536         }
6537
6538       /* Check if vector operands are valid.  */
6539       if (check_VecOperands (t))
6540         {
6541           specific_error = i.error;
6542           continue;
6543         }
6544
6545       /* Check if VEX/EVEX encoding requirements can be satisfied.  */
6546       if (VEX_check_encoding (t))
6547         {
6548           specific_error = i.error;
6549           continue;
6550         }
6551
6552       /* We've found a match; break out of loop.  */
6553       break;
6554     }
6555
6556   if (t == current_templates->end)
6557     {
6558       /* We found no match.  */
6559       const char *err_msg;
6560       switch (specific_error ? specific_error : i.error)
6561         {
6562         default:
6563           abort ();
6564         case operand_size_mismatch:
6565           err_msg = _("operand size mismatch");
6566           break;
6567         case operand_type_mismatch:
6568           err_msg = _("operand type mismatch");
6569           break;
6570         case register_type_mismatch:
6571           err_msg = _("register type mismatch");
6572           break;
6573         case number_of_operands_mismatch:
6574           err_msg = _("number of operands mismatch");
6575           break;
6576         case invalid_instruction_suffix:
6577           err_msg = _("invalid instruction suffix");
6578           break;
6579         case bad_imm4:
6580           err_msg = _("constant doesn't fit in 4 bits");
6581           break;
6582         case unsupported_with_intel_mnemonic:
6583           err_msg = _("unsupported with Intel mnemonic");
6584           break;
6585         case unsupported_syntax:
6586           err_msg = _("unsupported syntax");
6587           break;
6588         case unsupported:
6589           as_bad (_("unsupported instruction `%s'"),
6590                   current_templates->start->name);
6591           return NULL;
6592         case invalid_vsib_address:
6593           err_msg = _("invalid VSIB address");
6594           break;
6595         case invalid_vector_register_set:
6596           err_msg = _("mask, index, and destination registers must be distinct");
6597           break;
6598         case unsupported_vector_index_register:
6599           err_msg = _("unsupported vector index register");
6600           break;
6601         case unsupported_broadcast:
6602           err_msg = _("unsupported broadcast");
6603           break;
6604         case broadcast_needed:
6605           err_msg = _("broadcast is needed for operand of such type");
6606           break;
6607         case unsupported_masking:
6608           err_msg = _("unsupported masking");
6609           break;
6610         case mask_not_on_destination:
6611           err_msg = _("mask not on destination operand");
6612           break;
6613         case no_default_mask:
6614           err_msg = _("default mask isn't allowed");
6615           break;
6616         case unsupported_rc_sae:
6617           err_msg = _("unsupported static rounding/sae");
6618           break;
6619         case rc_sae_operand_not_last_imm:
6620           if (intel_syntax)
6621             err_msg = _("RC/SAE operand must precede immediate operands");
6622           else
6623             err_msg = _("RC/SAE operand must follow immediate operands");
6624           break;
6625         case invalid_register_operand:
6626           err_msg = _("invalid register operand");
6627           break;
6628         }
6629       as_bad (_("%s for `%s'"), err_msg,
6630               current_templates->start->name);
6631       return NULL;
6632     }
6633
6634   if (!quiet_warnings)
6635     {
6636       if (!intel_syntax
6637           && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6638         as_warn (_("indirect %s without `*'"), t->name);
6639
6640       if (t->opcode_modifier.isprefix
6641           && t->opcode_modifier.mnemonicsize == IGNORESIZE)
6642         {
6643           /* Warn them that a data or address size prefix doesn't
6644              affect assembly of the next line of code.  */
6645           as_warn (_("stand-alone `%s' prefix"), t->name);
6646         }
6647     }
6648
6649   /* Copy the template we found.  */
6650   i.tm = *t;
6651
6652   if (addr_prefix_disp != -1)
6653     i.tm.operand_types[addr_prefix_disp]
6654       = operand_types[addr_prefix_disp];
6655
6656   if (found_reverse_match)
6657     {
6658       /* If we found a reverse match we must alter the opcode direction
6659          bit and clear/flip the regmem modifier one.  found_reverse_match
6660          holds bits to change (different for int & float insns).  */
6661
6662       i.tm.base_opcode ^= found_reverse_match;
6663
6664       i.tm.operand_types[0] = operand_types[i.operands - 1];
6665       i.tm.operand_types[i.operands - 1] = operand_types[0];
6666
6667       /* Certain SIMD insns have their load forms specified in the opcode
6668          table, and hence we need to _set_ RegMem instead of clearing it.
6669          We need to avoid setting the bit though on insns like KMOVW.  */
6670       i.tm.opcode_modifier.regmem
6671         = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6672           && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6673           && !i.tm.opcode_modifier.regmem;
6674     }
6675
6676   return t;
6677 }
6678
6679 static int
6680 check_string (void)
6681 {
6682   unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6683   unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6684
6685   if (i.seg[op] != NULL && i.seg[op] != &es)
6686     {
6687       as_bad (_("`%s' operand %u must use `%ses' segment"),
6688               i.tm.name,
6689               intel_syntax ? i.tm.operands - es_op : es_op + 1,
6690               register_prefix);
6691       return 0;
6692     }
6693
6694   /* There's only ever one segment override allowed per instruction.
6695      This instruction possibly has a legal segment override on the
6696      second operand, so copy the segment to where non-string
6697      instructions store it, allowing common code.  */
6698   i.seg[op] = i.seg[1];
6699
6700   return 1;
6701 }
6702
6703 static int
6704 process_suffix (void)
6705 {
6706   /* If matched instruction specifies an explicit instruction mnemonic
6707      suffix, use it.  */
6708   if (i.tm.opcode_modifier.size == SIZE16)
6709     i.suffix = WORD_MNEM_SUFFIX;
6710   else if (i.tm.opcode_modifier.size == SIZE32)
6711     i.suffix = LONG_MNEM_SUFFIX;
6712   else if (i.tm.opcode_modifier.size == SIZE64)
6713     i.suffix = QWORD_MNEM_SUFFIX;
6714   else if (i.reg_operands
6715            && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6716            && !i.tm.opcode_modifier.addrprefixopreg)
6717     {
6718       unsigned int numop = i.operands;
6719
6720       /* movsx/movzx want only their source operand considered here, for the
6721          ambiguity checking below.  The suffix will be replaced afterwards
6722          to represent the destination (register).  */
6723       if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6724           || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6725         --i.operands;
6726
6727       /* crc32 needs REX.W set regardless of suffix / source operand size.  */
6728       if (i.tm.base_opcode == 0xf20f38f0
6729           && i.tm.operand_types[1].bitfield.qword)
6730         i.rex |= REX_W;
6731
6732       /* If there's no instruction mnemonic suffix we try to invent one
6733          based on GPR operands.  */
6734       if (!i.suffix)
6735         {
6736           /* We take i.suffix from the last register operand specified,
6737              Destination register type is more significant than source
6738              register type.  crc32 in SSE4.2 prefers source register
6739              type. */
6740           unsigned int op = i.tm.base_opcode != 0xf20f38f0 ? i.operands : 1;
6741
6742           while (op--)
6743             if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6744                 || i.tm.operand_types[op].bitfield.instance == Accum)
6745               {
6746                 if (i.types[op].bitfield.class != Reg)
6747                   continue;
6748                 if (i.types[op].bitfield.byte)
6749                   i.suffix = BYTE_MNEM_SUFFIX;
6750                 else if (i.types[op].bitfield.word)
6751                   i.suffix = WORD_MNEM_SUFFIX;
6752                 else if (i.types[op].bitfield.dword)
6753                   i.suffix = LONG_MNEM_SUFFIX;
6754                 else if (i.types[op].bitfield.qword)
6755                   i.suffix = QWORD_MNEM_SUFFIX;
6756                 else
6757                   continue;
6758                 break;
6759               }
6760
6761           /* As an exception, movsx/movzx silently default to a byte source
6762              in AT&T mode.  */
6763           if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6764               && !i.suffix && !intel_syntax)
6765             i.suffix = BYTE_MNEM_SUFFIX;
6766         }
6767       else if (i.suffix == BYTE_MNEM_SUFFIX)
6768         {
6769           if (intel_syntax
6770               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6771               && i.tm.opcode_modifier.no_bsuf)
6772             i.suffix = 0;
6773           else if (!check_byte_reg ())
6774             return 0;
6775         }
6776       else if (i.suffix == LONG_MNEM_SUFFIX)
6777         {
6778           if (intel_syntax
6779               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6780               && i.tm.opcode_modifier.no_lsuf
6781               && !i.tm.opcode_modifier.todword
6782               && !i.tm.opcode_modifier.toqword)
6783             i.suffix = 0;
6784           else if (!check_long_reg ())
6785             return 0;
6786         }
6787       else if (i.suffix == QWORD_MNEM_SUFFIX)
6788         {
6789           if (intel_syntax
6790               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6791               && i.tm.opcode_modifier.no_qsuf
6792               && !i.tm.opcode_modifier.todword
6793               && !i.tm.opcode_modifier.toqword)
6794             i.suffix = 0;
6795           else if (!check_qword_reg ())
6796             return 0;
6797         }
6798       else if (i.suffix == WORD_MNEM_SUFFIX)
6799         {
6800           if (intel_syntax
6801               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6802               && i.tm.opcode_modifier.no_wsuf)
6803             i.suffix = 0;
6804           else if (!check_word_reg ())
6805             return 0;
6806         }
6807       else if (intel_syntax
6808                && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
6809         /* Do nothing if the instruction is going to ignore the prefix.  */
6810         ;
6811       else
6812         abort ();
6813
6814       /* Undo the movsx/movzx change done above.  */
6815       i.operands = numop;
6816     }
6817   else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
6818            && !i.suffix)
6819     {
6820       i.suffix = stackop_size;
6821       if (stackop_size == LONG_MNEM_SUFFIX)
6822         {
6823           /* stackop_size is set to LONG_MNEM_SUFFIX for the
6824              .code16gcc directive to support 16-bit mode with
6825              32-bit address.  For IRET without a suffix, generate
6826              16-bit IRET (opcode 0xcf) to return from an interrupt
6827              handler.  */
6828           if (i.tm.base_opcode == 0xcf)
6829             {
6830               i.suffix = WORD_MNEM_SUFFIX;
6831               as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6832             }
6833           /* Warn about changed behavior for segment register push/pop.  */
6834           else if ((i.tm.base_opcode | 1) == 0x07)
6835             as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6836                      i.tm.name);
6837         }
6838     }
6839   else if (!i.suffix
6840            && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6841                || i.tm.opcode_modifier.jump == JUMP_BYTE
6842                || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6843                || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6844                    && i.tm.extension_opcode <= 3)))
6845     {
6846       switch (flag_code)
6847         {
6848         case CODE_64BIT:
6849           if (!i.tm.opcode_modifier.no_qsuf)
6850             {
6851               if (i.tm.opcode_modifier.jump == JUMP_BYTE
6852                   || i.tm.opcode_modifier.no_lsuf)
6853                 i.suffix = QWORD_MNEM_SUFFIX;
6854               break;
6855             }
6856           /* Fall through.  */
6857         case CODE_32BIT:
6858           if (!i.tm.opcode_modifier.no_lsuf)
6859             i.suffix = LONG_MNEM_SUFFIX;
6860           break;
6861         case CODE_16BIT:
6862           if (!i.tm.opcode_modifier.no_wsuf)
6863             i.suffix = WORD_MNEM_SUFFIX;
6864           break;
6865         }
6866     }
6867
6868   if (!i.suffix
6869       && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6870           /* Also cover lret/retf/iret in 64-bit mode.  */
6871           || (flag_code == CODE_64BIT
6872               && !i.tm.opcode_modifier.no_lsuf
6873               && !i.tm.opcode_modifier.no_qsuf))
6874       && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
6875       /* Explicit sizing prefixes are assumed to disambiguate insns.  */
6876       && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
6877       /* Accept FLDENV et al without suffix.  */
6878       && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6879     {
6880       unsigned int suffixes, evex = 0;
6881
6882       suffixes = !i.tm.opcode_modifier.no_bsuf;
6883       if (!i.tm.opcode_modifier.no_wsuf)
6884         suffixes |= 1 << 1;
6885       if (!i.tm.opcode_modifier.no_lsuf)
6886         suffixes |= 1 << 2;
6887       if (!i.tm.opcode_modifier.no_ldsuf)
6888         suffixes |= 1 << 3;
6889       if (!i.tm.opcode_modifier.no_ssuf)
6890         suffixes |= 1 << 4;
6891       if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6892         suffixes |= 1 << 5;
6893
6894       /* For [XYZ]MMWORD operands inspect operand sizes.  While generally
6895          also suitable for AT&T syntax mode, it was requested that this be
6896          restricted to just Intel syntax.  */
6897       if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6898         {
6899           unsigned int op;
6900
6901           for (op = 0; op < i.tm.operands; ++op)
6902             {
6903               if (is_evex_encoding (&i.tm)
6904                   && !cpu_arch_flags.bitfield.cpuavx512vl)
6905                 {
6906                   if (i.tm.operand_types[op].bitfield.ymmword)
6907                     i.tm.operand_types[op].bitfield.xmmword = 0;
6908                   if (i.tm.operand_types[op].bitfield.zmmword)
6909                     i.tm.operand_types[op].bitfield.ymmword = 0;
6910                   if (!i.tm.opcode_modifier.evex
6911                       || i.tm.opcode_modifier.evex == EVEXDYN)
6912                     i.tm.opcode_modifier.evex = EVEX512;
6913                 }
6914
6915               if (i.tm.operand_types[op].bitfield.xmmword
6916                   + i.tm.operand_types[op].bitfield.ymmword
6917                   + i.tm.operand_types[op].bitfield.zmmword < 2)
6918                 continue;
6919
6920               /* Any properly sized operand disambiguates the insn.  */
6921               if (i.types[op].bitfield.xmmword
6922                   || i.types[op].bitfield.ymmword
6923                   || i.types[op].bitfield.zmmword)
6924                 {
6925                   suffixes &= ~(7 << 6);
6926                   evex = 0;
6927                   break;
6928                 }
6929
6930               if ((i.flags[op] & Operand_Mem)
6931                   && i.tm.operand_types[op].bitfield.unspecified)
6932                 {
6933                   if (i.tm.operand_types[op].bitfield.xmmword)
6934                     suffixes |= 1 << 6;
6935                   if (i.tm.operand_types[op].bitfield.ymmword)
6936                     suffixes |= 1 << 7;
6937                   if (i.tm.operand_types[op].bitfield.zmmword)
6938                     suffixes |= 1 << 8;
6939                   if (is_evex_encoding (&i.tm))
6940                     evex = EVEX512;
6941                 }
6942             }
6943         }
6944
6945       /* Are multiple suffixes / operand sizes allowed?  */
6946       if (suffixes & (suffixes - 1))
6947         {
6948           if (intel_syntax
6949               && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6950                   || operand_check == check_error))
6951             {
6952               as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6953               return 0;
6954             }
6955           if (operand_check == check_error)
6956             {
6957               as_bad (_("no instruction mnemonic suffix given and "
6958                         "no register operands; can't size `%s'"), i.tm.name);
6959               return 0;
6960             }
6961           if (operand_check == check_warning)
6962             as_warn (_("%s; using default for `%s'"),
6963                        intel_syntax
6964                        ? _("ambiguous operand size")
6965                        : _("no instruction mnemonic suffix given and "
6966                            "no register operands"),
6967                        i.tm.name);
6968
6969           if (i.tm.opcode_modifier.floatmf)
6970             i.suffix = SHORT_MNEM_SUFFIX;
6971           else if ((i.tm.base_opcode | 8) == 0xfbe
6972                    || (i.tm.base_opcode == 0x63
6973                        && i.tm.cpu_flags.bitfield.cpu64))
6974             /* handled below */;
6975           else if (evex)
6976             i.tm.opcode_modifier.evex = evex;
6977           else if (flag_code == CODE_16BIT)
6978             i.suffix = WORD_MNEM_SUFFIX;
6979           else if (!i.tm.opcode_modifier.no_lsuf)
6980             i.suffix = LONG_MNEM_SUFFIX;
6981           else
6982             i.suffix = QWORD_MNEM_SUFFIX;
6983         }
6984     }
6985
6986   if ((i.tm.base_opcode | 8) == 0xfbe
6987       || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6988     {
6989       /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
6990          In AT&T syntax, if there is no suffix (warned about above), the default
6991          will be byte extension.  */
6992       if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
6993         i.tm.base_opcode |= 1;
6994
6995       /* For further processing, the suffix should represent the destination
6996          (register).  This is already the case when one was used with
6997          mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
6998          no suffix to begin with.  */
6999       if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
7000         {
7001           if (i.types[1].bitfield.word)
7002             i.suffix = WORD_MNEM_SUFFIX;
7003           else if (i.types[1].bitfield.qword)
7004             i.suffix = QWORD_MNEM_SUFFIX;
7005           else
7006             i.suffix = LONG_MNEM_SUFFIX;
7007
7008           i.tm.opcode_modifier.w = 0;
7009         }
7010     }
7011
7012   if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7013     i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7014                    != (i.tm.operand_types[1].bitfield.class == Reg);
7015
7016   /* Change the opcode based on the operand size given by i.suffix.  */
7017   switch (i.suffix)
7018     {
7019     /* Size floating point instruction.  */
7020     case LONG_MNEM_SUFFIX:
7021       if (i.tm.opcode_modifier.floatmf)
7022         {
7023           i.tm.base_opcode ^= 4;
7024           break;
7025         }
7026     /* fall through */
7027     case WORD_MNEM_SUFFIX:
7028     case QWORD_MNEM_SUFFIX:
7029       /* It's not a byte, select word/dword operation.  */
7030       if (i.tm.opcode_modifier.w)
7031         {
7032           if (i.short_form)
7033             i.tm.base_opcode |= 8;
7034           else
7035             i.tm.base_opcode |= 1;
7036         }
7037     /* fall through */
7038     case SHORT_MNEM_SUFFIX:
7039       /* Now select between word & dword operations via the operand
7040          size prefix, except for instructions that will ignore this
7041          prefix anyway.  */
7042       if (i.suffix != QWORD_MNEM_SUFFIX
7043           && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7044           && !i.tm.opcode_modifier.floatmf
7045           && !is_any_vex_encoding (&i.tm)
7046           && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7047               || (flag_code == CODE_64BIT
7048                   && i.tm.opcode_modifier.jump == JUMP_BYTE)))
7049         {
7050           unsigned int prefix = DATA_PREFIX_OPCODE;
7051
7052           if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
7053             prefix = ADDR_PREFIX_OPCODE;
7054
7055           if (!add_prefix (prefix))
7056             return 0;
7057         }
7058
7059       /* Set mode64 for an operand.  */
7060       if (i.suffix == QWORD_MNEM_SUFFIX
7061           && flag_code == CODE_64BIT
7062           && !i.tm.opcode_modifier.norex64
7063           && !i.tm.opcode_modifier.vexw
7064           /* Special case for xchg %rax,%rax.  It is NOP and doesn't
7065              need rex64. */
7066           && ! (i.operands == 2
7067                 && i.tm.base_opcode == 0x90
7068                 && i.tm.extension_opcode == None
7069                 && i.types[0].bitfield.instance == Accum
7070                 && i.types[0].bitfield.qword
7071                 && i.types[1].bitfield.instance == Accum
7072                 && i.types[1].bitfield.qword))
7073         i.rex |= REX_W;
7074
7075       break;
7076
7077     case 0:
7078       /* Select word/dword/qword operation with explict data sizing prefix
7079          when there are no suitable register operands.  */
7080       if (i.tm.opcode_modifier.w
7081           && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7082           && (!i.reg_operands
7083               || (i.reg_operands == 1
7084                       /* ShiftCount */
7085                   && (i.tm.operand_types[0].bitfield.instance == RegC
7086                       /* InOutPortReg */
7087                       || i.tm.operand_types[0].bitfield.instance == RegD
7088                       || i.tm.operand_types[1].bitfield.instance == RegD
7089                       /* CRC32 */
7090                       || i.tm.base_opcode == 0xf20f38f0))))
7091         i.tm.base_opcode |= 1;
7092       break;
7093     }
7094
7095   if (i.tm.opcode_modifier.addrprefixopreg)
7096     {
7097       gas_assert (!i.suffix);
7098       gas_assert (i.reg_operands);
7099
7100       if (i.tm.operand_types[0].bitfield.instance == Accum
7101           || i.operands == 1)
7102         {
7103           /* The address size override prefix changes the size of the
7104              first operand.  */
7105           if (flag_code == CODE_64BIT
7106               && i.op[0].regs->reg_type.bitfield.word)
7107             {
7108               as_bad (_("16-bit addressing unavailable for `%s'"),
7109                       i.tm.name);
7110               return 0;
7111             }
7112
7113           if ((flag_code == CODE_32BIT
7114                ? i.op[0].regs->reg_type.bitfield.word
7115                : i.op[0].regs->reg_type.bitfield.dword)
7116               && !add_prefix (ADDR_PREFIX_OPCODE))
7117             return 0;
7118         }
7119       else
7120         {
7121           /* Check invalid register operand when the address size override
7122              prefix changes the size of register operands.  */
7123           unsigned int op;
7124           enum { need_word, need_dword, need_qword } need;
7125
7126           if (flag_code == CODE_32BIT)
7127             need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7128           else if (i.prefix[ADDR_PREFIX])
7129             need = need_dword;
7130           else
7131             need = flag_code == CODE_64BIT ? need_qword : need_word;
7132
7133           for (op = 0; op < i.operands; op++)
7134             {
7135               if (i.types[op].bitfield.class != Reg)
7136                 continue;
7137
7138               switch (need)
7139                 {
7140                 case need_word:
7141                   if (i.op[op].regs->reg_type.bitfield.word)
7142                     continue;
7143                   break;
7144                 case need_dword:
7145                   if (i.op[op].regs->reg_type.bitfield.dword)
7146                     continue;
7147                   break;
7148                 case need_qword:
7149                   if (i.op[op].regs->reg_type.bitfield.qword)
7150                     continue;
7151                   break;
7152                 }
7153
7154               as_bad (_("invalid register operand size for `%s'"),
7155                       i.tm.name);
7156               return 0;
7157             }
7158         }
7159     }
7160
7161   return 1;
7162 }
7163
7164 static int
7165 check_byte_reg (void)
7166 {
7167   int op;
7168
7169   for (op = i.operands; --op >= 0;)
7170     {
7171       /* Skip non-register operands. */
7172       if (i.types[op].bitfield.class != Reg)
7173         continue;
7174
7175       /* If this is an eight bit register, it's OK.  If it's the 16 or
7176          32 bit version of an eight bit register, we will just use the
7177          low portion, and that's OK too.  */
7178       if (i.types[op].bitfield.byte)
7179         continue;
7180
7181       /* I/O port address operands are OK too.  */
7182       if (i.tm.operand_types[op].bitfield.instance == RegD
7183           && i.tm.operand_types[op].bitfield.word)
7184         continue;
7185
7186       /* crc32 only wants its source operand checked here.  */
7187       if (i.tm.base_opcode == 0xf20f38f0 && op)
7188         continue;
7189
7190       /* Any other register is bad.  */
7191       as_bad (_("`%s%s' not allowed with `%s%c'"),
7192               register_prefix, i.op[op].regs->reg_name,
7193               i.tm.name, i.suffix);
7194       return 0;
7195     }
7196   return 1;
7197 }
7198
7199 static int
7200 check_long_reg (void)
7201 {
7202   int op;
7203
7204   for (op = i.operands; --op >= 0;)
7205     /* Skip non-register operands. */
7206     if (i.types[op].bitfield.class != Reg)
7207       continue;
7208     /* Reject eight bit registers, except where the template requires
7209        them. (eg. movzb)  */
7210     else if (i.types[op].bitfield.byte
7211              && (i.tm.operand_types[op].bitfield.class == Reg
7212                  || i.tm.operand_types[op].bitfield.instance == Accum)
7213              && (i.tm.operand_types[op].bitfield.word
7214                  || i.tm.operand_types[op].bitfield.dword))
7215       {
7216         as_bad (_("`%s%s' not allowed with `%s%c'"),
7217                 register_prefix,
7218                 i.op[op].regs->reg_name,
7219                 i.tm.name,
7220                 i.suffix);
7221         return 0;
7222       }
7223     /* Error if the e prefix on a general reg is missing.  */
7224     else if (i.types[op].bitfield.word
7225              && (i.tm.operand_types[op].bitfield.class == Reg
7226                  || i.tm.operand_types[op].bitfield.instance == Accum)
7227              && i.tm.operand_types[op].bitfield.dword)
7228       {
7229         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7230                 register_prefix, i.op[op].regs->reg_name,
7231                 i.suffix);
7232         return 0;
7233       }
7234     /* Warn if the r prefix on a general reg is present.  */
7235     else if (i.types[op].bitfield.qword
7236              && (i.tm.operand_types[op].bitfield.class == Reg
7237                  || i.tm.operand_types[op].bitfield.instance == Accum)
7238              && i.tm.operand_types[op].bitfield.dword)
7239       {
7240         if (intel_syntax
7241             && i.tm.opcode_modifier.toqword
7242             && i.types[0].bitfield.class != RegSIMD)
7243           {
7244             /* Convert to QWORD.  We want REX byte. */
7245             i.suffix = QWORD_MNEM_SUFFIX;
7246           }
7247         else
7248           {
7249             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7250                     register_prefix, i.op[op].regs->reg_name,
7251                     i.suffix);
7252             return 0;
7253           }
7254       }
7255   return 1;
7256 }
7257
7258 static int
7259 check_qword_reg (void)
7260 {
7261   int op;
7262
7263   for (op = i.operands; --op >= 0; )
7264     /* Skip non-register operands. */
7265     if (i.types[op].bitfield.class != Reg)
7266       continue;
7267     /* Reject eight bit registers, except where the template requires
7268        them. (eg. movzb)  */
7269     else if (i.types[op].bitfield.byte
7270              && (i.tm.operand_types[op].bitfield.class == Reg
7271                  || i.tm.operand_types[op].bitfield.instance == Accum)
7272              && (i.tm.operand_types[op].bitfield.word
7273                  || i.tm.operand_types[op].bitfield.dword))
7274       {
7275         as_bad (_("`%s%s' not allowed with `%s%c'"),
7276                 register_prefix,
7277                 i.op[op].regs->reg_name,
7278                 i.tm.name,
7279                 i.suffix);
7280         return 0;
7281       }
7282     /* Warn if the r prefix on a general reg is missing.  */
7283     else if ((i.types[op].bitfield.word
7284               || i.types[op].bitfield.dword)
7285              && (i.tm.operand_types[op].bitfield.class == Reg
7286                  || i.tm.operand_types[op].bitfield.instance == Accum)
7287              && i.tm.operand_types[op].bitfield.qword)
7288       {
7289         /* Prohibit these changes in the 64bit mode, since the
7290            lowering is more complicated.  */
7291         if (intel_syntax
7292             && i.tm.opcode_modifier.todword
7293             && i.types[0].bitfield.class != RegSIMD)
7294           {
7295             /* Convert to DWORD.  We don't want REX byte. */
7296             i.suffix = LONG_MNEM_SUFFIX;
7297           }
7298         else
7299           {
7300             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7301                     register_prefix, i.op[op].regs->reg_name,
7302                     i.suffix);
7303             return 0;
7304           }
7305       }
7306   return 1;
7307 }
7308
7309 static int
7310 check_word_reg (void)
7311 {
7312   int op;
7313   for (op = i.operands; --op >= 0;)
7314     /* Skip non-register operands. */
7315     if (i.types[op].bitfield.class != Reg)
7316       continue;
7317     /* Reject eight bit registers, except where the template requires
7318        them. (eg. movzb)  */
7319     else if (i.types[op].bitfield.byte
7320              && (i.tm.operand_types[op].bitfield.class == Reg
7321                  || i.tm.operand_types[op].bitfield.instance == Accum)
7322              && (i.tm.operand_types[op].bitfield.word
7323                  || i.tm.operand_types[op].bitfield.dword))
7324       {
7325         as_bad (_("`%s%s' not allowed with `%s%c'"),
7326                 register_prefix,
7327                 i.op[op].regs->reg_name,
7328                 i.tm.name,
7329                 i.suffix);
7330         return 0;
7331       }
7332     /* Error if the e or r prefix on a general reg is present.  */
7333     else if ((i.types[op].bitfield.dword
7334                  || i.types[op].bitfield.qword)
7335              && (i.tm.operand_types[op].bitfield.class == Reg
7336                  || i.tm.operand_types[op].bitfield.instance == Accum)
7337              && i.tm.operand_types[op].bitfield.word)
7338       {
7339         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7340                 register_prefix, i.op[op].regs->reg_name,
7341                 i.suffix);
7342         return 0;
7343       }
7344   return 1;
7345 }
7346
7347 static int
7348 update_imm (unsigned int j)
7349 {
7350   i386_operand_type overlap = i.types[j];
7351   if ((overlap.bitfield.imm8
7352        || overlap.bitfield.imm8s
7353        || overlap.bitfield.imm16
7354        || overlap.bitfield.imm32
7355        || overlap.bitfield.imm32s
7356        || overlap.bitfield.imm64)
7357       && !operand_type_equal (&overlap, &imm8)
7358       && !operand_type_equal (&overlap, &imm8s)
7359       && !operand_type_equal (&overlap, &imm16)
7360       && !operand_type_equal (&overlap, &imm32)
7361       && !operand_type_equal (&overlap, &imm32s)
7362       && !operand_type_equal (&overlap, &imm64))
7363     {
7364       if (i.suffix)
7365         {
7366           i386_operand_type temp;
7367
7368           operand_type_set (&temp, 0);
7369           if (i.suffix == BYTE_MNEM_SUFFIX)
7370             {
7371               temp.bitfield.imm8 = overlap.bitfield.imm8;
7372               temp.bitfield.imm8s = overlap.bitfield.imm8s;
7373             }
7374           else if (i.suffix == WORD_MNEM_SUFFIX)
7375             temp.bitfield.imm16 = overlap.bitfield.imm16;
7376           else if (i.suffix == QWORD_MNEM_SUFFIX)
7377             {
7378               temp.bitfield.imm64 = overlap.bitfield.imm64;
7379               temp.bitfield.imm32s = overlap.bitfield.imm32s;
7380             }
7381           else
7382             temp.bitfield.imm32 = overlap.bitfield.imm32;
7383           overlap = temp;
7384         }
7385       else if (operand_type_equal (&overlap, &imm16_32_32s)
7386                || operand_type_equal (&overlap, &imm16_32)
7387                || operand_type_equal (&overlap, &imm16_32s))
7388         {
7389           if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
7390             overlap = imm16;
7391           else
7392             overlap = imm32s;
7393         }
7394       else if (i.prefix[REX_PREFIX] & REX_W)
7395         overlap = operand_type_and (overlap, imm32s);
7396       else if (i.prefix[DATA_PREFIX])
7397         overlap = operand_type_and (overlap,
7398                                     flag_code != CODE_16BIT ? imm16 : imm32);
7399       if (!operand_type_equal (&overlap, &imm8)
7400           && !operand_type_equal (&overlap, &imm8s)
7401           && !operand_type_equal (&overlap, &imm16)
7402           && !operand_type_equal (&overlap, &imm32)
7403           && !operand_type_equal (&overlap, &imm32s)
7404           && !operand_type_equal (&overlap, &imm64))
7405         {
7406           as_bad (_("no instruction mnemonic suffix given; "
7407                     "can't determine immediate size"));
7408           return 0;
7409         }
7410     }
7411   i.types[j] = overlap;
7412
7413   return 1;
7414 }
7415
7416 static int
7417 finalize_imm (void)
7418 {
7419   unsigned int j, n;
7420
7421   /* Update the first 2 immediate operands.  */
7422   n = i.operands > 2 ? 2 : i.operands;
7423   if (n)
7424     {
7425       for (j = 0; j < n; j++)
7426         if (update_imm (j) == 0)
7427           return 0;
7428
7429       /* The 3rd operand can't be immediate operand.  */
7430       gas_assert (operand_type_check (i.types[2], imm) == 0);
7431     }
7432
7433   return 1;
7434 }
7435
7436 static int
7437 process_operands (void)
7438 {
7439   /* Default segment register this instruction will use for memory
7440      accesses.  0 means unknown.  This is only for optimizing out
7441      unnecessary segment overrides.  */
7442   const seg_entry *default_seg = 0;
7443
7444   if (i.tm.opcode_modifier.sse2avx)
7445     {
7446       /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
7447          need converting.  */
7448       i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
7449       i.prefix[REX_PREFIX] = 0;
7450       i.rex_encoding = 0;
7451     }
7452   /* ImmExt should be processed after SSE2AVX.  */
7453   else if (i.tm.opcode_modifier.immext)
7454     process_immext ();
7455
7456   if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
7457     {
7458       unsigned int dupl = i.operands;
7459       unsigned int dest = dupl - 1;
7460       unsigned int j;
7461
7462       /* The destination must be an xmm register.  */
7463       gas_assert (i.reg_operands
7464                   && MAX_OPERANDS > dupl
7465                   && operand_type_equal (&i.types[dest], &regxmm));
7466
7467       if (i.tm.operand_types[0].bitfield.instance == Accum
7468           && i.tm.operand_types[0].bitfield.xmmword)
7469         {
7470           if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
7471             {
7472               /* Keep xmm0 for instructions with VEX prefix and 3
7473                  sources.  */
7474               i.tm.operand_types[0].bitfield.instance = InstanceNone;
7475               i.tm.operand_types[0].bitfield.class = RegSIMD;
7476               goto duplicate;
7477             }
7478           else
7479             {
7480               /* We remove the first xmm0 and keep the number of
7481                  operands unchanged, which in fact duplicates the
7482                  destination.  */
7483               for (j = 1; j < i.operands; j++)
7484                 {
7485                   i.op[j - 1] = i.op[j];
7486                   i.types[j - 1] = i.types[j];
7487                   i.tm.operand_types[j - 1] = i.tm.operand_types[j];
7488                   i.flags[j - 1] = i.flags[j];
7489                 }
7490             }
7491         }
7492       else if (i.tm.opcode_modifier.implicit1stxmm0)
7493         {
7494           gas_assert ((MAX_OPERANDS - 1) > dupl
7495                       && (i.tm.opcode_modifier.vexsources
7496                           == VEX3SOURCES));
7497
7498           /* Add the implicit xmm0 for instructions with VEX prefix
7499              and 3 sources.  */
7500           for (j = i.operands; j > 0; j--)
7501             {
7502               i.op[j] = i.op[j - 1];
7503               i.types[j] = i.types[j - 1];
7504               i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7505               i.flags[j] = i.flags[j - 1];
7506             }
7507           i.op[0].regs
7508             = (const reg_entry *) hash_find (reg_hash, "xmm0");
7509           i.types[0] = regxmm;
7510           i.tm.operand_types[0] = regxmm;
7511
7512           i.operands += 2;
7513           i.reg_operands += 2;
7514           i.tm.operands += 2;
7515
7516           dupl++;
7517           dest++;
7518           i.op[dupl] = i.op[dest];
7519           i.types[dupl] = i.types[dest];
7520           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7521           i.flags[dupl] = i.flags[dest];
7522         }
7523       else
7524         {
7525         duplicate:
7526           i.operands++;
7527           i.reg_operands++;
7528           i.tm.operands++;
7529
7530           i.op[dupl] = i.op[dest];
7531           i.types[dupl] = i.types[dest];
7532           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7533           i.flags[dupl] = i.flags[dest];
7534         }
7535
7536        if (i.tm.opcode_modifier.immext)
7537          process_immext ();
7538     }
7539   else if (i.tm.operand_types[0].bitfield.instance == Accum
7540            && i.tm.operand_types[0].bitfield.xmmword)
7541     {
7542       unsigned int j;
7543
7544       for (j = 1; j < i.operands; j++)
7545         {
7546           i.op[j - 1] = i.op[j];
7547           i.types[j - 1] = i.types[j];
7548
7549           /* We need to adjust fields in i.tm since they are used by
7550              build_modrm_byte.  */
7551           i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7552
7553           i.flags[j - 1] = i.flags[j];
7554         }
7555
7556       i.operands--;
7557       i.reg_operands--;
7558       i.tm.operands--;
7559     }
7560   else if (i.tm.opcode_modifier.implicitquadgroup)
7561     {
7562       unsigned int regnum, first_reg_in_group, last_reg_in_group;
7563
7564       /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7565       gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7566       regnum = register_number (i.op[1].regs);
7567       first_reg_in_group = regnum & ~3;
7568       last_reg_in_group = first_reg_in_group + 3;
7569       if (regnum != first_reg_in_group)
7570         as_warn (_("source register `%s%s' implicitly denotes"
7571                    " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7572                  register_prefix, i.op[1].regs->reg_name,
7573                  register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7574                  register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7575                  i.tm.name);
7576     }
7577   else if (i.tm.opcode_modifier.regkludge)
7578     {
7579       /* The imul $imm, %reg instruction is converted into
7580          imul $imm, %reg, %reg, and the clr %reg instruction
7581          is converted into xor %reg, %reg.  */
7582
7583       unsigned int first_reg_op;
7584
7585       if (operand_type_check (i.types[0], reg))
7586         first_reg_op = 0;
7587       else
7588         first_reg_op = 1;
7589       /* Pretend we saw the extra register operand.  */
7590       gas_assert (i.reg_operands == 1
7591                   && i.op[first_reg_op + 1].regs == 0);
7592       i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7593       i.types[first_reg_op + 1] = i.types[first_reg_op];
7594       i.operands++;
7595       i.reg_operands++;
7596     }
7597
7598   if (i.tm.opcode_modifier.modrm)
7599     {
7600       /* The opcode is completed (modulo i.tm.extension_opcode which
7601          must be put into the modrm byte).  Now, we make the modrm and
7602          index base bytes based on all the info we've collected.  */
7603
7604       default_seg = build_modrm_byte ();
7605     }
7606   else if (i.types[0].bitfield.class == SReg)
7607     {
7608       if (flag_code != CODE_64BIT
7609           ? i.tm.base_opcode == POP_SEG_SHORT
7610             && i.op[0].regs->reg_num == 1
7611           : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7612             && i.op[0].regs->reg_num < 4)
7613         {
7614           as_bad (_("you can't `%s %s%s'"),
7615                   i.tm.name, register_prefix, i.op[0].regs->reg_name);
7616           return 0;
7617         }
7618       if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7619         {
7620           i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7621           i.tm.opcode_length = 2;
7622         }
7623       i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7624     }
7625   else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7626     {
7627       default_seg = &ds;
7628     }
7629   else if (i.tm.opcode_modifier.isstring)
7630     {
7631       /* For the string instructions that allow a segment override
7632          on one of their operands, the default segment is ds.  */
7633       default_seg = &ds;
7634     }
7635   else if (i.short_form)
7636     {
7637       /* The register or float register operand is in operand
7638          0 or 1.  */
7639       unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7640
7641       /* Register goes in low 3 bits of opcode.  */
7642       i.tm.base_opcode |= i.op[op].regs->reg_num;
7643       if ((i.op[op].regs->reg_flags & RegRex) != 0)
7644         i.rex |= REX_B;
7645       if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7646         {
7647           /* Warn about some common errors, but press on regardless.
7648              The first case can be generated by gcc (<= 2.8.1).  */
7649           if (i.operands == 2)
7650             {
7651               /* Reversed arguments on faddp, fsubp, etc.  */
7652               as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7653                        register_prefix, i.op[!intel_syntax].regs->reg_name,
7654                        register_prefix, i.op[intel_syntax].regs->reg_name);
7655             }
7656           else
7657             {
7658               /* Extraneous `l' suffix on fp insn.  */
7659               as_warn (_("translating to `%s %s%s'"), i.tm.name,
7660                        register_prefix, i.op[0].regs->reg_name);
7661             }
7662         }
7663     }
7664
7665   if ((i.seg[0] || i.prefix[SEG_PREFIX])
7666       && i.tm.base_opcode == 0x8d /* lea */
7667       && !is_any_vex_encoding(&i.tm))
7668     {
7669       if (!quiet_warnings)
7670         as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7671       if (optimize)
7672         {
7673           i.seg[0] = NULL;
7674           i.prefix[SEG_PREFIX] = 0;
7675         }
7676     }
7677
7678   /* If a segment was explicitly specified, and the specified segment
7679      is neither the default nor the one already recorded from a prefix,
7680      use an opcode prefix to select it.  If we never figured out what
7681      the default segment is, then default_seg will be zero at this
7682      point, and the specified segment prefix will always be used.  */
7683   if (i.seg[0]
7684       && i.seg[0] != default_seg
7685       && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
7686     {
7687       if (!add_prefix (i.seg[0]->seg_prefix))
7688         return 0;
7689     }
7690   return 1;
7691 }
7692
7693 static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
7694                                  bfd_boolean do_sse2avx)
7695 {
7696   if (r->reg_flags & RegRex)
7697     {
7698       if (i.rex & rex_bit)
7699         as_bad (_("same type of prefix used twice"));
7700       i.rex |= rex_bit;
7701     }
7702   else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
7703     {
7704       gas_assert (i.vex.register_specifier == r);
7705       i.vex.register_specifier += 8;
7706     }
7707
7708   if (r->reg_flags & RegVRex)
7709     i.vrex |= rex_bit;
7710 }
7711
7712 static const seg_entry *
7713 build_modrm_byte (void)
7714 {
7715   const seg_entry *default_seg = 0;
7716   unsigned int source, dest;
7717   int vex_3_sources;
7718
7719   vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7720   if (vex_3_sources)
7721     {
7722       unsigned int nds, reg_slot;
7723       expressionS *exp;
7724
7725       dest = i.operands - 1;
7726       nds = dest - 1;
7727
7728       /* There are 2 kinds of instructions:
7729          1. 5 operands: 4 register operands or 3 register operands
7730          plus 1 memory operand plus one Imm4 operand, VexXDS, and
7731          VexW0 or VexW1.  The destination must be either XMM, YMM or
7732          ZMM register.
7733          2. 4 operands: 4 register operands or 3 register operands
7734          plus 1 memory operand, with VexXDS.  */
7735       gas_assert ((i.reg_operands == 4
7736                    || (i.reg_operands == 3 && i.mem_operands == 1))
7737                   && i.tm.opcode_modifier.vexvvvv == VEXXDS
7738                   && i.tm.opcode_modifier.vexw
7739                   && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7740
7741       /* If VexW1 is set, the first non-immediate operand is the source and
7742          the second non-immediate one is encoded in the immediate operand.  */
7743       if (i.tm.opcode_modifier.vexw == VEXW1)
7744         {
7745           source = i.imm_operands;
7746           reg_slot = i.imm_operands + 1;
7747         }
7748       else
7749         {
7750           source = i.imm_operands + 1;
7751           reg_slot = i.imm_operands;
7752         }
7753
7754       if (i.imm_operands == 0)
7755         {
7756           /* When there is no immediate operand, generate an 8bit
7757              immediate operand to encode the first operand.  */
7758           exp = &im_expressions[i.imm_operands++];
7759           i.op[i.operands].imms = exp;
7760           i.types[i.operands] = imm8;
7761           i.operands++;
7762
7763           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7764           exp->X_op = O_constant;
7765           exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7766           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7767         }
7768       else
7769         {
7770           gas_assert (i.imm_operands == 1);
7771           gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7772           gas_assert (!i.tm.opcode_modifier.immext);
7773
7774           /* Turn on Imm8 again so that output_imm will generate it.  */
7775           i.types[0].bitfield.imm8 = 1;
7776
7777           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7778           i.op[0].imms->X_add_number
7779               |= register_number (i.op[reg_slot].regs) << 4;
7780           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7781         }
7782
7783       gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7784       i.vex.register_specifier = i.op[nds].regs;
7785     }
7786   else
7787     source = dest = 0;
7788
7789   /* i.reg_operands MUST be the number of real register operands;
7790      implicit registers do not count.  If there are 3 register
7791      operands, it must be a instruction with VexNDS.  For a
7792      instruction with VexNDD, the destination register is encoded
7793      in VEX prefix.  If there are 4 register operands, it must be
7794      a instruction with VEX prefix and 3 sources.  */
7795   if (i.mem_operands == 0
7796       && ((i.reg_operands == 2
7797            && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7798           || (i.reg_operands == 3
7799               && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7800           || (i.reg_operands == 4 && vex_3_sources)))
7801     {
7802       switch (i.operands)
7803         {
7804         case 2:
7805           source = 0;
7806           break;
7807         case 3:
7808           /* When there are 3 operands, one of them may be immediate,
7809              which may be the first or the last operand.  Otherwise,
7810              the first operand must be shift count register (cl) or it
7811              is an instruction with VexNDS. */
7812           gas_assert (i.imm_operands == 1
7813                       || (i.imm_operands == 0
7814                           && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7815                               || (i.types[0].bitfield.instance == RegC
7816                                   && i.types[0].bitfield.byte))));
7817           if (operand_type_check (i.types[0], imm)
7818               || (i.types[0].bitfield.instance == RegC
7819                   && i.types[0].bitfield.byte))
7820             source = 1;
7821           else
7822             source = 0;
7823           break;
7824         case 4:
7825           /* When there are 4 operands, the first two must be 8bit
7826              immediate operands. The source operand will be the 3rd
7827              one.
7828
7829              For instructions with VexNDS, if the first operand
7830              an imm8, the source operand is the 2nd one.  If the last
7831              operand is imm8, the source operand is the first one.  */
7832           gas_assert ((i.imm_operands == 2
7833                        && i.types[0].bitfield.imm8
7834                        && i.types[1].bitfield.imm8)
7835                       || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7836                           && i.imm_operands == 1
7837                           && (i.types[0].bitfield.imm8
7838                               || i.types[i.operands - 1].bitfield.imm8
7839                               || i.rounding)));
7840           if (i.imm_operands == 2)
7841             source = 2;
7842           else
7843             {
7844               if (i.types[0].bitfield.imm8)
7845                 source = 1;
7846               else
7847                 source = 0;
7848             }
7849           break;
7850         case 5:
7851           if (is_evex_encoding (&i.tm))
7852             {
7853               /* For EVEX instructions, when there are 5 operands, the
7854                  first one must be immediate operand.  If the second one
7855                  is immediate operand, the source operand is the 3th
7856                  one.  If the last one is immediate operand, the source
7857                  operand is the 2nd one.  */
7858               gas_assert (i.imm_operands == 2
7859                           && i.tm.opcode_modifier.sae
7860                           && operand_type_check (i.types[0], imm));
7861               if (operand_type_check (i.types[1], imm))
7862                 source = 2;
7863               else if (operand_type_check (i.types[4], imm))
7864                 source = 1;
7865               else
7866                 abort ();
7867             }
7868           break;
7869         default:
7870           abort ();
7871         }
7872
7873       if (!vex_3_sources)
7874         {
7875           dest = source + 1;
7876
7877           /* RC/SAE operand could be between DEST and SRC.  That happens
7878              when one operand is GPR and the other one is XMM/YMM/ZMM
7879              register.  */
7880           if (i.rounding && i.rounding->operand == (int) dest)
7881             dest++;
7882
7883           if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7884             {
7885               /* For instructions with VexNDS, the register-only source
7886                  operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7887                  register.  It is encoded in VEX prefix.  */
7888
7889               i386_operand_type op;
7890               unsigned int vvvv;
7891
7892               /* Check register-only source operand when two source
7893                  operands are swapped.  */
7894               if (!i.tm.operand_types[source].bitfield.baseindex
7895                   && i.tm.operand_types[dest].bitfield.baseindex)
7896                 {
7897                   vvvv = source;
7898                   source = dest;
7899                 }
7900               else
7901                 vvvv = dest;
7902
7903               op = i.tm.operand_types[vvvv];
7904               if ((dest + 1) >= i.operands
7905                   || ((op.bitfield.class != Reg
7906                        || (!op.bitfield.dword && !op.bitfield.qword))
7907                       && op.bitfield.class != RegSIMD
7908                       && !operand_type_equal (&op, &regmask)))
7909                 abort ();
7910               i.vex.register_specifier = i.op[vvvv].regs;
7911               dest++;
7912             }
7913         }
7914
7915       i.rm.mode = 3;
7916       /* One of the register operands will be encoded in the i.rm.reg
7917          field, the other in the combined i.rm.mode and i.rm.regmem
7918          fields.  If no form of this instruction supports a memory
7919          destination operand, then we assume the source operand may
7920          sometimes be a memory operand and so we need to store the
7921          destination in the i.rm.reg field.  */
7922       if (!i.tm.opcode_modifier.regmem
7923           && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7924         {
7925           i.rm.reg = i.op[dest].regs->reg_num;
7926           i.rm.regmem = i.op[source].regs->reg_num;
7927           if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7928                || i.op[source].regs->reg_type.bitfield.class == RegMMX)
7929             i.has_regmmx = TRUE;
7930           else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7931                    || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
7932             {
7933               if (i.types[dest].bitfield.zmmword
7934                   || i.types[source].bitfield.zmmword)
7935                 i.has_regzmm = TRUE;
7936               else if (i.types[dest].bitfield.ymmword
7937                        || i.types[source].bitfield.ymmword)
7938                 i.has_regymm = TRUE;
7939               else
7940                 i.has_regxmm = TRUE;
7941             }
7942           set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
7943           set_rex_vrex (i.op[source].regs, REX_B, FALSE);
7944         }
7945       else
7946         {
7947           i.rm.reg = i.op[source].regs->reg_num;
7948           i.rm.regmem = i.op[dest].regs->reg_num;
7949           set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
7950           set_rex_vrex (i.op[source].regs, REX_R, FALSE);
7951         }
7952       if (flag_code != CODE_64BIT && (i.rex & REX_R))
7953         {
7954           if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
7955             abort ();
7956           i.rex &= ~REX_R;
7957           add_prefix (LOCK_PREFIX_OPCODE);
7958         }
7959     }
7960   else
7961     {                   /* If it's not 2 reg operands...  */
7962       unsigned int mem;
7963
7964       if (i.mem_operands)
7965         {
7966           unsigned int fake_zero_displacement = 0;
7967           unsigned int op;
7968
7969           for (op = 0; op < i.operands; op++)
7970             if (i.flags[op] & Operand_Mem)
7971               break;
7972           gas_assert (op < i.operands);
7973
7974           if (i.tm.opcode_modifier.sib)
7975             {
7976               if (i.index_reg->reg_num == RegIZ)
7977                 abort ();
7978
7979               i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7980               if (!i.base_reg)
7981                 {
7982                   i.sib.base = NO_BASE_REGISTER;
7983                   i.sib.scale = i.log2_scale_factor;
7984                   i.types[op].bitfield.disp8 = 0;
7985                   i.types[op].bitfield.disp16 = 0;
7986                   i.types[op].bitfield.disp64 = 0;
7987                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7988                     {
7989                       /* Must be 32 bit */
7990                       i.types[op].bitfield.disp32 = 1;
7991                       i.types[op].bitfield.disp32s = 0;
7992                     }
7993                   else
7994                     {
7995                       i.types[op].bitfield.disp32 = 0;
7996                       i.types[op].bitfield.disp32s = 1;
7997                     }
7998                 }
7999               i.sib.index = i.index_reg->reg_num;
8000               set_rex_vrex (i.index_reg, REX_X, FALSE);
8001             }
8002
8003           default_seg = &ds;
8004
8005           if (i.base_reg == 0)
8006             {
8007               i.rm.mode = 0;
8008               if (!i.disp_operands)
8009                 fake_zero_displacement = 1;
8010               if (i.index_reg == 0)
8011                 {
8012                   i386_operand_type newdisp;
8013
8014                   gas_assert (!i.tm.opcode_modifier.sib);
8015                   /* Operand is just <disp>  */
8016                   if (flag_code == CODE_64BIT)
8017                     {
8018                       /* 64bit mode overwrites the 32bit absolute
8019                          addressing by RIP relative addressing and
8020                          absolute addressing is encoded by one of the
8021                          redundant SIB forms.  */
8022                       i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8023                       i.sib.base = NO_BASE_REGISTER;
8024                       i.sib.index = NO_INDEX_REGISTER;
8025                       newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
8026                     }
8027                   else if ((flag_code == CODE_16BIT)
8028                            ^ (i.prefix[ADDR_PREFIX] != 0))
8029                     {
8030                       i.rm.regmem = NO_BASE_REGISTER_16;
8031                       newdisp = disp16;
8032                     }
8033                   else
8034                     {
8035                       i.rm.regmem = NO_BASE_REGISTER;
8036                       newdisp = disp32;
8037                     }
8038                   i.types[op] = operand_type_and_not (i.types[op], anydisp);
8039                   i.types[op] = operand_type_or (i.types[op], newdisp);
8040                 }
8041               else if (!i.tm.opcode_modifier.sib)
8042                 {
8043                   /* !i.base_reg && i.index_reg  */
8044                   if (i.index_reg->reg_num == RegIZ)
8045                     i.sib.index = NO_INDEX_REGISTER;
8046                   else
8047                     i.sib.index = i.index_reg->reg_num;
8048                   i.sib.base = NO_BASE_REGISTER;
8049                   i.sib.scale = i.log2_scale_factor;
8050                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8051                   i.types[op].bitfield.disp8 = 0;
8052                   i.types[op].bitfield.disp16 = 0;
8053                   i.types[op].bitfield.disp64 = 0;
8054                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8055                     {
8056                       /* Must be 32 bit */
8057                       i.types[op].bitfield.disp32 = 1;
8058                       i.types[op].bitfield.disp32s = 0;
8059                     }
8060                   else
8061                     {
8062                       i.types[op].bitfield.disp32 = 0;
8063                       i.types[op].bitfield.disp32s = 1;
8064                     }
8065                   if ((i.index_reg->reg_flags & RegRex) != 0)
8066                     i.rex |= REX_X;
8067                 }
8068             }
8069           /* RIP addressing for 64bit mode.  */
8070           else if (i.base_reg->reg_num == RegIP)
8071             {
8072               gas_assert (!i.tm.opcode_modifier.sib);
8073               i.rm.regmem = NO_BASE_REGISTER;
8074               i.types[op].bitfield.disp8 = 0;
8075               i.types[op].bitfield.disp16 = 0;
8076               i.types[op].bitfield.disp32 = 0;
8077               i.types[op].bitfield.disp32s = 1;
8078               i.types[op].bitfield.disp64 = 0;
8079               i.flags[op] |= Operand_PCrel;
8080               if (! i.disp_operands)
8081                 fake_zero_displacement = 1;
8082             }
8083           else if (i.base_reg->reg_type.bitfield.word)
8084             {
8085               gas_assert (!i.tm.opcode_modifier.sib);
8086               switch (i.base_reg->reg_num)
8087                 {
8088                 case 3: /* (%bx)  */
8089                   if (i.index_reg == 0)
8090                     i.rm.regmem = 7;
8091                   else /* (%bx,%si) -> 0, or (%bx,%di) -> 1  */
8092                     i.rm.regmem = i.index_reg->reg_num - 6;
8093                   break;
8094                 case 5: /* (%bp)  */
8095                   default_seg = &ss;
8096                   if (i.index_reg == 0)
8097                     {
8098                       i.rm.regmem = 6;
8099                       if (operand_type_check (i.types[op], disp) == 0)
8100                         {
8101                           /* fake (%bp) into 0(%bp)  */
8102                           i.types[op].bitfield.disp8 = 1;
8103                           fake_zero_displacement = 1;
8104                         }
8105                     }
8106                   else /* (%bp,%si) -> 2, or (%bp,%di) -> 3  */
8107                     i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8108                   break;
8109                 default: /* (%si) -> 4 or (%di) -> 5  */
8110                   i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8111                 }
8112               i.rm.mode = mode_from_disp_size (i.types[op]);
8113             }
8114           else /* i.base_reg and 32/64 bit mode  */
8115             {
8116               if (flag_code == CODE_64BIT
8117                   && operand_type_check (i.types[op], disp))
8118                 {
8119                   i.types[op].bitfield.disp16 = 0;
8120                   i.types[op].bitfield.disp64 = 0;
8121                   if (i.prefix[ADDR_PREFIX] == 0)
8122                     {
8123                       i.types[op].bitfield.disp32 = 0;
8124                       i.types[op].bitfield.disp32s = 1;
8125                     }
8126                   else
8127                     {
8128                       i.types[op].bitfield.disp32 = 1;
8129                       i.types[op].bitfield.disp32s = 0;
8130                     }
8131                 }
8132
8133               if (!i.tm.opcode_modifier.sib)
8134                 i.rm.regmem = i.base_reg->reg_num;
8135               if ((i.base_reg->reg_flags & RegRex) != 0)
8136                 i.rex |= REX_B;
8137               i.sib.base = i.base_reg->reg_num;
8138               /* x86-64 ignores REX prefix bit here to avoid decoder
8139                  complications.  */
8140               if (!(i.base_reg->reg_flags & RegRex)
8141                   && (i.base_reg->reg_num == EBP_REG_NUM
8142                    || i.base_reg->reg_num == ESP_REG_NUM))
8143                   default_seg = &ss;
8144               if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
8145                 {
8146                   fake_zero_displacement = 1;
8147                   i.types[op].bitfield.disp8 = 1;
8148                 }
8149               i.sib.scale = i.log2_scale_factor;
8150               if (i.index_reg == 0)
8151                 {
8152                   gas_assert (!i.tm.opcode_modifier.sib);
8153                   /* <disp>(%esp) becomes two byte modrm with no index
8154                      register.  We've already stored the code for esp
8155                      in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8156                      Any base register besides %esp will not use the
8157                      extra modrm byte.  */
8158                   i.sib.index = NO_INDEX_REGISTER;
8159                 }
8160               else if (!i.tm.opcode_modifier.sib)
8161                 {
8162                   if (i.index_reg->reg_num == RegIZ)
8163                     i.sib.index = NO_INDEX_REGISTER;
8164                   else
8165                     i.sib.index = i.index_reg->reg_num;
8166                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8167                   if ((i.index_reg->reg_flags & RegRex) != 0)
8168                     i.rex |= REX_X;
8169                 }
8170
8171               if (i.disp_operands
8172                   && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8173                       || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8174                 i.rm.mode = 0;
8175               else
8176                 {
8177                   if (!fake_zero_displacement
8178                       && !i.disp_operands
8179                       && i.disp_encoding)
8180                     {
8181                       fake_zero_displacement = 1;
8182                       if (i.disp_encoding == disp_encoding_8bit)
8183                         i.types[op].bitfield.disp8 = 1;
8184                       else
8185                         i.types[op].bitfield.disp32 = 1;
8186                     }
8187                   i.rm.mode = mode_from_disp_size (i.types[op]);
8188                 }
8189             }
8190
8191           if (fake_zero_displacement)
8192             {
8193               /* Fakes a zero displacement assuming that i.types[op]
8194                  holds the correct displacement size.  */
8195               expressionS *exp;
8196
8197               gas_assert (i.op[op].disps == 0);
8198               exp = &disp_expressions[i.disp_operands++];
8199               i.op[op].disps = exp;
8200               exp->X_op = O_constant;
8201               exp->X_add_number = 0;
8202               exp->X_add_symbol = (symbolS *) 0;
8203               exp->X_op_symbol = (symbolS *) 0;
8204             }
8205
8206           mem = op;
8207         }
8208       else
8209         mem = ~0;
8210
8211       if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
8212         {
8213           if (operand_type_check (i.types[0], imm))
8214             i.vex.register_specifier = NULL;
8215           else
8216             {
8217               /* VEX.vvvv encodes one of the sources when the first
8218                  operand is not an immediate.  */
8219               if (i.tm.opcode_modifier.vexw == VEXW0)
8220                 i.vex.register_specifier = i.op[0].regs;
8221               else
8222                 i.vex.register_specifier = i.op[1].regs;
8223             }
8224
8225           /* Destination is a XMM register encoded in the ModRM.reg
8226              and VEX.R bit.  */
8227           i.rm.reg = i.op[2].regs->reg_num;
8228           if ((i.op[2].regs->reg_flags & RegRex) != 0)
8229             i.rex |= REX_R;
8230
8231           /* ModRM.rm and VEX.B encodes the other source.  */
8232           if (!i.mem_operands)
8233             {
8234               i.rm.mode = 3;
8235
8236               if (i.tm.opcode_modifier.vexw == VEXW0)
8237                 i.rm.regmem = i.op[1].regs->reg_num;
8238               else
8239                 i.rm.regmem = i.op[0].regs->reg_num;
8240
8241               if ((i.op[1].regs->reg_flags & RegRex) != 0)
8242                 i.rex |= REX_B;
8243             }
8244         }
8245       else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
8246         {
8247           i.vex.register_specifier = i.op[2].regs;
8248           if (!i.mem_operands)
8249             {
8250               i.rm.mode = 3;
8251               i.rm.regmem = i.op[1].regs->reg_num;
8252               if ((i.op[1].regs->reg_flags & RegRex) != 0)
8253                 i.rex |= REX_B;
8254             }
8255         }
8256       /* Fill in i.rm.reg or i.rm.regmem field with register operand
8257          (if any) based on i.tm.extension_opcode.  Again, we must be
8258          careful to make sure that segment/control/debug/test/MMX
8259          registers are coded into the i.rm.reg field.  */
8260       else if (i.reg_operands)
8261         {
8262           unsigned int op;
8263           unsigned int vex_reg = ~0;
8264
8265           for (op = 0; op < i.operands; op++)
8266             {
8267               if (i.types[op].bitfield.class == Reg
8268                   || i.types[op].bitfield.class == RegBND
8269                   || i.types[op].bitfield.class == RegMask
8270                   || i.types[op].bitfield.class == SReg
8271                   || i.types[op].bitfield.class == RegCR
8272                   || i.types[op].bitfield.class == RegDR
8273                   || i.types[op].bitfield.class == RegTR)
8274                 break;
8275               if (i.types[op].bitfield.class == RegSIMD)
8276                 {
8277                   if (i.types[op].bitfield.zmmword)
8278                     i.has_regzmm = TRUE;
8279                   else if (i.types[op].bitfield.ymmword)
8280                     i.has_regymm = TRUE;
8281                   else
8282                     i.has_regxmm = TRUE;
8283                   break;
8284                 }
8285               if (i.types[op].bitfield.class == RegMMX)
8286                 {
8287                   i.has_regmmx = TRUE;
8288                   break;
8289                 }
8290             }
8291
8292           if (vex_3_sources)
8293             op = dest;
8294           else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
8295             {
8296               /* For instructions with VexNDS, the register-only
8297                  source operand is encoded in VEX prefix. */
8298               gas_assert (mem != (unsigned int) ~0);
8299
8300               if (op > mem)
8301                 {
8302                   vex_reg = op++;
8303                   gas_assert (op < i.operands);
8304                 }
8305               else
8306                 {
8307                   /* Check register-only source operand when two source
8308                      operands are swapped.  */
8309                   if (!i.tm.operand_types[op].bitfield.baseindex
8310                       && i.tm.operand_types[op + 1].bitfield.baseindex)
8311                     {
8312                       vex_reg = op;
8313                       op += 2;
8314                       gas_assert (mem == (vex_reg + 1)
8315                                   && op < i.operands);
8316                     }
8317                   else
8318                     {
8319                       vex_reg = op + 1;
8320                       gas_assert (vex_reg < i.operands);
8321                     }
8322                 }
8323             }
8324           else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
8325             {
8326               /* For instructions with VexNDD, the register destination
8327                  is encoded in VEX prefix.  */
8328               if (i.mem_operands == 0)
8329                 {
8330                   /* There is no memory operand.  */
8331                   gas_assert ((op + 2) == i.operands);
8332                   vex_reg = op + 1;
8333                 }
8334               else
8335                 {
8336                   /* There are only 2 non-immediate operands.  */
8337                   gas_assert (op < i.imm_operands + 2
8338                               && i.operands == i.imm_operands + 2);
8339                   vex_reg = i.imm_operands + 1;
8340                 }
8341             }
8342           else
8343             gas_assert (op < i.operands);
8344
8345           if (vex_reg != (unsigned int) ~0)
8346             {
8347               i386_operand_type *type = &i.tm.operand_types[vex_reg];
8348
8349               if ((type->bitfield.class != Reg
8350                    || (!type->bitfield.dword && !type->bitfield.qword))
8351                   && type->bitfield.class != RegSIMD
8352                   && !operand_type_equal (type, &regmask))
8353                 abort ();
8354
8355               i.vex.register_specifier = i.op[vex_reg].regs;
8356             }
8357
8358           /* Don't set OP operand twice.  */
8359           if (vex_reg != op)
8360             {
8361               /* If there is an extension opcode to put here, the
8362                  register number must be put into the regmem field.  */
8363               if (i.tm.extension_opcode != None)
8364                 {
8365                   i.rm.regmem = i.op[op].regs->reg_num;
8366                   set_rex_vrex (i.op[op].regs, REX_B,
8367                                 i.tm.opcode_modifier.sse2avx);
8368                 }
8369               else
8370                 {
8371                   i.rm.reg = i.op[op].regs->reg_num;
8372                   set_rex_vrex (i.op[op].regs, REX_R,
8373                                 i.tm.opcode_modifier.sse2avx);
8374                 }
8375             }
8376
8377           /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8378              must set it to 3 to indicate this is a register operand
8379              in the regmem field.  */
8380           if (!i.mem_operands)
8381             i.rm.mode = 3;
8382         }
8383
8384       /* Fill in i.rm.reg field with extension opcode (if any).  */
8385       if (i.tm.extension_opcode != None)
8386         i.rm.reg = i.tm.extension_opcode;
8387     }
8388   return default_seg;
8389 }
8390
8391 static unsigned int
8392 flip_code16 (unsigned int code16)
8393 {
8394   gas_assert (i.tm.operands == 1);
8395
8396   return !(i.prefix[REX_PREFIX] & REX_W)
8397          && (code16 ? i.tm.operand_types[0].bitfield.disp32
8398                       || i.tm.operand_types[0].bitfield.disp32s
8399                     : i.tm.operand_types[0].bitfield.disp16)
8400          ? CODE16 : 0;
8401 }
8402
8403 static void
8404 output_branch (void)
8405 {
8406   char *p;
8407   int size;
8408   int code16;
8409   int prefix;
8410   relax_substateT subtype;
8411   symbolS *sym;
8412   offsetT off;
8413
8414   code16 = flag_code == CODE_16BIT ? CODE16 : 0;
8415   size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
8416
8417   prefix = 0;
8418   if (i.prefix[DATA_PREFIX] != 0)
8419     {
8420       prefix = 1;
8421       i.prefixes -= 1;
8422       code16 ^= flip_code16(code16);
8423     }
8424   /* Pentium4 branch hints.  */
8425   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8426       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8427     {
8428       prefix++;
8429       i.prefixes--;
8430     }
8431   if (i.prefix[REX_PREFIX] != 0)
8432     {
8433       prefix++;
8434       i.prefixes--;
8435     }
8436
8437   /* BND prefixed jump.  */
8438   if (i.prefix[BND_PREFIX] != 0)
8439     {
8440       prefix++;
8441       i.prefixes--;
8442     }
8443
8444   if (i.prefixes != 0)
8445     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8446
8447   /* It's always a symbol;  End frag & setup for relax.
8448      Make sure there is enough room in this frag for the largest
8449      instruction we may generate in md_convert_frag.  This is 2
8450      bytes for the opcode and room for the prefix and largest
8451      displacement.  */
8452   frag_grow (prefix + 2 + 4);
8453   /* Prefix and 1 opcode byte go in fr_fix.  */
8454   p = frag_more (prefix + 1);
8455   if (i.prefix[DATA_PREFIX] != 0)
8456     *p++ = DATA_PREFIX_OPCODE;
8457   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8458       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8459     *p++ = i.prefix[SEG_PREFIX];
8460   if (i.prefix[BND_PREFIX] != 0)
8461     *p++ = BND_PREFIX_OPCODE;
8462   if (i.prefix[REX_PREFIX] != 0)
8463     *p++ = i.prefix[REX_PREFIX];
8464   *p = i.tm.base_opcode;
8465
8466   if ((unsigned char) *p == JUMP_PC_RELATIVE)
8467     subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
8468   else if (cpu_arch_flags.bitfield.cpui386)
8469     subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
8470   else
8471     subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
8472   subtype |= code16;
8473
8474   sym = i.op[0].disps->X_add_symbol;
8475   off = i.op[0].disps->X_add_number;
8476
8477   if (i.op[0].disps->X_op != O_constant
8478       && i.op[0].disps->X_op != O_symbol)
8479     {
8480       /* Handle complex expressions.  */
8481       sym = make_expr_symbol (i.op[0].disps);
8482       off = 0;
8483     }
8484
8485   /* 1 possible extra opcode + 4 byte displacement go in var part.
8486      Pass reloc in fr_var.  */
8487   frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
8488 }
8489
8490 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8491 /* Return TRUE iff PLT32 relocation should be used for branching to
8492    symbol S.  */
8493
8494 static bfd_boolean
8495 need_plt32_p (symbolS *s)
8496 {
8497   /* PLT32 relocation is ELF only.  */
8498   if (!IS_ELF)
8499     return FALSE;
8500
8501 #ifdef TE_SOLARIS
8502   /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8503      krtld support it.  */
8504   return FALSE;
8505 #endif
8506
8507   /* Since there is no need to prepare for PLT branch on x86-64, we
8508      can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8509      be used as a marker for 32-bit PC-relative branches.  */
8510   if (!object_64bit)
8511     return FALSE;
8512
8513   /* Weak or undefined symbol need PLT32 relocation.  */
8514   if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8515     return TRUE;
8516
8517   /* Non-global symbol doesn't need PLT32 relocation.  */
8518   if (! S_IS_EXTERNAL (s))
8519     return FALSE;
8520
8521   /* Other global symbols need PLT32 relocation.  NB: Symbol with
8522      non-default visibilities are treated as normal global symbol
8523      so that PLT32 relocation can be used as a marker for 32-bit
8524      PC-relative branches.  It is useful for linker relaxation.  */
8525   return TRUE;
8526 }
8527 #endif
8528
8529 static void
8530 output_jump (void)
8531 {
8532   char *p;
8533   int size;
8534   fixS *fixP;
8535   bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8536
8537   if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8538     {
8539       /* This is a loop or jecxz type instruction.  */
8540       size = 1;
8541       if (i.prefix[ADDR_PREFIX] != 0)
8542         {
8543           FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
8544           i.prefixes -= 1;
8545         }
8546       /* Pentium4 branch hints.  */
8547       if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8548           || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8549         {
8550           FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
8551           i.prefixes--;
8552         }
8553     }
8554   else
8555     {
8556       int code16;
8557
8558       code16 = 0;
8559       if (flag_code == CODE_16BIT)
8560         code16 = CODE16;
8561
8562       if (i.prefix[DATA_PREFIX] != 0)
8563         {
8564           FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8565           i.prefixes -= 1;
8566           code16 ^= flip_code16(code16);
8567         }
8568
8569       size = 4;
8570       if (code16)
8571         size = 2;
8572     }
8573
8574   /* BND prefixed jump.  */
8575   if (i.prefix[BND_PREFIX] != 0)
8576     {
8577       FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
8578       i.prefixes -= 1;
8579     }
8580
8581   if (i.prefix[REX_PREFIX] != 0)
8582     {
8583       FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
8584       i.prefixes -= 1;
8585     }
8586
8587   if (i.prefixes != 0)
8588     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8589
8590   p = frag_more (i.tm.opcode_length + size);
8591   switch (i.tm.opcode_length)
8592     {
8593     case 2:
8594       *p++ = i.tm.base_opcode >> 8;
8595       /* Fall through.  */
8596     case 1:
8597       *p++ = i.tm.base_opcode;
8598       break;
8599     default:
8600       abort ();
8601     }
8602
8603 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8604   if (size == 4
8605       && jump_reloc == NO_RELOC
8606       && need_plt32_p (i.op[0].disps->X_add_symbol))
8607     jump_reloc = BFD_RELOC_X86_64_PLT32;
8608 #endif
8609
8610   jump_reloc = reloc (size, 1, 1, jump_reloc);
8611
8612   fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8613                       i.op[0].disps, 1, jump_reloc);
8614
8615   /* All jumps handled here are signed, but don't use a signed limit
8616      check for 32 and 16 bit jumps as we want to allow wrap around at
8617      4G and 64k respectively.  */
8618   if (size == 1)
8619     fixP->fx_signed = 1;
8620 }
8621
8622 static void
8623 output_interseg_jump (void)
8624 {
8625   char *p;
8626   int size;
8627   int prefix;
8628   int code16;
8629
8630   code16 = 0;
8631   if (flag_code == CODE_16BIT)
8632     code16 = CODE16;
8633
8634   prefix = 0;
8635   if (i.prefix[DATA_PREFIX] != 0)
8636     {
8637       prefix = 1;
8638       i.prefixes -= 1;
8639       code16 ^= CODE16;
8640     }
8641
8642   gas_assert (!i.prefix[REX_PREFIX]);
8643
8644   size = 4;
8645   if (code16)
8646     size = 2;
8647
8648   if (i.prefixes != 0)
8649     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8650
8651   /* 1 opcode; 2 segment; offset  */
8652   p = frag_more (prefix + 1 + 2 + size);
8653
8654   if (i.prefix[DATA_PREFIX] != 0)
8655     *p++ = DATA_PREFIX_OPCODE;
8656
8657   if (i.prefix[REX_PREFIX] != 0)
8658     *p++ = i.prefix[REX_PREFIX];
8659
8660   *p++ = i.tm.base_opcode;
8661   if (i.op[1].imms->X_op == O_constant)
8662     {
8663       offsetT n = i.op[1].imms->X_add_number;
8664
8665       if (size == 2
8666           && !fits_in_unsigned_word (n)
8667           && !fits_in_signed_word (n))
8668         {
8669           as_bad (_("16-bit jump out of range"));
8670           return;
8671         }
8672       md_number_to_chars (p, n, size);
8673     }
8674   else
8675     fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8676                  i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8677   if (i.op[0].imms->X_op != O_constant)
8678     as_bad (_("can't handle non absolute segment in `%s'"),
8679             i.tm.name);
8680   md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8681 }
8682
8683 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8684 void
8685 x86_cleanup (void)
8686 {
8687   char *p;
8688   asection *seg = now_seg;
8689   subsegT subseg = now_subseg;
8690   asection *sec;
8691   unsigned int alignment, align_size_1;
8692   unsigned int isa_1_descsz, feature_2_descsz, descsz;
8693   unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8694   unsigned int padding;
8695
8696   if (!IS_ELF || !x86_used_note)
8697     return;
8698
8699   x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8700
8701   /* The .note.gnu.property section layout:
8702
8703      Field      Length          Contents
8704      ----       ----            ----
8705      n_namsz    4               4
8706      n_descsz   4               The note descriptor size
8707      n_type     4               NT_GNU_PROPERTY_TYPE_0
8708      n_name     4               "GNU"
8709      n_desc     n_descsz        The program property array
8710      ....       ....            ....
8711    */
8712
8713   /* Create the .note.gnu.property section.  */
8714   sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8715   bfd_set_section_flags (sec,
8716                          (SEC_ALLOC
8717                           | SEC_LOAD
8718                           | SEC_DATA
8719                           | SEC_HAS_CONTENTS
8720                           | SEC_READONLY));
8721
8722   if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8723     {
8724       align_size_1 = 7;
8725       alignment = 3;
8726     }
8727   else
8728     {
8729       align_size_1 = 3;
8730       alignment = 2;
8731     }
8732
8733   bfd_set_section_alignment (sec, alignment);
8734   elf_section_type (sec) = SHT_NOTE;
8735
8736   /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8737                                   + 4-byte data  */
8738   isa_1_descsz_raw = 4 + 4 + 4;
8739   /* Align GNU_PROPERTY_X86_ISA_1_USED.  */
8740   isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8741
8742   feature_2_descsz_raw = isa_1_descsz;
8743   /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8744                                       + 4-byte data  */
8745   feature_2_descsz_raw += 4 + 4 + 4;
8746   /* Align GNU_PROPERTY_X86_FEATURE_2_USED.  */
8747   feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8748                       & ~align_size_1);
8749
8750   descsz = feature_2_descsz;
8751   /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz.  */
8752   p = frag_more (4 + 4 + 4 + 4 + descsz);
8753
8754   /* Write n_namsz.  */
8755   md_number_to_chars (p, (valueT) 4, 4);
8756
8757   /* Write n_descsz.  */
8758   md_number_to_chars (p + 4, (valueT) descsz, 4);
8759
8760   /* Write n_type.  */
8761   md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8762
8763   /* Write n_name.  */
8764   memcpy (p + 4 * 3, "GNU", 4);
8765
8766   /* Write 4-byte type.  */
8767   md_number_to_chars (p + 4 * 4,
8768                       (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8769
8770   /* Write 4-byte data size.  */
8771   md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8772
8773   /* Write 4-byte data.  */
8774   md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8775
8776   /* Zero out paddings.  */
8777   padding = isa_1_descsz - isa_1_descsz_raw;
8778   if (padding)
8779     memset (p + 4 * 7, 0, padding);
8780
8781   /* Write 4-byte type.  */
8782   md_number_to_chars (p + isa_1_descsz + 4 * 4,
8783                       (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8784
8785   /* Write 4-byte data size.  */
8786   md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8787
8788   /* Write 4-byte data.  */
8789   md_number_to_chars (p + isa_1_descsz + 4 * 6,
8790                       (valueT) x86_feature_2_used, 4);
8791
8792   /* Zero out paddings.  */
8793   padding = feature_2_descsz - feature_2_descsz_raw;
8794   if (padding)
8795     memset (p + isa_1_descsz + 4 * 7, 0, padding);
8796
8797   /* We probably can't restore the current segment, for there likely
8798      isn't one yet...  */
8799   if (seg && subseg)
8800     subseg_set (seg, subseg);
8801 }
8802 #endif
8803
8804 static unsigned int
8805 encoding_length (const fragS *start_frag, offsetT start_off,
8806                  const char *frag_now_ptr)
8807 {
8808   unsigned int len = 0;
8809
8810   if (start_frag != frag_now)
8811     {
8812       const fragS *fr = start_frag;
8813
8814       do {
8815         len += fr->fr_fix;
8816         fr = fr->fr_next;
8817       } while (fr && fr != frag_now);
8818     }
8819
8820   return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8821 }
8822
8823 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8824    be macro-fused with conditional jumps.
8825    NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
8826    or is one of the following format:
8827
8828     cmp m, imm
8829     add m, imm
8830     sub m, imm
8831    test m, imm
8832     and m, imm
8833     inc m
8834     dec m
8835
8836    it is unfusible.  */
8837
8838 static int
8839 maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
8840 {
8841   /* No RIP address.  */
8842   if (i.base_reg && i.base_reg->reg_num == RegIP)
8843     return 0;
8844
8845   /* No VEX/EVEX encoding.  */
8846   if (is_any_vex_encoding (&i.tm))
8847     return 0;
8848
8849   /* add, sub without add/sub m, imm.  */
8850   if (i.tm.base_opcode <= 5
8851       || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8852       || ((i.tm.base_opcode | 3) == 0x83
8853           && (i.tm.extension_opcode == 0x5
8854               || i.tm.extension_opcode == 0x0)))
8855     {
8856       *mf_cmp_p = mf_cmp_alu_cmp;
8857       return !(i.mem_operands && i.imm_operands);
8858     }
8859
8860   /* and without and m, imm.  */
8861   if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8862       || ((i.tm.base_opcode | 3) == 0x83
8863           && i.tm.extension_opcode == 0x4))
8864     {
8865       *mf_cmp_p = mf_cmp_test_and;
8866       return !(i.mem_operands && i.imm_operands);
8867     }
8868
8869   /* test without test m imm.  */
8870   if ((i.tm.base_opcode | 1) == 0x85
8871       || (i.tm.base_opcode | 1) == 0xa9
8872       || ((i.tm.base_opcode | 1) == 0xf7
8873           && i.tm.extension_opcode == 0))
8874     {
8875       *mf_cmp_p = mf_cmp_test_and;
8876       return !(i.mem_operands && i.imm_operands);
8877     }
8878
8879   /* cmp without cmp m, imm.  */
8880   if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8881       || ((i.tm.base_opcode | 3) == 0x83
8882           && (i.tm.extension_opcode == 0x7)))
8883     {
8884       *mf_cmp_p = mf_cmp_alu_cmp;
8885       return !(i.mem_operands && i.imm_operands);
8886     }
8887
8888   /* inc, dec without inc/dec m.   */
8889   if ((i.tm.cpu_flags.bitfield.cpuno64
8890        && (i.tm.base_opcode | 0xf) == 0x4f)
8891       || ((i.tm.base_opcode | 1) == 0xff
8892           && i.tm.extension_opcode <= 0x1))
8893     {
8894       *mf_cmp_p = mf_cmp_incdec;
8895       return !i.mem_operands;
8896     }
8897
8898   return 0;
8899 }
8900
8901 /* Return 1 if a FUSED_JCC_PADDING frag should be generated.  */
8902
8903 static int
8904 add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
8905 {
8906   /* NB: Don't work with COND_JUMP86 without i386.  */
8907   if (!align_branch_power
8908       || now_seg == absolute_section
8909       || !cpu_arch_flags.bitfield.cpui386
8910       || !(align_branch & align_branch_fused_bit))
8911     return 0;
8912
8913   if (maybe_fused_with_jcc_p (mf_cmp_p))
8914     {
8915       if (last_insn.kind == last_insn_other
8916           || last_insn.seg != now_seg)
8917         return 1;
8918       if (flag_debug)
8919         as_warn_where (last_insn.file, last_insn.line,
8920                        _("`%s` skips -malign-branch-boundary on `%s`"),
8921                        last_insn.name, i.tm.name);
8922     }
8923
8924   return 0;
8925 }
8926
8927 /* Return 1 if a BRANCH_PREFIX frag should be generated.  */
8928
8929 static int
8930 add_branch_prefix_frag_p (void)
8931 {
8932   /* NB: Don't work with COND_JUMP86 without i386.  Don't add prefix
8933      to PadLock instructions since they include prefixes in opcode.  */
8934   if (!align_branch_power
8935       || !align_branch_prefix_size
8936       || now_seg == absolute_section
8937       || i.tm.cpu_flags.bitfield.cpupadlock
8938       || !cpu_arch_flags.bitfield.cpui386)
8939     return 0;
8940
8941   /* Don't add prefix if it is a prefix or there is no operand in case
8942      that segment prefix is special.  */
8943   if (!i.operands || i.tm.opcode_modifier.isprefix)
8944     return 0;
8945
8946   if (last_insn.kind == last_insn_other
8947       || last_insn.seg != now_seg)
8948     return 1;
8949
8950   if (flag_debug)
8951     as_warn_where (last_insn.file, last_insn.line,
8952                    _("`%s` skips -malign-branch-boundary on `%s`"),
8953                    last_insn.name, i.tm.name);
8954
8955   return 0;
8956 }
8957
8958 /* Return 1 if a BRANCH_PADDING frag should be generated.  */
8959
8960 static int
8961 add_branch_padding_frag_p (enum align_branch_kind *branch_p,
8962                            enum mf_jcc_kind *mf_jcc_p)
8963 {
8964   int add_padding;
8965
8966   /* NB: Don't work with COND_JUMP86 without i386.  */
8967   if (!align_branch_power
8968       || now_seg == absolute_section
8969       || !cpu_arch_flags.bitfield.cpui386)
8970     return 0;
8971
8972   add_padding = 0;
8973
8974   /* Check for jcc and direct jmp.  */
8975   if (i.tm.opcode_modifier.jump == JUMP)
8976     {
8977       if (i.tm.base_opcode == JUMP_PC_RELATIVE)
8978         {
8979           *branch_p = align_branch_jmp;
8980           add_padding = align_branch & align_branch_jmp_bit;
8981         }
8982       else
8983         {
8984           /* Because J<cc> and JN<cc> share same group in macro-fusible table,
8985              igore the lowest bit.  */
8986           *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
8987           *branch_p = align_branch_jcc;
8988           if ((align_branch & align_branch_jcc_bit))
8989             add_padding = 1;
8990         }
8991     }
8992   else if (is_any_vex_encoding (&i.tm))
8993     return 0;
8994   else if ((i.tm.base_opcode | 1) == 0xc3)
8995     {
8996       /* Near ret.  */
8997       *branch_p = align_branch_ret;
8998       if ((align_branch & align_branch_ret_bit))
8999         add_padding = 1;
9000     }
9001   else
9002     {
9003       /* Check for indirect jmp, direct and indirect calls.  */
9004       if (i.tm.base_opcode == 0xe8)
9005         {
9006           /* Direct call.  */
9007           *branch_p = align_branch_call;
9008           if ((align_branch & align_branch_call_bit))
9009             add_padding = 1;
9010         }
9011       else if (i.tm.base_opcode == 0xff
9012                && (i.tm.extension_opcode == 2
9013                    || i.tm.extension_opcode == 4))
9014         {
9015           /* Indirect call and jmp.  */
9016           *branch_p = align_branch_indirect;
9017           if ((align_branch & align_branch_indirect_bit))
9018             add_padding = 1;
9019         }
9020
9021       if (add_padding
9022           && i.disp_operands
9023           && tls_get_addr
9024           && (i.op[0].disps->X_op == O_symbol
9025               || (i.op[0].disps->X_op == O_subtract
9026                   && i.op[0].disps->X_op_symbol == GOT_symbol)))
9027         {
9028           symbolS *s = i.op[0].disps->X_add_symbol;
9029           /* No padding to call to global or undefined tls_get_addr.  */
9030           if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9031               && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9032             return 0;
9033         }
9034     }
9035
9036   if (add_padding
9037       && last_insn.kind != last_insn_other
9038       && last_insn.seg == now_seg)
9039     {
9040       if (flag_debug)
9041         as_warn_where (last_insn.file, last_insn.line,
9042                        _("`%s` skips -malign-branch-boundary on `%s`"),
9043                        last_insn.name, i.tm.name);
9044       return 0;
9045     }
9046
9047   return add_padding;
9048 }
9049
9050 static void
9051 output_insn (void)
9052 {
9053   fragS *insn_start_frag;
9054   offsetT insn_start_off;
9055   fragS *fragP = NULL;
9056   enum align_branch_kind branch = align_branch_none;
9057   /* The initializer is arbitrary just to avoid uninitialized error.
9058      it's actually either assigned in add_branch_padding_frag_p
9059      or never be used.  */
9060   enum mf_jcc_kind mf_jcc = mf_jcc_jo;
9061
9062 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9063   if (IS_ELF && x86_used_note)
9064     {
9065       if (i.tm.cpu_flags.bitfield.cpucmov)
9066         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
9067       if (i.tm.cpu_flags.bitfield.cpusse)
9068         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
9069       if (i.tm.cpu_flags.bitfield.cpusse2)
9070         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
9071       if (i.tm.cpu_flags.bitfield.cpusse3)
9072         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
9073       if (i.tm.cpu_flags.bitfield.cpussse3)
9074         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
9075       if (i.tm.cpu_flags.bitfield.cpusse4_1)
9076         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
9077       if (i.tm.cpu_flags.bitfield.cpusse4_2)
9078         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
9079       if (i.tm.cpu_flags.bitfield.cpuavx)
9080         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
9081       if (i.tm.cpu_flags.bitfield.cpuavx2)
9082         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
9083       if (i.tm.cpu_flags.bitfield.cpufma)
9084         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
9085       if (i.tm.cpu_flags.bitfield.cpuavx512f)
9086         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
9087       if (i.tm.cpu_flags.bitfield.cpuavx512cd)
9088         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
9089       if (i.tm.cpu_flags.bitfield.cpuavx512er)
9090         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
9091       if (i.tm.cpu_flags.bitfield.cpuavx512pf)
9092         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
9093       if (i.tm.cpu_flags.bitfield.cpuavx512vl)
9094         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
9095       if (i.tm.cpu_flags.bitfield.cpuavx512dq)
9096         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
9097       if (i.tm.cpu_flags.bitfield.cpuavx512bw)
9098         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
9099       if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
9100         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
9101       if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
9102         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
9103       if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
9104         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
9105       if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
9106         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
9107       if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
9108         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
9109       if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
9110         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
9111       if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
9112         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
9113       if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
9114         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
9115
9116       if (i.tm.cpu_flags.bitfield.cpu8087
9117           || i.tm.cpu_flags.bitfield.cpu287
9118           || i.tm.cpu_flags.bitfield.cpu387
9119           || i.tm.cpu_flags.bitfield.cpu687
9120           || i.tm.cpu_flags.bitfield.cpufisttp)
9121         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
9122       if (i.has_regmmx
9123           || i.tm.base_opcode == 0xf77 /* emms */
9124           || i.tm.base_opcode == 0xf0e /* femms */
9125           || i.tm.base_opcode == 0xf2a /* cvtpi2ps */
9126           || i.tm.base_opcode == 0x660f2a /* cvtpi2pd */)
9127         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9128       if (i.has_regxmm)
9129         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9130       if (i.has_regymm)
9131         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9132       if (i.has_regzmm)
9133         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9134       if (i.tm.cpu_flags.bitfield.cpufxsr)
9135         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9136       if (i.tm.cpu_flags.bitfield.cpuxsave)
9137         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9138       if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9139         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9140       if (i.tm.cpu_flags.bitfield.cpuxsavec)
9141         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9142     }
9143 #endif
9144
9145   /* Tie dwarf2 debug info to the address at the start of the insn.
9146      We can't do this after the insn has been output as the current
9147      frag may have been closed off.  eg. by frag_var.  */
9148   dwarf2_emit_insn (0);
9149
9150   insn_start_frag = frag_now;
9151   insn_start_off = frag_now_fix ();
9152
9153   if (add_branch_padding_frag_p (&branch, &mf_jcc))
9154     {
9155       char *p;
9156       /* Branch can be 8 bytes.  Leave some room for prefixes.  */
9157       unsigned int max_branch_padding_size = 14;
9158
9159       /* Align section to boundary.  */
9160       record_alignment (now_seg, align_branch_power);
9161
9162       /* Make room for padding.  */
9163       frag_grow (max_branch_padding_size);
9164
9165       /* Start of the padding.  */
9166       p = frag_more (0);
9167
9168       fragP = frag_now;
9169
9170       frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9171                 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9172                 NULL, 0, p);
9173
9174       fragP->tc_frag_data.mf_type = mf_jcc;
9175       fragP->tc_frag_data.branch_type = branch;
9176       fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9177     }
9178
9179   /* Output jumps.  */
9180   if (i.tm.opcode_modifier.jump == JUMP)
9181     output_branch ();
9182   else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9183            || i.tm.opcode_modifier.jump == JUMP_DWORD)
9184     output_jump ();
9185   else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
9186     output_interseg_jump ();
9187   else
9188     {
9189       /* Output normal instructions here.  */
9190       char *p;
9191       unsigned char *q;
9192       unsigned int j;
9193       unsigned int prefix;
9194       enum mf_cmp_kind mf_cmp;
9195
9196       if (avoid_fence
9197           && (i.tm.base_opcode == 0xfaee8
9198               || i.tm.base_opcode == 0xfaef0
9199               || i.tm.base_opcode == 0xfaef8))
9200         {
9201           /* Encode lfence, mfence, and sfence as
9202              f0 83 04 24 00   lock addl $0x0, (%{re}sp).  */
9203           offsetT val = 0x240483f0ULL;
9204           p = frag_more (5);
9205           md_number_to_chars (p, val, 5);
9206           return;
9207         }
9208
9209       /* Some processors fail on LOCK prefix. This options makes
9210          assembler ignore LOCK prefix and serves as a workaround.  */
9211       if (omit_lock_prefix)
9212         {
9213           if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
9214             return;
9215           i.prefix[LOCK_PREFIX] = 0;
9216         }
9217
9218       if (branch)
9219         /* Skip if this is a branch.  */
9220         ;
9221       else if (add_fused_jcc_padding_frag_p (&mf_cmp))
9222         {
9223           /* Make room for padding.  */
9224           frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9225           p = frag_more (0);
9226
9227           fragP = frag_now;
9228
9229           frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9230                     ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9231                     NULL, 0, p);
9232
9233           fragP->tc_frag_data.mf_type = mf_cmp;
9234           fragP->tc_frag_data.branch_type = align_branch_fused;
9235           fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9236         }
9237       else if (add_branch_prefix_frag_p ())
9238         {
9239           unsigned int max_prefix_size = align_branch_prefix_size;
9240
9241           /* Make room for padding.  */
9242           frag_grow (max_prefix_size);
9243           p = frag_more (0);
9244
9245           fragP = frag_now;
9246
9247           frag_var (rs_machine_dependent, max_prefix_size, 0,
9248                     ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9249                     NULL, 0, p);
9250
9251           fragP->tc_frag_data.max_bytes = max_prefix_size;
9252         }
9253
9254       /* Since the VEX/EVEX prefix contains the implicit prefix, we
9255          don't need the explicit prefix.  */
9256       if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
9257         {
9258           switch (i.tm.opcode_length)
9259             {
9260             case 3:
9261               if (i.tm.base_opcode & 0xff000000)
9262                 {
9263                   prefix = (i.tm.base_opcode >> 24) & 0xff;
9264                   if (!i.tm.cpu_flags.bitfield.cpupadlock
9265                       || prefix != REPE_PREFIX_OPCODE
9266                       || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
9267                     add_prefix (prefix);
9268                 }
9269               break;
9270             case 2:
9271               if ((i.tm.base_opcode & 0xff0000) != 0)
9272                 {
9273                   prefix = (i.tm.base_opcode >> 16) & 0xff;
9274                   add_prefix (prefix);
9275                 }
9276               break;
9277             case 1:
9278               break;
9279             case 0:
9280               /* Check for pseudo prefixes.  */
9281               as_bad_where (insn_start_frag->fr_file,
9282                             insn_start_frag->fr_line,
9283                              _("pseudo prefix without instruction"));
9284               return;
9285             default:
9286               abort ();
9287             }
9288
9289 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
9290           /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9291              R_X86_64_GOTTPOFF relocation so that linker can safely
9292              perform IE->LE optimization.  A dummy REX_OPCODE prefix
9293              is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9294              relocation for GDesc -> IE/LE optimization.  */
9295           if (x86_elf_abi == X86_64_X32_ABI
9296               && i.operands == 2
9297               && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9298                   || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
9299               && i.prefix[REX_PREFIX] == 0)
9300             add_prefix (REX_OPCODE);
9301 #endif
9302
9303           /* The prefix bytes.  */
9304           for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9305             if (*q)
9306               FRAG_APPEND_1_CHAR (*q);
9307         }
9308       else
9309         {
9310           for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9311             if (*q)
9312               switch (j)
9313                 {
9314                 case SEG_PREFIX:
9315                 case ADDR_PREFIX:
9316                   FRAG_APPEND_1_CHAR (*q);
9317                   break;
9318                 default:
9319                   /* There should be no other prefixes for instructions
9320                      with VEX prefix.  */
9321                   abort ();
9322                 }
9323
9324           /* For EVEX instructions i.vrex should become 0 after
9325              build_evex_prefix.  For VEX instructions upper 16 registers
9326              aren't available, so VREX should be 0.  */
9327           if (i.vrex)
9328             abort ();
9329           /* Now the VEX prefix.  */
9330           p = frag_more (i.vex.length);
9331           for (j = 0; j < i.vex.length; j++)
9332             p[j] = i.vex.bytes[j];
9333         }
9334
9335       /* Now the opcode; be careful about word order here!  */
9336       if (i.tm.opcode_length == 1)
9337         {
9338           FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9339         }
9340       else
9341         {
9342           switch (i.tm.opcode_length)
9343             {
9344             case 4:
9345               p = frag_more (4);
9346               *p++ = (i.tm.base_opcode >> 24) & 0xff;
9347               *p++ = (i.tm.base_opcode >> 16) & 0xff;
9348               break;
9349             case 3:
9350               p = frag_more (3);
9351               *p++ = (i.tm.base_opcode >> 16) & 0xff;
9352               break;
9353             case 2:
9354               p = frag_more (2);
9355               break;
9356             default:
9357               abort ();
9358               break;
9359             }
9360
9361           /* Put out high byte first: can't use md_number_to_chars!  */
9362           *p++ = (i.tm.base_opcode >> 8) & 0xff;
9363           *p = i.tm.base_opcode & 0xff;
9364         }
9365
9366       /* Now the modrm byte and sib byte (if present).  */
9367       if (i.tm.opcode_modifier.modrm)
9368         {
9369           FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
9370                                | i.rm.reg << 3
9371                                | i.rm.mode << 6));
9372           /* If i.rm.regmem == ESP (4)
9373              && i.rm.mode != (Register mode)
9374              && not 16 bit
9375              ==> need second modrm byte.  */
9376           if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9377               && i.rm.mode != 3
9378               && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
9379             FRAG_APPEND_1_CHAR ((i.sib.base << 0
9380                                  | i.sib.index << 3
9381                                  | i.sib.scale << 6));
9382         }
9383
9384       if (i.disp_operands)
9385         output_disp (insn_start_frag, insn_start_off);
9386
9387       if (i.imm_operands)
9388         output_imm (insn_start_frag, insn_start_off);
9389
9390       /*
9391        * frag_now_fix () returning plain abs_section_offset when we're in the
9392        * absolute section, and abs_section_offset not getting updated as data
9393        * gets added to the frag breaks the logic below.
9394        */
9395       if (now_seg != absolute_section)
9396         {
9397           j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9398           if (j > 15)
9399             as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9400                      j);
9401           else if (fragP)
9402             {
9403               /* NB: Don't add prefix with GOTPC relocation since
9404                  output_disp() above depends on the fixed encoding
9405                  length.  Can't add prefix with TLS relocation since
9406                  it breaks TLS linker optimization.  */
9407               unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9408               /* Prefix count on the current instruction.  */
9409               unsigned int count = i.vex.length;
9410               unsigned int k;
9411               for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9412                 /* REX byte is encoded in VEX/EVEX prefix.  */
9413                 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9414                   count++;
9415
9416               /* Count prefixes for extended opcode maps.  */
9417               if (!i.vex.length)
9418                 switch (i.tm.opcode_length)
9419                   {
9420                   case 3:
9421                     if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
9422                       {
9423                         count++;
9424                         switch ((i.tm.base_opcode >> 8) & 0xff)
9425                           {
9426                           case 0x38:
9427                           case 0x3a:
9428                             count++;
9429                             break;
9430                           default:
9431                             break;
9432                           }
9433                       }
9434                     break;
9435                   case 2:
9436                     if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
9437                       count++;
9438                     break;
9439                   case 1:
9440                     break;
9441                   default:
9442                     abort ();
9443                   }
9444
9445               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9446                   == BRANCH_PREFIX)
9447                 {
9448                   /* Set the maximum prefix size in BRANCH_PREFIX
9449                      frag.  */
9450                   if (fragP->tc_frag_data.max_bytes > max)
9451                     fragP->tc_frag_data.max_bytes = max;
9452                   if (fragP->tc_frag_data.max_bytes > count)
9453                     fragP->tc_frag_data.max_bytes -= count;
9454                   else
9455                     fragP->tc_frag_data.max_bytes = 0;
9456                 }
9457               else
9458                 {
9459                   /* Remember the maximum prefix size in FUSED_JCC_PADDING
9460                      frag.  */
9461                   unsigned int max_prefix_size;
9462                   if (align_branch_prefix_size > max)
9463                     max_prefix_size = max;
9464                   else
9465                     max_prefix_size = align_branch_prefix_size;
9466                   if (max_prefix_size > count)
9467                     fragP->tc_frag_data.max_prefix_length
9468                       = max_prefix_size - count;
9469                 }
9470
9471               /* Use existing segment prefix if possible.  Use CS
9472                  segment prefix in 64-bit mode.  In 32-bit mode, use SS
9473                  segment prefix with ESP/EBP base register and use DS
9474                  segment prefix without ESP/EBP base register.  */
9475               if (i.prefix[SEG_PREFIX])
9476                 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9477               else if (flag_code == CODE_64BIT)
9478                 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9479               else if (i.base_reg
9480                        && (i.base_reg->reg_num == 4
9481                            || i.base_reg->reg_num == 5))
9482                 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9483               else
9484                 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9485             }
9486         }
9487     }
9488
9489   /* NB: Don't work with COND_JUMP86 without i386.  */
9490   if (align_branch_power
9491       && now_seg != absolute_section
9492       && cpu_arch_flags.bitfield.cpui386)
9493     {
9494       /* Terminate each frag so that we can add prefix and check for
9495          fused jcc.  */
9496       frag_wane (frag_now);
9497       frag_new (0);
9498     }
9499
9500 #ifdef DEBUG386
9501   if (flag_debug)
9502     {
9503       pi ("" /*line*/, &i);
9504     }
9505 #endif /* DEBUG386  */
9506 }
9507
9508 /* Return the size of the displacement operand N.  */
9509
9510 static int
9511 disp_size (unsigned int n)
9512 {
9513   int size = 4;
9514
9515   if (i.types[n].bitfield.disp64)
9516     size = 8;
9517   else if (i.types[n].bitfield.disp8)
9518     size = 1;
9519   else if (i.types[n].bitfield.disp16)
9520     size = 2;
9521   return size;
9522 }
9523
9524 /* Return the size of the immediate operand N.  */
9525
9526 static int
9527 imm_size (unsigned int n)
9528 {
9529   int size = 4;
9530   if (i.types[n].bitfield.imm64)
9531     size = 8;
9532   else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9533     size = 1;
9534   else if (i.types[n].bitfield.imm16)
9535     size = 2;
9536   return size;
9537 }
9538
9539 static void
9540 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9541 {
9542   char *p;
9543   unsigned int n;
9544
9545   for (n = 0; n < i.operands; n++)
9546     {
9547       if (operand_type_check (i.types[n], disp))
9548         {
9549           if (i.op[n].disps->X_op == O_constant)
9550             {
9551               int size = disp_size (n);
9552               offsetT val = i.op[n].disps->X_add_number;
9553
9554               val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9555                                      size);
9556               p = frag_more (size);
9557               md_number_to_chars (p, val, size);
9558             }
9559           else
9560             {
9561               enum bfd_reloc_code_real reloc_type;
9562               int size = disp_size (n);
9563               int sign = i.types[n].bitfield.disp32s;
9564               int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9565               fixS *fixP;
9566
9567               /* We can't have 8 bit displacement here.  */
9568               gas_assert (!i.types[n].bitfield.disp8);
9569
9570               /* The PC relative address is computed relative
9571                  to the instruction boundary, so in case immediate
9572                  fields follows, we need to adjust the value.  */
9573               if (pcrel && i.imm_operands)
9574                 {
9575                   unsigned int n1;
9576                   int sz = 0;
9577
9578                   for (n1 = 0; n1 < i.operands; n1++)
9579                     if (operand_type_check (i.types[n1], imm))
9580                       {
9581                         /* Only one immediate is allowed for PC
9582                            relative address.  */
9583                         gas_assert (sz == 0);
9584                         sz = imm_size (n1);
9585                         i.op[n].disps->X_add_number -= sz;
9586                       }
9587                   /* We should find the immediate.  */
9588                   gas_assert (sz != 0);
9589                 }
9590
9591               p = frag_more (size);
9592               reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9593               if (GOT_symbol
9594                   && GOT_symbol == i.op[n].disps->X_add_symbol
9595                   && (((reloc_type == BFD_RELOC_32
9596                         || reloc_type == BFD_RELOC_X86_64_32S
9597                         || (reloc_type == BFD_RELOC_64
9598                             && object_64bit))
9599                        && (i.op[n].disps->X_op == O_symbol
9600                            || (i.op[n].disps->X_op == O_add
9601                                && ((symbol_get_value_expression
9602                                     (i.op[n].disps->X_op_symbol)->X_op)
9603                                    == O_subtract))))
9604                       || reloc_type == BFD_RELOC_32_PCREL))
9605                 {
9606                   if (!object_64bit)
9607                     {
9608                       reloc_type = BFD_RELOC_386_GOTPC;
9609                       i.has_gotpc_tls_reloc = TRUE;
9610                       i.op[n].imms->X_add_number +=
9611                         encoding_length (insn_start_frag, insn_start_off, p);
9612                     }
9613                   else if (reloc_type == BFD_RELOC_64)
9614                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9615                   else
9616                     /* Don't do the adjustment for x86-64, as there
9617                        the pcrel addressing is relative to the _next_
9618                        insn, and that is taken care of in other code.  */
9619                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9620                 }
9621               else if (align_branch_power)
9622                 {
9623                   switch (reloc_type)
9624                     {
9625                     case BFD_RELOC_386_TLS_GD:
9626                     case BFD_RELOC_386_TLS_LDM:
9627                     case BFD_RELOC_386_TLS_IE:
9628                     case BFD_RELOC_386_TLS_IE_32:
9629                     case BFD_RELOC_386_TLS_GOTIE:
9630                     case BFD_RELOC_386_TLS_GOTDESC:
9631                     case BFD_RELOC_386_TLS_DESC_CALL:
9632                     case BFD_RELOC_X86_64_TLSGD:
9633                     case BFD_RELOC_X86_64_TLSLD:
9634                     case BFD_RELOC_X86_64_GOTTPOFF:
9635                     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9636                     case BFD_RELOC_X86_64_TLSDESC_CALL:
9637                       i.has_gotpc_tls_reloc = TRUE;
9638                     default:
9639                       break;
9640                     }
9641                 }
9642               fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9643                                   size, i.op[n].disps, pcrel,
9644                                   reloc_type);
9645               /* Check for "call/jmp *mem", "mov mem, %reg",
9646                  "test %reg, mem" and "binop mem, %reg" where binop
9647                  is one of adc, add, and, cmp, or, sbb, sub, xor
9648                  instructions without data prefix.  Always generate
9649                  R_386_GOT32X for "sym*GOT" operand in 32-bit mode.  */
9650               if (i.prefix[DATA_PREFIX] == 0
9651                   && (generate_relax_relocations
9652                       || (!object_64bit
9653                           && i.rm.mode == 0
9654                           && i.rm.regmem == 5))
9655                   && (i.rm.mode == 2
9656                       || (i.rm.mode == 0 && i.rm.regmem == 5))
9657                   && !is_any_vex_encoding(&i.tm)
9658                   && ((i.operands == 1
9659                        && i.tm.base_opcode == 0xff
9660                        && (i.rm.reg == 2 || i.rm.reg == 4))
9661                       || (i.operands == 2
9662                           && (i.tm.base_opcode == 0x8b
9663                               || i.tm.base_opcode == 0x85
9664                               || (i.tm.base_opcode & ~0x38) == 0x03))))
9665                 {
9666                   if (object_64bit)
9667                     {
9668                       fixP->fx_tcbit = i.rex != 0;
9669                       if (i.base_reg
9670                           && (i.base_reg->reg_num == RegIP))
9671                       fixP->fx_tcbit2 = 1;
9672                     }
9673                   else
9674                     fixP->fx_tcbit2 = 1;
9675                 }
9676             }
9677         }
9678     }
9679 }
9680
9681 static void
9682 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9683 {
9684   char *p;
9685   unsigned int n;
9686
9687   for (n = 0; n < i.operands; n++)
9688     {
9689       /* Skip SAE/RC Imm operand in EVEX.  They are already handled.  */
9690       if (i.rounding && (int) n == i.rounding->operand)
9691         continue;
9692
9693       if (operand_type_check (i.types[n], imm))
9694         {
9695           if (i.op[n].imms->X_op == O_constant)
9696             {
9697               int size = imm_size (n);
9698               offsetT val;
9699
9700               val = offset_in_range (i.op[n].imms->X_add_number,
9701                                      size);
9702               p = frag_more (size);
9703               md_number_to_chars (p, val, size);
9704             }
9705           else
9706             {
9707               /* Not absolute_section.
9708                  Need a 32-bit fixup (don't support 8bit
9709                  non-absolute imms).  Try to support other
9710                  sizes ...  */
9711               enum bfd_reloc_code_real reloc_type;
9712               int size = imm_size (n);
9713               int sign;
9714
9715               if (i.types[n].bitfield.imm32s
9716                   && (i.suffix == QWORD_MNEM_SUFFIX
9717                       || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9718                 sign = 1;
9719               else
9720                 sign = 0;
9721
9722               p = frag_more (size);
9723               reloc_type = reloc (size, 0, sign, i.reloc[n]);
9724
9725               /*   This is tough to explain.  We end up with this one if we
9726                * have operands that look like
9727                * "_GLOBAL_OFFSET_TABLE_+[.-.L284]".  The goal here is to
9728                * obtain the absolute address of the GOT, and it is strongly
9729                * preferable from a performance point of view to avoid using
9730                * a runtime relocation for this.  The actual sequence of
9731                * instructions often look something like:
9732                *
9733                *        call    .L66
9734                * .L66:
9735                *        popl    %ebx
9736                *        addl    $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9737                *
9738                *   The call and pop essentially return the absolute address
9739                * of the label .L66 and store it in %ebx.  The linker itself
9740                * will ultimately change the first operand of the addl so
9741                * that %ebx points to the GOT, but to keep things simple, the
9742                * .o file must have this operand set so that it generates not
9743                * the absolute address of .L66, but the absolute address of
9744                * itself.  This allows the linker itself simply treat a GOTPC
9745                * relocation as asking for a pcrel offset to the GOT to be
9746                * added in, and the addend of the relocation is stored in the
9747                * operand field for the instruction itself.
9748                *
9749                *   Our job here is to fix the operand so that it would add
9750                * the correct offset so that %ebx would point to itself.  The
9751                * thing that is tricky is that .-.L66 will point to the
9752                * beginning of the instruction, so we need to further modify
9753                * the operand so that it will point to itself.  There are
9754                * other cases where you have something like:
9755                *
9756                *        .long   $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9757                *
9758                * and here no correction would be required.  Internally in
9759                * the assembler we treat operands of this form as not being
9760                * pcrel since the '.' is explicitly mentioned, and I wonder
9761                * whether it would simplify matters to do it this way.  Who
9762                * knows.  In earlier versions of the PIC patches, the
9763                * pcrel_adjust field was used to store the correction, but
9764                * since the expression is not pcrel, I felt it would be
9765                * confusing to do it this way.  */
9766
9767               if ((reloc_type == BFD_RELOC_32
9768                    || reloc_type == BFD_RELOC_X86_64_32S
9769                    || reloc_type == BFD_RELOC_64)
9770                   && GOT_symbol
9771                   && GOT_symbol == i.op[n].imms->X_add_symbol
9772                   && (i.op[n].imms->X_op == O_symbol
9773                       || (i.op[n].imms->X_op == O_add
9774                           && ((symbol_get_value_expression
9775                                (i.op[n].imms->X_op_symbol)->X_op)
9776                               == O_subtract))))
9777                 {
9778                   if (!object_64bit)
9779                     reloc_type = BFD_RELOC_386_GOTPC;
9780                   else if (size == 4)
9781                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9782                   else if (size == 8)
9783                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9784                   i.has_gotpc_tls_reloc = TRUE;
9785                   i.op[n].imms->X_add_number +=
9786                     encoding_length (insn_start_frag, insn_start_off, p);
9787                 }
9788               fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9789                            i.op[n].imms, 0, reloc_type);
9790             }
9791         }
9792     }
9793 }
9794 \f
9795 /* x86_cons_fix_new is called via the expression parsing code when a
9796    reloc is needed.  We use this hook to get the correct .got reloc.  */
9797 static int cons_sign = -1;
9798
9799 void
9800 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9801                   expressionS *exp, bfd_reloc_code_real_type r)
9802 {
9803   r = reloc (len, 0, cons_sign, r);
9804
9805 #ifdef TE_PE
9806   if (exp->X_op == O_secrel)
9807     {
9808       exp->X_op = O_symbol;
9809       r = BFD_RELOC_32_SECREL;
9810     }
9811 #endif
9812
9813   fix_new_exp (frag, off, len, exp, 0, r);
9814 }
9815
9816 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9817    purpose of the `.dc.a' internal pseudo-op.  */
9818
9819 int
9820 x86_address_bytes (void)
9821 {
9822   if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9823     return 4;
9824   return stdoutput->arch_info->bits_per_address / 8;
9825 }
9826
9827 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9828     || defined (LEX_AT)
9829 # define lex_got(reloc, adjust, types) NULL
9830 #else
9831 /* Parse operands of the form
9832    <symbol>@GOTOFF+<nnn>
9833    and similar .plt or .got references.
9834
9835    If we find one, set up the correct relocation in RELOC and copy the
9836    input string, minus the `@GOTOFF' into a malloc'd buffer for
9837    parsing by the calling routine.  Return this buffer, and if ADJUST
9838    is non-null set it to the length of the string we removed from the
9839    input line.  Otherwise return NULL.  */
9840 static char *
9841 lex_got (enum bfd_reloc_code_real *rel,
9842          int *adjust,
9843          i386_operand_type *types)
9844 {
9845   /* Some of the relocations depend on the size of what field is to
9846      be relocated.  But in our callers i386_immediate and i386_displacement
9847      we don't yet know the operand size (this will be set by insn
9848      matching).  Hence we record the word32 relocation here,
9849      and adjust the reloc according to the real size in reloc().  */
9850   static const struct {
9851     const char *str;
9852     int len;
9853     const enum bfd_reloc_code_real rel[2];
9854     const i386_operand_type types64;
9855   } gotrel[] = {
9856 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9857     { STRING_COMMA_LEN ("SIZE"),      { BFD_RELOC_SIZE32,
9858                                         BFD_RELOC_SIZE32 },
9859       OPERAND_TYPE_IMM32_64 },
9860 #endif
9861     { STRING_COMMA_LEN ("PLTOFF"),   { _dummy_first_bfd_reloc_code_real,
9862                                        BFD_RELOC_X86_64_PLTOFF64 },
9863       OPERAND_TYPE_IMM64 },
9864     { STRING_COMMA_LEN ("PLT"),      { BFD_RELOC_386_PLT32,
9865                                        BFD_RELOC_X86_64_PLT32    },
9866       OPERAND_TYPE_IMM32_32S_DISP32 },
9867     { STRING_COMMA_LEN ("GOTPLT"),   { _dummy_first_bfd_reloc_code_real,
9868                                        BFD_RELOC_X86_64_GOTPLT64 },
9869       OPERAND_TYPE_IMM64_DISP64 },
9870     { STRING_COMMA_LEN ("GOTOFF"),   { BFD_RELOC_386_GOTOFF,
9871                                        BFD_RELOC_X86_64_GOTOFF64 },
9872       OPERAND_TYPE_IMM64_DISP64 },
9873     { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9874                                        BFD_RELOC_X86_64_GOTPCREL },
9875       OPERAND_TYPE_IMM32_32S_DISP32 },
9876     { STRING_COMMA_LEN ("TLSGD"),    { BFD_RELOC_386_TLS_GD,
9877                                        BFD_RELOC_X86_64_TLSGD    },
9878       OPERAND_TYPE_IMM32_32S_DISP32 },
9879     { STRING_COMMA_LEN ("TLSLDM"),   { BFD_RELOC_386_TLS_LDM,
9880                                        _dummy_first_bfd_reloc_code_real },
9881       OPERAND_TYPE_NONE },
9882     { STRING_COMMA_LEN ("TLSLD"),    { _dummy_first_bfd_reloc_code_real,
9883                                        BFD_RELOC_X86_64_TLSLD    },
9884       OPERAND_TYPE_IMM32_32S_DISP32 },
9885     { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9886                                        BFD_RELOC_X86_64_GOTTPOFF },
9887       OPERAND_TYPE_IMM32_32S_DISP32 },
9888     { STRING_COMMA_LEN ("TPOFF"),    { BFD_RELOC_386_TLS_LE_32,
9889                                        BFD_RELOC_X86_64_TPOFF32  },
9890       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9891     { STRING_COMMA_LEN ("NTPOFF"),   { BFD_RELOC_386_TLS_LE,
9892                                        _dummy_first_bfd_reloc_code_real },
9893       OPERAND_TYPE_NONE },
9894     { STRING_COMMA_LEN ("DTPOFF"),   { BFD_RELOC_386_TLS_LDO_32,
9895                                        BFD_RELOC_X86_64_DTPOFF32 },
9896       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9897     { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9898                                        _dummy_first_bfd_reloc_code_real },
9899       OPERAND_TYPE_NONE },
9900     { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9901                                        _dummy_first_bfd_reloc_code_real },
9902       OPERAND_TYPE_NONE },
9903     { STRING_COMMA_LEN ("GOT"),      { BFD_RELOC_386_GOT32,
9904                                        BFD_RELOC_X86_64_GOT32    },
9905       OPERAND_TYPE_IMM32_32S_64_DISP32 },
9906     { STRING_COMMA_LEN ("TLSDESC"),  { BFD_RELOC_386_TLS_GOTDESC,
9907                                        BFD_RELOC_X86_64_GOTPC32_TLSDESC },
9908       OPERAND_TYPE_IMM32_32S_DISP32 },
9909     { STRING_COMMA_LEN ("TLSCALL"),  { BFD_RELOC_386_TLS_DESC_CALL,
9910                                        BFD_RELOC_X86_64_TLSDESC_CALL },
9911       OPERAND_TYPE_IMM32_32S_DISP32 },
9912   };
9913   char *cp;
9914   unsigned int j;
9915
9916 #if defined (OBJ_MAYBE_ELF)
9917   if (!IS_ELF)
9918     return NULL;
9919 #endif
9920
9921   for (cp = input_line_pointer; *cp != '@'; cp++)
9922     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9923       return NULL;
9924
9925   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9926     {
9927       int len = gotrel[j].len;
9928       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9929         {
9930           if (gotrel[j].rel[object_64bit] != 0)
9931             {
9932               int first, second;
9933               char *tmpbuf, *past_reloc;
9934
9935               *rel = gotrel[j].rel[object_64bit];
9936
9937               if (types)
9938                 {
9939                   if (flag_code != CODE_64BIT)
9940                     {
9941                       types->bitfield.imm32 = 1;
9942                       types->bitfield.disp32 = 1;
9943                     }
9944                   else
9945                     *types = gotrel[j].types64;
9946                 }
9947
9948               if (j != 0 && GOT_symbol == NULL)
9949                 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9950
9951               /* The length of the first part of our input line.  */
9952               first = cp - input_line_pointer;
9953
9954               /* The second part goes from after the reloc token until
9955                  (and including) an end_of_line char or comma.  */
9956               past_reloc = cp + 1 + len;
9957               cp = past_reloc;
9958               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9959                 ++cp;
9960               second = cp + 1 - past_reloc;
9961
9962               /* Allocate and copy string.  The trailing NUL shouldn't
9963                  be necessary, but be safe.  */
9964               tmpbuf = XNEWVEC (char, first + second + 2);
9965               memcpy (tmpbuf, input_line_pointer, first);
9966               if (second != 0 && *past_reloc != ' ')
9967                 /* Replace the relocation token with ' ', so that
9968                    errors like foo@GOTOFF1 will be detected.  */
9969                 tmpbuf[first++] = ' ';
9970               else
9971                 /* Increment length by 1 if the relocation token is
9972                    removed.  */
9973                 len++;
9974               if (adjust)
9975                 *adjust = len;
9976               memcpy (tmpbuf + first, past_reloc, second);
9977               tmpbuf[first + second] = '\0';
9978               return tmpbuf;
9979             }
9980
9981           as_bad (_("@%s reloc is not supported with %d-bit output format"),
9982                   gotrel[j].str, 1 << (5 + object_64bit));
9983           return NULL;
9984         }
9985     }
9986
9987   /* Might be a symbol version string.  Don't as_bad here.  */
9988   return NULL;
9989 }
9990 #endif
9991
9992 #ifdef TE_PE
9993 #ifdef lex_got
9994 #undef lex_got
9995 #endif
9996 /* Parse operands of the form
9997    <symbol>@SECREL32+<nnn>
9998
9999    If we find one, set up the correct relocation in RELOC and copy the
10000    input string, minus the `@SECREL32' into a malloc'd buffer for
10001    parsing by the calling routine.  Return this buffer, and if ADJUST
10002    is non-null set it to the length of the string we removed from the
10003    input line.  Otherwise return NULL.
10004
10005    This function is copied from the ELF version above adjusted for PE targets.  */
10006
10007 static char *
10008 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
10009          int *adjust ATTRIBUTE_UNUSED,
10010          i386_operand_type *types)
10011 {
10012   static const struct
10013   {
10014     const char *str;
10015     int len;
10016     const enum bfd_reloc_code_real rel[2];
10017     const i386_operand_type types64;
10018   }
10019   gotrel[] =
10020   {
10021     { STRING_COMMA_LEN ("SECREL32"),    { BFD_RELOC_32_SECREL,
10022                                           BFD_RELOC_32_SECREL },
10023       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
10024   };
10025
10026   char *cp;
10027   unsigned j;
10028
10029   for (cp = input_line_pointer; *cp != '@'; cp++)
10030     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10031       return NULL;
10032
10033   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10034     {
10035       int len = gotrel[j].len;
10036
10037       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10038         {
10039           if (gotrel[j].rel[object_64bit] != 0)
10040             {
10041               int first, second;
10042               char *tmpbuf, *past_reloc;
10043
10044               *rel = gotrel[j].rel[object_64bit];
10045               if (adjust)
10046                 *adjust = len;
10047
10048               if (types)
10049                 {
10050                   if (flag_code != CODE_64BIT)
10051                     {
10052                       types->bitfield.imm32 = 1;
10053                       types->bitfield.disp32 = 1;
10054                     }
10055                   else
10056                     *types = gotrel[j].types64;
10057                 }
10058
10059               /* The length of the first part of our input line.  */
10060               first = cp - input_line_pointer;
10061
10062               /* The second part goes from after the reloc token until
10063                  (and including) an end_of_line char or comma.  */
10064               past_reloc = cp + 1 + len;
10065               cp = past_reloc;
10066               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10067                 ++cp;
10068               second = cp + 1 - past_reloc;
10069
10070               /* Allocate and copy string.  The trailing NUL shouldn't
10071                  be necessary, but be safe.  */
10072               tmpbuf = XNEWVEC (char, first + second + 2);
10073               memcpy (tmpbuf, input_line_pointer, first);
10074               if (second != 0 && *past_reloc != ' ')
10075                 /* Replace the relocation token with ' ', so that
10076                    errors like foo@SECLREL321 will be detected.  */
10077                 tmpbuf[first++] = ' ';
10078               memcpy (tmpbuf + first, past_reloc, second);
10079               tmpbuf[first + second] = '\0';
10080               return tmpbuf;
10081             }
10082
10083           as_bad (_("@%s reloc is not supported with %d-bit output format"),
10084                   gotrel[j].str, 1 << (5 + object_64bit));
10085           return NULL;
10086         }
10087     }
10088
10089   /* Might be a symbol version string.  Don't as_bad here.  */
10090   return NULL;
10091 }
10092
10093 #endif /* TE_PE */
10094
10095 bfd_reloc_code_real_type
10096 x86_cons (expressionS *exp, int size)
10097 {
10098   bfd_reloc_code_real_type got_reloc = NO_RELOC;
10099
10100   intel_syntax = -intel_syntax;
10101
10102   exp->X_md = 0;
10103   if (size == 4 || (object_64bit && size == 8))
10104     {
10105       /* Handle @GOTOFF and the like in an expression.  */
10106       char *save;
10107       char *gotfree_input_line;
10108       int adjust = 0;
10109
10110       save = input_line_pointer;
10111       gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
10112       if (gotfree_input_line)
10113         input_line_pointer = gotfree_input_line;
10114
10115       expression (exp);
10116
10117       if (gotfree_input_line)
10118         {
10119           /* expression () has merrily parsed up to the end of line,
10120              or a comma - in the wrong buffer.  Transfer how far
10121              input_line_pointer has moved to the right buffer.  */
10122           input_line_pointer = (save
10123                                 + (input_line_pointer - gotfree_input_line)
10124                                 + adjust);
10125           free (gotfree_input_line);
10126           if (exp->X_op == O_constant
10127               || exp->X_op == O_absent
10128               || exp->X_op == O_illegal
10129               || exp->X_op == O_register
10130               || exp->X_op == O_big)
10131             {
10132               char c = *input_line_pointer;
10133               *input_line_pointer = 0;
10134               as_bad (_("missing or invalid expression `%s'"), save);
10135               *input_line_pointer = c;
10136             }
10137           else if ((got_reloc == BFD_RELOC_386_PLT32
10138                     || got_reloc == BFD_RELOC_X86_64_PLT32)
10139                    && exp->X_op != O_symbol)
10140             {
10141               char c = *input_line_pointer;
10142               *input_line_pointer = 0;
10143               as_bad (_("invalid PLT expression `%s'"), save);
10144               *input_line_pointer = c;
10145             }
10146         }
10147     }
10148   else
10149     expression (exp);
10150
10151   intel_syntax = -intel_syntax;
10152
10153   if (intel_syntax)
10154     i386_intel_simplify (exp);
10155
10156   return got_reloc;
10157 }
10158
10159 static void
10160 signed_cons (int size)
10161 {
10162   if (flag_code == CODE_64BIT)
10163     cons_sign = 1;
10164   cons (size);
10165   cons_sign = -1;
10166 }
10167
10168 #ifdef TE_PE
10169 static void
10170 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
10171 {
10172   expressionS exp;
10173
10174   do
10175     {
10176       expression (&exp);
10177       if (exp.X_op == O_symbol)
10178         exp.X_op = O_secrel;
10179
10180       emit_expr (&exp, 4);
10181     }
10182   while (*input_line_pointer++ == ',');
10183
10184   input_line_pointer--;
10185   demand_empty_rest_of_line ();
10186 }
10187 #endif
10188
10189 /* Handle Vector operations.  */
10190
10191 static char *
10192 check_VecOperations (char *op_string, char *op_end)
10193 {
10194   const reg_entry *mask;
10195   const char *saved;
10196   char *end_op;
10197
10198   while (*op_string
10199          && (op_end == NULL || op_string < op_end))
10200     {
10201       saved = op_string;
10202       if (*op_string == '{')
10203         {
10204           op_string++;
10205
10206           /* Check broadcasts.  */
10207           if (strncmp (op_string, "1to", 3) == 0)
10208             {
10209               int bcst_type;
10210
10211               if (i.broadcast)
10212                 goto duplicated_vec_op;
10213
10214               op_string += 3;
10215               if (*op_string == '8')
10216                 bcst_type = 8;
10217               else if (*op_string == '4')
10218                 bcst_type = 4;
10219               else if (*op_string == '2')
10220                 bcst_type = 2;
10221               else if (*op_string == '1'
10222                        && *(op_string+1) == '6')
10223                 {
10224                   bcst_type = 16;
10225                   op_string++;
10226                 }
10227               else
10228                 {
10229                   as_bad (_("Unsupported broadcast: `%s'"), saved);
10230                   return NULL;
10231                 }
10232               op_string++;
10233
10234               broadcast_op.type = bcst_type;
10235               broadcast_op.operand = this_operand;
10236               broadcast_op.bytes = 0;
10237               i.broadcast = &broadcast_op;
10238             }
10239           /* Check masking operation.  */
10240           else if ((mask = parse_register (op_string, &end_op)) != NULL)
10241             {
10242               if (mask == &bad_reg)
10243                 return NULL;
10244
10245               /* k0 can't be used for write mask.  */
10246               if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
10247                 {
10248                   as_bad (_("`%s%s' can't be used for write mask"),
10249                           register_prefix, mask->reg_name);
10250                   return NULL;
10251                 }
10252
10253               if (!i.mask)
10254                 {
10255                   mask_op.mask = mask;
10256                   mask_op.zeroing = 0;
10257                   mask_op.operand = this_operand;
10258                   i.mask = &mask_op;
10259                 }
10260               else
10261                 {
10262                   if (i.mask->mask)
10263                     goto duplicated_vec_op;
10264
10265                   i.mask->mask = mask;
10266
10267                   /* Only "{z}" is allowed here.  No need to check
10268                      zeroing mask explicitly.  */
10269                   if (i.mask->operand != this_operand)
10270                     {
10271                       as_bad (_("invalid write mask `%s'"), saved);
10272                       return NULL;
10273                     }
10274                 }
10275
10276               op_string = end_op;
10277             }
10278           /* Check zeroing-flag for masking operation.  */
10279           else if (*op_string == 'z')
10280             {
10281               if (!i.mask)
10282                 {
10283                   mask_op.mask = NULL;
10284                   mask_op.zeroing = 1;
10285                   mask_op.operand = this_operand;
10286                   i.mask = &mask_op;
10287                 }
10288               else
10289                 {
10290                   if (i.mask->zeroing)
10291                     {
10292                     duplicated_vec_op:
10293                       as_bad (_("duplicated `%s'"), saved);
10294                       return NULL;
10295                     }
10296
10297                   i.mask->zeroing = 1;
10298
10299                   /* Only "{%k}" is allowed here.  No need to check mask
10300                      register explicitly.  */
10301                   if (i.mask->operand != this_operand)
10302                     {
10303                       as_bad (_("invalid zeroing-masking `%s'"),
10304                               saved);
10305                       return NULL;
10306                     }
10307                 }
10308
10309               op_string++;
10310             }
10311           else
10312             goto unknown_vec_op;
10313
10314           if (*op_string != '}')
10315             {
10316               as_bad (_("missing `}' in `%s'"), saved);
10317               return NULL;
10318             }
10319           op_string++;
10320
10321           /* Strip whitespace since the addition of pseudo prefixes
10322              changed how the scrubber treats '{'.  */
10323           if (is_space_char (*op_string))
10324             ++op_string;
10325
10326           continue;
10327         }
10328     unknown_vec_op:
10329       /* We don't know this one.  */
10330       as_bad (_("unknown vector operation: `%s'"), saved);
10331       return NULL;
10332     }
10333
10334   if (i.mask && i.mask->zeroing && !i.mask->mask)
10335     {
10336       as_bad (_("zeroing-masking only allowed with write mask"));
10337       return NULL;
10338     }
10339
10340   return op_string;
10341 }
10342
10343 static int
10344 i386_immediate (char *imm_start)
10345 {
10346   char *save_input_line_pointer;
10347   char *gotfree_input_line;
10348   segT exp_seg = 0;
10349   expressionS *exp;
10350   i386_operand_type types;
10351
10352   operand_type_set (&types, ~0);
10353
10354   if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10355     {
10356       as_bad (_("at most %d immediate operands are allowed"),
10357               MAX_IMMEDIATE_OPERANDS);
10358       return 0;
10359     }
10360
10361   exp = &im_expressions[i.imm_operands++];
10362   i.op[this_operand].imms = exp;
10363
10364   if (is_space_char (*imm_start))
10365     ++imm_start;
10366
10367   save_input_line_pointer = input_line_pointer;
10368   input_line_pointer = imm_start;
10369
10370   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10371   if (gotfree_input_line)
10372     input_line_pointer = gotfree_input_line;
10373
10374   exp_seg = expression (exp);
10375
10376   SKIP_WHITESPACE ();
10377
10378   /* Handle vector operations.  */
10379   if (*input_line_pointer == '{')
10380     {
10381       input_line_pointer = check_VecOperations (input_line_pointer,
10382                                                 NULL);
10383       if (input_line_pointer == NULL)
10384         return 0;
10385     }
10386
10387   if (*input_line_pointer)
10388     as_bad (_("junk `%s' after expression"), input_line_pointer);
10389
10390   input_line_pointer = save_input_line_pointer;
10391   if (gotfree_input_line)
10392     {
10393       free (gotfree_input_line);
10394
10395       if (exp->X_op == O_constant || exp->X_op == O_register)
10396         exp->X_op = O_illegal;
10397     }
10398
10399   return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10400 }
10401
10402 static int
10403 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10404                          i386_operand_type types, const char *imm_start)
10405 {
10406   if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
10407     {
10408       if (imm_start)
10409         as_bad (_("missing or invalid immediate expression `%s'"),
10410                 imm_start);
10411       return 0;
10412     }
10413   else if (exp->X_op == O_constant)
10414     {
10415       /* Size it properly later.  */
10416       i.types[this_operand].bitfield.imm64 = 1;
10417       /* If not 64bit, sign extend val.  */
10418       if (flag_code != CODE_64BIT
10419           && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
10420         exp->X_add_number
10421           = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
10422     }
10423 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10424   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
10425            && exp_seg != absolute_section
10426            && exp_seg != text_section
10427            && exp_seg != data_section
10428            && exp_seg != bss_section
10429            && exp_seg != undefined_section
10430            && !bfd_is_com_section (exp_seg))
10431     {
10432       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10433       return 0;
10434     }
10435 #endif
10436   else if (!intel_syntax && exp_seg == reg_section)
10437     {
10438       if (imm_start)
10439         as_bad (_("illegal immediate register operand %s"), imm_start);
10440       return 0;
10441     }
10442   else
10443     {
10444       /* This is an address.  The size of the address will be
10445          determined later, depending on destination register,
10446          suffix, or the default for the section.  */
10447       i.types[this_operand].bitfield.imm8 = 1;
10448       i.types[this_operand].bitfield.imm16 = 1;
10449       i.types[this_operand].bitfield.imm32 = 1;
10450       i.types[this_operand].bitfield.imm32s = 1;
10451       i.types[this_operand].bitfield.imm64 = 1;
10452       i.types[this_operand] = operand_type_and (i.types[this_operand],
10453                                                 types);
10454     }
10455
10456   return 1;
10457 }
10458
10459 static char *
10460 i386_scale (char *scale)
10461 {
10462   offsetT val;
10463   char *save = input_line_pointer;
10464
10465   input_line_pointer = scale;
10466   val = get_absolute_expression ();
10467
10468   switch (val)
10469     {
10470     case 1:
10471       i.log2_scale_factor = 0;
10472       break;
10473     case 2:
10474       i.log2_scale_factor = 1;
10475       break;
10476     case 4:
10477       i.log2_scale_factor = 2;
10478       break;
10479     case 8:
10480       i.log2_scale_factor = 3;
10481       break;
10482     default:
10483       {
10484         char sep = *input_line_pointer;
10485
10486         *input_line_pointer = '\0';
10487         as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10488                 scale);
10489         *input_line_pointer = sep;
10490         input_line_pointer = save;
10491         return NULL;
10492       }
10493     }
10494   if (i.log2_scale_factor != 0 && i.index_reg == 0)
10495     {
10496       as_warn (_("scale factor of %d without an index register"),
10497                1 << i.log2_scale_factor);
10498       i.log2_scale_factor = 0;
10499     }
10500   scale = input_line_pointer;
10501   input_line_pointer = save;
10502   return scale;
10503 }
10504
10505 static int
10506 i386_displacement (char *disp_start, char *disp_end)
10507 {
10508   expressionS *exp;
10509   segT exp_seg = 0;
10510   char *save_input_line_pointer;
10511   char *gotfree_input_line;
10512   int override;
10513   i386_operand_type bigdisp, types = anydisp;
10514   int ret;
10515
10516   if (i.disp_operands == MAX_MEMORY_OPERANDS)
10517     {
10518       as_bad (_("at most %d displacement operands are allowed"),
10519               MAX_MEMORY_OPERANDS);
10520       return 0;
10521     }
10522
10523   operand_type_set (&bigdisp, 0);
10524   if (i.jumpabsolute
10525       || i.types[this_operand].bitfield.baseindex
10526       || (current_templates->start->opcode_modifier.jump != JUMP
10527           && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
10528     {
10529       i386_addressing_mode ();
10530       override = (i.prefix[ADDR_PREFIX] != 0);
10531       if (flag_code == CODE_64BIT)
10532         {
10533           if (!override)
10534             {
10535               bigdisp.bitfield.disp32s = 1;
10536               bigdisp.bitfield.disp64 = 1;
10537             }
10538           else
10539             bigdisp.bitfield.disp32 = 1;
10540         }
10541       else if ((flag_code == CODE_16BIT) ^ override)
10542           bigdisp.bitfield.disp16 = 1;
10543       else
10544           bigdisp.bitfield.disp32 = 1;
10545     }
10546   else
10547     {
10548       /* For PC-relative branches, the width of the displacement may be
10549          dependent upon data size, but is never dependent upon address size.
10550          Also make sure to not unintentionally match against a non-PC-relative
10551          branch template.  */
10552       static templates aux_templates;
10553       const insn_template *t = current_templates->start;
10554       bfd_boolean has_intel64 = FALSE;
10555
10556       aux_templates.start = t;
10557       while (++t < current_templates->end)
10558         {
10559           if (t->opcode_modifier.jump
10560               != current_templates->start->opcode_modifier.jump)
10561             break;
10562           if ((t->opcode_modifier.isa64 >= INTEL64))
10563             has_intel64 = TRUE;
10564         }
10565       if (t < current_templates->end)
10566         {
10567           aux_templates.end = t;
10568           current_templates = &aux_templates;
10569         }
10570
10571       override = (i.prefix[DATA_PREFIX] != 0);
10572       if (flag_code == CODE_64BIT)
10573         {
10574           if ((override || i.suffix == WORD_MNEM_SUFFIX)
10575               && (!intel64 || !has_intel64))
10576             bigdisp.bitfield.disp16 = 1;
10577           else
10578             bigdisp.bitfield.disp32s = 1;
10579         }
10580       else
10581         {
10582           if (!override)
10583             override = (i.suffix == (flag_code != CODE_16BIT
10584                                      ? WORD_MNEM_SUFFIX
10585                                      : LONG_MNEM_SUFFIX));
10586           bigdisp.bitfield.disp32 = 1;
10587           if ((flag_code == CODE_16BIT) ^ override)
10588             {
10589               bigdisp.bitfield.disp32 = 0;
10590               bigdisp.bitfield.disp16 = 1;
10591             }
10592         }
10593     }
10594   i.types[this_operand] = operand_type_or (i.types[this_operand],
10595                                            bigdisp);
10596
10597   exp = &disp_expressions[i.disp_operands];
10598   i.op[this_operand].disps = exp;
10599   i.disp_operands++;
10600   save_input_line_pointer = input_line_pointer;
10601   input_line_pointer = disp_start;
10602   END_STRING_AND_SAVE (disp_end);
10603
10604 #ifndef GCC_ASM_O_HACK
10605 #define GCC_ASM_O_HACK 0
10606 #endif
10607 #if GCC_ASM_O_HACK
10608   END_STRING_AND_SAVE (disp_end + 1);
10609   if (i.types[this_operand].bitfield.baseIndex
10610       && displacement_string_end[-1] == '+')
10611     {
10612       /* This hack is to avoid a warning when using the "o"
10613          constraint within gcc asm statements.
10614          For instance:
10615
10616          #define _set_tssldt_desc(n,addr,limit,type) \
10617          __asm__ __volatile__ ( \
10618          "movw %w2,%0\n\t" \
10619          "movw %w1,2+%0\n\t" \
10620          "rorl $16,%1\n\t" \
10621          "movb %b1,4+%0\n\t" \
10622          "movb %4,5+%0\n\t" \
10623          "movb $0,6+%0\n\t" \
10624          "movb %h1,7+%0\n\t" \
10625          "rorl $16,%1" \
10626          : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10627
10628          This works great except that the output assembler ends
10629          up looking a bit weird if it turns out that there is
10630          no offset.  You end up producing code that looks like:
10631
10632          #APP
10633          movw $235,(%eax)
10634          movw %dx,2+(%eax)
10635          rorl $16,%edx
10636          movb %dl,4+(%eax)
10637          movb $137,5+(%eax)
10638          movb $0,6+(%eax)
10639          movb %dh,7+(%eax)
10640          rorl $16,%edx
10641          #NO_APP
10642
10643          So here we provide the missing zero.  */
10644
10645       *displacement_string_end = '0';
10646     }
10647 #endif
10648   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10649   if (gotfree_input_line)
10650     input_line_pointer = gotfree_input_line;
10651
10652   exp_seg = expression (exp);
10653
10654   SKIP_WHITESPACE ();
10655   if (*input_line_pointer)
10656     as_bad (_("junk `%s' after expression"), input_line_pointer);
10657 #if GCC_ASM_O_HACK
10658   RESTORE_END_STRING (disp_end + 1);
10659 #endif
10660   input_line_pointer = save_input_line_pointer;
10661   if (gotfree_input_line)
10662     {
10663       free (gotfree_input_line);
10664
10665       if (exp->X_op == O_constant || exp->X_op == O_register)
10666         exp->X_op = O_illegal;
10667     }
10668
10669   ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10670
10671   RESTORE_END_STRING (disp_end);
10672
10673   return ret;
10674 }
10675
10676 static int
10677 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10678                             i386_operand_type types, const char *disp_start)
10679 {
10680   i386_operand_type bigdisp;
10681   int ret = 1;
10682
10683   /* We do this to make sure that the section symbol is in
10684      the symbol table.  We will ultimately change the relocation
10685      to be relative to the beginning of the section.  */
10686   if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10687       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10688       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10689     {
10690       if (exp->X_op != O_symbol)
10691         goto inv_disp;
10692
10693       if (S_IS_LOCAL (exp->X_add_symbol)
10694           && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10695           && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10696         section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10697       exp->X_op = O_subtract;
10698       exp->X_op_symbol = GOT_symbol;
10699       if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10700         i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10701       else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10702         i.reloc[this_operand] = BFD_RELOC_64;
10703       else
10704         i.reloc[this_operand] = BFD_RELOC_32;
10705     }
10706
10707   else if (exp->X_op == O_absent
10708            || exp->X_op == O_illegal
10709            || exp->X_op == O_big)
10710     {
10711     inv_disp:
10712       as_bad (_("missing or invalid displacement expression `%s'"),
10713               disp_start);
10714       ret = 0;
10715     }
10716
10717   else if (flag_code == CODE_64BIT
10718            && !i.prefix[ADDR_PREFIX]
10719            && exp->X_op == O_constant)
10720     {
10721       /* Since displacement is signed extended to 64bit, don't allow
10722          disp32 and turn off disp32s if they are out of range.  */
10723       i.types[this_operand].bitfield.disp32 = 0;
10724       if (!fits_in_signed_long (exp->X_add_number))
10725         {
10726           i.types[this_operand].bitfield.disp32s = 0;
10727           if (i.types[this_operand].bitfield.baseindex)
10728             {
10729               as_bad (_("0x%lx out range of signed 32bit displacement"),
10730                       (long) exp->X_add_number);
10731               ret = 0;
10732             }
10733         }
10734     }
10735
10736 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10737   else if (exp->X_op != O_constant
10738            && OUTPUT_FLAVOR == bfd_target_aout_flavour
10739            && exp_seg != absolute_section
10740            && exp_seg != text_section
10741            && exp_seg != data_section
10742            && exp_seg != bss_section
10743            && exp_seg != undefined_section
10744            && !bfd_is_com_section (exp_seg))
10745     {
10746       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10747       ret = 0;
10748     }
10749 #endif
10750
10751   if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10752       /* Constants get taken care of by optimize_disp().  */
10753       && exp->X_op != O_constant)
10754     i.types[this_operand].bitfield.disp8 = 1;
10755
10756   /* Check if this is a displacement only operand.  */
10757   bigdisp = i.types[this_operand];
10758   bigdisp.bitfield.disp8 = 0;
10759   bigdisp.bitfield.disp16 = 0;
10760   bigdisp.bitfield.disp32 = 0;
10761   bigdisp.bitfield.disp32s = 0;
10762   bigdisp.bitfield.disp64 = 0;
10763   if (operand_type_all_zero (&bigdisp))
10764     i.types[this_operand] = operand_type_and (i.types[this_operand],
10765                                               types);
10766
10767   return ret;
10768 }
10769
10770 /* Return the active addressing mode, taking address override and
10771    registers forming the address into consideration.  Update the
10772    address override prefix if necessary.  */
10773
10774 static enum flag_code
10775 i386_addressing_mode (void)
10776 {
10777   enum flag_code addr_mode;
10778
10779   if (i.prefix[ADDR_PREFIX])
10780     addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10781   else if (flag_code == CODE_16BIT
10782            && current_templates->start->cpu_flags.bitfield.cpumpx
10783            /* Avoid replacing the "16-bit addressing not allowed" diagnostic
10784               from md_assemble() by "is not a valid base/index expression"
10785               when there is a base and/or index.  */
10786            && !i.types[this_operand].bitfield.baseindex)
10787     {
10788       /* MPX insn memory operands with neither base nor index must be forced
10789          to use 32-bit addressing in 16-bit mode.  */
10790       addr_mode = CODE_32BIT;
10791       i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10792       ++i.prefixes;
10793       gas_assert (!i.types[this_operand].bitfield.disp16);
10794       gas_assert (!i.types[this_operand].bitfield.disp32);
10795     }
10796   else
10797     {
10798       addr_mode = flag_code;
10799
10800 #if INFER_ADDR_PREFIX
10801       if (i.mem_operands == 0)
10802         {
10803           /* Infer address prefix from the first memory operand.  */
10804           const reg_entry *addr_reg = i.base_reg;
10805
10806           if (addr_reg == NULL)
10807             addr_reg = i.index_reg;
10808
10809           if (addr_reg)
10810             {
10811               if (addr_reg->reg_type.bitfield.dword)
10812                 addr_mode = CODE_32BIT;
10813               else if (flag_code != CODE_64BIT
10814                        && addr_reg->reg_type.bitfield.word)
10815                 addr_mode = CODE_16BIT;
10816
10817               if (addr_mode != flag_code)
10818                 {
10819                   i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10820                   i.prefixes += 1;
10821                   /* Change the size of any displacement too.  At most one
10822                      of Disp16 or Disp32 is set.
10823                      FIXME.  There doesn't seem to be any real need for
10824                      separate Disp16 and Disp32 flags.  The same goes for
10825                      Imm16 and Imm32.  Removing them would probably clean
10826                      up the code quite a lot.  */
10827                   if (flag_code != CODE_64BIT
10828                       && (i.types[this_operand].bitfield.disp16
10829                           || i.types[this_operand].bitfield.disp32))
10830                     i.types[this_operand]
10831                       = operand_type_xor (i.types[this_operand], disp16_32);
10832                 }
10833             }
10834         }
10835 #endif
10836     }
10837
10838   return addr_mode;
10839 }
10840
10841 /* Make sure the memory operand we've been dealt is valid.
10842    Return 1 on success, 0 on a failure.  */
10843
10844 static int
10845 i386_index_check (const char *operand_string)
10846 {
10847   const char *kind = "base/index";
10848   enum flag_code addr_mode = i386_addressing_mode ();
10849
10850   if (current_templates->start->opcode_modifier.isstring
10851       && !current_templates->start->cpu_flags.bitfield.cpupadlock
10852       && (current_templates->end[-1].opcode_modifier.isstring
10853           || i.mem_operands))
10854     {
10855       /* Memory operands of string insns are special in that they only allow
10856          a single register (rDI, rSI, or rBX) as their memory address.  */
10857       const reg_entry *expected_reg;
10858       static const char *di_si[][2] =
10859         {
10860           { "esi", "edi" },
10861           { "si", "di" },
10862           { "rsi", "rdi" }
10863         };
10864       static const char *bx[] = { "ebx", "bx", "rbx" };
10865
10866       kind = "string address";
10867
10868       if (current_templates->start->opcode_modifier.repprefixok)
10869         {
10870           int es_op = current_templates->end[-1].opcode_modifier.isstring
10871                       - IS_STRING_ES_OP0;
10872           int op = 0;
10873
10874           if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
10875               || ((!i.mem_operands != !intel_syntax)
10876                   && current_templates->end[-1].operand_types[1]
10877                      .bitfield.baseindex))
10878             op = 1;
10879           expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
10880         }
10881       else
10882         expected_reg = hash_find (reg_hash, bx[addr_mode]);
10883
10884       if (i.base_reg != expected_reg
10885           || i.index_reg
10886           || operand_type_check (i.types[this_operand], disp))
10887         {
10888           /* The second memory operand must have the same size as
10889              the first one.  */
10890           if (i.mem_operands
10891               && i.base_reg
10892               && !((addr_mode == CODE_64BIT
10893                     && i.base_reg->reg_type.bitfield.qword)
10894                    || (addr_mode == CODE_32BIT
10895                        ? i.base_reg->reg_type.bitfield.dword
10896                        : i.base_reg->reg_type.bitfield.word)))
10897             goto bad_address;
10898
10899           as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10900                    operand_string,
10901                    intel_syntax ? '[' : '(',
10902                    register_prefix,
10903                    expected_reg->reg_name,
10904                    intel_syntax ? ']' : ')');
10905           return 1;
10906         }
10907       else
10908         return 1;
10909
10910     bad_address:
10911       as_bad (_("`%s' is not a valid %s expression"),
10912               operand_string, kind);
10913       return 0;
10914     }
10915   else
10916     {
10917       if (addr_mode != CODE_16BIT)
10918         {
10919           /* 32-bit/64-bit checks.  */
10920           if ((i.base_reg
10921                && ((addr_mode == CODE_64BIT
10922                     ? !i.base_reg->reg_type.bitfield.qword
10923                     : !i.base_reg->reg_type.bitfield.dword)
10924                    || (i.index_reg && i.base_reg->reg_num == RegIP)
10925                    || i.base_reg->reg_num == RegIZ))
10926               || (i.index_reg
10927                   && !i.index_reg->reg_type.bitfield.xmmword
10928                   && !i.index_reg->reg_type.bitfield.ymmword
10929                   && !i.index_reg->reg_type.bitfield.zmmword
10930                   && ((addr_mode == CODE_64BIT
10931                        ? !i.index_reg->reg_type.bitfield.qword
10932                        : !i.index_reg->reg_type.bitfield.dword)
10933                       || !i.index_reg->reg_type.bitfield.baseindex)))
10934             goto bad_address;
10935
10936           /* bndmk, bndldx, and bndstx have special restrictions. */
10937           if (current_templates->start->base_opcode == 0xf30f1b
10938               || (current_templates->start->base_opcode & ~1) == 0x0f1a)
10939             {
10940               /* They cannot use RIP-relative addressing. */
10941               if (i.base_reg && i.base_reg->reg_num == RegIP)
10942                 {
10943                   as_bad (_("`%s' cannot be used here"), operand_string);
10944                   return 0;
10945                 }
10946
10947               /* bndldx and bndstx ignore their scale factor. */
10948               if (current_templates->start->base_opcode != 0xf30f1b
10949                   && i.log2_scale_factor)
10950                 as_warn (_("register scaling is being ignored here"));
10951             }
10952         }
10953       else
10954         {
10955           /* 16-bit checks.  */
10956           if ((i.base_reg
10957                && (!i.base_reg->reg_type.bitfield.word
10958                    || !i.base_reg->reg_type.bitfield.baseindex))
10959               || (i.index_reg
10960                   && (!i.index_reg->reg_type.bitfield.word
10961                       || !i.index_reg->reg_type.bitfield.baseindex
10962                       || !(i.base_reg
10963                            && i.base_reg->reg_num < 6
10964                            && i.index_reg->reg_num >= 6
10965                            && i.log2_scale_factor == 0))))
10966             goto bad_address;
10967         }
10968     }
10969   return 1;
10970 }
10971
10972 /* Handle vector immediates.  */
10973
10974 static int
10975 RC_SAE_immediate (const char *imm_start)
10976 {
10977   unsigned int match_found, j;
10978   const char *pstr = imm_start;
10979   expressionS *exp;
10980
10981   if (*pstr != '{')
10982     return 0;
10983
10984   pstr++;
10985   match_found = 0;
10986   for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10987     {
10988       if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10989         {
10990           if (!i.rounding)
10991             {
10992               rc_op.type = RC_NamesTable[j].type;
10993               rc_op.operand = this_operand;
10994               i.rounding = &rc_op;
10995             }
10996           else
10997             {
10998               as_bad (_("duplicated `%s'"), imm_start);
10999               return 0;
11000             }
11001           pstr += RC_NamesTable[j].len;
11002           match_found = 1;
11003           break;
11004         }
11005     }
11006   if (!match_found)
11007     return 0;
11008
11009   if (*pstr++ != '}')
11010     {
11011       as_bad (_("Missing '}': '%s'"), imm_start);
11012       return 0;
11013     }
11014   /* RC/SAE immediate string should contain nothing more.  */;
11015   if (*pstr != 0)
11016     {
11017       as_bad (_("Junk after '}': '%s'"), imm_start);
11018       return 0;
11019     }
11020
11021   exp = &im_expressions[i.imm_operands++];
11022   i.op[this_operand].imms = exp;
11023
11024   exp->X_op = O_constant;
11025   exp->X_add_number = 0;
11026   exp->X_add_symbol = (symbolS *) 0;
11027   exp->X_op_symbol = (symbolS *) 0;
11028
11029   i.types[this_operand].bitfield.imm8 = 1;
11030   return 1;
11031 }
11032
11033 /* Only string instructions can have a second memory operand, so
11034    reduce current_templates to just those if it contains any.  */
11035 static int
11036 maybe_adjust_templates (void)
11037 {
11038   const insn_template *t;
11039
11040   gas_assert (i.mem_operands == 1);
11041
11042   for (t = current_templates->start; t < current_templates->end; ++t)
11043     if (t->opcode_modifier.isstring)
11044       break;
11045
11046   if (t < current_templates->end)
11047     {
11048       static templates aux_templates;
11049       bfd_boolean recheck;
11050
11051       aux_templates.start = t;
11052       for (; t < current_templates->end; ++t)
11053         if (!t->opcode_modifier.isstring)
11054           break;
11055       aux_templates.end = t;
11056
11057       /* Determine whether to re-check the first memory operand.  */
11058       recheck = (aux_templates.start != current_templates->start
11059                  || t != current_templates->end);
11060
11061       current_templates = &aux_templates;
11062
11063       if (recheck)
11064         {
11065           i.mem_operands = 0;
11066           if (i.memop1_string != NULL
11067               && i386_index_check (i.memop1_string) == 0)
11068             return 0;
11069           i.mem_operands = 1;
11070         }
11071     }
11072
11073   return 1;
11074 }
11075
11076 /* Parse OPERAND_STRING into the i386_insn structure I.  Returns zero
11077    on error.  */
11078
11079 static int
11080 i386_att_operand (char *operand_string)
11081 {
11082   const reg_entry *r;
11083   char *end_op;
11084   char *op_string = operand_string;
11085
11086   if (is_space_char (*op_string))
11087     ++op_string;
11088
11089   /* We check for an absolute prefix (differentiating,
11090      for example, 'jmp pc_relative_label' from 'jmp *absolute_label'.  */
11091   if (*op_string == ABSOLUTE_PREFIX)
11092     {
11093       ++op_string;
11094       if (is_space_char (*op_string))
11095         ++op_string;
11096       i.jumpabsolute = TRUE;
11097     }
11098
11099   /* Check if operand is a register.  */
11100   if ((r = parse_register (op_string, &end_op)) != NULL)
11101     {
11102       i386_operand_type temp;
11103
11104       if (r == &bad_reg)
11105         return 0;
11106
11107       /* Check for a segment override by searching for ':' after a
11108          segment register.  */
11109       op_string = end_op;
11110       if (is_space_char (*op_string))
11111         ++op_string;
11112       if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
11113         {
11114           switch (r->reg_num)
11115             {
11116             case 0:
11117               i.seg[i.mem_operands] = &es;
11118               break;
11119             case 1:
11120               i.seg[i.mem_operands] = &cs;
11121               break;
11122             case 2:
11123               i.seg[i.mem_operands] = &ss;
11124               break;
11125             case 3:
11126               i.seg[i.mem_operands] = &ds;
11127               break;
11128             case 4:
11129               i.seg[i.mem_operands] = &fs;
11130               break;
11131             case 5:
11132               i.seg[i.mem_operands] = &gs;
11133               break;
11134             }
11135
11136           /* Skip the ':' and whitespace.  */
11137           ++op_string;
11138           if (is_space_char (*op_string))
11139             ++op_string;
11140
11141           if (!is_digit_char (*op_string)
11142               && !is_identifier_char (*op_string)
11143               && *op_string != '('
11144               && *op_string != ABSOLUTE_PREFIX)
11145             {
11146               as_bad (_("bad memory operand `%s'"), op_string);
11147               return 0;
11148             }
11149           /* Handle case of %es:*foo.  */
11150           if (*op_string == ABSOLUTE_PREFIX)
11151             {
11152               ++op_string;
11153               if (is_space_char (*op_string))
11154                 ++op_string;
11155               i.jumpabsolute = TRUE;
11156             }
11157           goto do_memory_reference;
11158         }
11159
11160       /* Handle vector operations.  */
11161       if (*op_string == '{')
11162         {
11163           op_string = check_VecOperations (op_string, NULL);
11164           if (op_string == NULL)
11165             return 0;
11166         }
11167
11168       if (*op_string)
11169         {
11170           as_bad (_("junk `%s' after register"), op_string);
11171           return 0;
11172         }
11173       temp = r->reg_type;
11174       temp.bitfield.baseindex = 0;
11175       i.types[this_operand] = operand_type_or (i.types[this_operand],
11176                                                temp);
11177       i.types[this_operand].bitfield.unspecified = 0;
11178       i.op[this_operand].regs = r;
11179       i.reg_operands++;
11180     }
11181   else if (*op_string == REGISTER_PREFIX)
11182     {
11183       as_bad (_("bad register name `%s'"), op_string);
11184       return 0;
11185     }
11186   else if (*op_string == IMMEDIATE_PREFIX)
11187     {
11188       ++op_string;
11189       if (i.jumpabsolute)
11190         {
11191           as_bad (_("immediate operand illegal with absolute jump"));
11192           return 0;
11193         }
11194       if (!i386_immediate (op_string))
11195         return 0;
11196     }
11197   else if (RC_SAE_immediate (operand_string))
11198     {
11199       /* If it is a RC or SAE immediate, do nothing.  */
11200       ;
11201     }
11202   else if (is_digit_char (*op_string)
11203            || is_identifier_char (*op_string)
11204            || *op_string == '"'
11205            || *op_string == '(')
11206     {
11207       /* This is a memory reference of some sort.  */
11208       char *base_string;
11209
11210       /* Start and end of displacement string expression (if found).  */
11211       char *displacement_string_start;
11212       char *displacement_string_end;
11213       char *vop_start;
11214
11215     do_memory_reference:
11216       if (i.mem_operands == 1 && !maybe_adjust_templates ())
11217         return 0;
11218       if ((i.mem_operands == 1
11219            && !current_templates->start->opcode_modifier.isstring)
11220           || i.mem_operands == 2)
11221         {
11222           as_bad (_("too many memory references for `%s'"),
11223                   current_templates->start->name);
11224           return 0;
11225         }
11226
11227       /* Check for base index form.  We detect the base index form by
11228          looking for an ')' at the end of the operand, searching
11229          for the '(' matching it, and finding a REGISTER_PREFIX or ','
11230          after the '('.  */
11231       base_string = op_string + strlen (op_string);
11232
11233       /* Handle vector operations.  */
11234       vop_start = strchr (op_string, '{');
11235       if (vop_start && vop_start < base_string)
11236         {
11237           if (check_VecOperations (vop_start, base_string) == NULL)
11238             return 0;
11239           base_string = vop_start;
11240         }
11241
11242       --base_string;
11243       if (is_space_char (*base_string))
11244         --base_string;
11245
11246       /* If we only have a displacement, set-up for it to be parsed later.  */
11247       displacement_string_start = op_string;
11248       displacement_string_end = base_string + 1;
11249
11250       if (*base_string == ')')
11251         {
11252           char *temp_string;
11253           unsigned int parens_balanced = 1;
11254           /* We've already checked that the number of left & right ()'s are
11255              equal, so this loop will not be infinite.  */
11256           do
11257             {
11258               base_string--;
11259               if (*base_string == ')')
11260                 parens_balanced++;
11261               if (*base_string == '(')
11262                 parens_balanced--;
11263             }
11264           while (parens_balanced);
11265
11266           temp_string = base_string;
11267
11268           /* Skip past '(' and whitespace.  */
11269           ++base_string;
11270           if (is_space_char (*base_string))
11271             ++base_string;
11272
11273           if (*base_string == ','
11274               || ((i.base_reg = parse_register (base_string, &end_op))
11275                   != NULL))
11276             {
11277               displacement_string_end = temp_string;
11278
11279               i.types[this_operand].bitfield.baseindex = 1;
11280
11281               if (i.base_reg)
11282                 {
11283                   if (i.base_reg == &bad_reg)
11284                     return 0;
11285                   base_string = end_op;
11286                   if (is_space_char (*base_string))
11287                     ++base_string;
11288                 }
11289
11290               /* There may be an index reg or scale factor here.  */
11291               if (*base_string == ',')
11292                 {
11293                   ++base_string;
11294                   if (is_space_char (*base_string))
11295                     ++base_string;
11296
11297                   if ((i.index_reg = parse_register (base_string, &end_op))
11298                       != NULL)
11299                     {
11300                       if (i.index_reg == &bad_reg)
11301                         return 0;
11302                       base_string = end_op;
11303                       if (is_space_char (*base_string))
11304                         ++base_string;
11305                       if (*base_string == ',')
11306                         {
11307                           ++base_string;
11308                           if (is_space_char (*base_string))
11309                             ++base_string;
11310                         }
11311                       else if (*base_string != ')')
11312                         {
11313                           as_bad (_("expecting `,' or `)' "
11314                                     "after index register in `%s'"),
11315                                   operand_string);
11316                           return 0;
11317                         }
11318                     }
11319                   else if (*base_string == REGISTER_PREFIX)
11320                     {
11321                       end_op = strchr (base_string, ',');
11322                       if (end_op)
11323                         *end_op = '\0';
11324                       as_bad (_("bad register name `%s'"), base_string);
11325                       return 0;
11326                     }
11327
11328                   /* Check for scale factor.  */
11329                   if (*base_string != ')')
11330                     {
11331                       char *end_scale = i386_scale (base_string);
11332
11333                       if (!end_scale)
11334                         return 0;
11335
11336                       base_string = end_scale;
11337                       if (is_space_char (*base_string))
11338                         ++base_string;
11339                       if (*base_string != ')')
11340                         {
11341                           as_bad (_("expecting `)' "
11342                                     "after scale factor in `%s'"),
11343                                   operand_string);
11344                           return 0;
11345                         }
11346                     }
11347                   else if (!i.index_reg)
11348                     {
11349                       as_bad (_("expecting index register or scale factor "
11350                                 "after `,'; got '%c'"),
11351                               *base_string);
11352                       return 0;
11353                     }
11354                 }
11355               else if (*base_string != ')')
11356                 {
11357                   as_bad (_("expecting `,' or `)' "
11358                             "after base register in `%s'"),
11359                           operand_string);
11360                   return 0;
11361                 }
11362             }
11363           else if (*base_string == REGISTER_PREFIX)
11364             {
11365               end_op = strchr (base_string, ',');
11366               if (end_op)
11367                 *end_op = '\0';
11368               as_bad (_("bad register name `%s'"), base_string);
11369               return 0;
11370             }
11371         }
11372
11373       /* If there's an expression beginning the operand, parse it,
11374          assuming displacement_string_start and
11375          displacement_string_end are meaningful.  */
11376       if (displacement_string_start != displacement_string_end)
11377         {
11378           if (!i386_displacement (displacement_string_start,
11379                                   displacement_string_end))
11380             return 0;
11381         }
11382
11383       /* Special case for (%dx) while doing input/output op.  */
11384       if (i.base_reg
11385           && i.base_reg->reg_type.bitfield.instance == RegD
11386           && i.base_reg->reg_type.bitfield.word
11387           && i.index_reg == 0
11388           && i.log2_scale_factor == 0
11389           && i.seg[i.mem_operands] == 0
11390           && !operand_type_check (i.types[this_operand], disp))
11391         {
11392           i.types[this_operand] = i.base_reg->reg_type;
11393           return 1;
11394         }
11395
11396       if (i386_index_check (operand_string) == 0)
11397         return 0;
11398       i.flags[this_operand] |= Operand_Mem;
11399       if (i.mem_operands == 0)
11400         i.memop1_string = xstrdup (operand_string);
11401       i.mem_operands++;
11402     }
11403   else
11404     {
11405       /* It's not a memory operand; argh!  */
11406       as_bad (_("invalid char %s beginning operand %d `%s'"),
11407               output_invalid (*op_string),
11408               this_operand + 1,
11409               op_string);
11410       return 0;
11411     }
11412   return 1;                     /* Normal return.  */
11413 }
11414 \f
11415 /* Calculate the maximum variable size (i.e., excluding fr_fix)
11416    that an rs_machine_dependent frag may reach.  */
11417
11418 unsigned int
11419 i386_frag_max_var (fragS *frag)
11420 {
11421   /* The only relaxable frags are for jumps.
11422      Unconditional jumps can grow by 4 bytes and others by 5 bytes.  */
11423   gas_assert (frag->fr_type == rs_machine_dependent);
11424   return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11425 }
11426
11427 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11428 static int
11429 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
11430 {
11431   /* STT_GNU_IFUNC symbol must go through PLT.  */
11432   if ((symbol_get_bfdsym (fr_symbol)->flags
11433        & BSF_GNU_INDIRECT_FUNCTION) != 0)
11434     return 0;
11435
11436   if (!S_IS_EXTERNAL (fr_symbol))
11437     /* Symbol may be weak or local.  */
11438     return !S_IS_WEAK (fr_symbol);
11439
11440   /* Global symbols with non-default visibility can't be preempted. */
11441   if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11442     return 1;
11443
11444   if (fr_var != NO_RELOC)
11445     switch ((enum bfd_reloc_code_real) fr_var)
11446       {
11447       case BFD_RELOC_386_PLT32:
11448       case BFD_RELOC_X86_64_PLT32:
11449         /* Symbol with PLT relocation may be preempted. */
11450         return 0;
11451       default:
11452         abort ();
11453       }
11454
11455   /* Global symbols with default visibility in a shared library may be
11456      preempted by another definition.  */
11457   return !shared;
11458 }
11459 #endif
11460
11461 /* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11462    Note also work for Skylake and Cascadelake.
11463 ---------------------------------------------------------------------
11464 |   JCC   | ADD/SUB/CMP | INC/DEC | TEST/AND |
11465 | ------  | ----------- | ------- | -------- |
11466 |   Jo    |      N      |    N    |     Y    |
11467 |   Jno   |      N      |    N    |     Y    |
11468 |  Jc/Jb  |      Y      |    N    |     Y    |
11469 | Jae/Jnb |      Y      |    N    |     Y    |
11470 |  Je/Jz  |      Y      |    Y    |     Y    |
11471 | Jne/Jnz |      Y      |    Y    |     Y    |
11472 | Jna/Jbe |      Y      |    N    |     Y    |
11473 | Ja/Jnbe |      Y      |    N    |     Y    |
11474 |   Js    |      N      |    N    |     Y    |
11475 |   Jns   |      N      |    N    |     Y    |
11476 |  Jp/Jpe |      N      |    N    |     Y    |
11477 | Jnp/Jpo |      N      |    N    |     Y    |
11478 | Jl/Jnge |      Y      |    Y    |     Y    |
11479 | Jge/Jnl |      Y      |    Y    |     Y    |
11480 | Jle/Jng |      Y      |    Y    |     Y    |
11481 | Jg/Jnle |      Y      |    Y    |     Y    |
11482 ---------------------------------------------------------------------  */
11483 static int
11484 i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11485 {
11486   if (mf_cmp == mf_cmp_alu_cmp)
11487     return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11488             || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11489   if (mf_cmp == mf_cmp_incdec)
11490     return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11491             || mf_jcc == mf_jcc_jle);
11492   if (mf_cmp == mf_cmp_test_and)
11493     return 1;
11494   return 0;
11495 }
11496
11497 /* Return the next non-empty frag.  */
11498
11499 static fragS *
11500 i386_next_non_empty_frag (fragS *fragP)
11501 {
11502   /* There may be a frag with a ".fill 0" when there is no room in
11503      the current frag for frag_grow in output_insn.  */
11504   for (fragP = fragP->fr_next;
11505        (fragP != NULL
11506         && fragP->fr_type == rs_fill
11507         && fragP->fr_fix == 0);
11508        fragP = fragP->fr_next)
11509     ;
11510   return fragP;
11511 }
11512
11513 /* Return the next jcc frag after BRANCH_PADDING.  */
11514
11515 static fragS *
11516 i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
11517 {
11518   fragS *branch_fragP;
11519   if (!pad_fragP)
11520     return NULL;
11521
11522   if (pad_fragP->fr_type == rs_machine_dependent
11523       && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
11524           == BRANCH_PADDING))
11525     {
11526       branch_fragP = i386_next_non_empty_frag (pad_fragP);
11527       if (branch_fragP->fr_type != rs_machine_dependent)
11528         return NULL;
11529       if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11530           && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11531                                    pad_fragP->tc_frag_data.mf_type))
11532         return branch_fragP;
11533     }
11534
11535   return NULL;
11536 }
11537
11538 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags.  */
11539
11540 static void
11541 i386_classify_machine_dependent_frag (fragS *fragP)
11542 {
11543   fragS *cmp_fragP;
11544   fragS *pad_fragP;
11545   fragS *branch_fragP;
11546   fragS *next_fragP;
11547   unsigned int max_prefix_length;
11548
11549   if (fragP->tc_frag_data.classified)
11550     return;
11551
11552   /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING.  Convert
11553      FUSED_JCC_PADDING and merge BRANCH_PADDING.  */
11554   for (next_fragP = fragP;
11555        next_fragP != NULL;
11556        next_fragP = next_fragP->fr_next)
11557     {
11558       next_fragP->tc_frag_data.classified = 1;
11559       if (next_fragP->fr_type == rs_machine_dependent)
11560         switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11561           {
11562           case BRANCH_PADDING:
11563             /* The BRANCH_PADDING frag must be followed by a branch
11564                frag.  */
11565             branch_fragP = i386_next_non_empty_frag (next_fragP);
11566             next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11567             break;
11568           case FUSED_JCC_PADDING:
11569             /* Check if this is a fused jcc:
11570                FUSED_JCC_PADDING
11571                CMP like instruction
11572                BRANCH_PADDING
11573                COND_JUMP
11574                */
11575             cmp_fragP = i386_next_non_empty_frag (next_fragP);
11576             pad_fragP = i386_next_non_empty_frag (cmp_fragP);
11577             branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
11578             if (branch_fragP)
11579               {
11580                 /* The BRANCH_PADDING frag is merged with the
11581                    FUSED_JCC_PADDING frag.  */
11582                 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11583                 /* CMP like instruction size.  */
11584                 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11585                 frag_wane (pad_fragP);
11586                 /* Skip to branch_fragP.  */
11587                 next_fragP = branch_fragP;
11588               }
11589             else if (next_fragP->tc_frag_data.max_prefix_length)
11590               {
11591                 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11592                    a fused jcc.  */
11593                 next_fragP->fr_subtype
11594                   = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11595                 next_fragP->tc_frag_data.max_bytes
11596                   = next_fragP->tc_frag_data.max_prefix_length;
11597                 /* This will be updated in the BRANCH_PREFIX scan.  */
11598                 next_fragP->tc_frag_data.max_prefix_length = 0;
11599               }
11600             else
11601               frag_wane (next_fragP);
11602             break;
11603           }
11604     }
11605
11606   /* Stop if there is no BRANCH_PREFIX.  */
11607   if (!align_branch_prefix_size)
11608     return;
11609
11610   /* Scan for BRANCH_PREFIX.  */
11611   for (; fragP != NULL; fragP = fragP->fr_next)
11612     {
11613       if (fragP->fr_type != rs_machine_dependent
11614           || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11615               != BRANCH_PREFIX))
11616         continue;
11617
11618       /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11619          COND_JUMP_PREFIX.  */
11620       max_prefix_length = 0;
11621       for (next_fragP = fragP;
11622            next_fragP != NULL;
11623            next_fragP = next_fragP->fr_next)
11624         {
11625           if (next_fragP->fr_type == rs_fill)
11626             /* Skip rs_fill frags.  */
11627             continue;
11628           else if (next_fragP->fr_type != rs_machine_dependent)
11629             /* Stop for all other frags.  */
11630             break;
11631
11632           /* rs_machine_dependent frags.  */
11633           if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11634               == BRANCH_PREFIX)
11635             {
11636               /* Count BRANCH_PREFIX frags.  */
11637               if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11638                 {
11639                   max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11640                   frag_wane (next_fragP);
11641                 }
11642               else
11643                 max_prefix_length
11644                   += next_fragP->tc_frag_data.max_bytes;
11645             }
11646           else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11647                     == BRANCH_PADDING)
11648                    || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11649                        == FUSED_JCC_PADDING))
11650             {
11651               /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING.  */
11652               fragP->tc_frag_data.u.padding_fragP = next_fragP;
11653               break;
11654             }
11655           else
11656             /* Stop for other rs_machine_dependent frags.  */
11657             break;
11658         }
11659
11660       fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11661
11662       /* Skip to the next frag.  */
11663       fragP = next_fragP;
11664     }
11665 }
11666
11667 /* Compute padding size for
11668
11669         FUSED_JCC_PADDING
11670         CMP like instruction
11671         BRANCH_PADDING
11672         COND_JUMP/UNCOND_JUMP
11673
11674    or
11675
11676         BRANCH_PADDING
11677         COND_JUMP/UNCOND_JUMP
11678  */
11679
11680 static int
11681 i386_branch_padding_size (fragS *fragP, offsetT address)
11682 {
11683   unsigned int offset, size, padding_size;
11684   fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11685
11686   /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag.  */
11687   if (!address)
11688     address = fragP->fr_address;
11689   address += fragP->fr_fix;
11690
11691   /* CMP like instrunction size.  */
11692   size = fragP->tc_frag_data.cmp_size;
11693
11694   /* The base size of the branch frag.  */
11695   size += branch_fragP->fr_fix;
11696
11697   /* Add opcode and displacement bytes for the rs_machine_dependent
11698      branch frag.  */
11699   if (branch_fragP->fr_type == rs_machine_dependent)
11700     size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11701
11702   /* Check if branch is within boundary and doesn't end at the last
11703      byte.  */
11704   offset = address & ((1U << align_branch_power) - 1);
11705   if ((offset + size) >= (1U << align_branch_power))
11706     /* Padding needed to avoid crossing boundary.  */
11707     padding_size = (1U << align_branch_power) - offset;
11708   else
11709     /* No padding needed.  */
11710     padding_size = 0;
11711
11712   /* The return value may be saved in tc_frag_data.length which is
11713      unsigned byte.  */
11714   if (!fits_in_unsigned_byte (padding_size))
11715     abort ();
11716
11717   return padding_size;
11718 }
11719
11720 /* i386_generic_table_relax_frag()
11721
11722    Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11723    grow/shrink padding to align branch frags.  Hand others to
11724    relax_frag().  */
11725
11726 long
11727 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11728 {
11729   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11730       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11731     {
11732       long padding_size = i386_branch_padding_size (fragP, 0);
11733       long grow = padding_size - fragP->tc_frag_data.length;
11734
11735       /* When the BRANCH_PREFIX frag is used, the computed address
11736          must match the actual address and there should be no padding.  */
11737       if (fragP->tc_frag_data.padding_address
11738           && (fragP->tc_frag_data.padding_address != fragP->fr_address
11739               || padding_size))
11740         abort ();
11741
11742       /* Update the padding size.  */
11743       if (grow)
11744         fragP->tc_frag_data.length = padding_size;
11745
11746       return grow;
11747     }
11748   else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11749     {
11750       fragS *padding_fragP, *next_fragP;
11751       long padding_size, left_size, last_size;
11752
11753       padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11754       if (!padding_fragP)
11755         /* Use the padding set by the leading BRANCH_PREFIX frag.  */
11756         return (fragP->tc_frag_data.length
11757                 - fragP->tc_frag_data.last_length);
11758
11759       /* Compute the relative address of the padding frag in the very
11760         first time where the BRANCH_PREFIX frag sizes are zero.  */
11761       if (!fragP->tc_frag_data.padding_address)
11762         fragP->tc_frag_data.padding_address
11763           = padding_fragP->fr_address - (fragP->fr_address - stretch);
11764
11765       /* First update the last length from the previous interation.  */
11766       left_size = fragP->tc_frag_data.prefix_length;
11767       for (next_fragP = fragP;
11768            next_fragP != padding_fragP;
11769            next_fragP = next_fragP->fr_next)
11770         if (next_fragP->fr_type == rs_machine_dependent
11771             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11772                 == BRANCH_PREFIX))
11773           {
11774             if (left_size)
11775               {
11776                 int max = next_fragP->tc_frag_data.max_bytes;
11777                 if (max)
11778                   {
11779                     int size;
11780                     if (max > left_size)
11781                       size = left_size;
11782                     else
11783                       size = max;
11784                     left_size -= size;
11785                     next_fragP->tc_frag_data.last_length = size;
11786                   }
11787               }
11788             else
11789               next_fragP->tc_frag_data.last_length = 0;
11790           }
11791
11792       /* Check the padding size for the padding frag.  */
11793       padding_size = i386_branch_padding_size
11794         (padding_fragP, (fragP->fr_address
11795                          + fragP->tc_frag_data.padding_address));
11796
11797       last_size = fragP->tc_frag_data.prefix_length;
11798       /* Check if there is change from the last interation.  */
11799       if (padding_size == last_size)
11800         {
11801           /* Update the expected address of the padding frag.  */
11802           padding_fragP->tc_frag_data.padding_address
11803             = (fragP->fr_address + padding_size
11804                + fragP->tc_frag_data.padding_address);
11805           return 0;
11806         }
11807
11808       if (padding_size > fragP->tc_frag_data.max_prefix_length)
11809         {
11810           /* No padding if there is no sufficient room.  Clear the
11811              expected address of the padding frag.  */
11812           padding_fragP->tc_frag_data.padding_address = 0;
11813           padding_size = 0;
11814         }
11815       else
11816         /* Store the expected address of the padding frag.  */
11817         padding_fragP->tc_frag_data.padding_address
11818           = (fragP->fr_address + padding_size
11819              + fragP->tc_frag_data.padding_address);
11820
11821       fragP->tc_frag_data.prefix_length = padding_size;
11822
11823       /* Update the length for the current interation.  */
11824       left_size = padding_size;
11825       for (next_fragP = fragP;
11826            next_fragP != padding_fragP;
11827            next_fragP = next_fragP->fr_next)
11828         if (next_fragP->fr_type == rs_machine_dependent
11829             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11830                 == BRANCH_PREFIX))
11831           {
11832             if (left_size)
11833               {
11834                 int max = next_fragP->tc_frag_data.max_bytes;
11835                 if (max)
11836                   {
11837                     int size;
11838                     if (max > left_size)
11839                       size = left_size;
11840                     else
11841                       size = max;
11842                     left_size -= size;
11843                     next_fragP->tc_frag_data.length = size;
11844                   }
11845               }
11846             else
11847               next_fragP->tc_frag_data.length = 0;
11848           }
11849
11850       return (fragP->tc_frag_data.length
11851               - fragP->tc_frag_data.last_length);
11852     }
11853   return relax_frag (segment, fragP, stretch);
11854 }
11855
11856 /* md_estimate_size_before_relax()
11857
11858    Called just before relax() for rs_machine_dependent frags.  The x86
11859    assembler uses these frags to handle variable size jump
11860    instructions.
11861
11862    Any symbol that is now undefined will not become defined.
11863    Return the correct fr_subtype in the frag.
11864    Return the initial "guess for variable size of frag" to caller.
11865    The guess is actually the growth beyond the fixed part.  Whatever
11866    we do to grow the fixed or variable part contributes to our
11867    returned value.  */
11868
11869 int
11870 md_estimate_size_before_relax (fragS *fragP, segT segment)
11871 {
11872   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11873       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11874       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11875     {
11876       i386_classify_machine_dependent_frag (fragP);
11877       return fragP->tc_frag_data.length;
11878     }
11879
11880   /* We've already got fragP->fr_subtype right;  all we have to do is
11881      check for un-relaxable symbols.  On an ELF system, we can't relax
11882      an externally visible symbol, because it may be overridden by a
11883      shared library.  */
11884   if (S_GET_SEGMENT (fragP->fr_symbol) != segment
11885 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11886       || (IS_ELF
11887           && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11888                                                 fragP->fr_var))
11889 #endif
11890 #if defined (OBJ_COFF) && defined (TE_PE)
11891       || (OUTPUT_FLAVOR == bfd_target_coff_flavour
11892           && S_IS_WEAK (fragP->fr_symbol))
11893 #endif
11894       )
11895     {
11896       /* Symbol is undefined in this segment, or we need to keep a
11897          reloc so that weak symbols can be overridden.  */
11898       int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
11899       enum bfd_reloc_code_real reloc_type;
11900       unsigned char *opcode;
11901       int old_fr_fix;
11902
11903       if (fragP->fr_var != NO_RELOC)
11904         reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
11905       else if (size == 2)
11906         reloc_type = BFD_RELOC_16_PCREL;
11907 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11908       else if (need_plt32_p (fragP->fr_symbol))
11909         reloc_type = BFD_RELOC_X86_64_PLT32;
11910 #endif
11911       else
11912         reloc_type = BFD_RELOC_32_PCREL;
11913
11914       old_fr_fix = fragP->fr_fix;
11915       opcode = (unsigned char *) fragP->fr_opcode;
11916
11917       switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
11918         {
11919         case UNCOND_JUMP:
11920           /* Make jmp (0xeb) a (d)word displacement jump.  */
11921           opcode[0] = 0xe9;
11922           fragP->fr_fix += size;
11923           fix_new (fragP, old_fr_fix, size,
11924                    fragP->fr_symbol,
11925                    fragP->fr_offset, 1,
11926                    reloc_type);
11927           break;
11928
11929         case COND_JUMP86:
11930           if (size == 2
11931               && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
11932             {
11933               /* Negate the condition, and branch past an
11934                  unconditional jump.  */
11935               opcode[0] ^= 1;
11936               opcode[1] = 3;
11937               /* Insert an unconditional jump.  */
11938               opcode[2] = 0xe9;
11939               /* We added two extra opcode bytes, and have a two byte
11940                  offset.  */
11941               fragP->fr_fix += 2 + 2;
11942               fix_new (fragP, old_fr_fix + 2, 2,
11943                        fragP->fr_symbol,
11944                        fragP->fr_offset, 1,
11945                        reloc_type);
11946               break;
11947             }
11948           /* Fall through.  */
11949
11950         case COND_JUMP:
11951           if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11952             {
11953               fixS *fixP;
11954
11955               fragP->fr_fix += 1;
11956               fixP = fix_new (fragP, old_fr_fix, 1,
11957                               fragP->fr_symbol,
11958                               fragP->fr_offset, 1,
11959                               BFD_RELOC_8_PCREL);
11960               fixP->fx_signed = 1;
11961               break;
11962             }
11963
11964           /* This changes the byte-displacement jump 0x7N
11965              to the (d)word-displacement jump 0x0f,0x8N.  */
11966           opcode[1] = opcode[0] + 0x10;
11967           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11968           /* We've added an opcode byte.  */
11969           fragP->fr_fix += 1 + size;
11970           fix_new (fragP, old_fr_fix + 1, size,
11971                    fragP->fr_symbol,
11972                    fragP->fr_offset, 1,
11973                    reloc_type);
11974           break;
11975
11976         default:
11977           BAD_CASE (fragP->fr_subtype);
11978           break;
11979         }
11980       frag_wane (fragP);
11981       return fragP->fr_fix - old_fr_fix;
11982     }
11983
11984   /* Guess size depending on current relax state.  Initially the relax
11985      state will correspond to a short jump and we return 1, because
11986      the variable part of the frag (the branch offset) is one byte
11987      long.  However, we can relax a section more than once and in that
11988      case we must either set fr_subtype back to the unrelaxed state,
11989      or return the value for the appropriate branch.  */
11990   return md_relax_table[fragP->fr_subtype].rlx_length;
11991 }
11992
11993 /* Called after relax() is finished.
11994
11995    In:  Address of frag.
11996         fr_type == rs_machine_dependent.
11997         fr_subtype is what the address relaxed to.
11998
11999    Out: Any fixSs and constants are set up.
12000         Caller will turn frag into a ".space 0".  */
12001
12002 void
12003 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
12004                  fragS *fragP)
12005 {
12006   unsigned char *opcode;
12007   unsigned char *where_to_put_displacement = NULL;
12008   offsetT target_address;
12009   offsetT opcode_address;
12010   unsigned int extension = 0;
12011   offsetT displacement_from_opcode_start;
12012
12013   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12014       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
12015       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12016     {
12017       /* Generate nop padding.  */
12018       unsigned int size = fragP->tc_frag_data.length;
12019       if (size)
12020         {
12021           if (size > fragP->tc_frag_data.max_bytes)
12022             abort ();
12023
12024           if (flag_debug)
12025             {
12026               const char *msg;
12027               const char *branch = "branch";
12028               const char *prefix = "";
12029               fragS *padding_fragP;
12030               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12031                   == BRANCH_PREFIX)
12032                 {
12033                   padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12034                   switch (fragP->tc_frag_data.default_prefix)
12035                     {
12036                     default:
12037                       abort ();
12038                       break;
12039                     case CS_PREFIX_OPCODE:
12040                       prefix = " cs";
12041                       break;
12042                     case DS_PREFIX_OPCODE:
12043                       prefix = " ds";
12044                       break;
12045                     case ES_PREFIX_OPCODE:
12046                       prefix = " es";
12047                       break;
12048                     case FS_PREFIX_OPCODE:
12049                       prefix = " fs";
12050                       break;
12051                     case GS_PREFIX_OPCODE:
12052                       prefix = " gs";
12053                       break;
12054                     case SS_PREFIX_OPCODE:
12055                       prefix = " ss";
12056                       break;
12057                     }
12058                   if (padding_fragP)
12059                     msg = _("%s:%u: add %d%s at 0x%llx to align "
12060                             "%s within %d-byte boundary\n");
12061                   else
12062                     msg = _("%s:%u: add additional %d%s at 0x%llx to "
12063                             "align %s within %d-byte boundary\n");
12064                 }
12065               else
12066                 {
12067                   padding_fragP = fragP;
12068                   msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12069                           "%s within %d-byte boundary\n");
12070                 }
12071
12072               if (padding_fragP)
12073                 switch (padding_fragP->tc_frag_data.branch_type)
12074                   {
12075                   case align_branch_jcc:
12076                     branch = "jcc";
12077                     break;
12078                   case align_branch_fused:
12079                     branch = "fused jcc";
12080                     break;
12081                   case align_branch_jmp:
12082                     branch = "jmp";
12083                     break;
12084                   case align_branch_call:
12085                     branch = "call";
12086                     break;
12087                   case align_branch_indirect:
12088                     branch = "indiret branch";
12089                     break;
12090                   case align_branch_ret:
12091                     branch = "ret";
12092                     break;
12093                   default:
12094                     break;
12095                   }
12096
12097               fprintf (stdout, msg,
12098                        fragP->fr_file, fragP->fr_line, size, prefix,
12099                        (long long) fragP->fr_address, branch,
12100                        1 << align_branch_power);
12101             }
12102           if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12103             memset (fragP->fr_opcode,
12104                     fragP->tc_frag_data.default_prefix, size);
12105           else
12106             i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12107                                 size, 0);
12108           fragP->fr_fix += size;
12109         }
12110       return;
12111     }
12112
12113   opcode = (unsigned char *) fragP->fr_opcode;
12114
12115   /* Address we want to reach in file space.  */
12116   target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
12117
12118   /* Address opcode resides at in file space.  */
12119   opcode_address = fragP->fr_address + fragP->fr_fix;
12120
12121   /* Displacement from opcode start to fill into instruction.  */
12122   displacement_from_opcode_start = target_address - opcode_address;
12123
12124   if ((fragP->fr_subtype & BIG) == 0)
12125     {
12126       /* Don't have to change opcode.  */
12127       extension = 1;            /* 1 opcode + 1 displacement  */
12128       where_to_put_displacement = &opcode[1];
12129     }
12130   else
12131     {
12132       if (no_cond_jump_promotion
12133           && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
12134         as_warn_where (fragP->fr_file, fragP->fr_line,
12135                        _("long jump required"));
12136
12137       switch (fragP->fr_subtype)
12138         {
12139         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12140           extension = 4;                /* 1 opcode + 4 displacement  */
12141           opcode[0] = 0xe9;
12142           where_to_put_displacement = &opcode[1];
12143           break;
12144
12145         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12146           extension = 2;                /* 1 opcode + 2 displacement  */
12147           opcode[0] = 0xe9;
12148           where_to_put_displacement = &opcode[1];
12149           break;
12150
12151         case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12152         case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12153           extension = 5;                /* 2 opcode + 4 displacement  */
12154           opcode[1] = opcode[0] + 0x10;
12155           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12156           where_to_put_displacement = &opcode[2];
12157           break;
12158
12159         case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12160           extension = 3;                /* 2 opcode + 2 displacement  */
12161           opcode[1] = opcode[0] + 0x10;
12162           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12163           where_to_put_displacement = &opcode[2];
12164           break;
12165
12166         case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12167           extension = 4;
12168           opcode[0] ^= 1;
12169           opcode[1] = 3;
12170           opcode[2] = 0xe9;
12171           where_to_put_displacement = &opcode[3];
12172           break;
12173
12174         default:
12175           BAD_CASE (fragP->fr_subtype);
12176           break;
12177         }
12178     }
12179
12180   /* If size if less then four we are sure that the operand fits,
12181      but if it's 4, then it could be that the displacement is larger
12182      then -/+ 2GB.  */
12183   if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12184       && object_64bit
12185       && ((addressT) (displacement_from_opcode_start - extension
12186                       + ((addressT) 1 << 31))
12187           > (((addressT) 2 << 31) - 1)))
12188     {
12189       as_bad_where (fragP->fr_file, fragP->fr_line,
12190                     _("jump target out of range"));
12191       /* Make us emit 0.  */
12192       displacement_from_opcode_start = extension;
12193     }
12194   /* Now put displacement after opcode.  */
12195   md_number_to_chars ((char *) where_to_put_displacement,
12196                       (valueT) (displacement_from_opcode_start - extension),
12197                       DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
12198   fragP->fr_fix += extension;
12199 }
12200 \f
12201 /* Apply a fixup (fixP) to segment data, once it has been determined
12202    by our caller that we have all the info we need to fix it up.
12203
12204    Parameter valP is the pointer to the value of the bits.
12205
12206    On the 386, immediates, displacements, and data pointers are all in
12207    the same (little-endian) format, so we don't need to care about which
12208    we are handling.  */
12209
12210 void
12211 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
12212 {
12213   char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
12214   valueT value = *valP;
12215
12216 #if !defined (TE_Mach)
12217   if (fixP->fx_pcrel)
12218     {
12219       switch (fixP->fx_r_type)
12220         {
12221         default:
12222           break;
12223
12224         case BFD_RELOC_64:
12225           fixP->fx_r_type = BFD_RELOC_64_PCREL;
12226           break;
12227         case BFD_RELOC_32:
12228         case BFD_RELOC_X86_64_32S:
12229           fixP->fx_r_type = BFD_RELOC_32_PCREL;
12230           break;
12231         case BFD_RELOC_16:
12232           fixP->fx_r_type = BFD_RELOC_16_PCREL;
12233           break;
12234         case BFD_RELOC_8:
12235           fixP->fx_r_type = BFD_RELOC_8_PCREL;
12236           break;
12237         }
12238     }
12239
12240   if (fixP->fx_addsy != NULL
12241       && (fixP->fx_r_type == BFD_RELOC_32_PCREL
12242           || fixP->fx_r_type == BFD_RELOC_64_PCREL
12243           || fixP->fx_r_type == BFD_RELOC_16_PCREL
12244           || fixP->fx_r_type == BFD_RELOC_8_PCREL)
12245       && !use_rela_relocations)
12246     {
12247       /* This is a hack.  There should be a better way to handle this.
12248          This covers for the fact that bfd_install_relocation will
12249          subtract the current location (for partial_inplace, PC relative
12250          relocations); see more below.  */
12251 #ifndef OBJ_AOUT
12252       if (IS_ELF
12253 #ifdef TE_PE
12254           || OUTPUT_FLAVOR == bfd_target_coff_flavour
12255 #endif
12256           )
12257         value += fixP->fx_where + fixP->fx_frag->fr_address;
12258 #endif
12259 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12260       if (IS_ELF)
12261         {
12262           segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
12263
12264           if ((sym_seg == seg
12265                || (symbol_section_p (fixP->fx_addsy)
12266                    && sym_seg != absolute_section))
12267               && !generic_force_reloc (fixP))
12268             {
12269               /* Yes, we add the values in twice.  This is because
12270                  bfd_install_relocation subtracts them out again.  I think
12271                  bfd_install_relocation is broken, but I don't dare change
12272                  it.  FIXME.  */
12273               value += fixP->fx_where + fixP->fx_frag->fr_address;
12274             }
12275         }
12276 #endif
12277 #if defined (OBJ_COFF) && defined (TE_PE)
12278       /* For some reason, the PE format does not store a
12279          section address offset for a PC relative symbol.  */
12280       if (S_GET_SEGMENT (fixP->fx_addsy) != seg
12281           || S_IS_WEAK (fixP->fx_addsy))
12282         value += md_pcrel_from (fixP);
12283 #endif
12284     }
12285 #if defined (OBJ_COFF) && defined (TE_PE)
12286   if (fixP->fx_addsy != NULL
12287       && S_IS_WEAK (fixP->fx_addsy)
12288       /* PR 16858: Do not modify weak function references.  */
12289       && ! fixP->fx_pcrel)
12290     {
12291 #if !defined (TE_PEP)
12292       /* For x86 PE weak function symbols are neither PC-relative
12293          nor do they set S_IS_FUNCTION.  So the only reliable way
12294          to detect them is to check the flags of their containing
12295          section.  */
12296       if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12297           && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12298         ;
12299       else
12300 #endif
12301       value -= S_GET_VALUE (fixP->fx_addsy);
12302     }
12303 #endif
12304
12305   /* Fix a few things - the dynamic linker expects certain values here,
12306      and we must not disappoint it.  */
12307 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12308   if (IS_ELF && fixP->fx_addsy)
12309     switch (fixP->fx_r_type)
12310       {
12311       case BFD_RELOC_386_PLT32:
12312       case BFD_RELOC_X86_64_PLT32:
12313         /* Make the jump instruction point to the address of the operand.
12314            At runtime we merely add the offset to the actual PLT entry.
12315            NB: Subtract the offset size only for jump instructions.  */
12316         if (fixP->fx_pcrel)
12317           value = -4;
12318         break;
12319
12320       case BFD_RELOC_386_TLS_GD:
12321       case BFD_RELOC_386_TLS_LDM:
12322       case BFD_RELOC_386_TLS_IE_32:
12323       case BFD_RELOC_386_TLS_IE:
12324       case BFD_RELOC_386_TLS_GOTIE:
12325       case BFD_RELOC_386_TLS_GOTDESC:
12326       case BFD_RELOC_X86_64_TLSGD:
12327       case BFD_RELOC_X86_64_TLSLD:
12328       case BFD_RELOC_X86_64_GOTTPOFF:
12329       case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12330         value = 0; /* Fully resolved at runtime.  No addend.  */
12331         /* Fallthrough */
12332       case BFD_RELOC_386_TLS_LE:
12333       case BFD_RELOC_386_TLS_LDO_32:
12334       case BFD_RELOC_386_TLS_LE_32:
12335       case BFD_RELOC_X86_64_DTPOFF32:
12336       case BFD_RELOC_X86_64_DTPOFF64:
12337       case BFD_RELOC_X86_64_TPOFF32:
12338       case BFD_RELOC_X86_64_TPOFF64:
12339         S_SET_THREAD_LOCAL (fixP->fx_addsy);
12340         break;
12341
12342       case BFD_RELOC_386_TLS_DESC_CALL:
12343       case BFD_RELOC_X86_64_TLSDESC_CALL:
12344         value = 0; /* Fully resolved at runtime.  No addend.  */
12345         S_SET_THREAD_LOCAL (fixP->fx_addsy);
12346         fixP->fx_done = 0;
12347         return;
12348
12349       case BFD_RELOC_VTABLE_INHERIT:
12350       case BFD_RELOC_VTABLE_ENTRY:
12351         fixP->fx_done = 0;
12352         return;
12353
12354       default:
12355         break;
12356       }
12357 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)  */
12358   *valP = value;
12359 #endif /* !defined (TE_Mach)  */
12360
12361   /* Are we finished with this relocation now?  */
12362   if (fixP->fx_addsy == NULL)
12363     fixP->fx_done = 1;
12364 #if defined (OBJ_COFF) && defined (TE_PE)
12365   else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12366     {
12367       fixP->fx_done = 0;
12368       /* Remember value for tc_gen_reloc.  */
12369       fixP->fx_addnumber = value;
12370       /* Clear out the frag for now.  */
12371       value = 0;
12372     }
12373 #endif
12374   else if (use_rela_relocations)
12375     {
12376       fixP->fx_no_overflow = 1;
12377       /* Remember value for tc_gen_reloc.  */
12378       fixP->fx_addnumber = value;
12379       value = 0;
12380     }
12381
12382   md_number_to_chars (p, value, fixP->fx_size);
12383 }
12384 \f
12385 const char *
12386 md_atof (int type, char *litP, int *sizeP)
12387 {
12388   /* This outputs the LITTLENUMs in REVERSE order;
12389      in accord with the bigendian 386.  */
12390   return ieee_md_atof (type, litP, sizeP, FALSE);
12391 }
12392 \f
12393 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
12394
12395 static char *
12396 output_invalid (int c)
12397 {
12398   if (ISPRINT (c))
12399     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12400               "'%c'", c);
12401   else
12402     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12403               "(0x%x)", (unsigned char) c);
12404   return output_invalid_buf;
12405 }
12406
12407 /* Verify that @r can be used in the current context.  */
12408
12409 static bfd_boolean check_register (const reg_entry *r)
12410 {
12411   if (allow_pseudo_reg)
12412     return TRUE;
12413
12414   if (operand_type_all_zero (&r->reg_type))
12415     return FALSE;
12416
12417   if ((r->reg_type.bitfield.dword
12418        || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12419        || r->reg_type.bitfield.class == RegCR
12420        || r->reg_type.bitfield.class == RegDR)
12421       && !cpu_arch_flags.bitfield.cpui386)
12422     return FALSE;
12423
12424   if (r->reg_type.bitfield.class == RegTR
12425       && (flag_code == CODE_64BIT
12426           || !cpu_arch_flags.bitfield.cpui386
12427           || cpu_arch_isa_flags.bitfield.cpui586
12428           || cpu_arch_isa_flags.bitfield.cpui686))
12429     return FALSE;
12430
12431   if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12432     return FALSE;
12433
12434   if (!cpu_arch_flags.bitfield.cpuavx512f)
12435     {
12436       if (r->reg_type.bitfield.zmmword
12437           || r->reg_type.bitfield.class == RegMask)
12438         return FALSE;
12439
12440       if (!cpu_arch_flags.bitfield.cpuavx)
12441         {
12442           if (r->reg_type.bitfield.ymmword)
12443             return FALSE;
12444
12445           if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12446             return FALSE;
12447         }
12448     }
12449
12450   if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12451     return FALSE;
12452
12453   /* Don't allow fake index register unless allow_index_reg isn't 0. */
12454   if (!allow_index_reg && r->reg_num == RegIZ)
12455     return FALSE;
12456
12457   /* Upper 16 vector registers are only available with VREX in 64bit
12458      mode, and require EVEX encoding.  */
12459   if (r->reg_flags & RegVRex)
12460     {
12461       if (!cpu_arch_flags.bitfield.cpuavx512f
12462           || flag_code != CODE_64BIT)
12463         return FALSE;
12464
12465       if (i.vec_encoding == vex_encoding_default)
12466         i.vec_encoding = vex_encoding_evex;
12467       else if (i.vec_encoding != vex_encoding_evex)
12468         i.vec_encoding = vex_encoding_error;
12469     }
12470
12471   if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12472       && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12473       && flag_code != CODE_64BIT)
12474     return FALSE;
12475
12476   if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12477       && !intel_syntax)
12478     return FALSE;
12479
12480   return TRUE;
12481 }
12482
12483 /* REG_STRING starts *before* REGISTER_PREFIX.  */
12484
12485 static const reg_entry *
12486 parse_real_register (char *reg_string, char **end_op)
12487 {
12488   char *s = reg_string;
12489   char *p;
12490   char reg_name_given[MAX_REG_NAME_SIZE + 1];
12491   const reg_entry *r;
12492
12493   /* Skip possible REGISTER_PREFIX and possible whitespace.  */
12494   if (*s == REGISTER_PREFIX)
12495     ++s;
12496
12497   if (is_space_char (*s))
12498     ++s;
12499
12500   p = reg_name_given;
12501   while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
12502     {
12503       if (p >= reg_name_given + MAX_REG_NAME_SIZE)
12504         return (const reg_entry *) NULL;
12505       s++;
12506     }
12507
12508   /* For naked regs, make sure that we are not dealing with an identifier.
12509      This prevents confusing an identifier like `eax_var' with register
12510      `eax'.  */
12511   if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12512     return (const reg_entry *) NULL;
12513
12514   *end_op = s;
12515
12516   r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
12517
12518   /* Handle floating point regs, allowing spaces in the (i) part.  */
12519   if (r == i386_regtab /* %st is first entry of table  */)
12520     {
12521       if (!cpu_arch_flags.bitfield.cpu8087
12522           && !cpu_arch_flags.bitfield.cpu287
12523           && !cpu_arch_flags.bitfield.cpu387
12524           && !allow_pseudo_reg)
12525         return (const reg_entry *) NULL;
12526
12527       if (is_space_char (*s))
12528         ++s;
12529       if (*s == '(')
12530         {
12531           ++s;
12532           if (is_space_char (*s))
12533             ++s;
12534           if (*s >= '0' && *s <= '7')
12535             {
12536               int fpr = *s - '0';
12537               ++s;
12538               if (is_space_char (*s))
12539                 ++s;
12540               if (*s == ')')
12541                 {
12542                   *end_op = s + 1;
12543                   r = (const reg_entry *) hash_find (reg_hash, "st(0)");
12544                   know (r);
12545                   return r + fpr;
12546                 }
12547             }
12548           /* We have "%st(" then garbage.  */
12549           return (const reg_entry *) NULL;
12550         }
12551     }
12552
12553   return r && check_register (r) ? r : NULL;
12554 }
12555
12556 /* REG_STRING starts *before* REGISTER_PREFIX.  */
12557
12558 static const reg_entry *
12559 parse_register (char *reg_string, char **end_op)
12560 {
12561   const reg_entry *r;
12562
12563   if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12564     r = parse_real_register (reg_string, end_op);
12565   else
12566     r = NULL;
12567   if (!r)
12568     {
12569       char *save = input_line_pointer;
12570       char c;
12571       symbolS *symbolP;
12572
12573       input_line_pointer = reg_string;
12574       c = get_symbol_name (&reg_string);
12575       symbolP = symbol_find (reg_string);
12576       if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12577         {
12578           const expressionS *e = symbol_get_value_expression (symbolP);
12579
12580           know (e->X_op == O_register);
12581           know (e->X_add_number >= 0
12582                 && (valueT) e->X_add_number < i386_regtab_size);
12583           r = i386_regtab + e->X_add_number;
12584           if (!check_register (r))
12585             {
12586               as_bad (_("register '%s%s' cannot be used here"),
12587                       register_prefix, r->reg_name);
12588               r = &bad_reg;
12589             }
12590           *end_op = input_line_pointer;
12591         }
12592       *input_line_pointer = c;
12593       input_line_pointer = save;
12594     }
12595   return r;
12596 }
12597
12598 int
12599 i386_parse_name (char *name, expressionS *e, char *nextcharP)
12600 {
12601   const reg_entry *r;
12602   char *end = input_line_pointer;
12603
12604   *end = *nextcharP;
12605   r = parse_register (name, &input_line_pointer);
12606   if (r && end <= input_line_pointer)
12607     {
12608       *nextcharP = *input_line_pointer;
12609       *input_line_pointer = 0;
12610       if (r != &bad_reg)
12611         {
12612           e->X_op = O_register;
12613           e->X_add_number = r - i386_regtab;
12614         }
12615       else
12616           e->X_op = O_illegal;
12617       return 1;
12618     }
12619   input_line_pointer = end;
12620   *end = 0;
12621   return intel_syntax ? i386_intel_parse_name (name, e) : 0;
12622 }
12623
12624 void
12625 md_operand (expressionS *e)
12626 {
12627   char *end;
12628   const reg_entry *r;
12629
12630   switch (*input_line_pointer)
12631     {
12632     case REGISTER_PREFIX:
12633       r = parse_real_register (input_line_pointer, &end);
12634       if (r)
12635         {
12636           e->X_op = O_register;
12637           e->X_add_number = r - i386_regtab;
12638           input_line_pointer = end;
12639         }
12640       break;
12641
12642     case '[':
12643       gas_assert (intel_syntax);
12644       end = input_line_pointer++;
12645       expression (e);
12646       if (*input_line_pointer == ']')
12647         {
12648           ++input_line_pointer;
12649           e->X_op_symbol = make_expr_symbol (e);
12650           e->X_add_symbol = NULL;
12651           e->X_add_number = 0;
12652           e->X_op = O_index;
12653         }
12654       else
12655         {
12656           e->X_op = O_absent;
12657           input_line_pointer = end;
12658         }
12659       break;
12660     }
12661 }
12662
12663 \f
12664 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12665 const char *md_shortopts = "kVQ:sqnO::";
12666 #else
12667 const char *md_shortopts = "qnO::";
12668 #endif
12669
12670 #define OPTION_32 (OPTION_MD_BASE + 0)
12671 #define OPTION_64 (OPTION_MD_BASE + 1)
12672 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12673 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12674 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12675 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12676 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12677 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12678 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12679 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12680 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12681 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12682 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12683 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12684 #define OPTION_X32 (OPTION_MD_BASE + 14)
12685 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12686 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12687 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12688 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12689 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12690 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12691 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12692 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12693 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12694 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12695 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12696 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12697 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12698 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12699 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12700 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12701 #define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
12702 #define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
12703 #define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
12704
12705 struct option md_longopts[] =
12706 {
12707   {"32", no_argument, NULL, OPTION_32},
12708 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12709      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12710   {"64", no_argument, NULL, OPTION_64},
12711 #endif
12712 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12713   {"x32", no_argument, NULL, OPTION_X32},
12714   {"mshared", no_argument, NULL, OPTION_MSHARED},
12715   {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12716 #endif
12717   {"divide", no_argument, NULL, OPTION_DIVIDE},
12718   {"march", required_argument, NULL, OPTION_MARCH},
12719   {"mtune", required_argument, NULL, OPTION_MTUNE},
12720   {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12721   {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12722   {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12723   {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12724   {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12725   {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12726   {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12727   {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12728   {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12729   {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12730   {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12731   {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12732 # if defined (TE_PE) || defined (TE_PEP)
12733   {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12734 #endif
12735   {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12736   {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12737   {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12738   {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12739   {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12740   {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12741   {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12742   {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12743   {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
12744   {"mlfence-before-indirect-branch", required_argument, NULL,
12745    OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
12746   {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
12747   {"mamd64", no_argument, NULL, OPTION_MAMD64},
12748   {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12749   {NULL, no_argument, NULL, 0}
12750 };
12751 size_t md_longopts_size = sizeof (md_longopts);
12752
12753 int
12754 md_parse_option (int c, const char *arg)
12755 {
12756   unsigned int j;
12757   char *arch, *next, *saved, *type;
12758
12759   switch (c)
12760     {
12761     case 'n':
12762       optimize_align_code = 0;
12763       break;
12764
12765     case 'q':
12766       quiet_warnings = 1;
12767       break;
12768
12769 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12770       /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12771          should be emitted or not.  FIXME: Not implemented.  */
12772     case 'Q':
12773       if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12774         return 0;
12775       break;
12776
12777       /* -V: SVR4 argument to print version ID.  */
12778     case 'V':
12779       print_version_id ();
12780       break;
12781
12782       /* -k: Ignore for FreeBSD compatibility.  */
12783     case 'k':
12784       break;
12785
12786     case 's':
12787       /* -s: On i386 Solaris, this tells the native assembler to use
12788          .stab instead of .stab.excl.  We always use .stab anyhow.  */
12789       break;
12790
12791     case OPTION_MSHARED:
12792       shared = 1;
12793       break;
12794
12795     case OPTION_X86_USED_NOTE:
12796       if (strcasecmp (arg, "yes") == 0)
12797         x86_used_note = 1;
12798       else if (strcasecmp (arg, "no") == 0)
12799         x86_used_note = 0;
12800       else
12801         as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12802       break;
12803
12804
12805 #endif
12806 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12807      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12808     case OPTION_64:
12809       {
12810         const char **list, **l;
12811
12812         list = bfd_target_list ();
12813         for (l = list; *l != NULL; l++)
12814           if (CONST_STRNEQ (*l, "elf64-x86-64")
12815               || strcmp (*l, "coff-x86-64") == 0
12816               || strcmp (*l, "pe-x86-64") == 0
12817               || strcmp (*l, "pei-x86-64") == 0
12818               || strcmp (*l, "mach-o-x86-64") == 0)
12819             {
12820               default_arch = "x86_64";
12821               break;
12822             }
12823         if (*l == NULL)
12824           as_fatal (_("no compiled in support for x86_64"));
12825         free (list);
12826       }
12827       break;
12828 #endif
12829
12830 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12831     case OPTION_X32:
12832       if (IS_ELF)
12833         {
12834           const char **list, **l;
12835
12836           list = bfd_target_list ();
12837           for (l = list; *l != NULL; l++)
12838             if (CONST_STRNEQ (*l, "elf32-x86-64"))
12839               {
12840                 default_arch = "x86_64:32";
12841                 break;
12842               }
12843           if (*l == NULL)
12844             as_fatal (_("no compiled in support for 32bit x86_64"));
12845           free (list);
12846         }
12847       else
12848         as_fatal (_("32bit x86_64 is only supported for ELF"));
12849       break;
12850 #endif
12851
12852     case OPTION_32:
12853       default_arch = "i386";
12854       break;
12855
12856     case OPTION_DIVIDE:
12857 #ifdef SVR4_COMMENT_CHARS
12858       {
12859         char *n, *t;
12860         const char *s;
12861
12862         n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
12863         t = n;
12864         for (s = i386_comment_chars; *s != '\0'; s++)
12865           if (*s != '/')
12866             *t++ = *s;
12867         *t = '\0';
12868         i386_comment_chars = n;
12869       }
12870 #endif
12871       break;
12872
12873     case OPTION_MARCH:
12874       saved = xstrdup (arg);
12875       arch = saved;
12876       /* Allow -march=+nosse.  */
12877       if (*arch == '+')
12878         arch++;
12879       do
12880         {
12881           if (*arch == '.')
12882             as_fatal (_("invalid -march= option: `%s'"), arg);
12883           next = strchr (arch, '+');
12884           if (next)
12885             *next++ = '\0';
12886           for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12887             {
12888               if (strcmp (arch, cpu_arch [j].name) == 0)
12889                 {
12890                   /* Processor.  */
12891                   if (! cpu_arch[j].flags.bitfield.cpui386)
12892                     continue;
12893
12894                   cpu_arch_name = cpu_arch[j].name;
12895                   cpu_sub_arch_name = NULL;
12896                   cpu_arch_flags = cpu_arch[j].flags;
12897                   cpu_arch_isa = cpu_arch[j].type;
12898                   cpu_arch_isa_flags = cpu_arch[j].flags;
12899                   if (!cpu_arch_tune_set)
12900                     {
12901                       cpu_arch_tune = cpu_arch_isa;
12902                       cpu_arch_tune_flags = cpu_arch_isa_flags;
12903                     }
12904                   break;
12905                 }
12906               else if (*cpu_arch [j].name == '.'
12907                        && strcmp (arch, cpu_arch [j].name + 1) == 0)
12908                 {
12909                   /* ISA extension.  */
12910                   i386_cpu_flags flags;
12911
12912                   flags = cpu_flags_or (cpu_arch_flags,
12913                                         cpu_arch[j].flags);
12914
12915                   if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12916                     {
12917                       if (cpu_sub_arch_name)
12918                         {
12919                           char *name = cpu_sub_arch_name;
12920                           cpu_sub_arch_name = concat (name,
12921                                                       cpu_arch[j].name,
12922                                                       (const char *) NULL);
12923                           free (name);
12924                         }
12925                       else
12926                         cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
12927                       cpu_arch_flags = flags;
12928                       cpu_arch_isa_flags = flags;
12929                     }
12930                   else
12931                     cpu_arch_isa_flags
12932                       = cpu_flags_or (cpu_arch_isa_flags,
12933                                       cpu_arch[j].flags);
12934                   break;
12935                 }
12936             }
12937
12938           if (j >= ARRAY_SIZE (cpu_arch))
12939             {
12940               /* Disable an ISA extension.  */
12941               for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12942                 if (strcmp (arch, cpu_noarch [j].name) == 0)
12943                   {
12944                     i386_cpu_flags flags;
12945
12946                     flags = cpu_flags_and_not (cpu_arch_flags,
12947                                                cpu_noarch[j].flags);
12948                     if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12949                       {
12950                         if (cpu_sub_arch_name)
12951                           {
12952                             char *name = cpu_sub_arch_name;
12953                             cpu_sub_arch_name = concat (arch,
12954                                                         (const char *) NULL);
12955                             free (name);
12956                           }
12957                         else
12958                           cpu_sub_arch_name = xstrdup (arch);
12959                         cpu_arch_flags = flags;
12960                         cpu_arch_isa_flags = flags;
12961                       }
12962                     break;
12963                   }
12964
12965               if (j >= ARRAY_SIZE (cpu_noarch))
12966                 j = ARRAY_SIZE (cpu_arch);
12967             }
12968
12969           if (j >= ARRAY_SIZE (cpu_arch))
12970             as_fatal (_("invalid -march= option: `%s'"), arg);
12971
12972           arch = next;
12973         }
12974       while (next != NULL);
12975       free (saved);
12976       break;
12977
12978     case OPTION_MTUNE:
12979       if (*arg == '.')
12980         as_fatal (_("invalid -mtune= option: `%s'"), arg);
12981       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12982         {
12983           if (strcmp (arg, cpu_arch [j].name) == 0)
12984             {
12985               cpu_arch_tune_set = 1;
12986               cpu_arch_tune = cpu_arch [j].type;
12987               cpu_arch_tune_flags = cpu_arch[j].flags;
12988               break;
12989             }
12990         }
12991       if (j >= ARRAY_SIZE (cpu_arch))
12992         as_fatal (_("invalid -mtune= option: `%s'"), arg);
12993       break;
12994
12995     case OPTION_MMNEMONIC:
12996       if (strcasecmp (arg, "att") == 0)
12997         intel_mnemonic = 0;
12998       else if (strcasecmp (arg, "intel") == 0)
12999         intel_mnemonic = 1;
13000       else
13001         as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
13002       break;
13003
13004     case OPTION_MSYNTAX:
13005       if (strcasecmp (arg, "att") == 0)
13006         intel_syntax = 0;
13007       else if (strcasecmp (arg, "intel") == 0)
13008         intel_syntax = 1;
13009       else
13010         as_fatal (_("invalid -msyntax= option: `%s'"), arg);
13011       break;
13012
13013     case OPTION_MINDEX_REG:
13014       allow_index_reg = 1;
13015       break;
13016
13017     case OPTION_MNAKED_REG:
13018       allow_naked_reg = 1;
13019       break;
13020
13021     case OPTION_MSSE2AVX:
13022       sse2avx = 1;
13023       break;
13024
13025     case OPTION_MSSE_CHECK:
13026       if (strcasecmp (arg, "error") == 0)
13027         sse_check = check_error;
13028       else if (strcasecmp (arg, "warning") == 0)
13029         sse_check = check_warning;
13030       else if (strcasecmp (arg, "none") == 0)
13031         sse_check = check_none;
13032       else
13033         as_fatal (_("invalid -msse-check= option: `%s'"), arg);
13034       break;
13035
13036     case OPTION_MOPERAND_CHECK:
13037       if (strcasecmp (arg, "error") == 0)
13038         operand_check = check_error;
13039       else if (strcasecmp (arg, "warning") == 0)
13040         operand_check = check_warning;
13041       else if (strcasecmp (arg, "none") == 0)
13042         operand_check = check_none;
13043       else
13044         as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
13045       break;
13046
13047     case OPTION_MAVXSCALAR:
13048       if (strcasecmp (arg, "128") == 0)
13049         avxscalar = vex128;
13050       else if (strcasecmp (arg, "256") == 0)
13051         avxscalar = vex256;
13052       else
13053         as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
13054       break;
13055
13056     case OPTION_MVEXWIG:
13057       if (strcmp (arg, "0") == 0)
13058         vexwig = vexw0;
13059       else if (strcmp (arg, "1") == 0)
13060         vexwig = vexw1;
13061       else
13062         as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
13063       break;
13064
13065     case OPTION_MADD_BND_PREFIX:
13066       add_bnd_prefix = 1;
13067       break;
13068
13069     case OPTION_MEVEXLIG:
13070       if (strcmp (arg, "128") == 0)
13071         evexlig = evexl128;
13072       else if (strcmp (arg, "256") == 0)
13073         evexlig = evexl256;
13074       else  if (strcmp (arg, "512") == 0)
13075         evexlig = evexl512;
13076       else
13077         as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13078       break;
13079
13080     case OPTION_MEVEXRCIG:
13081       if (strcmp (arg, "rne") == 0)
13082         evexrcig = rne;
13083       else if (strcmp (arg, "rd") == 0)
13084         evexrcig = rd;
13085       else if (strcmp (arg, "ru") == 0)
13086         evexrcig = ru;
13087       else if (strcmp (arg, "rz") == 0)
13088         evexrcig = rz;
13089       else
13090         as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13091       break;
13092
13093     case OPTION_MEVEXWIG:
13094       if (strcmp (arg, "0") == 0)
13095         evexwig = evexw0;
13096       else if (strcmp (arg, "1") == 0)
13097         evexwig = evexw1;
13098       else
13099         as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13100       break;
13101
13102 # if defined (TE_PE) || defined (TE_PEP)
13103     case OPTION_MBIG_OBJ:
13104       use_big_obj = 1;
13105       break;
13106 #endif
13107
13108     case OPTION_MOMIT_LOCK_PREFIX:
13109       if (strcasecmp (arg, "yes") == 0)
13110         omit_lock_prefix = 1;
13111       else if (strcasecmp (arg, "no") == 0)
13112         omit_lock_prefix = 0;
13113       else
13114         as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13115       break;
13116
13117     case OPTION_MFENCE_AS_LOCK_ADD:
13118       if (strcasecmp (arg, "yes") == 0)
13119         avoid_fence = 1;
13120       else if (strcasecmp (arg, "no") == 0)
13121         avoid_fence = 0;
13122       else
13123         as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13124       break;
13125
13126     case OPTION_MLFENCE_AFTER_LOAD:
13127       if (strcasecmp (arg, "yes") == 0)
13128         lfence_after_load = 1;
13129       else if (strcasecmp (arg, "no") == 0)
13130         lfence_after_load = 0;
13131       else
13132         as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13133       break;
13134
13135     case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13136       if (strcasecmp (arg, "all") == 0)
13137         {
13138           lfence_before_indirect_branch = lfence_branch_all;
13139           if (lfence_before_ret == lfence_before_ret_none)
13140             lfence_before_ret = lfence_before_ret_shl;
13141         }
13142       else if (strcasecmp (arg, "memory") == 0)
13143         lfence_before_indirect_branch = lfence_branch_memory;
13144       else if (strcasecmp (arg, "register") == 0)
13145         lfence_before_indirect_branch = lfence_branch_register;
13146       else if (strcasecmp (arg, "none") == 0)
13147         lfence_before_indirect_branch = lfence_branch_none;
13148       else
13149         as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13150                   arg);
13151       break;
13152
13153     case OPTION_MLFENCE_BEFORE_RET:
13154       if (strcasecmp (arg, "or") == 0)
13155         lfence_before_ret = lfence_before_ret_or;
13156       else if (strcasecmp (arg, "not") == 0)
13157         lfence_before_ret = lfence_before_ret_not;
13158       else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13159         lfence_before_ret = lfence_before_ret_shl;
13160       else if (strcasecmp (arg, "none") == 0)
13161         lfence_before_ret = lfence_before_ret_none;
13162       else
13163         as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13164                   arg);
13165       break;
13166
13167     case OPTION_MRELAX_RELOCATIONS:
13168       if (strcasecmp (arg, "yes") == 0)
13169         generate_relax_relocations = 1;
13170       else if (strcasecmp (arg, "no") == 0)
13171         generate_relax_relocations = 0;
13172       else
13173         as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13174       break;
13175
13176     case OPTION_MALIGN_BRANCH_BOUNDARY:
13177       {
13178         char *end;
13179         long int align = strtoul (arg, &end, 0);
13180         if (*end == '\0')
13181           {
13182             if (align == 0)
13183               {
13184                 align_branch_power = 0;
13185                 break;
13186               }
13187             else if (align >= 16)
13188               {
13189                 int align_power;
13190                 for (align_power = 0;
13191                      (align & 1) == 0;
13192                      align >>= 1, align_power++)
13193                   continue;
13194                 /* Limit alignment power to 31.  */
13195                 if (align == 1 && align_power < 32)
13196                   {
13197                     align_branch_power = align_power;
13198                     break;
13199                   }
13200               }
13201           }
13202         as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13203       }
13204       break;
13205
13206     case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13207       {
13208         char *end;
13209         int align = strtoul (arg, &end, 0);
13210         /* Some processors only support 5 prefixes.  */
13211         if (*end == '\0' && align >= 0 && align < 6)
13212           {
13213             align_branch_prefix_size = align;
13214             break;
13215           }
13216         as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13217                   arg);
13218       }
13219       break;
13220
13221     case OPTION_MALIGN_BRANCH:
13222       align_branch = 0;
13223       saved = xstrdup (arg);
13224       type = saved;
13225       do
13226         {
13227           next = strchr (type, '+');
13228           if (next)
13229             *next++ = '\0';
13230           if (strcasecmp (type, "jcc") == 0)
13231             align_branch |= align_branch_jcc_bit;
13232           else if (strcasecmp (type, "fused") == 0)
13233             align_branch |= align_branch_fused_bit;
13234           else if (strcasecmp (type, "jmp") == 0)
13235             align_branch |= align_branch_jmp_bit;
13236           else if (strcasecmp (type, "call") == 0)
13237             align_branch |= align_branch_call_bit;
13238           else if (strcasecmp (type, "ret") == 0)
13239             align_branch |= align_branch_ret_bit;
13240           else if (strcasecmp (type, "indirect") == 0)
13241             align_branch |= align_branch_indirect_bit;
13242           else
13243             as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13244           type = next;
13245         }
13246       while (next != NULL);
13247       free (saved);
13248       break;
13249
13250     case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13251       align_branch_power = 5;
13252       align_branch_prefix_size = 5;
13253       align_branch = (align_branch_jcc_bit
13254                       | align_branch_fused_bit
13255                       | align_branch_jmp_bit);
13256       break;
13257
13258     case OPTION_MAMD64:
13259       isa64 = amd64;
13260       break;
13261
13262     case OPTION_MINTEL64:
13263       isa64 = intel64;
13264       break;
13265
13266     case 'O':
13267       if (arg == NULL)
13268         {
13269           optimize = 1;
13270           /* Turn off -Os.  */
13271           optimize_for_space = 0;
13272         }
13273       else if (*arg == 's')
13274         {
13275           optimize_for_space = 1;
13276           /* Turn on all encoding optimizations.  */
13277           optimize = INT_MAX;
13278         }
13279       else
13280         {
13281           optimize = atoi (arg);
13282           /* Turn off -Os.  */
13283           optimize_for_space = 0;
13284         }
13285       break;
13286
13287     default:
13288       return 0;
13289     }
13290   return 1;
13291 }
13292
13293 #define MESSAGE_TEMPLATE \
13294 "                                                                                "
13295
13296 static char *
13297 output_message (FILE *stream, char *p, char *message, char *start,
13298                 int *left_p, const char *name, int len)
13299 {
13300   int size = sizeof (MESSAGE_TEMPLATE);
13301   int left = *left_p;
13302
13303   /* Reserve 2 spaces for ", " or ",\0" */
13304   left -= len + 2;
13305
13306   /* Check if there is any room.  */
13307   if (left >= 0)
13308     {
13309       if (p != start)
13310         {
13311           *p++ = ',';
13312           *p++ = ' ';
13313         }
13314       p = mempcpy (p, name, len);
13315     }
13316   else
13317     {
13318       /* Output the current message now and start a new one.  */
13319       *p++ = ',';
13320       *p = '\0';
13321       fprintf (stream, "%s\n", message);
13322       p = start;
13323       left = size - (start - message) - len - 2;
13324
13325       gas_assert (left >= 0);
13326
13327       p = mempcpy (p, name, len);
13328     }
13329
13330   *left_p = left;
13331   return p;
13332 }
13333
13334 static void
13335 show_arch (FILE *stream, int ext, int check)
13336 {
13337   static char message[] = MESSAGE_TEMPLATE;
13338   char *start = message + 27;
13339   char *p;
13340   int size = sizeof (MESSAGE_TEMPLATE);
13341   int left;
13342   const char *name;
13343   int len;
13344   unsigned int j;
13345
13346   p = start;
13347   left = size - (start - message);
13348   for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13349     {
13350       /* Should it be skipped?  */
13351       if (cpu_arch [j].skip)
13352         continue;
13353
13354       name = cpu_arch [j].name;
13355       len = cpu_arch [j].len;
13356       if (*name == '.')
13357         {
13358           /* It is an extension.  Skip if we aren't asked to show it.  */
13359           if (ext)
13360             {
13361               name++;
13362               len--;
13363             }
13364           else
13365             continue;
13366         }
13367       else if (ext)
13368         {
13369           /* It is an processor.  Skip if we show only extension.  */
13370           continue;
13371         }
13372       else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13373         {
13374           /* It is an impossible processor - skip.  */
13375           continue;
13376         }
13377
13378       p = output_message (stream, p, message, start, &left, name, len);
13379     }
13380
13381   /* Display disabled extensions.  */
13382   if (ext)
13383     for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13384       {
13385         name = cpu_noarch [j].name;
13386         len = cpu_noarch [j].len;
13387         p = output_message (stream, p, message, start, &left, name,
13388                             len);
13389       }
13390
13391   *p = '\0';
13392   fprintf (stream, "%s\n", message);
13393 }
13394
13395 void
13396 md_show_usage (FILE *stream)
13397 {
13398 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13399   fprintf (stream, _("\
13400   -Qy, -Qn                ignored\n\
13401   -V                      print assembler version number\n\
13402   -k                      ignored\n"));
13403 #endif
13404   fprintf (stream, _("\
13405   -n                      Do not optimize code alignment\n\
13406   -q                      quieten some warnings\n"));
13407 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13408   fprintf (stream, _("\
13409   -s                      ignored\n"));
13410 #endif
13411 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13412                       || defined (TE_PE) || defined (TE_PEP))
13413   fprintf (stream, _("\
13414   --32/--64/--x32         generate 32bit/64bit/x32 code\n"));
13415 #endif
13416 #ifdef SVR4_COMMENT_CHARS
13417   fprintf (stream, _("\
13418   --divide                do not treat `/' as a comment character\n"));
13419 #else
13420   fprintf (stream, _("\
13421   --divide                ignored\n"));
13422 #endif
13423   fprintf (stream, _("\
13424   -march=CPU[,+EXTENSION...]\n\
13425                           generate code for CPU and EXTENSION, CPU is one of:\n"));
13426   show_arch (stream, 0, 1);
13427   fprintf (stream, _("\
13428                           EXTENSION is combination of:\n"));
13429   show_arch (stream, 1, 0);
13430   fprintf (stream, _("\
13431   -mtune=CPU              optimize for CPU, CPU is one of:\n"));
13432   show_arch (stream, 0, 0);
13433   fprintf (stream, _("\
13434   -msse2avx               encode SSE instructions with VEX prefix\n"));
13435   fprintf (stream, _("\
13436   -msse-check=[none|error|warning] (default: warning)\n\
13437                           check SSE instructions\n"));
13438   fprintf (stream, _("\
13439   -moperand-check=[none|error|warning] (default: warning)\n\
13440                           check operand combinations for validity\n"));
13441   fprintf (stream, _("\
13442   -mavxscalar=[128|256] (default: 128)\n\
13443                           encode scalar AVX instructions with specific vector\n\
13444                            length\n"));
13445   fprintf (stream, _("\
13446   -mvexwig=[0|1] (default: 0)\n\
13447                           encode VEX instructions with specific VEX.W value\n\
13448                            for VEX.W bit ignored instructions\n"));
13449   fprintf (stream, _("\
13450   -mevexlig=[128|256|512] (default: 128)\n\
13451                           encode scalar EVEX instructions with specific vector\n\
13452                            length\n"));
13453   fprintf (stream, _("\
13454   -mevexwig=[0|1] (default: 0)\n\
13455                           encode EVEX instructions with specific EVEX.W value\n\
13456                            for EVEX.W bit ignored instructions\n"));
13457   fprintf (stream, _("\
13458   -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
13459                           encode EVEX instructions with specific EVEX.RC value\n\
13460                            for SAE-only ignored instructions\n"));
13461   fprintf (stream, _("\
13462   -mmnemonic=[att|intel] "));
13463   if (SYSV386_COMPAT)
13464     fprintf (stream, _("(default: att)\n"));
13465   else
13466     fprintf (stream, _("(default: intel)\n"));
13467   fprintf (stream, _("\
13468                           use AT&T/Intel mnemonic\n"));
13469   fprintf (stream, _("\
13470   -msyntax=[att|intel] (default: att)\n\
13471                           use AT&T/Intel syntax\n"));
13472   fprintf (stream, _("\
13473   -mindex-reg             support pseudo index registers\n"));
13474   fprintf (stream, _("\
13475   -mnaked-reg             don't require `%%' prefix for registers\n"));
13476   fprintf (stream, _("\
13477   -madd-bnd-prefix        add BND prefix for all valid branches\n"));
13478 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13479   fprintf (stream, _("\
13480   -mshared                disable branch optimization for shared code\n"));
13481   fprintf (stream, _("\
13482   -mx86-used-note=[no|yes] "));
13483   if (DEFAULT_X86_USED_NOTE)
13484     fprintf (stream, _("(default: yes)\n"));
13485   else
13486     fprintf (stream, _("(default: no)\n"));
13487   fprintf (stream, _("\
13488                           generate x86 used ISA and feature properties\n"));
13489 #endif
13490 #if defined (TE_PE) || defined (TE_PEP)
13491   fprintf (stream, _("\
13492   -mbig-obj               generate big object files\n"));
13493 #endif
13494   fprintf (stream, _("\
13495   -momit-lock-prefix=[no|yes] (default: no)\n\
13496                           strip all lock prefixes\n"));
13497   fprintf (stream, _("\
13498   -mfence-as-lock-add=[no|yes] (default: no)\n\
13499                           encode lfence, mfence and sfence as\n\
13500                            lock addl $0x0, (%%{re}sp)\n"));
13501   fprintf (stream, _("\
13502   -mrelax-relocations=[no|yes] "));
13503   if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13504     fprintf (stream, _("(default: yes)\n"));
13505   else
13506     fprintf (stream, _("(default: no)\n"));
13507   fprintf (stream, _("\
13508                           generate relax relocations\n"));
13509   fprintf (stream, _("\
13510   -malign-branch-boundary=NUM (default: 0)\n\
13511                           align branches within NUM byte boundary\n"));
13512   fprintf (stream, _("\
13513   -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13514                           TYPE is combination of jcc, fused, jmp, call, ret,\n\
13515                            indirect\n\
13516                           specify types of branches to align\n"));
13517   fprintf (stream, _("\
13518   -malign-branch-prefix-size=NUM (default: 5)\n\
13519                           align branches with NUM prefixes per instruction\n"));
13520   fprintf (stream, _("\
13521   -mbranches-within-32B-boundaries\n\
13522                           align branches within 32 byte boundary\n"));
13523   fprintf (stream, _("\
13524   -mlfence-after-load=[no|yes] (default: no)\n\
13525                           generate lfence after load\n"));
13526   fprintf (stream, _("\
13527   -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13528                           generate lfence before indirect near branch\n"));
13529   fprintf (stream, _("\
13530   -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
13531                           generate lfence before ret\n"));
13532   fprintf (stream, _("\
13533   -mamd64                 accept only AMD64 ISA [default]\n"));
13534   fprintf (stream, _("\
13535   -mintel64               accept only Intel64 ISA\n"));
13536 }
13537
13538 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
13539      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13540      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13541
13542 /* Pick the target format to use.  */
13543
13544 const char *
13545 i386_target_format (void)
13546 {
13547   if (!strncmp (default_arch, "x86_64", 6))
13548     {
13549       update_code_flag (CODE_64BIT, 1);
13550       if (default_arch[6] == '\0')
13551         x86_elf_abi = X86_64_ABI;
13552       else
13553         x86_elf_abi = X86_64_X32_ABI;
13554     }
13555   else if (!strcmp (default_arch, "i386"))
13556     update_code_flag (CODE_32BIT, 1);
13557   else if (!strcmp (default_arch, "iamcu"))
13558     {
13559       update_code_flag (CODE_32BIT, 1);
13560       if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13561         {
13562           static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13563           cpu_arch_name = "iamcu";
13564           cpu_sub_arch_name = NULL;
13565           cpu_arch_flags = iamcu_flags;
13566           cpu_arch_isa = PROCESSOR_IAMCU;
13567           cpu_arch_isa_flags = iamcu_flags;
13568           if (!cpu_arch_tune_set)
13569             {
13570               cpu_arch_tune = cpu_arch_isa;
13571               cpu_arch_tune_flags = cpu_arch_isa_flags;
13572             }
13573         }
13574       else if (cpu_arch_isa != PROCESSOR_IAMCU)
13575         as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13576                   cpu_arch_name);
13577     }
13578   else
13579     as_fatal (_("unknown architecture"));
13580
13581   if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13582     cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13583   if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13584     cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13585
13586   switch (OUTPUT_FLAVOR)
13587     {
13588 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
13589     case bfd_target_aout_flavour:
13590       return AOUT_TARGET_FORMAT;
13591 #endif
13592 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13593 # if defined (TE_PE) || defined (TE_PEP)
13594     case bfd_target_coff_flavour:
13595       if (flag_code == CODE_64BIT)
13596         return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13597       else
13598         return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
13599 # elif defined (TE_GO32)
13600     case bfd_target_coff_flavour:
13601       return "coff-go32";
13602 # else
13603     case bfd_target_coff_flavour:
13604       return "coff-i386";
13605 # endif
13606 #endif
13607 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13608     case bfd_target_elf_flavour:
13609       {
13610         const char *format;
13611
13612         switch (x86_elf_abi)
13613           {
13614           default:
13615             format = ELF_TARGET_FORMAT;
13616 #ifndef TE_SOLARIS
13617             tls_get_addr = "___tls_get_addr";
13618 #endif
13619             break;
13620           case X86_64_ABI:
13621             use_rela_relocations = 1;
13622             object_64bit = 1;
13623 #ifndef TE_SOLARIS
13624             tls_get_addr = "__tls_get_addr";
13625 #endif
13626             format = ELF_TARGET_FORMAT64;
13627             break;
13628           case X86_64_X32_ABI:
13629             use_rela_relocations = 1;
13630             object_64bit = 1;
13631 #ifndef TE_SOLARIS
13632             tls_get_addr = "__tls_get_addr";
13633 #endif
13634             disallow_64bit_reloc = 1;
13635             format = ELF_TARGET_FORMAT32;
13636             break;
13637           }
13638         if (cpu_arch_isa == PROCESSOR_L1OM)
13639           {
13640             if (x86_elf_abi != X86_64_ABI)
13641               as_fatal (_("Intel L1OM is 64bit only"));
13642             return ELF_TARGET_L1OM_FORMAT;
13643           }
13644         else if (cpu_arch_isa == PROCESSOR_K1OM)
13645           {
13646             if (x86_elf_abi != X86_64_ABI)
13647               as_fatal (_("Intel K1OM is 64bit only"));
13648             return ELF_TARGET_K1OM_FORMAT;
13649           }
13650         else if (cpu_arch_isa == PROCESSOR_IAMCU)
13651           {
13652             if (x86_elf_abi != I386_ABI)
13653               as_fatal (_("Intel MCU is 32bit only"));
13654             return ELF_TARGET_IAMCU_FORMAT;
13655           }
13656         else
13657           return format;
13658       }
13659 #endif
13660 #if defined (OBJ_MACH_O)
13661     case bfd_target_mach_o_flavour:
13662       if (flag_code == CODE_64BIT)
13663         {
13664           use_rela_relocations = 1;
13665           object_64bit = 1;
13666           return "mach-o-x86-64";
13667         }
13668       else
13669         return "mach-o-i386";
13670 #endif
13671     default:
13672       abort ();
13673       return NULL;
13674     }
13675 }
13676
13677 #endif /* OBJ_MAYBE_ more than one  */
13678 \f
13679 symbolS *
13680 md_undefined_symbol (char *name)
13681 {
13682   if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13683       && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13684       && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13685       && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
13686     {
13687       if (!GOT_symbol)
13688         {
13689           if (symbol_find (name))
13690             as_bad (_("GOT already in symbol table"));
13691           GOT_symbol = symbol_new (name, undefined_section,
13692                                    (valueT) 0, &zero_address_frag);
13693         };
13694       return GOT_symbol;
13695     }
13696   return 0;
13697 }
13698
13699 /* Round up a section size to the appropriate boundary.  */
13700
13701 valueT
13702 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13703 {
13704 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13705   if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13706     {
13707       /* For a.out, force the section size to be aligned.  If we don't do
13708          this, BFD will align it for us, but it will not write out the
13709          final bytes of the section.  This may be a bug in BFD, but it is
13710          easier to fix it here since that is how the other a.out targets
13711          work.  */
13712       int align;
13713
13714       align = bfd_section_alignment (segment);
13715       size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13716     }
13717 #endif
13718
13719   return size;
13720 }
13721
13722 /* On the i386, PC-relative offsets are relative to the start of the
13723    next instruction.  That is, the address of the offset, plus its
13724    size, since the offset is always the last part of the insn.  */
13725
13726 long
13727 md_pcrel_from (fixS *fixP)
13728 {
13729   return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13730 }
13731
13732 #ifndef I386COFF
13733
13734 static void
13735 s_bss (int ignore ATTRIBUTE_UNUSED)
13736 {
13737   int temp;
13738
13739 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13740   if (IS_ELF)
13741     obj_elf_section_change_hook ();
13742 #endif
13743   temp = get_absolute_expression ();
13744   subseg_set (bss_section, (subsegT) temp);
13745   demand_empty_rest_of_line ();
13746 }
13747
13748 #endif
13749
13750 /* Remember constant directive.  */
13751
13752 void
13753 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13754 {
13755   if (last_insn.kind != last_insn_directive
13756       && (bfd_section_flags (now_seg) & SEC_CODE))
13757     {
13758       last_insn.seg = now_seg;
13759       last_insn.kind = last_insn_directive;
13760       last_insn.name = "constant directive";
13761       last_insn.file = as_where (&last_insn.line);
13762       if (lfence_before_ret != lfence_before_ret_none)
13763         {
13764           if (lfence_before_indirect_branch != lfence_branch_none)
13765             as_warn (_("constant directive skips -mlfence-before-ret "
13766                        "and -mlfence-before-indirect-branch"));
13767           else
13768             as_warn (_("constant directive skips -mlfence-before-ret"));
13769         }
13770       else if (lfence_before_indirect_branch != lfence_branch_none)
13771         as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
13772     }
13773 }
13774
13775 void
13776 i386_validate_fix (fixS *fixp)
13777 {
13778   if (fixp->fx_subsy)
13779     {
13780       if (fixp->fx_subsy == GOT_symbol)
13781         {
13782           if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13783             {
13784               if (!object_64bit)
13785                 abort ();
13786 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13787               if (fixp->fx_tcbit2)
13788                 fixp->fx_r_type = (fixp->fx_tcbit
13789                                    ? BFD_RELOC_X86_64_REX_GOTPCRELX
13790                                    : BFD_RELOC_X86_64_GOTPCRELX);
13791               else
13792 #endif
13793                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13794             }
13795           else
13796             {
13797               if (!object_64bit)
13798                 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13799               else
13800                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13801             }
13802           fixp->fx_subsy = 0;
13803         }
13804     }
13805 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13806   else if (!object_64bit)
13807     {
13808       if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13809           && fixp->fx_tcbit2)
13810         fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13811     }
13812 #endif
13813 }
13814
13815 arelent *
13816 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
13817 {
13818   arelent *rel;
13819   bfd_reloc_code_real_type code;
13820
13821   switch (fixp->fx_r_type)
13822     {
13823 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13824     case BFD_RELOC_SIZE32:
13825     case BFD_RELOC_SIZE64:
13826       if (S_IS_DEFINED (fixp->fx_addsy)
13827           && !S_IS_EXTERNAL (fixp->fx_addsy))
13828         {
13829           /* Resolve size relocation against local symbol to size of
13830              the symbol plus addend.  */
13831           valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13832           if (fixp->fx_r_type == BFD_RELOC_SIZE32
13833               && !fits_in_unsigned_long (value))
13834             as_bad_where (fixp->fx_file, fixp->fx_line,
13835                           _("symbol size computation overflow"));
13836           fixp->fx_addsy = NULL;
13837           fixp->fx_subsy = NULL;
13838           md_apply_fix (fixp, (valueT *) &value, NULL);
13839           return NULL;
13840         }
13841 #endif
13842       /* Fall through.  */
13843
13844     case BFD_RELOC_X86_64_PLT32:
13845     case BFD_RELOC_X86_64_GOT32:
13846     case BFD_RELOC_X86_64_GOTPCREL:
13847     case BFD_RELOC_X86_64_GOTPCRELX:
13848     case BFD_RELOC_X86_64_REX_GOTPCRELX:
13849     case BFD_RELOC_386_PLT32:
13850     case BFD_RELOC_386_GOT32:
13851     case BFD_RELOC_386_GOT32X:
13852     case BFD_RELOC_386_GOTOFF:
13853     case BFD_RELOC_386_GOTPC:
13854     case BFD_RELOC_386_TLS_GD:
13855     case BFD_RELOC_386_TLS_LDM:
13856     case BFD_RELOC_386_TLS_LDO_32:
13857     case BFD_RELOC_386_TLS_IE_32:
13858     case BFD_RELOC_386_TLS_IE:
13859     case BFD_RELOC_386_TLS_GOTIE:
13860     case BFD_RELOC_386_TLS_LE_32:
13861     case BFD_RELOC_386_TLS_LE:
13862     case BFD_RELOC_386_TLS_GOTDESC:
13863     case BFD_RELOC_386_TLS_DESC_CALL:
13864     case BFD_RELOC_X86_64_TLSGD:
13865     case BFD_RELOC_X86_64_TLSLD:
13866     case BFD_RELOC_X86_64_DTPOFF32:
13867     case BFD_RELOC_X86_64_DTPOFF64:
13868     case BFD_RELOC_X86_64_GOTTPOFF:
13869     case BFD_RELOC_X86_64_TPOFF32:
13870     case BFD_RELOC_X86_64_TPOFF64:
13871     case BFD_RELOC_X86_64_GOTOFF64:
13872     case BFD_RELOC_X86_64_GOTPC32:
13873     case BFD_RELOC_X86_64_GOT64:
13874     case BFD_RELOC_X86_64_GOTPCREL64:
13875     case BFD_RELOC_X86_64_GOTPC64:
13876     case BFD_RELOC_X86_64_GOTPLT64:
13877     case BFD_RELOC_X86_64_PLTOFF64:
13878     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13879     case BFD_RELOC_X86_64_TLSDESC_CALL:
13880     case BFD_RELOC_RVA:
13881     case BFD_RELOC_VTABLE_ENTRY:
13882     case BFD_RELOC_VTABLE_INHERIT:
13883 #ifdef TE_PE
13884     case BFD_RELOC_32_SECREL:
13885 #endif
13886       code = fixp->fx_r_type;
13887       break;
13888     case BFD_RELOC_X86_64_32S:
13889       if (!fixp->fx_pcrel)
13890         {
13891           /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32.  */
13892           code = fixp->fx_r_type;
13893           break;
13894         }
13895       /* Fall through.  */
13896     default:
13897       if (fixp->fx_pcrel)
13898         {
13899           switch (fixp->fx_size)
13900             {
13901             default:
13902               as_bad_where (fixp->fx_file, fixp->fx_line,
13903                             _("can not do %d byte pc-relative relocation"),
13904                             fixp->fx_size);
13905               code = BFD_RELOC_32_PCREL;
13906               break;
13907             case 1: code = BFD_RELOC_8_PCREL;  break;
13908             case 2: code = BFD_RELOC_16_PCREL; break;
13909             case 4: code = BFD_RELOC_32_PCREL; break;
13910 #ifdef BFD64
13911             case 8: code = BFD_RELOC_64_PCREL; break;
13912 #endif
13913             }
13914         }
13915       else
13916         {
13917           switch (fixp->fx_size)
13918             {
13919             default:
13920               as_bad_where (fixp->fx_file, fixp->fx_line,
13921                             _("can not do %d byte relocation"),
13922                             fixp->fx_size);
13923               code = BFD_RELOC_32;
13924               break;
13925             case 1: code = BFD_RELOC_8;  break;
13926             case 2: code = BFD_RELOC_16; break;
13927             case 4: code = BFD_RELOC_32; break;
13928 #ifdef BFD64
13929             case 8: code = BFD_RELOC_64; break;
13930 #endif
13931             }
13932         }
13933       break;
13934     }
13935
13936   if ((code == BFD_RELOC_32
13937        || code == BFD_RELOC_32_PCREL
13938        || code == BFD_RELOC_X86_64_32S)
13939       && GOT_symbol
13940       && fixp->fx_addsy == GOT_symbol)
13941     {
13942       if (!object_64bit)
13943         code = BFD_RELOC_386_GOTPC;
13944       else
13945         code = BFD_RELOC_X86_64_GOTPC32;
13946     }
13947   if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13948       && GOT_symbol
13949       && fixp->fx_addsy == GOT_symbol)
13950     {
13951       code = BFD_RELOC_X86_64_GOTPC64;
13952     }
13953
13954   rel = XNEW (arelent);
13955   rel->sym_ptr_ptr = XNEW (asymbol *);
13956   *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
13957
13958   rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
13959
13960   if (!use_rela_relocations)
13961     {
13962       /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
13963          vtable entry to be used in the relocation's section offset.  */
13964       if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
13965         rel->address = fixp->fx_offset;
13966 #if defined (OBJ_COFF) && defined (TE_PE)
13967       else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
13968         rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
13969       else
13970 #endif
13971       rel->addend = 0;
13972     }
13973   /* Use the rela in 64bit mode.  */
13974   else
13975     {
13976       if (disallow_64bit_reloc)
13977         switch (code)
13978           {
13979           case BFD_RELOC_X86_64_DTPOFF64:
13980           case BFD_RELOC_X86_64_TPOFF64:
13981           case BFD_RELOC_64_PCREL:
13982           case BFD_RELOC_X86_64_GOTOFF64:
13983           case BFD_RELOC_X86_64_GOT64:
13984           case BFD_RELOC_X86_64_GOTPCREL64:
13985           case BFD_RELOC_X86_64_GOTPC64:
13986           case BFD_RELOC_X86_64_GOTPLT64:
13987           case BFD_RELOC_X86_64_PLTOFF64:
13988             as_bad_where (fixp->fx_file, fixp->fx_line,
13989                           _("cannot represent relocation type %s in x32 mode"),
13990                           bfd_get_reloc_code_name (code));
13991             break;
13992           default:
13993             break;
13994           }
13995
13996       if (!fixp->fx_pcrel)
13997         rel->addend = fixp->fx_offset;
13998       else
13999         switch (code)
14000           {
14001           case BFD_RELOC_X86_64_PLT32:
14002           case BFD_RELOC_X86_64_GOT32:
14003           case BFD_RELOC_X86_64_GOTPCREL:
14004           case BFD_RELOC_X86_64_GOTPCRELX:
14005           case BFD_RELOC_X86_64_REX_GOTPCRELX:
14006           case BFD_RELOC_X86_64_TLSGD:
14007           case BFD_RELOC_X86_64_TLSLD:
14008           case BFD_RELOC_X86_64_GOTTPOFF:
14009           case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14010           case BFD_RELOC_X86_64_TLSDESC_CALL:
14011             rel->addend = fixp->fx_offset - fixp->fx_size;
14012             break;
14013           default:
14014             rel->addend = (section->vma
14015                            - fixp->fx_size
14016                            + fixp->fx_addnumber
14017                            + md_pcrel_from (fixp));
14018             break;
14019           }
14020     }
14021
14022   rel->howto = bfd_reloc_type_lookup (stdoutput, code);
14023   if (rel->howto == NULL)
14024     {
14025       as_bad_where (fixp->fx_file, fixp->fx_line,
14026                     _("cannot represent relocation type %s"),
14027                     bfd_get_reloc_code_name (code));
14028       /* Set howto to a garbage value so that we can keep going.  */
14029       rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
14030       gas_assert (rel->howto != NULL);
14031     }
14032
14033   return rel;
14034 }
14035
14036 #include "tc-i386-intel.c"
14037
14038 void
14039 tc_x86_parse_to_dw2regnum (expressionS *exp)
14040 {
14041   int saved_naked_reg;
14042   char saved_register_dot;
14043
14044   saved_naked_reg = allow_naked_reg;
14045   allow_naked_reg = 1;
14046   saved_register_dot = register_chars['.'];
14047   register_chars['.'] = '.';
14048   allow_pseudo_reg = 1;
14049   expression_and_evaluate (exp);
14050   allow_pseudo_reg = 0;
14051   register_chars['.'] = saved_register_dot;
14052   allow_naked_reg = saved_naked_reg;
14053
14054   if (exp->X_op == O_register && exp->X_add_number >= 0)
14055     {
14056       if ((addressT) exp->X_add_number < i386_regtab_size)
14057         {
14058           exp->X_op = O_constant;
14059           exp->X_add_number = i386_regtab[exp->X_add_number]
14060                               .dw2_regnum[flag_code >> 1];
14061         }
14062       else
14063         exp->X_op = O_illegal;
14064     }
14065 }
14066
14067 void
14068 tc_x86_frame_initial_instructions (void)
14069 {
14070   static unsigned int sp_regno[2];
14071
14072   if (!sp_regno[flag_code >> 1])
14073     {
14074       char *saved_input = input_line_pointer;
14075       char sp[][4] = {"esp", "rsp"};
14076       expressionS exp;
14077
14078       input_line_pointer = sp[flag_code >> 1];
14079       tc_x86_parse_to_dw2regnum (&exp);
14080       gas_assert (exp.X_op == O_constant);
14081       sp_regno[flag_code >> 1] = exp.X_add_number;
14082       input_line_pointer = saved_input;
14083     }
14084
14085   cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14086   cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
14087 }
14088
14089 int
14090 x86_dwarf2_addr_size (void)
14091 {
14092 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14093   if (x86_elf_abi == X86_64_X32_ABI)
14094     return 4;
14095 #endif
14096   return bfd_arch_bits_per_address (stdoutput) / 8;
14097 }
14098
14099 int
14100 i386_elf_section_type (const char *str, size_t len)
14101 {
14102   if (flag_code == CODE_64BIT
14103       && len == sizeof ("unwind") - 1
14104       && strncmp (str, "unwind", 6) == 0)
14105     return SHT_X86_64_UNWIND;
14106
14107   return -1;
14108 }
14109
14110 #ifdef TE_SOLARIS
14111 void
14112 i386_solaris_fix_up_eh_frame (segT sec)
14113 {
14114   if (flag_code == CODE_64BIT)
14115     elf_section_type (sec) = SHT_X86_64_UNWIND;
14116 }
14117 #endif
14118
14119 #ifdef TE_PE
14120 void
14121 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14122 {
14123   expressionS exp;
14124
14125   exp.X_op = O_secrel;
14126   exp.X_add_symbol = symbol;
14127   exp.X_add_number = 0;
14128   emit_expr (&exp, size);
14129 }
14130 #endif
14131
14132 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14133 /* For ELF on x86-64, add support for SHF_X86_64_LARGE.  */
14134
14135 bfd_vma
14136 x86_64_section_letter (int letter, const char **ptr_msg)
14137 {
14138   if (flag_code == CODE_64BIT)
14139     {
14140       if (letter == 'l')
14141         return SHF_X86_64_LARGE;
14142
14143       *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
14144     }
14145   else
14146     *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
14147   return -1;
14148 }
14149
14150 bfd_vma
14151 x86_64_section_word (char *str, size_t len)
14152 {
14153   if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
14154     return SHF_X86_64_LARGE;
14155
14156   return -1;
14157 }
14158
14159 static void
14160 handle_large_common (int small ATTRIBUTE_UNUSED)
14161 {
14162   if (flag_code != CODE_64BIT)
14163     {
14164       s_comm_internal (0, elf_common_parse);
14165       as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14166     }
14167   else
14168     {
14169       static segT lbss_section;
14170       asection *saved_com_section_ptr = elf_com_section_ptr;
14171       asection *saved_bss_section = bss_section;
14172
14173       if (lbss_section == NULL)
14174         {
14175           flagword applicable;
14176           segT seg = now_seg;
14177           subsegT subseg = now_subseg;
14178
14179           /* The .lbss section is for local .largecomm symbols.  */
14180           lbss_section = subseg_new (".lbss", 0);
14181           applicable = bfd_applicable_section_flags (stdoutput);
14182           bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
14183           seg_info (lbss_section)->bss = 1;
14184
14185           subseg_set (seg, subseg);
14186         }
14187
14188       elf_com_section_ptr = &_bfd_elf_large_com_section;
14189       bss_section = lbss_section;
14190
14191       s_comm_internal (0, elf_common_parse);
14192
14193       elf_com_section_ptr = saved_com_section_ptr;
14194       bss_section = saved_bss_section;
14195     }
14196 }
14197 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */