gas/config/tc-i386.c

   1 /* tc-i386.c -- Assemble code for the Intel 80386
   2    Copyright (C) 1989-2020 Free Software Foundation, Inc.
   3
   4    This file is part of GAS, the GNU Assembler.
   5
   6    GAS is free software; you can redistribute it and/or modify
   7    it under the terms of the GNU General Public License as published by
   8    the Free Software Foundation; either version 3, or (at your option)
   9    any later version.
  10
  11    GAS is distributed in the hope that it will be useful,
  12    but WITHOUT ANY WARRANTY; without even the implied warranty of
  13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14    GNU General Public License for more details.
  15
  16    You should have received a copy of the GNU General Public License
  17    along with GAS; see the file COPYING.  If not, write to the Free
  18    Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
  19    02110-1301, USA.  */
  20
  21 /* Intel 80386 machine specific gas.
  22    Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
  23    x86_64 support by Jan Hubicka (jh@suse.cz)
  24    VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
  25    Bugs & suggestions are completely welcome.  This is free software.
  26    Please help us make it better.  */
  27
  28 #include "as.h"
  29 #include "safe-ctype.h"
  30 #include "subsegs.h"
  31 #include "dwarf2dbg.h"
  32 #include "dw2gencfi.h"
  33 #include "elf/x86-64.h"
  34 #include "opcodes/i386-init.h"
  35
  36 #ifdef HAVE_LIMITS_H
  37 #include <limits.h>
  38 #else
  39 #ifdef HAVE_SYS_PARAM_H
  40 #include <sys/param.h>
  41 #endif
  42 #ifndef INT_MAX
  43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
  44 #endif
  45 #endif
  46
  47 #ifndef INFER_ADDR_PREFIX
  48 #define INFER_ADDR_PREFIX 1
  49 #endif
  50
  51 #ifndef DEFAULT_ARCH
  52 #define DEFAULT_ARCH "i386"
  53 #endif
  54
  55 #ifndef INLINE
  56 #if __GNUC__ >= 2
  57 #define INLINE __inline__
  58 #else
  59 #define INLINE
  60 #endif
  61 #endif
  62
  63 /* Prefixes will be emitted in the order defined below.
  64    WAIT_PREFIX must be the first prefix since FWAIT is really is an
  65    instruction, and so must come before any prefixes.
  66    The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
  67    REP_PREFIX/HLE_PREFIX, LOCK_PREFIX.  */
  68 #define WAIT_PREFIX     0
  69 #define SEG_PREFIX      1
  70 #define ADDR_PREFIX     2
  71 #define DATA_PREFIX     3
  72 #define REP_PREFIX      4
  73 #define HLE_PREFIX      REP_PREFIX
  74 #define BND_PREFIX      REP_PREFIX
  75 #define LOCK_PREFIX     5
  76 #define REX_PREFIX      6       /* must come last.  */
  77 #define MAX_PREFIXES    7       /* max prefixes per opcode */
  78
  79 /* we define the syntax here (modulo base,index,scale syntax) */
  80 #define REGISTER_PREFIX '%'
  81 #define IMMEDIATE_PREFIX '$'
  82 #define ABSOLUTE_PREFIX '*'
  83
  84 /* these are the instruction mnemonic suffixes in AT&T syntax or
  85    memory operand size in Intel syntax.  */
  86 #define WORD_MNEM_SUFFIX  'w'
  87 #define BYTE_MNEM_SUFFIX  'b'
  88 #define SHORT_MNEM_SUFFIX 's'
  89 #define LONG_MNEM_SUFFIX  'l'
  90 #define QWORD_MNEM_SUFFIX  'q'
  91 /* Intel Syntax.  Use a non-ascii letter since since it never appears
  92    in instructions.  */
  93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
  94
  95 #define END_OF_INSN '\0'
  96
  97 /* This matches the C -> StaticRounding alias in the opcode table.  */
  98 #define commutative staticrounding
  99
 100 /*
 101   'templates' is for grouping together 'template' structures for opcodes
 102   of the same name.  This is only used for storing the insns in the grand
 103   ole hash table of insns.
 104   The templates themselves start at START and range up to (but not including)
 105   END.
 106   */
 107 typedef struct
 108 {
 109   const insn_template *start;
 110   const insn_template *end;
 111 }
 112 templates;
 113
 114 /* 386 operand encoding bytes:  see 386 book for details of this.  */
 115 typedef struct
 116 {
 117   unsigned int regmem;  /* codes register or memory operand */
 118   unsigned int reg;     /* codes register operand (or extended opcode) */
 119   unsigned int mode;    /* how to interpret regmem & reg */
 120 }
 121 modrm_byte;
 122
 123 /* x86-64 extension prefix.  */
 124 typedef int rex_byte;
 125
 126 /* 386 opcode byte to code indirect addressing.  */
 127 typedef struct
 128 {
 129   unsigned base;
 130   unsigned index;
 131   unsigned scale;
 132 }
 133 sib_byte;
 134
 135 /* x86 arch names, types and features */
 136 typedef struct
 137 {
 138   const char *name;             /* arch name */
 139   unsigned int len;             /* arch string length */
 140   enum processor_type type;     /* arch type */
 141   i386_cpu_flags flags;         /* cpu feature flags */
 142   unsigned int skip;            /* show_arch should skip this. */
 143 }
 144 arch_entry;
 145
 146 /* Used to turn off indicated flags.  */
 147 typedef struct
 148 {
 149   const char *name;             /* arch name */
 150   unsigned int len;             /* arch string length */
 151   i386_cpu_flags flags;         /* cpu feature flags */
 152 }
 153 noarch_entry;
 154
 155 static void update_code_flag (int, int);
 156 static void set_code_flag (int);
 157 static void set_16bit_gcc_code_flag (int);
 158 static void set_intel_syntax (int);
 159 static void set_intel_mnemonic (int);
 160 static void set_allow_index_reg (int);
 161 static void set_check (int);
 162 static void set_cpu_arch (int);
 163 #ifdef TE_PE
 164 static void pe_directive_secrel (int);
 165 #endif
 166 static void signed_cons (int);
 167 static char *output_invalid (int c);
 168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
 169                                     const char *);
 170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
 171                                        const char *);
 172 static int i386_att_operand (char *);
 173 static int i386_intel_operand (char *, int);
 174 static int i386_intel_simplify (expressionS *);
 175 static int i386_intel_parse_name (const char *, expressionS *);
 176 static const reg_entry *parse_register (char *, char **);
 177 static char *parse_insn (char *, char *);
 178 static char *parse_operands (char *, const char *);
 179 static void swap_operands (void);
 180 static void swap_2_operands (int, int);
 181 static enum flag_code i386_addressing_mode (void);
 182 static void optimize_imm (void);
 183 static void optimize_disp (void);
 184 static const insn_template *match_template (char);
 185 static int check_string (void);
 186 static int process_suffix (void);
 187 static int check_byte_reg (void);
 188 static int check_long_reg (void);
 189 static int check_qword_reg (void);
 190 static int check_word_reg (void);
 191 static int finalize_imm (void);
 192 static int process_operands (void);
 193 static const seg_entry *build_modrm_byte (void);
 194 static void output_insn (void);
 195 static void output_imm (fragS *, offsetT);
 196 static void output_disp (fragS *, offsetT);
 197 #ifndef I386COFF
 198 static void s_bss (int);
 199 #endif
 200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
 202
 203 /* GNU_PROPERTY_X86_ISA_1_USED.  */
 204 static unsigned int x86_isa_1_used;
 205 /* GNU_PROPERTY_X86_FEATURE_2_USED.  */
 206 static unsigned int x86_feature_2_used;
 207 /* Generate x86 used ISA and feature properties.  */
 208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
 209 #endif
 210
 211 static const char *default_arch = DEFAULT_ARCH;
 212
 213 /* parse_register() returns this when a register alias cannot be used.  */
 214 static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
 215                                    { Dw2Inval, Dw2Inval } };
 216
 217 /* This struct describes rounding control and SAE in the instruction.  */
 218 struct RC_Operation
 219 {
 220   enum rc_type
 221     {
 222       rne = 0,
 223       rd,
 224       ru,
 225       rz,
 226       saeonly
 227     } type;
 228   int operand;
 229 };
 230
 231 static struct RC_Operation rc_op;
 232
 233 /* The struct describes masking, applied to OPERAND in the instruction.
 234    MASK is a pointer to the corresponding mask register.  ZEROING tells
 235    whether merging or zeroing mask is used.  */
 236 struct Mask_Operation
 237 {
 238   const reg_entry *mask;
 239   unsigned int zeroing;
 240   /* The operand where this operation is associated.  */
 241   int operand;
 242 };
 243
 244 static struct Mask_Operation mask_op;
 245
 246 /* The struct describes broadcasting, applied to OPERAND.  FACTOR is
 247    broadcast factor.  */
 248 struct Broadcast_Operation
 249 {
 250   /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}.  */
 251   int type;
 252
 253   /* Index of broadcasted operand.  */
 254   int operand;
 255
 256   /* Number of bytes to broadcast.  */
 257   int bytes;
 258 };
 259
 260 static struct Broadcast_Operation broadcast_op;
 261
 262 /* VEX prefix.  */
 263 typedef struct
 264 {
 265   /* VEX prefix is either 2 byte or 3 byte.  EVEX is 4 byte.  */
 266   unsigned char bytes[4];
 267   unsigned int length;
 268   /* Destination or source register specifier.  */
 269   const reg_entry *register_specifier;
 270 } vex_prefix;
 271
 272 /* 'md_assemble ()' gathers together information and puts it into a
 273    i386_insn.  */
 274
 275 union i386_op
 276   {
 277     expressionS *disps;
 278     expressionS *imms;
 279     const reg_entry *regs;
 280   };
 281
 282 enum i386_error
 283   {
 284     operand_size_mismatch,
 285     operand_type_mismatch,
 286     register_type_mismatch,
 287     number_of_operands_mismatch,
 288     invalid_instruction_suffix,
 289     bad_imm4,
 290     unsupported_with_intel_mnemonic,
 291     unsupported_syntax,
 292     unsupported,
 293     invalid_vsib_address,
 294     invalid_vector_register_set,
 295     unsupported_vector_index_register,
 296     unsupported_broadcast,
 297     broadcast_needed,
 298     unsupported_masking,
 299     mask_not_on_destination,
 300     no_default_mask,
 301     unsupported_rc_sae,
 302     rc_sae_operand_not_last_imm,
 303     invalid_register_operand,
 304   };
 305
 306 struct _i386_insn
 307   {
 308     /* TM holds the template for the insn were currently assembling.  */
 309     insn_template tm;
 310
 311     /* SUFFIX holds the instruction size suffix for byte, word, dword
 312        or qword, if given.  */
 313     char suffix;
 314
 315     /* OPERANDS gives the number of given operands.  */
 316     unsigned int operands;
 317
 318     /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
 319        of given register, displacement, memory operands and immediate
 320        operands.  */
 321     unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
 322
 323     /* TYPES [i] is the type (see above #defines) which tells us how to
 324        use OP[i] for the corresponding operand.  */
 325     i386_operand_type types[MAX_OPERANDS];
 326
 327     /* Displacement expression, immediate expression, or register for each
 328        operand.  */
 329     union i386_op op[MAX_OPERANDS];
 330
 331     /* Flags for operands.  */
 332     unsigned int flags[MAX_OPERANDS];
 333 #define Operand_PCrel 1
 334 #define Operand_Mem   2
 335
 336     /* Relocation type for operand */
 337     enum bfd_reloc_code_real reloc[MAX_OPERANDS];
 338
 339     /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
 340        the base index byte below.  */
 341     const reg_entry *base_reg;
 342     const reg_entry *index_reg;
 343     unsigned int log2_scale_factor;
 344
 345     /* SEG gives the seg_entries of this insn.  They are zero unless
 346        explicit segment overrides are given.  */
 347     const seg_entry *seg[2];
 348
 349     /* Copied first memory operand string, for re-checking.  */
 350     char *memop1_string;
 351
 352     /* PREFIX holds all the given prefix opcodes (usually null).
 353        PREFIXES is the number of prefix opcodes.  */
 354     unsigned int prefixes;
 355     unsigned char prefix[MAX_PREFIXES];
 356
 357     /* Register is in low 3 bits of opcode.  */
 358     bfd_boolean short_form;
 359
 360     /* The operand to a branch insn indicates an absolute branch.  */
 361     bfd_boolean jumpabsolute;
 362
 363     /* Has MMX register operands.  */
 364     bfd_boolean has_regmmx;
 365
 366     /* Has XMM register operands.  */
 367     bfd_boolean has_regxmm;
 368
 369     /* Has YMM register operands.  */
 370     bfd_boolean has_regymm;
 371
 372     /* Has ZMM register operands.  */
 373     bfd_boolean has_regzmm;
 374
 375     /* Has GOTPC or TLS relocation.  */
 376     bfd_boolean has_gotpc_tls_reloc;
 377
 378     /* RM and SIB are the modrm byte and the sib byte where the
 379        addressing modes of this insn are encoded.  */
 380     modrm_byte rm;
 381     rex_byte rex;
 382     rex_byte vrex;
 383     sib_byte sib;
 384     vex_prefix vex;
 385
 386     /* Masking attributes.  */
 387     struct Mask_Operation *mask;
 388
 389     /* Rounding control and SAE attributes.  */
 390     struct RC_Operation *rounding;
 391
 392     /* Broadcasting attributes.  */
 393     struct Broadcast_Operation *broadcast;
 394
 395     /* Compressed disp8*N attribute.  */
 396     unsigned int memshift;
 397
 398     /* Prefer load or store in encoding.  */
 399     enum
 400       {
 401         dir_encoding_default = 0,
 402         dir_encoding_load,
 403         dir_encoding_store,
 404         dir_encoding_swap
 405       } dir_encoding;
 406
 407     /* Prefer 8bit or 32bit displacement in encoding.  */
 408     enum
 409       {
 410         disp_encoding_default = 0,
 411         disp_encoding_8bit,
 412         disp_encoding_32bit
 413       } disp_encoding;
 414
 415     /* Prefer the REX byte in encoding.  */
 416     bfd_boolean rex_encoding;
 417
 418     /* Disable instruction size optimization.  */
 419     bfd_boolean no_optimize;
 420
 421     /* How to encode vector instructions.  */
 422     enum
 423       {
 424         vex_encoding_default = 0,
 425         vex_encoding_vex,
 426         vex_encoding_vex3,
 427         vex_encoding_evex,
 428         vex_encoding_error
 429       } vec_encoding;
 430
 431     /* REP prefix.  */
 432     const char *rep_prefix;
 433
 434     /* HLE prefix.  */
 435     const char *hle_prefix;
 436
 437     /* Have BND prefix.  */
 438     const char *bnd_prefix;
 439
 440     /* Have NOTRACK prefix.  */
 441     const char *notrack_prefix;
 442
 443     /* Error message.  */
 444     enum i386_error error;
 445   };
 446
 447 typedef struct _i386_insn i386_insn;
 448
 449 /* Link RC type with corresponding string, that'll be looked for in
 450    asm.  */
 451 struct RC_name
 452 {
 453   enum rc_type type;
 454   const char *name;
 455   unsigned int len;
 456 };
 457
 458 static const struct RC_name RC_NamesTable[] =
 459 {
 460   {  rne, STRING_COMMA_LEN ("rn-sae") },
 461   {  rd,  STRING_COMMA_LEN ("rd-sae") },
 462   {  ru,  STRING_COMMA_LEN ("ru-sae") },
 463   {  rz,  STRING_COMMA_LEN ("rz-sae") },
 464   {  saeonly,  STRING_COMMA_LEN ("sae") },
 465 };
 466
 467 /* List of chars besides those in app.c:symbol_chars that can start an
 468    operand.  Used to prevent the scrubber eating vital white-space.  */
 469 const char extra_symbol_chars[] = "*%-([{}"
 470 #ifdef LEX_AT
 471         "@"
 472 #endif
 473 #ifdef LEX_QM
 474         "?"
 475 #endif
 476         ;
 477
 478 #if (defined (TE_I386AIX)                               \
 479      || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
 480          && !defined (TE_GNU)                           \
 481          && !defined (TE_LINUX)                         \
 482          && !defined (TE_NACL)                          \
 483          && !defined (TE_FreeBSD)                       \
 484          && !defined (TE_DragonFly)                     \
 485          && !defined (TE_NetBSD)))
 486 /* This array holds the chars that always start a comment.  If the
 487    pre-processor is disabled, these aren't very useful.  The option
 488    --divide will remove '/' from this list.  */
 489 const char *i386_comment_chars = "#/";
 490 #define SVR4_COMMENT_CHARS 1
 491 #define PREFIX_SEPARATOR '\\'
 492
 493 #else
 494 const char *i386_comment_chars = "#";
 495 #define PREFIX_SEPARATOR '/'
 496 #endif
 497
 498 /* This array holds the chars that only start a comment at the beginning of
 499    a line.  If the line seems to have the form '# 123 filename'
 500    .line and .file directives will appear in the pre-processed output.
 501    Note that input_file.c hand checks for '#' at the beginning of the
 502    first line of the input file.  This is because the compiler outputs
 503    #NO_APP at the beginning of its output.
 504    Also note that comments started like this one will always work if
 505    '/' isn't otherwise defined.  */
 506 const char line_comment_chars[] = "#/";
 507
 508 const char line_separator_chars[] = ";";
 509
 510 /* Chars that can be used to separate mant from exp in floating point
 511    nums.  */
 512 const char EXP_CHARS[] = "eE";
 513
 514 /* Chars that mean this number is a floating point constant
 515    As in 0f12.456
 516    or    0d1.2345e12.  */
 517 const char FLT_CHARS[] = "fFdDxX";
 518
 519 /* Tables for lexical analysis.  */
 520 static char mnemonic_chars[256];
 521 static char register_chars[256];
 522 static char operand_chars[256];
 523 static char identifier_chars[256];
 524 static char digit_chars[256];
 525
 526 /* Lexical macros.  */
 527 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
 528 #define is_operand_char(x) (operand_chars[(unsigned char) x])
 529 #define is_register_char(x) (register_chars[(unsigned char) x])
 530 #define is_space_char(x) ((x) == ' ')
 531 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
 532 #define is_digit_char(x) (digit_chars[(unsigned char) x])
 533
 534 /* All non-digit non-letter characters that may occur in an operand.  */
 535 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
 536
 537 /* md_assemble() always leaves the strings it's passed unaltered.  To
 538    effect this we maintain a stack of saved characters that we've smashed
 539    with '\0's (indicating end of strings for various sub-fields of the
 540    assembler instruction).  */
 541 static char save_stack[32];
 542 static char *save_stack_p;
 543 #define END_STRING_AND_SAVE(s) \
 544         do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
 545 #define RESTORE_END_STRING(s) \
 546         do { *(s) = *--save_stack_p; } while (0)
 547
 548 /* The instruction we're assembling.  */
 549 static i386_insn i;
 550
 551 /* Possible templates for current insn.  */
 552 static const templates *current_templates;
 553
 554 /* Per instruction expressionS buffers: max displacements & immediates.  */
 555 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
 556 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
 557
 558 /* Current operand we are working on.  */
 559 static int this_operand = -1;
 560
 561 /* We support four different modes.  FLAG_CODE variable is used to distinguish
 562    these.  */
 563
 564 enum flag_code {
 565         CODE_32BIT,
 566         CODE_16BIT,
 567         CODE_64BIT };
 568
 569 static enum flag_code flag_code;
 570 static unsigned int object_64bit;
 571 static unsigned int disallow_64bit_reloc;
 572 static int use_rela_relocations = 0;
 573 /* __tls_get_addr/___tls_get_addr symbol for TLS.  */
 574 static const char *tls_get_addr;
 575
 576 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
 577      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
 578      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
 579
 580 /* The ELF ABI to use.  */
 581 enum x86_elf_abi
 582 {
 583   I386_ABI,
 584   X86_64_ABI,
 585   X86_64_X32_ABI
 586 };
 587
 588 static enum x86_elf_abi x86_elf_abi = I386_ABI;
 589 #endif
 590
 591 #if defined (TE_PE) || defined (TE_PEP)
 592 /* Use big object file format.  */
 593 static int use_big_obj = 0;
 594 #endif
 595
 596 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 597 /* 1 if generating code for a shared library.  */
 598 static int shared = 0;
 599 #endif
 600
 601 /* 1 for intel syntax,
 602    0 if att syntax.  */
 603 static int intel_syntax = 0;
 604
 605 static enum x86_64_isa
 606 {
 607   amd64 = 1,    /* AMD64 ISA.  */
 608   intel64       /* Intel64 ISA.  */
 609 } isa64;
 610
 611 /* 1 for intel mnemonic,
 612    0 if att mnemonic.  */
 613 static int intel_mnemonic = !SYSV386_COMPAT;
 614
 615 /* 1 if pseudo registers are permitted.  */
 616 static int allow_pseudo_reg = 0;
 617
 618 /* 1 if register prefix % not required.  */
 619 static int allow_naked_reg = 0;
 620
 621 /* 1 if the assembler should add BND prefix for all control-transferring
 622    instructions supporting it, even if this prefix wasn't specified
 623    explicitly.  */
 624 static int add_bnd_prefix = 0;
 625
 626 /* 1 if pseudo index register, eiz/riz, is allowed .  */
 627 static int allow_index_reg = 0;
 628
 629 /* 1 if the assembler should ignore LOCK prefix, even if it was
 630    specified explicitly.  */
 631 static int omit_lock_prefix = 0;
 632
 633 /* 1 if the assembler should encode lfence, mfence, and sfence as
 634    "lock addl $0, (%{re}sp)".  */
 635 static int avoid_fence = 0;
 636
 637 /* 1 if lfence should be inserted after every load.  */
 638 static int lfence_after_load = 0;
 639
 640 /* Non-zero if lfence should be inserted before indirect branch.  */
 641 static enum lfence_before_indirect_branch_kind
 642   {
 643     lfence_branch_none = 0,
 644     lfence_branch_register,
 645     lfence_branch_memory,
 646     lfence_branch_all
 647   }
 648 lfence_before_indirect_branch;
 649
 650 /* Non-zero if lfence should be inserted before ret.  */
 651 static enum lfence_before_ret_kind
 652   {
 653     lfence_before_ret_none = 0,
 654     lfence_before_ret_not,
 655     lfence_before_ret_or,
 656     lfence_before_ret_shl
 657   }
 658 lfence_before_ret;
 659
 660 /* Types of previous instruction is .byte or prefix.  */
 661 static struct
 662   {
 663     segT seg;
 664     const char *file;
 665     const char *name;
 666     unsigned int line;
 667     enum last_insn_kind
 668       {
 669         last_insn_other = 0,
 670         last_insn_directive,
 671         last_insn_prefix
 672       } kind;
 673   } last_insn;
 674
 675 /* 1 if the assembler should generate relax relocations.  */
 676
 677 static int generate_relax_relocations
 678   = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
 679
 680 static enum check_kind
 681   {
 682     check_none = 0,
 683     check_warning,
 684     check_error
 685   }
 686 sse_check, operand_check = check_warning;
 687
 688 /* Non-zero if branches should be aligned within power of 2 boundary.  */
 689 static int align_branch_power = 0;
 690
 691 /* Types of branches to align.  */
 692 enum align_branch_kind
 693   {
 694     align_branch_none = 0,
 695     align_branch_jcc = 1,
 696     align_branch_fused = 2,
 697     align_branch_jmp = 3,
 698     align_branch_call = 4,
 699     align_branch_indirect = 5,
 700     align_branch_ret = 6
 701   };
 702
 703 /* Type bits of branches to align.  */
 704 enum align_branch_bit
 705   {
 706     align_branch_jcc_bit = 1 << align_branch_jcc,
 707     align_branch_fused_bit = 1 << align_branch_fused,
 708     align_branch_jmp_bit = 1 << align_branch_jmp,
 709     align_branch_call_bit = 1 << align_branch_call,
 710     align_branch_indirect_bit = 1 << align_branch_indirect,
 711     align_branch_ret_bit = 1 << align_branch_ret
 712   };
 713
 714 static unsigned int align_branch = (align_branch_jcc_bit
 715                                     | align_branch_fused_bit
 716                                     | align_branch_jmp_bit);
 717
 718 /* Types of condition jump used by macro-fusion.  */
 719 enum mf_jcc_kind
 720   {
 721     mf_jcc_jo = 0,  /* base opcode 0x70  */
 722     mf_jcc_jc,      /* base opcode 0x72  */
 723     mf_jcc_je,      /* base opcode 0x74  */
 724     mf_jcc_jna,     /* base opcode 0x76  */
 725     mf_jcc_js,      /* base opcode 0x78  */
 726     mf_jcc_jp,      /* base opcode 0x7a  */
 727     mf_jcc_jl,      /* base opcode 0x7c  */
 728     mf_jcc_jle,     /* base opcode 0x7e  */
 729   };
 730
 731 /* Types of compare flag-modifying insntructions used by macro-fusion.  */
 732 enum mf_cmp_kind
 733   {
 734     mf_cmp_test_and,  /* test/cmp */
 735     mf_cmp_alu_cmp,  /* add/sub/cmp */
 736     mf_cmp_incdec  /* inc/dec */
 737   };
 738
 739 /* The maximum padding size for fused jcc.  CMP like instruction can
 740    be 9 bytes and jcc can be 6 bytes.  Leave room just in case for
 741    prefixes.   */
 742 #define MAX_FUSED_JCC_PADDING_SIZE 20
 743
 744 /* The maximum number of prefixes added for an instruction.  */
 745 static unsigned int align_branch_prefix_size = 5;
 746
 747 /* Optimization:
 748    1. Clear the REX_W bit with register operand if possible.
 749    2. Above plus use 128bit vector instruction to clear the full vector
 750       register.
 751  */
 752 static int optimize = 0;
 753
 754 /* Optimization:
 755    1. Clear the REX_W bit with register operand if possible.
 756    2. Above plus use 128bit vector instruction to clear the full vector
 757       register.
 758    3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
 759       "testb $imm7,%r8".
 760  */
 761 static int optimize_for_space = 0;
 762
 763 /* Register prefix used for error message.  */
 764 static const char *register_prefix = "%";
 765
 766 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
 767    leave, push, and pop instructions so that gcc has the same stack
 768    frame as in 32 bit mode.  */
 769 static char stackop_size = '\0';
 770
 771 /* Non-zero to optimize code alignment.  */
 772 int optimize_align_code = 1;
 773
 774 /* Non-zero to quieten some warnings.  */
 775 static int quiet_warnings = 0;
 776
 777 /* CPU name.  */
 778 static const char *cpu_arch_name = NULL;
 779 static char *cpu_sub_arch_name = NULL;
 780
 781 /* CPU feature flags.  */
 782 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
 783
 784 /* If we have selected a cpu we are generating instructions for.  */
 785 static int cpu_arch_tune_set = 0;
 786
 787 /* Cpu we are generating instructions for.  */
 788 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
 789
 790 /* CPU feature flags of cpu we are generating instructions for.  */
 791 static i386_cpu_flags cpu_arch_tune_flags;
 792
 793 /* CPU instruction set architecture used.  */
 794 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
 795
 796 /* CPU feature flags of instruction set architecture used.  */
 797 i386_cpu_flags cpu_arch_isa_flags;
 798
 799 /* If set, conditional jumps are not automatically promoted to handle
 800    larger than a byte offset.  */
 801 static unsigned int no_cond_jump_promotion = 0;
 802
 803 /* Encode SSE instructions with VEX prefix.  */
 804 static unsigned int sse2avx;
 805
 806 /* Encode scalar AVX instructions with specific vector length.  */
 807 static enum
 808   {
 809     vex128 = 0,
 810     vex256
 811   } avxscalar;
 812
 813 /* Encode VEX WIG instructions with specific vex.w.  */
 814 static enum
 815   {
 816     vexw0 = 0,
 817     vexw1
 818   } vexwig;
 819
 820 /* Encode scalar EVEX LIG instructions with specific vector length.  */
 821 static enum
 822   {
 823     evexl128 = 0,
 824     evexl256,
 825     evexl512
 826   } evexlig;
 827
 828 /* Encode EVEX WIG instructions with specific evex.w.  */
 829 static enum
 830   {
 831     evexw0 = 0,
 832     evexw1
 833   } evexwig;
 834
 835 /* Value to encode in EVEX RC bits, for SAE-only instructions.  */
 836 static enum rc_type evexrcig = rne;
 837
 838 /* Pre-defined "_GLOBAL_OFFSET_TABLE_".  */
 839 static symbolS *GOT_symbol;
 840
 841 /* The dwarf2 return column, adjusted for 32 or 64 bit.  */
 842 unsigned int x86_dwarf2_return_column;
 843
 844 /* The dwarf2 data alignment, adjusted for 32 or 64 bit.  */
 845 int x86_cie_data_alignment;
 846
 847 /* Interface to relax_segment.
 848    There are 3 major relax states for 386 jump insns because the
 849    different types of jumps add different sizes to frags when we're
 850    figuring out what sort of jump to choose to reach a given label.
 851
 852    BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
 853    branches which are handled by md_estimate_size_before_relax() and
 854    i386_generic_table_relax_frag().  */
 855
 856 /* Types.  */
 857 #define UNCOND_JUMP 0
 858 #define COND_JUMP 1
 859 #define COND_JUMP86 2
 860 #define BRANCH_PADDING 3
 861 #define BRANCH_PREFIX 4
 862 #define FUSED_JCC_PADDING 5
 863
 864 /* Sizes.  */
 865 #define CODE16  1
 866 #define SMALL   0
 867 #define SMALL16 (SMALL | CODE16)
 868 #define BIG     2
 869 #define BIG16   (BIG | CODE16)
 870
 871 #ifndef INLINE
 872 #ifdef __GNUC__
 873 #define INLINE __inline__
 874 #else
 875 #define INLINE
 876 #endif
 877 #endif
 878
 879 #define ENCODE_RELAX_STATE(type, size) \
 880   ((relax_substateT) (((type) << 2) | (size)))
 881 #define TYPE_FROM_RELAX_STATE(s) \
 882   ((s) >> 2)
 883 #define DISP_SIZE_FROM_RELAX_STATE(s) \
 884     ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
 885
 886 /* This table is used by relax_frag to promote short jumps to long
 887    ones where necessary.  SMALL (short) jumps may be promoted to BIG
 888    (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long).  We
 889    don't allow a short jump in a 32 bit code segment to be promoted to
 890    a 16 bit offset jump because it's slower (requires data size
 891    prefix), and doesn't work, unless the destination is in the bottom
 892    64k of the code segment (The top 16 bits of eip are zeroed).  */
 893
 894 const relax_typeS md_relax_table[] =
 895 {
 896   /* The fields are:
 897      1) most positive reach of this state,
 898      2) most negative reach of this state,
 899      3) how many bytes this mode will have in the variable part of the frag
 900      4) which index into the table to try if we can't fit into this one.  */
 901
 902   /* UNCOND_JUMP states.  */
 903   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
 904   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
 905   /* dword jmp adds 4 bytes to frag:
 906      0 extra opcode bytes, 4 displacement bytes.  */
 907   {0, 0, 4, 0},
 908   /* word jmp adds 2 byte2 to frag:
 909      0 extra opcode bytes, 2 displacement bytes.  */
 910   {0, 0, 2, 0},
 911
 912   /* COND_JUMP states.  */
 913   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
 914   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
 915   /* dword conditionals adds 5 bytes to frag:
 916      1 extra opcode byte, 4 displacement bytes.  */
 917   {0, 0, 5, 0},
 918   /* word conditionals add 3 bytes to frag:
 919      1 extra opcode byte, 2 displacement bytes.  */
 920   {0, 0, 3, 0},
 921
 922   /* COND_JUMP86 states.  */
 923   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
 924   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
 925   /* dword conditionals adds 5 bytes to frag:
 926      1 extra opcode byte, 4 displacement bytes.  */
 927   {0, 0, 5, 0},
 928   /* word conditionals add 4 bytes to frag:
 929      1 displacement byte and a 3 byte long branch insn.  */
 930   {0, 0, 4, 0}
 931 };
 932
 933 static const arch_entry cpu_arch[] =
 934 {
 935   /* Do not replace the first two entries - i386_target_format()
 936      relies on them being there in this order.  */
 937   { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
 938     CPU_GENERIC32_FLAGS, 0 },
 939   { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
 940     CPU_GENERIC64_FLAGS, 0 },
 941   { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
 942     CPU_NONE_FLAGS, 0 },
 943   { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
 944     CPU_I186_FLAGS, 0 },
 945   { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
 946     CPU_I286_FLAGS, 0 },
 947   { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
 948     CPU_I386_FLAGS, 0 },
 949   { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
 950     CPU_I486_FLAGS, 0 },
 951   { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
 952     CPU_I586_FLAGS, 0 },
 953   { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
 954     CPU_I686_FLAGS, 0 },
 955   { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
 956     CPU_I586_FLAGS, 0 },
 957   { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
 958     CPU_PENTIUMPRO_FLAGS, 0 },
 959   { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
 960     CPU_P2_FLAGS, 0 },
 961   { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
 962     CPU_P3_FLAGS, 0 },
 963   { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
 964     CPU_P4_FLAGS, 0 },
 965   { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
 966     CPU_CORE_FLAGS, 0 },
 967   { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
 968     CPU_NOCONA_FLAGS, 0 },
 969   { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
 970     CPU_CORE_FLAGS, 1 },
 971   { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
 972     CPU_CORE_FLAGS, 0 },
 973   { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
 974     CPU_CORE2_FLAGS, 1 },
 975   { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
 976     CPU_CORE2_FLAGS, 0 },
 977   { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
 978     CPU_COREI7_FLAGS, 0 },
 979   { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
 980     CPU_L1OM_FLAGS, 0 },
 981   { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
 982     CPU_K1OM_FLAGS, 0 },
 983   { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
 984     CPU_IAMCU_FLAGS, 0 },
 985   { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
 986     CPU_K6_FLAGS, 0 },
 987   { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
 988     CPU_K6_2_FLAGS, 0 },
 989   { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
 990     CPU_ATHLON_FLAGS, 0 },
 991   { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
 992     CPU_K8_FLAGS, 1 },
 993   { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
 994     CPU_K8_FLAGS, 0 },
 995   { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
 996     CPU_K8_FLAGS, 0 },
 997   { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
 998     CPU_AMDFAM10_FLAGS, 0 },
 999   { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
1000     CPU_BDVER1_FLAGS, 0 },
1001   { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
1002     CPU_BDVER2_FLAGS, 0 },
1003   { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
1004     CPU_BDVER3_FLAGS, 0 },
1005   { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
1006     CPU_BDVER4_FLAGS, 0 },
1007   { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
1008     CPU_ZNVER1_FLAGS, 0 },
1009   { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1010     CPU_ZNVER2_FLAGS, 0 },
1011   { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
1012     CPU_BTVER1_FLAGS, 0 },
1013   { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
1014     CPU_BTVER2_FLAGS, 0 },
1015   { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
1016     CPU_8087_FLAGS, 0 },
1017   { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
1018     CPU_287_FLAGS, 0 },
1019   { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
1020     CPU_387_FLAGS, 0 },
1021   { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1022     CPU_687_FLAGS, 0 },
1023   { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1024     CPU_CMOV_FLAGS, 0 },
1025   { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1026     CPU_FXSR_FLAGS, 0 },
1027   { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
1028     CPU_MMX_FLAGS, 0 },
1029   { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
1030     CPU_SSE_FLAGS, 0 },
1031   { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
1032     CPU_SSE2_FLAGS, 0 },
1033   { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
1034     CPU_SSE3_FLAGS, 0 },
1035   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1036     CPU_SSE4A_FLAGS, 0 },
1037   { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
1038     CPU_SSSE3_FLAGS, 0 },
1039   { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
1040     CPU_SSE4_1_FLAGS, 0 },
1041   { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
1042     CPU_SSE4_2_FLAGS, 0 },
1043   { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
1044     CPU_SSE4_2_FLAGS, 0 },
1045   { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
1046     CPU_AVX_FLAGS, 0 },
1047   { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
1048     CPU_AVX2_FLAGS, 0 },
1049   { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
1050     CPU_AVX512F_FLAGS, 0 },
1051   { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1052     CPU_AVX512CD_FLAGS, 0 },
1053   { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1054     CPU_AVX512ER_FLAGS, 0 },
1055   { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1056     CPU_AVX512PF_FLAGS, 0 },
1057   { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1058     CPU_AVX512DQ_FLAGS, 0 },
1059   { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1060     CPU_AVX512BW_FLAGS, 0 },
1061   { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1062     CPU_AVX512VL_FLAGS, 0 },
1063   { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1064     CPU_VMX_FLAGS, 0 },
1065   { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1066     CPU_VMFUNC_FLAGS, 0 },
1067   { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1068     CPU_SMX_FLAGS, 0 },
1069   { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1070     CPU_XSAVE_FLAGS, 0 },
1071   { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1072     CPU_XSAVEOPT_FLAGS, 0 },
1073   { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1074     CPU_XSAVEC_FLAGS, 0 },
1075   { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1076     CPU_XSAVES_FLAGS, 0 },
1077   { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1078     CPU_AES_FLAGS, 0 },
1079   { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1080     CPU_PCLMUL_FLAGS, 0 },
1081   { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1082     CPU_PCLMUL_FLAGS, 1 },
1083   { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1084     CPU_FSGSBASE_FLAGS, 0 },
1085   { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1086     CPU_RDRND_FLAGS, 0 },
1087   { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1088     CPU_F16C_FLAGS, 0 },
1089   { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1090     CPU_BMI2_FLAGS, 0 },
1091   { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1092     CPU_FMA_FLAGS, 0 },
1093   { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1094     CPU_FMA4_FLAGS, 0 },
1095   { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1096     CPU_XOP_FLAGS, 0 },
1097   { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1098     CPU_LWP_FLAGS, 0 },
1099   { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1100     CPU_MOVBE_FLAGS, 0 },
1101   { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1102     CPU_CX16_FLAGS, 0 },
1103   { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1104     CPU_EPT_FLAGS, 0 },
1105   { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1106     CPU_LZCNT_FLAGS, 0 },
1107   { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1108     CPU_POPCNT_FLAGS, 0 },
1109   { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1110     CPU_HLE_FLAGS, 0 },
1111   { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1112     CPU_RTM_FLAGS, 0 },
1113   { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1114     CPU_INVPCID_FLAGS, 0 },
1115   { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1116     CPU_CLFLUSH_FLAGS, 0 },
1117   { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1118     CPU_NOP_FLAGS, 0 },
1119   { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1120     CPU_SYSCALL_FLAGS, 0 },
1121   { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1122     CPU_RDTSCP_FLAGS, 0 },
1123   { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1124     CPU_3DNOW_FLAGS, 0 },
1125   { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1126     CPU_3DNOWA_FLAGS, 0 },
1127   { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1128     CPU_PADLOCK_FLAGS, 0 },
1129   { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1130     CPU_SVME_FLAGS, 1 },
1131   { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1132     CPU_SVME_FLAGS, 0 },
1133   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1134     CPU_SSE4A_FLAGS, 0 },
1135   { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1136     CPU_ABM_FLAGS, 0 },
1137   { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1138     CPU_BMI_FLAGS, 0 },
1139   { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1140     CPU_TBM_FLAGS, 0 },
1141   { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1142     CPU_ADX_FLAGS, 0 },
1143   { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1144     CPU_RDSEED_FLAGS, 0 },
1145   { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1146     CPU_PRFCHW_FLAGS, 0 },
1147   { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1148     CPU_SMAP_FLAGS, 0 },
1149   { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1150     CPU_MPX_FLAGS, 0 },
1151   { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1152     CPU_SHA_FLAGS, 0 },
1153   { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1154     CPU_CLFLUSHOPT_FLAGS, 0 },
1155   { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1156     CPU_PREFETCHWT1_FLAGS, 0 },
1157   { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1158     CPU_SE1_FLAGS, 0 },
1159   { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1160     CPU_CLWB_FLAGS, 0 },
1161   { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1162     CPU_AVX512IFMA_FLAGS, 0 },
1163   { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1164     CPU_AVX512VBMI_FLAGS, 0 },
1165   { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1166     CPU_AVX512_4FMAPS_FLAGS, 0 },
1167   { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1168     CPU_AVX512_4VNNIW_FLAGS, 0 },
1169   { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1170     CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1171   { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1172     CPU_AVX512_VBMI2_FLAGS, 0 },
1173   { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1174     CPU_AVX512_VNNI_FLAGS, 0 },
1175   { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1176     CPU_AVX512_BITALG_FLAGS, 0 },
1177   { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1178     CPU_CLZERO_FLAGS, 0 },
1179   { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1180     CPU_MWAITX_FLAGS, 0 },
1181   { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1182     CPU_OSPKE_FLAGS, 0 },
1183   { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1184     CPU_RDPID_FLAGS, 0 },
1185   { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1186     CPU_PTWRITE_FLAGS, 0 },
1187   { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1188     CPU_IBT_FLAGS, 0 },
1189   { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1190     CPU_SHSTK_FLAGS, 0 },
1191   { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1192     CPU_GFNI_FLAGS, 0 },
1193   { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1194     CPU_VAES_FLAGS, 0 },
1195   { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1196     CPU_VPCLMULQDQ_FLAGS, 0 },
1197   { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1198     CPU_WBNOINVD_FLAGS, 0 },
1199   { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1200     CPU_PCONFIG_FLAGS, 0 },
1201   { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1202     CPU_WAITPKG_FLAGS, 0 },
1203   { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1204     CPU_CLDEMOTE_FLAGS, 0 },
1205   { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1206     CPU_MOVDIRI_FLAGS, 0 },
1207   { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1208     CPU_MOVDIR64B_FLAGS, 0 },
1209   { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1210     CPU_AVX512_BF16_FLAGS, 0 },
1211   { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1212     CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1213   { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1214     CPU_ENQCMD_FLAGS, 0 },
1215   { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1216     CPU_SERIALIZE_FLAGS, 0 },
1217   { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1218     CPU_RDPRU_FLAGS, 0 },
1219   { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1220     CPU_MCOMMIT_FLAGS, 0 },
1221   { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1222     CPU_SEV_ES_FLAGS, 0 },
1223   { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1224     CPU_TSXLDTRK_FLAGS, 0 },
1225 };
1226
1227 static const noarch_entry cpu_noarch[] =
1228 {
1229   { STRING_COMMA_LEN ("no87"),  CPU_ANY_X87_FLAGS },
1230   { STRING_COMMA_LEN ("no287"),  CPU_ANY_287_FLAGS },
1231   { STRING_COMMA_LEN ("no387"),  CPU_ANY_387_FLAGS },
1232   { STRING_COMMA_LEN ("no687"),  CPU_ANY_687_FLAGS },
1233   { STRING_COMMA_LEN ("nocmov"),  CPU_ANY_CMOV_FLAGS },
1234   { STRING_COMMA_LEN ("nofxsr"),  CPU_ANY_FXSR_FLAGS },
1235   { STRING_COMMA_LEN ("nommx"),  CPU_ANY_MMX_FLAGS },
1236   { STRING_COMMA_LEN ("nosse"),  CPU_ANY_SSE_FLAGS },
1237   { STRING_COMMA_LEN ("nosse2"),  CPU_ANY_SSE2_FLAGS },
1238   { STRING_COMMA_LEN ("nosse3"),  CPU_ANY_SSE3_FLAGS },
1239   { STRING_COMMA_LEN ("nosse4a"),  CPU_ANY_SSE4A_FLAGS },
1240   { STRING_COMMA_LEN ("nossse3"),  CPU_ANY_SSSE3_FLAGS },
1241   { STRING_COMMA_LEN ("nosse4.1"),  CPU_ANY_SSE4_1_FLAGS },
1242   { STRING_COMMA_LEN ("nosse4.2"),  CPU_ANY_SSE4_2_FLAGS },
1243   { STRING_COMMA_LEN ("nosse4"),  CPU_ANY_SSE4_1_FLAGS },
1244   { STRING_COMMA_LEN ("noavx"),  CPU_ANY_AVX_FLAGS },
1245   { STRING_COMMA_LEN ("noavx2"),  CPU_ANY_AVX2_FLAGS },
1246   { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1247   { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1248   { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1249   { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1250   { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1251   { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1252   { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1253   { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1254   { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1255   { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1256   { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1257   { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1258   { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1259   { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1260   { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1261   { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1262   { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1263   { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1264   { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1265   { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1266   { STRING_COMMA_LEN ("noavx512_vp2intersect"),
1267     CPU_ANY_AVX512_VP2INTERSECT_FLAGS },
1268   { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1269   { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
1270   { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
1271 };
1272
1273 #ifdef I386COFF
1274 /* Like s_lcomm_internal in gas/read.c but the alignment string
1275    is allowed to be optional.  */
1276
1277 static symbolS *
1278 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1279 {
1280   addressT align = 0;
1281
1282   SKIP_WHITESPACE ();
1283
1284   if (needs_align
1285       && *input_line_pointer == ',')
1286     {
1287       align = parse_align (needs_align - 1);
1288
1289       if (align == (addressT) -1)
1290         return NULL;
1291     }
1292   else
1293     {
1294       if (size >= 8)
1295         align = 3;
1296       else if (size >= 4)
1297         align = 2;
1298       else if (size >= 2)
1299         align = 1;
1300       else
1301         align = 0;
1302     }
1303
1304   bss_alloc (symbolP, size, align);
1305   return symbolP;
1306 }
1307
1308 static void
1309 pe_lcomm (int needs_align)
1310 {
1311   s_comm_internal (needs_align * 2, pe_lcomm_internal);
1312 }
1313 #endif
1314
1315 const pseudo_typeS md_pseudo_table[] =
1316 {
1317 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1318   {"align", s_align_bytes, 0},
1319 #else
1320   {"align", s_align_ptwo, 0},
1321 #endif
1322   {"arch", set_cpu_arch, 0},
1323 #ifndef I386COFF
1324   {"bss", s_bss, 0},
1325 #else
1326   {"lcomm", pe_lcomm, 1},
1327 #endif
1328   {"ffloat", float_cons, 'f'},
1329   {"dfloat", float_cons, 'd'},
1330   {"tfloat", float_cons, 'x'},
1331   {"value", cons, 2},
1332   {"slong", signed_cons, 4},
1333   {"noopt", s_ignore, 0},
1334   {"optim", s_ignore, 0},
1335   {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1336   {"code16", set_code_flag, CODE_16BIT},
1337   {"code32", set_code_flag, CODE_32BIT},
1338 #ifdef BFD64
1339   {"code64", set_code_flag, CODE_64BIT},
1340 #endif
1341   {"intel_syntax", set_intel_syntax, 1},
1342   {"att_syntax", set_intel_syntax, 0},
1343   {"intel_mnemonic", set_intel_mnemonic, 1},
1344   {"att_mnemonic", set_intel_mnemonic, 0},
1345   {"allow_index_reg", set_allow_index_reg, 1},
1346   {"disallow_index_reg", set_allow_index_reg, 0},
1347   {"sse_check", set_check, 0},
1348   {"operand_check", set_check, 1},
1349 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1350   {"largecomm", handle_large_common, 0},
1351 #else
1352   {"file", dwarf2_directive_file, 0},
1353   {"loc", dwarf2_directive_loc, 0},
1354   {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1355 #endif
1356 #ifdef TE_PE
1357   {"secrel32", pe_directive_secrel, 0},
1358 #endif
1359   {0, 0, 0}
1360 };
1361
1362 /* For interface with expression ().  */
1363 extern char *input_line_pointer;
1364
1365 /* Hash table for instruction mnemonic lookup.  */
1366 static struct hash_control *op_hash;
1367
1368 /* Hash table for register lookup.  */
1369 static struct hash_control *reg_hash;
1370 \f
1371   /* Various efficient no-op patterns for aligning code labels.
1372      Note: Don't try to assemble the instructions in the comments.
1373      0L and 0w are not legal.  */
1374 static const unsigned char f32_1[] =
1375   {0x90};                               /* nop                  */
1376 static const unsigned char f32_2[] =
1377   {0x66,0x90};                          /* xchg %ax,%ax         */
1378 static const unsigned char f32_3[] =
1379   {0x8d,0x76,0x00};                     /* leal 0(%esi),%esi    */
1380 static const unsigned char f32_4[] =
1381   {0x8d,0x74,0x26,0x00};                /* leal 0(%esi,1),%esi  */
1382 static const unsigned char f32_6[] =
1383   {0x8d,0xb6,0x00,0x00,0x00,0x00};      /* leal 0L(%esi),%esi   */
1384 static const unsigned char f32_7[] =
1385   {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1386 static const unsigned char f16_3[] =
1387   {0x8d,0x74,0x00};                     /* lea 0(%si),%si       */
1388 static const unsigned char f16_4[] =
1389   {0x8d,0xb4,0x00,0x00};                /* lea 0W(%si),%si      */
1390 static const unsigned char jump_disp8[] =
1391   {0xeb};                               /* jmp disp8           */
1392 static const unsigned char jump32_disp32[] =
1393   {0xe9};                               /* jmp disp32          */
1394 static const unsigned char jump16_disp32[] =
1395   {0x66,0xe9};                          /* jmp disp32          */
1396 /* 32-bit NOPs patterns.  */
1397 static const unsigned char *const f32_patt[] = {
1398   f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1399 };
1400 /* 16-bit NOPs patterns.  */
1401 static const unsigned char *const f16_patt[] = {
1402   f32_1, f32_2, f16_3, f16_4
1403 };
1404 /* nopl (%[re]ax) */
1405 static const unsigned char alt_3[] =
1406   {0x0f,0x1f,0x00};
1407 /* nopl 0(%[re]ax) */
1408 static const unsigned char alt_4[] =
1409   {0x0f,0x1f,0x40,0x00};
1410 /* nopl 0(%[re]ax,%[re]ax,1) */
1411 static const unsigned char alt_5[] =
1412   {0x0f,0x1f,0x44,0x00,0x00};
1413 /* nopw 0(%[re]ax,%[re]ax,1) */
1414 static const unsigned char alt_6[] =
1415   {0x66,0x0f,0x1f,0x44,0x00,0x00};
1416 /* nopl 0L(%[re]ax) */
1417 static const unsigned char alt_7[] =
1418   {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1419 /* nopl 0L(%[re]ax,%[re]ax,1) */
1420 static const unsigned char alt_8[] =
1421   {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1422 /* nopw 0L(%[re]ax,%[re]ax,1) */
1423 static const unsigned char alt_9[] =
1424   {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1425 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1426 static const unsigned char alt_10[] =
1427   {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1428 /* data16 nopw %cs:0L(%eax,%eax,1) */
1429 static const unsigned char alt_11[] =
1430   {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1431 /* 32-bit and 64-bit NOPs patterns.  */
1432 static const unsigned char *const alt_patt[] = {
1433   f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1434   alt_9, alt_10, alt_11
1435 };
1436
1437 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1438    size of a single NOP instruction MAX_SINGLE_NOP_SIZE.  */
1439
1440 static void
1441 i386_output_nops (char *where, const unsigned char *const *patt,
1442                   int count, int max_single_nop_size)
1443
1444 {
1445   /* Place the longer NOP first.  */
1446   int last;
1447   int offset;
1448   const unsigned char *nops;
1449
1450   if (max_single_nop_size < 1)
1451     {
1452       as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1453                 max_single_nop_size);
1454       return;
1455     }
1456
1457   nops = patt[max_single_nop_size - 1];
1458
1459   /* Use the smaller one if the requsted one isn't available.  */
1460   if (nops == NULL)
1461     {
1462       max_single_nop_size--;
1463       nops = patt[max_single_nop_size - 1];
1464     }
1465
1466   last = count % max_single_nop_size;
1467
1468   count -= last;
1469   for (offset = 0; offset < count; offset += max_single_nop_size)
1470     memcpy (where + offset, nops, max_single_nop_size);
1471
1472   if (last)
1473     {
1474       nops = patt[last - 1];
1475       if (nops == NULL)
1476         {
1477           /* Use the smaller one plus one-byte NOP if the needed one
1478              isn't available.  */
1479           last--;
1480           nops = patt[last - 1];
1481           memcpy (where + offset, nops, last);
1482           where[offset + last] = *patt[0];
1483         }
1484       else
1485         memcpy (where + offset, nops, last);
1486     }
1487 }
1488
1489 static INLINE int
1490 fits_in_imm7 (offsetT num)
1491 {
1492   return (num & 0x7f) == num;
1493 }
1494
1495 static INLINE int
1496 fits_in_imm31 (offsetT num)
1497 {
1498   return (num & 0x7fffffff) == num;
1499 }
1500
1501 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1502    single NOP instruction LIMIT.  */
1503
1504 void
1505 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1506 {
1507   const unsigned char *const *patt = NULL;
1508   int max_single_nop_size;
1509   /* Maximum number of NOPs before switching to jump over NOPs.  */
1510   int max_number_of_nops;
1511
1512   switch (fragP->fr_type)
1513     {
1514     case rs_fill_nop:
1515     case rs_align_code:
1516       break;
1517     case rs_machine_dependent:
1518       /* Allow NOP padding for jumps and calls.  */
1519       if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1520           || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1521         break;
1522       /* Fall through.  */
1523     default:
1524       return;
1525     }
1526
1527   /* We need to decide which NOP sequence to use for 32bit and
1528      64bit. When -mtune= is used:
1529
1530      1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1531      PROCESSOR_GENERIC32, f32_patt will be used.
1532      2. For the rest, alt_patt will be used.
1533
1534      When -mtune= isn't used, alt_patt will be used if
1535      cpu_arch_isa_flags has CpuNop.  Otherwise, f32_patt will
1536      be used.
1537
1538      When -march= or .arch is used, we can't use anything beyond
1539      cpu_arch_isa_flags.   */
1540
1541   if (flag_code == CODE_16BIT)
1542     {
1543       patt = f16_patt;
1544       max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1545       /* Limit number of NOPs to 2 in 16-bit mode.  */
1546       max_number_of_nops = 2;
1547     }
1548   else
1549     {
1550       if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1551         {
1552           /* PROCESSOR_UNKNOWN means that all ISAs may be used.  */
1553           switch (cpu_arch_tune)
1554             {
1555             case PROCESSOR_UNKNOWN:
1556               /* We use cpu_arch_isa_flags to check if we SHOULD
1557                  optimize with nops.  */
1558               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1559                 patt = alt_patt;
1560               else
1561                 patt = f32_patt;
1562               break;
1563             case PROCESSOR_PENTIUM4:
1564             case PROCESSOR_NOCONA:
1565             case PROCESSOR_CORE:
1566             case PROCESSOR_CORE2:
1567             case PROCESSOR_COREI7:
1568             case PROCESSOR_L1OM:
1569             case PROCESSOR_K1OM:
1570             case PROCESSOR_GENERIC64:
1571             case PROCESSOR_K6:
1572             case PROCESSOR_ATHLON:
1573             case PROCESSOR_K8:
1574             case PROCESSOR_AMDFAM10:
1575             case PROCESSOR_BD:
1576             case PROCESSOR_ZNVER:
1577             case PROCESSOR_BT:
1578               patt = alt_patt;
1579               break;
1580             case PROCESSOR_I386:
1581             case PROCESSOR_I486:
1582             case PROCESSOR_PENTIUM:
1583             case PROCESSOR_PENTIUMPRO:
1584             case PROCESSOR_IAMCU:
1585             case PROCESSOR_GENERIC32:
1586               patt = f32_patt;
1587               break;
1588             }
1589         }
1590       else
1591         {
1592           switch (fragP->tc_frag_data.tune)
1593             {
1594             case PROCESSOR_UNKNOWN:
1595               /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1596                  PROCESSOR_UNKNOWN.  */
1597               abort ();
1598               break;
1599
1600             case PROCESSOR_I386:
1601             case PROCESSOR_I486:
1602             case PROCESSOR_PENTIUM:
1603             case PROCESSOR_IAMCU:
1604             case PROCESSOR_K6:
1605             case PROCESSOR_ATHLON:
1606             case PROCESSOR_K8:
1607             case PROCESSOR_AMDFAM10:
1608             case PROCESSOR_BD:
1609             case PROCESSOR_ZNVER:
1610             case PROCESSOR_BT:
1611             case PROCESSOR_GENERIC32:
1612               /* We use cpu_arch_isa_flags to check if we CAN optimize
1613                  with nops.  */
1614               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1615                 patt = alt_patt;
1616               else
1617                 patt = f32_patt;
1618               break;
1619             case PROCESSOR_PENTIUMPRO:
1620             case PROCESSOR_PENTIUM4:
1621             case PROCESSOR_NOCONA:
1622             case PROCESSOR_CORE:
1623             case PROCESSOR_CORE2:
1624             case PROCESSOR_COREI7:
1625             case PROCESSOR_L1OM:
1626             case PROCESSOR_K1OM:
1627               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1628                 patt = alt_patt;
1629               else
1630                 patt = f32_patt;
1631               break;
1632             case PROCESSOR_GENERIC64:
1633               patt = alt_patt;
1634               break;
1635             }
1636         }
1637
1638       if (patt == f32_patt)
1639         {
1640           max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1641           /* Limit number of NOPs to 2 for older processors.  */
1642           max_number_of_nops = 2;
1643         }
1644       else
1645         {
1646           max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1647           /* Limit number of NOPs to 7 for newer processors.  */
1648           max_number_of_nops = 7;
1649         }
1650     }
1651
1652   if (limit == 0)
1653     limit = max_single_nop_size;
1654
1655   if (fragP->fr_type == rs_fill_nop)
1656     {
1657       /* Output NOPs for .nop directive.  */
1658       if (limit > max_single_nop_size)
1659         {
1660           as_bad_where (fragP->fr_file, fragP->fr_line,
1661                         _("invalid single nop size: %d "
1662                           "(expect within [0, %d])"),
1663                         limit, max_single_nop_size);
1664           return;
1665         }
1666     }
1667   else if (fragP->fr_type != rs_machine_dependent)
1668     fragP->fr_var = count;
1669
1670   if ((count / max_single_nop_size) > max_number_of_nops)
1671     {
1672       /* Generate jump over NOPs.  */
1673       offsetT disp = count - 2;
1674       if (fits_in_imm7 (disp))
1675         {
1676           /* Use "jmp disp8" if possible.  */
1677           count = disp;
1678           where[0] = jump_disp8[0];
1679           where[1] = count;
1680           where += 2;
1681         }
1682       else
1683         {
1684           unsigned int size_of_jump;
1685
1686           if (flag_code == CODE_16BIT)
1687             {
1688               where[0] = jump16_disp32[0];
1689               where[1] = jump16_disp32[1];
1690               size_of_jump = 2;
1691             }
1692           else
1693             {
1694               where[0] = jump32_disp32[0];
1695               size_of_jump = 1;
1696             }
1697
1698           count -= size_of_jump + 4;
1699           if (!fits_in_imm31 (count))
1700             {
1701               as_bad_where (fragP->fr_file, fragP->fr_line,
1702                             _("jump over nop padding out of range"));
1703               return;
1704             }
1705
1706           md_number_to_chars (where + size_of_jump, count, 4);
1707           where += size_of_jump + 4;
1708         }
1709     }
1710
1711   /* Generate multiple NOPs.  */
1712   i386_output_nops (where, patt, count, limit);
1713 }
1714
1715 static INLINE int
1716 operand_type_all_zero (const union i386_operand_type *x)
1717 {
1718   switch (ARRAY_SIZE(x->array))
1719     {
1720     case 3:
1721       if (x->array[2])
1722         return 0;
1723       /* Fall through.  */
1724     case 2:
1725       if (x->array[1])
1726         return 0;
1727       /* Fall through.  */
1728     case 1:
1729       return !x->array[0];
1730     default:
1731       abort ();
1732     }
1733 }
1734
1735 static INLINE void
1736 operand_type_set (union i386_operand_type *x, unsigned int v)
1737 {
1738   switch (ARRAY_SIZE(x->array))
1739     {
1740     case 3:
1741       x->array[2] = v;
1742       /* Fall through.  */
1743     case 2:
1744       x->array[1] = v;
1745       /* Fall through.  */
1746     case 1:
1747       x->array[0] = v;
1748       /* Fall through.  */
1749       break;
1750     default:
1751       abort ();
1752     }
1753
1754   x->bitfield.class = ClassNone;
1755   x->bitfield.instance = InstanceNone;
1756 }
1757
1758 static INLINE int
1759 operand_type_equal (const union i386_operand_type *x,
1760                     const union i386_operand_type *y)
1761 {
1762   switch (ARRAY_SIZE(x->array))
1763     {
1764     case 3:
1765       if (x->array[2] != y->array[2])
1766         return 0;
1767       /* Fall through.  */
1768     case 2:
1769       if (x->array[1] != y->array[1])
1770         return 0;
1771       /* Fall through.  */
1772     case 1:
1773       return x->array[0] == y->array[0];
1774       break;
1775     default:
1776       abort ();
1777     }
1778 }
1779
1780 static INLINE int
1781 cpu_flags_all_zero (const union i386_cpu_flags *x)
1782 {
1783   switch (ARRAY_SIZE(x->array))
1784     {
1785     case 4:
1786       if (x->array[3])
1787         return 0;
1788       /* Fall through.  */
1789     case 3:
1790       if (x->array[2])
1791         return 0;
1792       /* Fall through.  */
1793     case 2:
1794       if (x->array[1])
1795         return 0;
1796       /* Fall through.  */
1797     case 1:
1798       return !x->array[0];
1799     default:
1800       abort ();
1801     }
1802 }
1803
1804 static INLINE int
1805 cpu_flags_equal (const union i386_cpu_flags *x,
1806                  const union i386_cpu_flags *y)
1807 {
1808   switch (ARRAY_SIZE(x->array))
1809     {
1810     case 4:
1811       if (x->array[3] != y->array[3])
1812         return 0;
1813       /* Fall through.  */
1814     case 3:
1815       if (x->array[2] != y->array[2])
1816         return 0;
1817       /* Fall through.  */
1818     case 2:
1819       if (x->array[1] != y->array[1])
1820         return 0;
1821       /* Fall through.  */
1822     case 1:
1823       return x->array[0] == y->array[0];
1824       break;
1825     default:
1826       abort ();
1827     }
1828 }
1829
1830 static INLINE int
1831 cpu_flags_check_cpu64 (i386_cpu_flags f)
1832 {
1833   return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1834            || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1835 }
1836
1837 static INLINE i386_cpu_flags
1838 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1839 {
1840   switch (ARRAY_SIZE (x.array))
1841     {
1842     case 4:
1843       x.array [3] &= y.array [3];
1844       /* Fall through.  */
1845     case 3:
1846       x.array [2] &= y.array [2];
1847       /* Fall through.  */
1848     case 2:
1849       x.array [1] &= y.array [1];
1850       /* Fall through.  */
1851     case 1:
1852       x.array [0] &= y.array [0];
1853       break;
1854     default:
1855       abort ();
1856     }
1857   return x;
1858 }
1859
1860 static INLINE i386_cpu_flags
1861 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1862 {
1863   switch (ARRAY_SIZE (x.array))
1864     {
1865     case 4:
1866       x.array [3] |= y.array [3];
1867       /* Fall through.  */
1868     case 3:
1869       x.array [2] |= y.array [2];
1870       /* Fall through.  */
1871     case 2:
1872       x.array [1] |= y.array [1];
1873       /* Fall through.  */
1874     case 1:
1875       x.array [0] |= y.array [0];
1876       break;
1877     default:
1878       abort ();
1879     }
1880   return x;
1881 }
1882
1883 static INLINE i386_cpu_flags
1884 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1885 {
1886   switch (ARRAY_SIZE (x.array))
1887     {
1888     case 4:
1889       x.array [3] &= ~y.array [3];
1890       /* Fall through.  */
1891     case 3:
1892       x.array [2] &= ~y.array [2];
1893       /* Fall through.  */
1894     case 2:
1895       x.array [1] &= ~y.array [1];
1896       /* Fall through.  */
1897     case 1:
1898       x.array [0] &= ~y.array [0];
1899       break;
1900     default:
1901       abort ();
1902     }
1903   return x;
1904 }
1905
1906 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1907
1908 #define CPU_FLAGS_ARCH_MATCH            0x1
1909 #define CPU_FLAGS_64BIT_MATCH           0x2
1910
1911 #define CPU_FLAGS_PERFECT_MATCH \
1912   (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1913
1914 /* Return CPU flags match bits. */
1915
1916 static int
1917 cpu_flags_match (const insn_template *t)
1918 {
1919   i386_cpu_flags x = t->cpu_flags;
1920   int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1921
1922   x.bitfield.cpu64 = 0;
1923   x.bitfield.cpuno64 = 0;
1924
1925   if (cpu_flags_all_zero (&x))
1926     {
1927       /* This instruction is available on all archs.  */
1928       match |= CPU_FLAGS_ARCH_MATCH;
1929     }
1930   else
1931     {
1932       /* This instruction is available only on some archs.  */
1933       i386_cpu_flags cpu = cpu_arch_flags;
1934
1935       /* AVX512VL is no standalone feature - match it and then strip it.  */
1936       if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1937         return match;
1938       x.bitfield.cpuavx512vl = 0;
1939
1940       cpu = cpu_flags_and (x, cpu);
1941       if (!cpu_flags_all_zero (&cpu))
1942         {
1943           if (x.bitfield.cpuavx)
1944             {
1945               /* We need to check a few extra flags with AVX.  */
1946               if (cpu.bitfield.cpuavx
1947                   && (!t->opcode_modifier.sse2avx
1948                       || (sse2avx && !i.prefix[DATA_PREFIX]))
1949                   && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1950                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1951                   && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1952                 match |= CPU_FLAGS_ARCH_MATCH;
1953             }
1954           else if (x.bitfield.cpuavx512f)
1955             {
1956               /* We need to check a few extra flags with AVX512F.  */
1957               if (cpu.bitfield.cpuavx512f
1958                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1959                   && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1960                   && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1961                 match |= CPU_FLAGS_ARCH_MATCH;
1962             }
1963           else
1964             match |= CPU_FLAGS_ARCH_MATCH;
1965         }
1966     }
1967   return match;
1968 }
1969
1970 static INLINE i386_operand_type
1971 operand_type_and (i386_operand_type x, i386_operand_type y)
1972 {
1973   if (x.bitfield.class != y.bitfield.class)
1974     x.bitfield.class = ClassNone;
1975   if (x.bitfield.instance != y.bitfield.instance)
1976     x.bitfield.instance = InstanceNone;
1977
1978   switch (ARRAY_SIZE (x.array))
1979     {
1980     case 3:
1981       x.array [2] &= y.array [2];
1982       /* Fall through.  */
1983     case 2:
1984       x.array [1] &= y.array [1];
1985       /* Fall through.  */
1986     case 1:
1987       x.array [0] &= y.array [0];
1988       break;
1989     default:
1990       abort ();
1991     }
1992   return x;
1993 }
1994
1995 static INLINE i386_operand_type
1996 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1997 {
1998   gas_assert (y.bitfield.class == ClassNone);
1999   gas_assert (y.bitfield.instance == InstanceNone);
2000
2001   switch (ARRAY_SIZE (x.array))
2002     {
2003     case 3:
2004       x.array [2] &= ~y.array [2];
2005       /* Fall through.  */
2006     case 2:
2007       x.array [1] &= ~y.array [1];
2008       /* Fall through.  */
2009     case 1:
2010       x.array [0] &= ~y.array [0];
2011       break;
2012     default:
2013       abort ();
2014     }
2015   return x;
2016 }
2017
2018 static INLINE i386_operand_type
2019 operand_type_or (i386_operand_type x, i386_operand_type y)
2020 {
2021   gas_assert (x.bitfield.class == ClassNone ||
2022               y.bitfield.class == ClassNone ||
2023               x.bitfield.class == y.bitfield.class);
2024   gas_assert (x.bitfield.instance == InstanceNone ||
2025               y.bitfield.instance == InstanceNone ||
2026               x.bitfield.instance == y.bitfield.instance);
2027
2028   switch (ARRAY_SIZE (x.array))
2029     {
2030     case 3:
2031       x.array [2] |= y.array [2];
2032       /* Fall through.  */
2033     case 2:
2034       x.array [1] |= y.array [1];
2035       /* Fall through.  */
2036     case 1:
2037       x.array [0] |= y.array [0];
2038       break;
2039     default:
2040       abort ();
2041     }
2042   return x;
2043 }
2044
2045 static INLINE i386_operand_type
2046 operand_type_xor (i386_operand_type x, i386_operand_type y)
2047 {
2048   gas_assert (y.bitfield.class == ClassNone);
2049   gas_assert (y.bitfield.instance == InstanceNone);
2050
2051   switch (ARRAY_SIZE (x.array))
2052     {
2053     case 3:
2054       x.array [2] ^= y.array [2];
2055       /* Fall through.  */
2056     case 2:
2057       x.array [1] ^= y.array [1];
2058       /* Fall through.  */
2059     case 1:
2060       x.array [0] ^= y.array [0];
2061       break;
2062     default:
2063       abort ();
2064     }
2065   return x;
2066 }
2067
2068 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2069 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2070 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2071 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2072 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2073 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2074 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2075 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2076 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2077 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2078 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2079 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2080 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2081 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2082 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2083 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2084 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2085
2086 enum operand_type
2087 {
2088   reg,
2089   imm,
2090   disp,
2091   anymem
2092 };
2093
2094 static INLINE int
2095 operand_type_check (i386_operand_type t, enum operand_type c)
2096 {
2097   switch (c)
2098     {
2099     case reg:
2100       return t.bitfield.class == Reg;
2101
2102     case imm:
2103       return (t.bitfield.imm8
2104               || t.bitfield.imm8s
2105               || t.bitfield.imm16
2106               || t.bitfield.imm32
2107               || t.bitfield.imm32s
2108               || t.bitfield.imm64);
2109
2110     case disp:
2111       return (t.bitfield.disp8
2112               || t.bitfield.disp16
2113               || t.bitfield.disp32
2114               || t.bitfield.disp32s
2115               || t.bitfield.disp64);
2116
2117     case anymem:
2118       return (t.bitfield.disp8
2119               || t.bitfield.disp16
2120               || t.bitfield.disp32
2121               || t.bitfield.disp32s
2122               || t.bitfield.disp64
2123               || t.bitfield.baseindex);
2124
2125     default:
2126       abort ();
2127     }
2128
2129   return 0;
2130 }
2131
2132 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2133    between operand GIVEN and opeand WANTED for instruction template T.  */
2134
2135 static INLINE int
2136 match_operand_size (const insn_template *t, unsigned int wanted,
2137                     unsigned int given)
2138 {
2139   return !((i.types[given].bitfield.byte
2140             && !t->operand_types[wanted].bitfield.byte)
2141            || (i.types[given].bitfield.word
2142                && !t->operand_types[wanted].bitfield.word)
2143            || (i.types[given].bitfield.dword
2144                && !t->operand_types[wanted].bitfield.dword)
2145            || (i.types[given].bitfield.qword
2146                && !t->operand_types[wanted].bitfield.qword)
2147            || (i.types[given].bitfield.tbyte
2148                && !t->operand_types[wanted].bitfield.tbyte));
2149 }
2150
2151 /* Return 1 if there is no conflict in SIMD register between operand
2152    GIVEN and opeand WANTED for instruction template T.  */
2153
2154 static INLINE int
2155 match_simd_size (const insn_template *t, unsigned int wanted,
2156                  unsigned int given)
2157 {
2158   return !((i.types[given].bitfield.xmmword
2159             && !t->operand_types[wanted].bitfield.xmmword)
2160            || (i.types[given].bitfield.ymmword
2161                && !t->operand_types[wanted].bitfield.ymmword)
2162            || (i.types[given].bitfield.zmmword
2163                && !t->operand_types[wanted].bitfield.zmmword));
2164 }
2165
2166 /* Return 1 if there is no conflict in any size between operand GIVEN
2167    and opeand WANTED for instruction template T.  */
2168
2169 static INLINE int
2170 match_mem_size (const insn_template *t, unsigned int wanted,
2171                 unsigned int given)
2172 {
2173   return (match_operand_size (t, wanted, given)
2174           && !((i.types[given].bitfield.unspecified
2175                 && !i.broadcast
2176                 && !t->operand_types[wanted].bitfield.unspecified)
2177                || (i.types[given].bitfield.fword
2178                    && !t->operand_types[wanted].bitfield.fword)
2179                /* For scalar opcode templates to allow register and memory
2180                   operands at the same time, some special casing is needed
2181                   here.  Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2182                   down-conversion vpmov*.  */
2183                || ((t->operand_types[wanted].bitfield.class == RegSIMD
2184                     && t->operand_types[wanted].bitfield.byte
2185                        + t->operand_types[wanted].bitfield.word
2186                        + t->operand_types[wanted].bitfield.dword
2187                        + t->operand_types[wanted].bitfield.qword
2188                        > !!t->opcode_modifier.broadcast)
2189                    ? (i.types[given].bitfield.xmmword
2190                       || i.types[given].bitfield.ymmword
2191                       || i.types[given].bitfield.zmmword)
2192                    : !match_simd_size(t, wanted, given))));
2193 }
2194
2195 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2196    operands for instruction template T, and it has MATCH_REVERSE set if there
2197    is no size conflict on any operands for the template with operands reversed
2198    (and the template allows for reversing in the first place).  */
2199
2200 #define MATCH_STRAIGHT 1
2201 #define MATCH_REVERSE  2
2202
2203 static INLINE unsigned int
2204 operand_size_match (const insn_template *t)
2205 {
2206   unsigned int j, match = MATCH_STRAIGHT;
2207
2208   /* Don't check non-absolute jump instructions.  */
2209   if (t->opcode_modifier.jump
2210       && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2211     return match;
2212
2213   /* Check memory and accumulator operand size.  */
2214   for (j = 0; j < i.operands; j++)
2215     {
2216       if (i.types[j].bitfield.class != Reg
2217           && i.types[j].bitfield.class != RegSIMD
2218           && t->opcode_modifier.anysize)
2219         continue;
2220
2221       if (t->operand_types[j].bitfield.class == Reg
2222           && !match_operand_size (t, j, j))
2223         {
2224           match = 0;
2225           break;
2226         }
2227
2228       if (t->operand_types[j].bitfield.class == RegSIMD
2229           && !match_simd_size (t, j, j))
2230         {
2231           match = 0;
2232           break;
2233         }
2234
2235       if (t->operand_types[j].bitfield.instance == Accum
2236           && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2237         {
2238           match = 0;
2239           break;
2240         }
2241
2242       if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2243         {
2244           match = 0;
2245           break;
2246         }
2247     }
2248
2249   if (!t->opcode_modifier.d)
2250     {
2251     mismatch:
2252       if (!match)
2253         i.error = operand_size_mismatch;
2254       return match;
2255     }
2256
2257   /* Check reverse.  */
2258   gas_assert (i.operands >= 2 && i.operands <= 3);
2259
2260   for (j = 0; j < i.operands; j++)
2261     {
2262       unsigned int given = i.operands - j - 1;
2263
2264       if (t->operand_types[j].bitfield.class == Reg
2265           && !match_operand_size (t, j, given))
2266         goto mismatch;
2267
2268       if (t->operand_types[j].bitfield.class == RegSIMD
2269           && !match_simd_size (t, j, given))
2270         goto mismatch;
2271
2272       if (t->operand_types[j].bitfield.instance == Accum
2273           && (!match_operand_size (t, j, given)
2274               || !match_simd_size (t, j, given)))
2275         goto mismatch;
2276
2277       if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2278         goto mismatch;
2279     }
2280
2281   return match | MATCH_REVERSE;
2282 }
2283
2284 static INLINE int
2285 operand_type_match (i386_operand_type overlap,
2286                     i386_operand_type given)
2287 {
2288   i386_operand_type temp = overlap;
2289
2290   temp.bitfield.unspecified = 0;
2291   temp.bitfield.byte = 0;
2292   temp.bitfield.word = 0;
2293   temp.bitfield.dword = 0;
2294   temp.bitfield.fword = 0;
2295   temp.bitfield.qword = 0;
2296   temp.bitfield.tbyte = 0;
2297   temp.bitfield.xmmword = 0;
2298   temp.bitfield.ymmword = 0;
2299   temp.bitfield.zmmword = 0;
2300   if (operand_type_all_zero (&temp))
2301     goto mismatch;
2302
2303   if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2304     return 1;
2305
2306  mismatch:
2307   i.error = operand_type_mismatch;
2308   return 0;
2309 }
2310
2311 /* If given types g0 and g1 are registers they must be of the same type
2312    unless the expected operand type register overlap is null.
2313    Some Intel syntax memory operand size checking also happens here.  */
2314
2315 static INLINE int
2316 operand_type_register_match (i386_operand_type g0,
2317                              i386_operand_type t0,
2318                              i386_operand_type g1,
2319                              i386_operand_type t1)
2320 {
2321   if (g0.bitfield.class != Reg
2322       && g0.bitfield.class != RegSIMD
2323       && (!operand_type_check (g0, anymem)
2324           || g0.bitfield.unspecified
2325           || (t0.bitfield.class != Reg
2326               && t0.bitfield.class != RegSIMD)))
2327     return 1;
2328
2329   if (g1.bitfield.class != Reg
2330       && g1.bitfield.class != RegSIMD
2331       && (!operand_type_check (g1, anymem)
2332           || g1.bitfield.unspecified
2333           || (t1.bitfield.class != Reg
2334               && t1.bitfield.class != RegSIMD)))
2335     return 1;
2336
2337   if (g0.bitfield.byte == g1.bitfield.byte
2338       && g0.bitfield.word == g1.bitfield.word
2339       && g0.bitfield.dword == g1.bitfield.dword
2340       && g0.bitfield.qword == g1.bitfield.qword
2341       && g0.bitfield.xmmword == g1.bitfield.xmmword
2342       && g0.bitfield.ymmword == g1.bitfield.ymmword
2343       && g0.bitfield.zmmword == g1.bitfield.zmmword)
2344     return 1;
2345
2346   if (!(t0.bitfield.byte & t1.bitfield.byte)
2347       && !(t0.bitfield.word & t1.bitfield.word)
2348       && !(t0.bitfield.dword & t1.bitfield.dword)
2349       && !(t0.bitfield.qword & t1.bitfield.qword)
2350       && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2351       && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2352       && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2353     return 1;
2354
2355   i.error = register_type_mismatch;
2356
2357   return 0;
2358 }
2359
2360 static INLINE unsigned int
2361 register_number (const reg_entry *r)
2362 {
2363   unsigned int nr = r->reg_num;
2364
2365   if (r->reg_flags & RegRex)
2366     nr += 8;
2367
2368   if (r->reg_flags & RegVRex)
2369     nr += 16;
2370
2371   return nr;
2372 }
2373
2374 static INLINE unsigned int
2375 mode_from_disp_size (i386_operand_type t)
2376 {
2377   if (t.bitfield.disp8)
2378     return 1;
2379   else if (t.bitfield.disp16
2380            || t.bitfield.disp32
2381            || t.bitfield.disp32s)
2382     return 2;
2383   else
2384     return 0;
2385 }
2386
2387 static INLINE int
2388 fits_in_signed_byte (addressT num)
2389 {
2390   return num + 0x80 <= 0xff;
2391 }
2392
2393 static INLINE int
2394 fits_in_unsigned_byte (addressT num)
2395 {
2396   return num <= 0xff;
2397 }
2398
2399 static INLINE int
2400 fits_in_unsigned_word (addressT num)
2401 {
2402   return num <= 0xffff;
2403 }
2404
2405 static INLINE int
2406 fits_in_signed_word (addressT num)
2407 {
2408   return num + 0x8000 <= 0xffff;
2409 }
2410
2411 static INLINE int
2412 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2413 {
2414 #ifndef BFD64
2415   return 1;
2416 #else
2417   return num + 0x80000000 <= 0xffffffff;
2418 #endif
2419 }                               /* fits_in_signed_long() */
2420
2421 static INLINE int
2422 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2423 {
2424 #ifndef BFD64
2425   return 1;
2426 #else
2427   return num <= 0xffffffff;
2428 #endif
2429 }                               /* fits_in_unsigned_long() */
2430
2431 static INLINE int
2432 fits_in_disp8 (offsetT num)
2433 {
2434   int shift = i.memshift;
2435   unsigned int mask;
2436
2437   if (shift == -1)
2438     abort ();
2439
2440   mask = (1 << shift) - 1;
2441
2442   /* Return 0 if NUM isn't properly aligned.  */
2443   if ((num & mask))
2444     return 0;
2445
2446   /* Check if NUM will fit in 8bit after shift.  */
2447   return fits_in_signed_byte (num >> shift);
2448 }
2449
2450 static INLINE int
2451 fits_in_imm4 (offsetT num)
2452 {
2453   return (num & 0xf) == num;
2454 }
2455
2456 static i386_operand_type
2457 smallest_imm_type (offsetT num)
2458 {
2459   i386_operand_type t;
2460
2461   operand_type_set (&t, 0);
2462   t.bitfield.imm64 = 1;
2463
2464   if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2465     {
2466       /* This code is disabled on the 486 because all the Imm1 forms
2467          in the opcode table are slower on the i486.  They're the
2468          versions with the implicitly specified single-position
2469          displacement, which has another syntax if you really want to
2470          use that form.  */
2471       t.bitfield.imm1 = 1;
2472       t.bitfield.imm8 = 1;
2473       t.bitfield.imm8s = 1;
2474       t.bitfield.imm16 = 1;
2475       t.bitfield.imm32 = 1;
2476       t.bitfield.imm32s = 1;
2477     }
2478   else if (fits_in_signed_byte (num))
2479     {
2480       t.bitfield.imm8 = 1;
2481       t.bitfield.imm8s = 1;
2482       t.bitfield.imm16 = 1;
2483       t.bitfield.imm32 = 1;
2484       t.bitfield.imm32s = 1;
2485     }
2486   else if (fits_in_unsigned_byte (num))
2487     {
2488       t.bitfield.imm8 = 1;
2489       t.bitfield.imm16 = 1;
2490       t.bitfield.imm32 = 1;
2491       t.bitfield.imm32s = 1;
2492     }
2493   else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2494     {
2495       t.bitfield.imm16 = 1;
2496       t.bitfield.imm32 = 1;
2497       t.bitfield.imm32s = 1;
2498     }
2499   else if (fits_in_signed_long (num))
2500     {
2501       t.bitfield.imm32 = 1;
2502       t.bitfield.imm32s = 1;
2503     }
2504   else if (fits_in_unsigned_long (num))
2505     t.bitfield.imm32 = 1;
2506
2507   return t;
2508 }
2509
2510 static offsetT
2511 offset_in_range (offsetT val, int size)
2512 {
2513   addressT mask;
2514
2515   switch (size)
2516     {
2517     case 1: mask = ((addressT) 1 <<  8) - 1; break;
2518     case 2: mask = ((addressT) 1 << 16) - 1; break;
2519     case 4: mask = ((addressT) 2 << 31) - 1; break;
2520 #ifdef BFD64
2521     case 8: mask = ((addressT) 2 << 63) - 1; break;
2522 #endif
2523     default: abort ();
2524     }
2525
2526 #ifdef BFD64
2527   /* If BFD64, sign extend val for 32bit address mode.  */
2528   if (flag_code != CODE_64BIT
2529       || i.prefix[ADDR_PREFIX])
2530     if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2531       val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2532 #endif
2533
2534   if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2535     {
2536       char buf1[40], buf2[40];
2537
2538       sprint_value (buf1, val);
2539       sprint_value (buf2, val & mask);
2540       as_warn (_("%s shortened to %s"), buf1, buf2);
2541     }
2542   return val & mask;
2543 }
2544
2545 enum PREFIX_GROUP
2546 {
2547   PREFIX_EXIST = 0,
2548   PREFIX_LOCK,
2549   PREFIX_REP,
2550   PREFIX_DS,
2551   PREFIX_OTHER
2552 };
2553
2554 /* Returns
2555    a. PREFIX_EXIST if attempting to add a prefix where one from the
2556    same class already exists.
2557    b. PREFIX_LOCK if lock prefix is added.
2558    c. PREFIX_REP if rep/repne prefix is added.
2559    d. PREFIX_DS if ds prefix is added.
2560    e. PREFIX_OTHER if other prefix is added.
2561  */
2562
2563 static enum PREFIX_GROUP
2564 add_prefix (unsigned int prefix)
2565 {
2566   enum PREFIX_GROUP ret = PREFIX_OTHER;
2567   unsigned int q;
2568
2569   if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2570       && flag_code == CODE_64BIT)
2571     {
2572       if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2573           || (i.prefix[REX_PREFIX] & prefix & REX_R)
2574           || (i.prefix[REX_PREFIX] & prefix & REX_X)
2575           || (i.prefix[REX_PREFIX] & prefix & REX_B))
2576         ret = PREFIX_EXIST;
2577       q = REX_PREFIX;
2578     }
2579   else
2580     {
2581       switch (prefix)
2582         {
2583         default:
2584           abort ();
2585
2586         case DS_PREFIX_OPCODE:
2587           ret = PREFIX_DS;
2588           /* Fall through.  */
2589         case CS_PREFIX_OPCODE:
2590         case ES_PREFIX_OPCODE:
2591         case FS_PREFIX_OPCODE:
2592         case GS_PREFIX_OPCODE:
2593         case SS_PREFIX_OPCODE:
2594           q = SEG_PREFIX;
2595           break;
2596
2597         case REPNE_PREFIX_OPCODE:
2598         case REPE_PREFIX_OPCODE:
2599           q = REP_PREFIX;
2600           ret = PREFIX_REP;
2601           break;
2602
2603         case LOCK_PREFIX_OPCODE:
2604           q = LOCK_PREFIX;
2605           ret = PREFIX_LOCK;
2606           break;
2607
2608         case FWAIT_OPCODE:
2609           q = WAIT_PREFIX;
2610           break;
2611
2612         case ADDR_PREFIX_OPCODE:
2613           q = ADDR_PREFIX;
2614           break;
2615
2616         case DATA_PREFIX_OPCODE:
2617           q = DATA_PREFIX;
2618           break;
2619         }
2620       if (i.prefix[q] != 0)
2621         ret = PREFIX_EXIST;
2622     }
2623
2624   if (ret)
2625     {
2626       if (!i.prefix[q])
2627         ++i.prefixes;
2628       i.prefix[q] |= prefix;
2629     }
2630   else
2631     as_bad (_("same type of prefix used twice"));
2632
2633   return ret;
2634 }
2635
2636 static void
2637 update_code_flag (int value, int check)
2638 {
2639   PRINTF_LIKE ((*as_error));
2640
2641   flag_code = (enum flag_code) value;
2642   if (flag_code == CODE_64BIT)
2643     {
2644       cpu_arch_flags.bitfield.cpu64 = 1;
2645       cpu_arch_flags.bitfield.cpuno64 = 0;
2646     }
2647   else
2648     {
2649       cpu_arch_flags.bitfield.cpu64 = 0;
2650       cpu_arch_flags.bitfield.cpuno64 = 1;
2651     }
2652   if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2653     {
2654       if (check)
2655         as_error = as_fatal;
2656       else
2657         as_error = as_bad;
2658       (*as_error) (_("64bit mode not supported on `%s'."),
2659                    cpu_arch_name ? cpu_arch_name : default_arch);
2660     }
2661   if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2662     {
2663       if (check)
2664         as_error = as_fatal;
2665       else
2666         as_error = as_bad;
2667       (*as_error) (_("32bit mode not supported on `%s'."),
2668                    cpu_arch_name ? cpu_arch_name : default_arch);
2669     }
2670   stackop_size = '\0';
2671 }
2672
2673 static void
2674 set_code_flag (int value)
2675 {
2676   update_code_flag (value, 0);
2677 }
2678
2679 static void
2680 set_16bit_gcc_code_flag (int new_code_flag)
2681 {
2682   flag_code = (enum flag_code) new_code_flag;
2683   if (flag_code != CODE_16BIT)
2684     abort ();
2685   cpu_arch_flags.bitfield.cpu64 = 0;
2686   cpu_arch_flags.bitfield.cpuno64 = 1;
2687   stackop_size = LONG_MNEM_SUFFIX;
2688 }
2689
2690 static void
2691 set_intel_syntax (int syntax_flag)
2692 {
2693   /* Find out if register prefixing is specified.  */
2694   int ask_naked_reg = 0;
2695
2696   SKIP_WHITESPACE ();
2697   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2698     {
2699       char *string;
2700       int e = get_symbol_name (&string);
2701
2702       if (strcmp (string, "prefix") == 0)
2703         ask_naked_reg = 1;
2704       else if (strcmp (string, "noprefix") == 0)
2705         ask_naked_reg = -1;
2706       else
2707         as_bad (_("bad argument to syntax directive."));
2708       (void) restore_line_pointer (e);
2709     }
2710   demand_empty_rest_of_line ();
2711
2712   intel_syntax = syntax_flag;
2713
2714   if (ask_naked_reg == 0)
2715     allow_naked_reg = (intel_syntax
2716                        && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2717   else
2718     allow_naked_reg = (ask_naked_reg < 0);
2719
2720   expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2721
2722   identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2723   identifier_chars['$'] = intel_syntax ? '$' : 0;
2724   register_prefix = allow_naked_reg ? "" : "%";
2725 }
2726
2727 static void
2728 set_intel_mnemonic (int mnemonic_flag)
2729 {
2730   intel_mnemonic = mnemonic_flag;
2731 }
2732
2733 static void
2734 set_allow_index_reg (int flag)
2735 {
2736   allow_index_reg = flag;
2737 }
2738
2739 static void
2740 set_check (int what)
2741 {
2742   enum check_kind *kind;
2743   const char *str;
2744
2745   if (what)
2746     {
2747       kind = &operand_check;
2748       str = "operand";
2749     }
2750   else
2751     {
2752       kind = &sse_check;
2753       str = "sse";
2754     }
2755
2756   SKIP_WHITESPACE ();
2757
2758   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2759     {
2760       char *string;
2761       int e = get_symbol_name (&string);
2762
2763       if (strcmp (string, "none") == 0)
2764         *kind = check_none;
2765       else if (strcmp (string, "warning") == 0)
2766         *kind = check_warning;
2767       else if (strcmp (string, "error") == 0)
2768         *kind = check_error;
2769       else
2770         as_bad (_("bad argument to %s_check directive."), str);
2771       (void) restore_line_pointer (e);
2772     }
2773   else
2774     as_bad (_("missing argument for %s_check directive"), str);
2775
2776   demand_empty_rest_of_line ();
2777 }
2778
2779 static void
2780 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2781                            i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2782 {
2783 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2784   static const char *arch;
2785
2786   /* Intel LIOM is only supported on ELF.  */
2787   if (!IS_ELF)
2788     return;
2789
2790   if (!arch)
2791     {
2792       /* Use cpu_arch_name if it is set in md_parse_option.  Otherwise
2793          use default_arch.  */
2794       arch = cpu_arch_name;
2795       if (!arch)
2796         arch = default_arch;
2797     }
2798
2799   /* If we are targeting Intel MCU, we must enable it.  */
2800   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2801       || new_flag.bitfield.cpuiamcu)
2802     return;
2803
2804   /* If we are targeting Intel L1OM, we must enable it.  */
2805   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2806       || new_flag.bitfield.cpul1om)
2807     return;
2808
2809   /* If we are targeting Intel K1OM, we must enable it.  */
2810   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2811       || new_flag.bitfield.cpuk1om)
2812     return;
2813
2814   as_bad (_("`%s' is not supported on `%s'"), name, arch);
2815 #endif
2816 }
2817
2818 static void
2819 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2820 {
2821   SKIP_WHITESPACE ();
2822
2823   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2824     {
2825       char *string;
2826       int e = get_symbol_name (&string);
2827       unsigned int j;
2828       i386_cpu_flags flags;
2829
2830       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2831         {
2832           if (strcmp (string, cpu_arch[j].name) == 0)
2833             {
2834               check_cpu_arch_compatible (string, cpu_arch[j].flags);
2835
2836               if (*string != '.')
2837                 {
2838                   cpu_arch_name = cpu_arch[j].name;
2839                   cpu_sub_arch_name = NULL;
2840                   cpu_arch_flags = cpu_arch[j].flags;
2841                   if (flag_code == CODE_64BIT)
2842                     {
2843                       cpu_arch_flags.bitfield.cpu64 = 1;
2844                       cpu_arch_flags.bitfield.cpuno64 = 0;
2845                     }
2846                   else
2847                     {
2848                       cpu_arch_flags.bitfield.cpu64 = 0;
2849                       cpu_arch_flags.bitfield.cpuno64 = 1;
2850                     }
2851                   cpu_arch_isa = cpu_arch[j].type;
2852                   cpu_arch_isa_flags = cpu_arch[j].flags;
2853                   if (!cpu_arch_tune_set)
2854                     {
2855                       cpu_arch_tune = cpu_arch_isa;
2856                       cpu_arch_tune_flags = cpu_arch_isa_flags;
2857                     }
2858                   break;
2859                 }
2860
2861               flags = cpu_flags_or (cpu_arch_flags,
2862                                     cpu_arch[j].flags);
2863
2864               if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2865                 {
2866                   if (cpu_sub_arch_name)
2867                     {
2868                       char *name = cpu_sub_arch_name;
2869                       cpu_sub_arch_name = concat (name,
2870                                                   cpu_arch[j].name,
2871                                                   (const char *) NULL);
2872                       free (name);
2873                     }
2874                   else
2875                     cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2876                   cpu_arch_flags = flags;
2877                   cpu_arch_isa_flags = flags;
2878                 }
2879               else
2880                 cpu_arch_isa_flags
2881                   = cpu_flags_or (cpu_arch_isa_flags,
2882                                   cpu_arch[j].flags);
2883               (void) restore_line_pointer (e);
2884               demand_empty_rest_of_line ();
2885               return;
2886             }
2887         }
2888
2889       if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2890         {
2891           /* Disable an ISA extension.  */
2892           for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2893             if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2894               {
2895                 flags = cpu_flags_and_not (cpu_arch_flags,
2896                                            cpu_noarch[j].flags);
2897                 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2898                   {
2899                     if (cpu_sub_arch_name)
2900                       {
2901                         char *name = cpu_sub_arch_name;
2902                         cpu_sub_arch_name = concat (name, string,
2903                                                     (const char *) NULL);
2904                         free (name);
2905                       }
2906                     else
2907                       cpu_sub_arch_name = xstrdup (string);
2908                     cpu_arch_flags = flags;
2909                     cpu_arch_isa_flags = flags;
2910                   }
2911                 (void) restore_line_pointer (e);
2912                 demand_empty_rest_of_line ();
2913                 return;
2914               }
2915
2916           j = ARRAY_SIZE (cpu_arch);
2917         }
2918
2919       if (j >= ARRAY_SIZE (cpu_arch))
2920         as_bad (_("no such architecture: `%s'"), string);
2921
2922       *input_line_pointer = e;
2923     }
2924   else
2925     as_bad (_("missing cpu architecture"));
2926
2927   no_cond_jump_promotion = 0;
2928   if (*input_line_pointer == ','
2929       && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2930     {
2931       char *string;
2932       char e;
2933
2934       ++input_line_pointer;
2935       e = get_symbol_name (&string);
2936
2937       if (strcmp (string, "nojumps") == 0)
2938         no_cond_jump_promotion = 1;
2939       else if (strcmp (string, "jumps") == 0)
2940         ;
2941       else
2942         as_bad (_("no such architecture modifier: `%s'"), string);
2943
2944       (void) restore_line_pointer (e);
2945     }
2946
2947   demand_empty_rest_of_line ();
2948 }
2949
2950 enum bfd_architecture
2951 i386_arch (void)
2952 {
2953   if (cpu_arch_isa == PROCESSOR_L1OM)
2954     {
2955       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2956           || flag_code != CODE_64BIT)
2957         as_fatal (_("Intel L1OM is 64bit ELF only"));
2958       return bfd_arch_l1om;
2959     }
2960   else if (cpu_arch_isa == PROCESSOR_K1OM)
2961     {
2962       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2963           || flag_code != CODE_64BIT)
2964         as_fatal (_("Intel K1OM is 64bit ELF only"));
2965       return bfd_arch_k1om;
2966     }
2967   else if (cpu_arch_isa == PROCESSOR_IAMCU)
2968     {
2969       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2970           || flag_code == CODE_64BIT)
2971         as_fatal (_("Intel MCU is 32bit ELF only"));
2972       return bfd_arch_iamcu;
2973     }
2974   else
2975     return bfd_arch_i386;
2976 }
2977
2978 unsigned long
2979 i386_mach (void)
2980 {
2981   if (!strncmp (default_arch, "x86_64", 6))
2982     {
2983       if (cpu_arch_isa == PROCESSOR_L1OM)
2984         {
2985           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2986               || default_arch[6] != '\0')
2987             as_fatal (_("Intel L1OM is 64bit ELF only"));
2988           return bfd_mach_l1om;
2989         }
2990       else if (cpu_arch_isa == PROCESSOR_K1OM)
2991         {
2992           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2993               || default_arch[6] != '\0')
2994             as_fatal (_("Intel K1OM is 64bit ELF only"));
2995           return bfd_mach_k1om;
2996         }
2997       else if (default_arch[6] == '\0')
2998         return bfd_mach_x86_64;
2999       else
3000         return bfd_mach_x64_32;
3001     }
3002   else if (!strcmp (default_arch, "i386")
3003            || !strcmp (default_arch, "iamcu"))
3004     {
3005       if (cpu_arch_isa == PROCESSOR_IAMCU)
3006         {
3007           if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3008             as_fatal (_("Intel MCU is 32bit ELF only"));
3009           return bfd_mach_i386_iamcu;
3010         }
3011       else
3012         return bfd_mach_i386_i386;
3013     }
3014   else
3015     as_fatal (_("unknown architecture"));
3016 }
3017 \f
3018 void
3019 md_begin (void)
3020 {
3021   const char *hash_err;
3022
3023   /* Support pseudo prefixes like {disp32}.  */
3024   lex_type ['{'] = LEX_BEGIN_NAME;
3025
3026   /* Initialize op_hash hash table.  */
3027   op_hash = hash_new ();
3028
3029   {
3030     const insn_template *optab;
3031     templates *core_optab;
3032
3033     /* Setup for loop.  */
3034     optab = i386_optab;
3035     core_optab = XNEW (templates);
3036     core_optab->start = optab;
3037
3038     while (1)
3039       {
3040         ++optab;
3041         if (optab->name == NULL
3042             || strcmp (optab->name, (optab - 1)->name) != 0)
3043           {
3044             /* different name --> ship out current template list;
3045                add to hash table; & begin anew.  */
3046             core_optab->end = optab;
3047             hash_err = hash_insert (op_hash,
3048                                     (optab - 1)->name,
3049                                     (void *) core_optab);
3050             if (hash_err)
3051               {
3052                 as_fatal (_("can't hash %s: %s"),
3053                           (optab - 1)->name,
3054                           hash_err);
3055               }
3056             if (optab->name == NULL)
3057               break;
3058             core_optab = XNEW (templates);
3059             core_optab->start = optab;
3060           }
3061       }
3062   }
3063
3064   /* Initialize reg_hash hash table.  */
3065   reg_hash = hash_new ();
3066   {
3067     const reg_entry *regtab;
3068     unsigned int regtab_size = i386_regtab_size;
3069
3070     for (regtab = i386_regtab; regtab_size--; regtab++)
3071       {
3072         hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
3073         if (hash_err)
3074           as_fatal (_("can't hash %s: %s"),
3075                     regtab->reg_name,
3076                     hash_err);
3077       }
3078   }
3079
3080   /* Fill in lexical tables:  mnemonic_chars, operand_chars.  */
3081   {
3082     int c;
3083     char *p;
3084
3085     for (c = 0; c < 256; c++)
3086       {
3087         if (ISDIGIT (c))
3088           {
3089             digit_chars[c] = c;
3090             mnemonic_chars[c] = c;
3091             register_chars[c] = c;
3092             operand_chars[c] = c;
3093           }
3094         else if (ISLOWER (c))
3095           {
3096             mnemonic_chars[c] = c;
3097             register_chars[c] = c;
3098             operand_chars[c] = c;
3099           }
3100         else if (ISUPPER (c))
3101           {
3102             mnemonic_chars[c] = TOLOWER (c);
3103             register_chars[c] = mnemonic_chars[c];
3104             operand_chars[c] = c;
3105           }
3106         else if (c == '{' || c == '}')
3107           {
3108             mnemonic_chars[c] = c;
3109             operand_chars[c] = c;
3110           }
3111
3112         if (ISALPHA (c) || ISDIGIT (c))
3113           identifier_chars[c] = c;
3114         else if (c >= 128)
3115           {
3116             identifier_chars[c] = c;
3117             operand_chars[c] = c;
3118           }
3119       }
3120
3121 #ifdef LEX_AT
3122     identifier_chars['@'] = '@';
3123 #endif
3124 #ifdef LEX_QM
3125     identifier_chars['?'] = '?';
3126     operand_chars['?'] = '?';
3127 #endif
3128     digit_chars['-'] = '-';
3129     mnemonic_chars['_'] = '_';
3130     mnemonic_chars['-'] = '-';
3131     mnemonic_chars['.'] = '.';
3132     identifier_chars['_'] = '_';
3133     identifier_chars['.'] = '.';
3134
3135     for (p = operand_special_chars; *p != '\0'; p++)
3136       operand_chars[(unsigned char) *p] = *p;
3137   }
3138
3139   if (flag_code == CODE_64BIT)
3140     {
3141 #if defined (OBJ_COFF) && defined (TE_PE)
3142       x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3143                                   ? 32 : 16);
3144 #else
3145       x86_dwarf2_return_column = 16;
3146 #endif
3147       x86_cie_data_alignment = -8;
3148     }
3149   else
3150     {
3151       x86_dwarf2_return_column = 8;
3152       x86_cie_data_alignment = -4;
3153     }
3154
3155   /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3156      can be turned into BRANCH_PREFIX frag.  */
3157   if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3158     abort ();
3159 }
3160
3161 void
3162 i386_print_statistics (FILE *file)
3163 {
3164   hash_print_statistics (file, "i386 opcode", op_hash);
3165   hash_print_statistics (file, "i386 register", reg_hash);
3166 }
3167 \f
3168 #ifdef DEBUG386
3169
3170 /* Debugging routines for md_assemble.  */
3171 static void pte (insn_template *);
3172 static void pt (i386_operand_type);
3173 static void pe (expressionS *);
3174 static void ps (symbolS *);
3175
3176 static void
3177 pi (const char *line, i386_insn *x)
3178 {
3179   unsigned int j;
3180
3181   fprintf (stdout, "%s: template ", line);
3182   pte (&x->tm);
3183   fprintf (stdout, "  address: base %s  index %s  scale %x\n",
3184            x->base_reg ? x->base_reg->reg_name : "none",
3185            x->index_reg ? x->index_reg->reg_name : "none",
3186            x->log2_scale_factor);
3187   fprintf (stdout, "  modrm:  mode %x  reg %x  reg/mem %x\n",
3188            x->rm.mode, x->rm.reg, x->rm.regmem);
3189   fprintf (stdout, "  sib:  base %x  index %x  scale %x\n",
3190            x->sib.base, x->sib.index, x->sib.scale);
3191   fprintf (stdout, "  rex: 64bit %x  extX %x  extY %x  extZ %x\n",
3192            (x->rex & REX_W) != 0,
3193            (x->rex & REX_R) != 0,
3194            (x->rex & REX_X) != 0,
3195            (x->rex & REX_B) != 0);
3196   for (j = 0; j < x->operands; j++)
3197     {
3198       fprintf (stdout, "    #%d:  ", j + 1);
3199       pt (x->types[j]);
3200       fprintf (stdout, "\n");
3201       if (x->types[j].bitfield.class == Reg
3202           || x->types[j].bitfield.class == RegMMX
3203           || x->types[j].bitfield.class == RegSIMD
3204           || x->types[j].bitfield.class == RegMask
3205           || x->types[j].bitfield.class == SReg
3206           || x->types[j].bitfield.class == RegCR
3207           || x->types[j].bitfield.class == RegDR
3208           || x->types[j].bitfield.class == RegTR
3209           || x->types[j].bitfield.class == RegBND)
3210         fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3211       if (operand_type_check (x->types[j], imm))
3212         pe (x->op[j].imms);
3213       if (operand_type_check (x->types[j], disp))
3214         pe (x->op[j].disps);
3215     }
3216 }
3217
3218 static void
3219 pte (insn_template *t)
3220 {
3221   unsigned int j;
3222   fprintf (stdout, " %d operands ", t->operands);
3223   fprintf (stdout, "opcode %x ", t->base_opcode);
3224   if (t->extension_opcode != None)
3225     fprintf (stdout, "ext %x ", t->extension_opcode);
3226   if (t->opcode_modifier.d)
3227     fprintf (stdout, "D");
3228   if (t->opcode_modifier.w)
3229     fprintf (stdout, "W");
3230   fprintf (stdout, "\n");
3231   for (j = 0; j < t->operands; j++)
3232     {
3233       fprintf (stdout, "    #%d type ", j + 1);
3234       pt (t->operand_types[j]);
3235       fprintf (stdout, "\n");
3236     }
3237 }
3238
3239 static void
3240 pe (expressionS *e)
3241 {
3242   fprintf (stdout, "    operation     %d\n", e->X_op);
3243   fprintf (stdout, "    add_number    %ld (%lx)\n",
3244            (long) e->X_add_number, (long) e->X_add_number);
3245   if (e->X_add_symbol)
3246     {
3247       fprintf (stdout, "    add_symbol    ");
3248       ps (e->X_add_symbol);
3249       fprintf (stdout, "\n");
3250     }
3251   if (e->X_op_symbol)
3252     {
3253       fprintf (stdout, "    op_symbol    ");
3254       ps (e->X_op_symbol);
3255       fprintf (stdout, "\n");
3256     }
3257 }
3258
3259 static void
3260 ps (symbolS *s)
3261 {
3262   fprintf (stdout, "%s type %s%s",
3263            S_GET_NAME (s),
3264            S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3265            segment_name (S_GET_SEGMENT (s)));
3266 }
3267
3268 static struct type_name
3269   {
3270     i386_operand_type mask;
3271     const char *name;
3272   }
3273 const type_names[] =
3274 {
3275   { OPERAND_TYPE_REG8, "r8" },
3276   { OPERAND_TYPE_REG16, "r16" },
3277   { OPERAND_TYPE_REG32, "r32" },
3278   { OPERAND_TYPE_REG64, "r64" },
3279   { OPERAND_TYPE_ACC8, "acc8" },
3280   { OPERAND_TYPE_ACC16, "acc16" },
3281   { OPERAND_TYPE_ACC32, "acc32" },
3282   { OPERAND_TYPE_ACC64, "acc64" },
3283   { OPERAND_TYPE_IMM8, "i8" },
3284   { OPERAND_TYPE_IMM8, "i8s" },
3285   { OPERAND_TYPE_IMM16, "i16" },
3286   { OPERAND_TYPE_IMM32, "i32" },
3287   { OPERAND_TYPE_IMM32S, "i32s" },
3288   { OPERAND_TYPE_IMM64, "i64" },
3289   { OPERAND_TYPE_IMM1, "i1" },
3290   { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3291   { OPERAND_TYPE_DISP8, "d8" },
3292   { OPERAND_TYPE_DISP16, "d16" },
3293   { OPERAND_TYPE_DISP32, "d32" },
3294   { OPERAND_TYPE_DISP32S, "d32s" },
3295   { OPERAND_TYPE_DISP64, "d64" },
3296   { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3297   { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3298   { OPERAND_TYPE_CONTROL, "control reg" },
3299   { OPERAND_TYPE_TEST, "test reg" },
3300   { OPERAND_TYPE_DEBUG, "debug reg" },
3301   { OPERAND_TYPE_FLOATREG, "FReg" },
3302   { OPERAND_TYPE_FLOATACC, "FAcc" },
3303   { OPERAND_TYPE_SREG, "SReg" },
3304   { OPERAND_TYPE_REGMMX, "rMMX" },
3305   { OPERAND_TYPE_REGXMM, "rXMM" },
3306   { OPERAND_TYPE_REGYMM, "rYMM" },
3307   { OPERAND_TYPE_REGZMM, "rZMM" },
3308   { OPERAND_TYPE_REGMASK, "Mask reg" },
3309 };
3310
3311 static void
3312 pt (i386_operand_type t)
3313 {
3314   unsigned int j;
3315   i386_operand_type a;
3316
3317   for (j = 0; j < ARRAY_SIZE (type_names); j++)
3318     {
3319       a = operand_type_and (t, type_names[j].mask);
3320       if (operand_type_equal (&a, &type_names[j].mask))
3321         fprintf (stdout, "%s, ",  type_names[j].name);
3322     }
3323   fflush (stdout);
3324 }
3325
3326 #endif /* DEBUG386 */
3327 \f
3328 static bfd_reloc_code_real_type
3329 reloc (unsigned int size,
3330        int pcrel,
3331        int sign,
3332        bfd_reloc_code_real_type other)
3333 {
3334   if (other != NO_RELOC)
3335     {
3336       reloc_howto_type *rel;
3337
3338       if (size == 8)
3339         switch (other)
3340           {
3341           case BFD_RELOC_X86_64_GOT32:
3342             return BFD_RELOC_X86_64_GOT64;
3343             break;
3344           case BFD_RELOC_X86_64_GOTPLT64:
3345             return BFD_RELOC_X86_64_GOTPLT64;
3346             break;
3347           case BFD_RELOC_X86_64_PLTOFF64:
3348             return BFD_RELOC_X86_64_PLTOFF64;
3349             break;
3350           case BFD_RELOC_X86_64_GOTPC32:
3351             other = BFD_RELOC_X86_64_GOTPC64;
3352             break;
3353           case BFD_RELOC_X86_64_GOTPCREL:
3354             other = BFD_RELOC_X86_64_GOTPCREL64;
3355             break;
3356           case BFD_RELOC_X86_64_TPOFF32:
3357             other = BFD_RELOC_X86_64_TPOFF64;
3358             break;
3359           case BFD_RELOC_X86_64_DTPOFF32:
3360             other = BFD_RELOC_X86_64_DTPOFF64;
3361             break;
3362           default:
3363             break;
3364           }
3365
3366 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3367       if (other == BFD_RELOC_SIZE32)
3368         {
3369           if (size == 8)
3370             other = BFD_RELOC_SIZE64;
3371           if (pcrel)
3372             {
3373               as_bad (_("there are no pc-relative size relocations"));
3374               return NO_RELOC;
3375             }
3376         }
3377 #endif
3378
3379       /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless.  */
3380       if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3381         sign = -1;
3382
3383       rel = bfd_reloc_type_lookup (stdoutput, other);
3384       if (!rel)
3385         as_bad (_("unknown relocation (%u)"), other);
3386       else if (size != bfd_get_reloc_size (rel))
3387         as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3388                 bfd_get_reloc_size (rel),
3389                 size);
3390       else if (pcrel && !rel->pc_relative)
3391         as_bad (_("non-pc-relative relocation for pc-relative field"));
3392       else if ((rel->complain_on_overflow == complain_overflow_signed
3393                 && !sign)
3394                || (rel->complain_on_overflow == complain_overflow_unsigned
3395                    && sign > 0))
3396         as_bad (_("relocated field and relocation type differ in signedness"));
3397       else
3398         return other;
3399       return NO_RELOC;
3400     }
3401
3402   if (pcrel)
3403     {
3404       if (!sign)
3405         as_bad (_("there are no unsigned pc-relative relocations"));
3406       switch (size)
3407         {
3408         case 1: return BFD_RELOC_8_PCREL;
3409         case 2: return BFD_RELOC_16_PCREL;
3410         case 4: return BFD_RELOC_32_PCREL;
3411         case 8: return BFD_RELOC_64_PCREL;
3412         }
3413       as_bad (_("cannot do %u byte pc-relative relocation"), size);
3414     }
3415   else
3416     {
3417       if (sign > 0)
3418         switch (size)
3419           {
3420           case 4: return BFD_RELOC_X86_64_32S;
3421           }
3422       else
3423         switch (size)
3424           {
3425           case 1: return BFD_RELOC_8;
3426           case 2: return BFD_RELOC_16;
3427           case 4: return BFD_RELOC_32;
3428           case 8: return BFD_RELOC_64;
3429           }
3430       as_bad (_("cannot do %s %u byte relocation"),
3431               sign > 0 ? "signed" : "unsigned", size);
3432     }
3433
3434   return NO_RELOC;
3435 }
3436
3437 /* Here we decide which fixups can be adjusted to make them relative to
3438    the beginning of the section instead of the symbol.  Basically we need
3439    to make sure that the dynamic relocations are done correctly, so in
3440    some cases we force the original symbol to be used.  */
3441
3442 int
3443 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3444 {
3445 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3446   if (!IS_ELF)
3447     return 1;
3448
3449   /* Don't adjust pc-relative references to merge sections in 64-bit
3450      mode.  */
3451   if (use_rela_relocations
3452       && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3453       && fixP->fx_pcrel)
3454     return 0;
3455
3456   /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3457      and changed later by validate_fix.  */
3458   if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3459       && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3460     return 0;
3461
3462   /* Adjust_reloc_syms doesn't know about the GOT.  Need to keep symbol
3463      for size relocations.  */
3464   if (fixP->fx_r_type == BFD_RELOC_SIZE32
3465       || fixP->fx_r_type == BFD_RELOC_SIZE64
3466       || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3467       || fixP->fx_r_type == BFD_RELOC_386_GOT32
3468       || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3469       || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3470       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3471       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3472       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3473       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3474       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3475       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3476       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3477       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3478       || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3479       || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3480       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3481       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3482       || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3483       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3484       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3485       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3486       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3487       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3488       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3489       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3490       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3491       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3492       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3493       || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3494       || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3495     return 0;
3496 #endif
3497   return 1;
3498 }
3499
3500 static int
3501 intel_float_operand (const char *mnemonic)
3502 {
3503   /* Note that the value returned is meaningful only for opcodes with (memory)
3504      operands, hence the code here is free to improperly handle opcodes that
3505      have no operands (for better performance and smaller code). */
3506
3507   if (mnemonic[0] != 'f')
3508     return 0; /* non-math */
3509
3510   switch (mnemonic[1])
3511     {
3512     /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3513        the fs segment override prefix not currently handled because no
3514        call path can make opcodes without operands get here */
3515     case 'i':
3516       return 2 /* integer op */;
3517     case 'l':
3518       if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3519         return 3; /* fldcw/fldenv */
3520       break;
3521     case 'n':
3522       if (mnemonic[2] != 'o' /* fnop */)
3523         return 3; /* non-waiting control op */
3524       break;
3525     case 'r':
3526       if (mnemonic[2] == 's')
3527         return 3; /* frstor/frstpm */
3528       break;
3529     case 's':
3530       if (mnemonic[2] == 'a')
3531         return 3; /* fsave */
3532       if (mnemonic[2] == 't')
3533         {
3534           switch (mnemonic[3])
3535             {
3536             case 'c': /* fstcw */
3537             case 'd': /* fstdw */
3538             case 'e': /* fstenv */
3539             case 's': /* fsts[gw] */
3540               return 3;
3541             }
3542         }
3543       break;
3544     case 'x':
3545       if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3546         return 0; /* fxsave/fxrstor are not really math ops */
3547       break;
3548     }
3549
3550   return 1;
3551 }
3552
3553 /* Build the VEX prefix.  */
3554
3555 static void
3556 build_vex_prefix (const insn_template *t)
3557 {
3558   unsigned int register_specifier;
3559   unsigned int implied_prefix;
3560   unsigned int vector_length;
3561   unsigned int w;
3562
3563   /* Check register specifier.  */
3564   if (i.vex.register_specifier)
3565     {
3566       register_specifier =
3567         ~register_number (i.vex.register_specifier) & 0xf;
3568       gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3569     }
3570   else
3571     register_specifier = 0xf;
3572
3573   /* Use 2-byte VEX prefix by swapping destination and source operand
3574      if there are more than 1 register operand.  */
3575   if (i.reg_operands > 1
3576       && i.vec_encoding != vex_encoding_vex3
3577       && i.dir_encoding == dir_encoding_default
3578       && i.operands == i.reg_operands
3579       && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3580       && i.tm.opcode_modifier.vexopcode == VEX0F
3581       && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3582       && i.rex == REX_B)
3583     {
3584       unsigned int xchg = i.operands - 1;
3585       union i386_op temp_op;
3586       i386_operand_type temp_type;
3587
3588       temp_type = i.types[xchg];
3589       i.types[xchg] = i.types[0];
3590       i.types[0] = temp_type;
3591       temp_op = i.op[xchg];
3592       i.op[xchg] = i.op[0];
3593       i.op[0] = temp_op;
3594
3595       gas_assert (i.rm.mode == 3);
3596
3597       i.rex = REX_R;
3598       xchg = i.rm.regmem;
3599       i.rm.regmem = i.rm.reg;
3600       i.rm.reg = xchg;
3601
3602       if (i.tm.opcode_modifier.d)
3603         i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3604                             ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3605       else /* Use the next insn.  */
3606         i.tm = t[1];
3607     }
3608
3609   /* Use 2-byte VEX prefix by swapping commutative source operands if there
3610      are no memory operands and at least 3 register ones.  */
3611   if (i.reg_operands >= 3
3612       && i.vec_encoding != vex_encoding_vex3
3613       && i.reg_operands == i.operands - i.imm_operands
3614       && i.tm.opcode_modifier.vex
3615       && i.tm.opcode_modifier.commutative
3616       && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3617       && i.rex == REX_B
3618       && i.vex.register_specifier
3619       && !(i.vex.register_specifier->reg_flags & RegRex))
3620     {
3621       unsigned int xchg = i.operands - i.reg_operands;
3622       union i386_op temp_op;
3623       i386_operand_type temp_type;
3624
3625       gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3626       gas_assert (!i.tm.opcode_modifier.sae);
3627       gas_assert (operand_type_equal (&i.types[i.operands - 2],
3628                                       &i.types[i.operands - 3]));
3629       gas_assert (i.rm.mode == 3);
3630
3631       temp_type = i.types[xchg];
3632       i.types[xchg] = i.types[xchg + 1];
3633       i.types[xchg + 1] = temp_type;
3634       temp_op = i.op[xchg];
3635       i.op[xchg] = i.op[xchg + 1];
3636       i.op[xchg + 1] = temp_op;
3637
3638       i.rex = 0;
3639       xchg = i.rm.regmem | 8;
3640       i.rm.regmem = ~register_specifier & 0xf;
3641       gas_assert (!(i.rm.regmem & 8));
3642       i.vex.register_specifier += xchg - i.rm.regmem;
3643       register_specifier = ~xchg & 0xf;
3644     }
3645
3646   if (i.tm.opcode_modifier.vex == VEXScalar)
3647     vector_length = avxscalar;
3648   else if (i.tm.opcode_modifier.vex == VEX256)
3649     vector_length = 1;
3650   else
3651     {
3652       unsigned int op;
3653
3654       /* Determine vector length from the last multi-length vector
3655          operand.  */
3656       vector_length = 0;
3657       for (op = t->operands; op--;)
3658         if (t->operand_types[op].bitfield.xmmword
3659             && t->operand_types[op].bitfield.ymmword
3660             && i.types[op].bitfield.ymmword)
3661           {
3662             vector_length = 1;
3663             break;
3664           }
3665     }
3666
3667   switch ((i.tm.base_opcode >> 8) & 0xff)
3668     {
3669     case 0:
3670       implied_prefix = 0;
3671       break;
3672     case DATA_PREFIX_OPCODE:
3673       implied_prefix = 1;
3674       break;
3675     case REPE_PREFIX_OPCODE:
3676       implied_prefix = 2;
3677       break;
3678     case REPNE_PREFIX_OPCODE:
3679       implied_prefix = 3;
3680       break;
3681     default:
3682       abort ();
3683     }
3684
3685   /* Check the REX.W bit and VEXW.  */
3686   if (i.tm.opcode_modifier.vexw == VEXWIG)
3687     w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3688   else if (i.tm.opcode_modifier.vexw)
3689     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3690   else
3691     w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3692
3693   /* Use 2-byte VEX prefix if possible.  */
3694   if (w == 0
3695       && i.vec_encoding != vex_encoding_vex3
3696       && i.tm.opcode_modifier.vexopcode == VEX0F
3697       && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3698     {
3699       /* 2-byte VEX prefix.  */
3700       unsigned int r;
3701
3702       i.vex.length = 2;
3703       i.vex.bytes[0] = 0xc5;
3704
3705       /* Check the REX.R bit.  */
3706       r = (i.rex & REX_R) ? 0 : 1;
3707       i.vex.bytes[1] = (r << 7
3708                         | register_specifier << 3
3709                         | vector_length << 2
3710                         | implied_prefix);
3711     }
3712   else
3713     {
3714       /* 3-byte VEX prefix.  */
3715       unsigned int m;
3716
3717       i.vex.length = 3;
3718
3719       switch (i.tm.opcode_modifier.vexopcode)
3720         {
3721         case VEX0F:
3722           m = 0x1;
3723           i.vex.bytes[0] = 0xc4;
3724           break;
3725         case VEX0F38:
3726           m = 0x2;
3727           i.vex.bytes[0] = 0xc4;
3728           break;
3729         case VEX0F3A:
3730           m = 0x3;
3731           i.vex.bytes[0] = 0xc4;
3732           break;
3733         case XOP08:
3734           m = 0x8;
3735           i.vex.bytes[0] = 0x8f;
3736           break;
3737         case XOP09:
3738           m = 0x9;
3739           i.vex.bytes[0] = 0x8f;
3740           break;
3741         case XOP0A:
3742           m = 0xa;
3743           i.vex.bytes[0] = 0x8f;
3744           break;
3745         default:
3746           abort ();
3747         }
3748
3749       /* The high 3 bits of the second VEX byte are 1's compliment
3750          of RXB bits from REX.  */
3751       i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3752
3753       i.vex.bytes[2] = (w << 7
3754                         | register_specifier << 3
3755                         | vector_length << 2
3756                         | implied_prefix);
3757     }
3758 }
3759
3760 static INLINE bfd_boolean
3761 is_evex_encoding (const insn_template *t)
3762 {
3763   return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3764          || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3765          || t->opcode_modifier.sae;
3766 }
3767
3768 static INLINE bfd_boolean
3769 is_any_vex_encoding (const insn_template *t)
3770 {
3771   return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3772          || is_evex_encoding (t);
3773 }
3774
3775 /* Build the EVEX prefix.  */
3776
3777 static void
3778 build_evex_prefix (void)
3779 {
3780   unsigned int register_specifier;
3781   unsigned int implied_prefix;
3782   unsigned int m, w;
3783   rex_byte vrex_used = 0;
3784
3785   /* Check register specifier.  */
3786   if (i.vex.register_specifier)
3787     {
3788       gas_assert ((i.vrex & REX_X) == 0);
3789
3790       register_specifier = i.vex.register_specifier->reg_num;
3791       if ((i.vex.register_specifier->reg_flags & RegRex))
3792         register_specifier += 8;
3793       /* The upper 16 registers are encoded in the fourth byte of the
3794          EVEX prefix.  */
3795       if (!(i.vex.register_specifier->reg_flags & RegVRex))
3796         i.vex.bytes[3] = 0x8;
3797       register_specifier = ~register_specifier & 0xf;
3798     }
3799   else
3800     {
3801       register_specifier = 0xf;
3802
3803       /* Encode upper 16 vector index register in the fourth byte of
3804          the EVEX prefix.  */
3805       if (!(i.vrex & REX_X))
3806         i.vex.bytes[3] = 0x8;
3807       else
3808         vrex_used |= REX_X;
3809     }
3810
3811   switch ((i.tm.base_opcode >> 8) & 0xff)
3812     {
3813     case 0:
3814       implied_prefix = 0;
3815       break;
3816     case DATA_PREFIX_OPCODE:
3817       implied_prefix = 1;
3818       break;
3819     case REPE_PREFIX_OPCODE:
3820       implied_prefix = 2;
3821       break;
3822     case REPNE_PREFIX_OPCODE:
3823       implied_prefix = 3;
3824       break;
3825     default:
3826       abort ();
3827     }
3828
3829   /* 4 byte EVEX prefix.  */
3830   i.vex.length = 4;
3831   i.vex.bytes[0] = 0x62;
3832
3833   /* mmmm bits.  */
3834   switch (i.tm.opcode_modifier.vexopcode)
3835     {
3836     case VEX0F:
3837       m = 1;
3838       break;
3839     case VEX0F38:
3840       m = 2;
3841       break;
3842     case VEX0F3A:
3843       m = 3;
3844       break;
3845     default:
3846       abort ();
3847       break;
3848     }
3849
3850   /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3851      bits from REX.  */
3852   i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3853
3854   /* The fifth bit of the second EVEX byte is 1's compliment of the
3855      REX_R bit in VREX.  */
3856   if (!(i.vrex & REX_R))
3857     i.vex.bytes[1] |= 0x10;
3858   else
3859     vrex_used |= REX_R;
3860
3861   if ((i.reg_operands + i.imm_operands) == i.operands)
3862     {
3863       /* When all operands are registers, the REX_X bit in REX is not
3864          used.  We reuse it to encode the upper 16 registers, which is
3865          indicated by the REX_B bit in VREX.  The REX_X bit is encoded
3866          as 1's compliment.  */
3867       if ((i.vrex & REX_B))
3868         {
3869           vrex_used |= REX_B;
3870           i.vex.bytes[1] &= ~0x40;
3871         }
3872     }
3873
3874   /* EVEX instructions shouldn't need the REX prefix.  */
3875   i.vrex &= ~vrex_used;
3876   gas_assert (i.vrex == 0);
3877
3878   /* Check the REX.W bit and VEXW.  */
3879   if (i.tm.opcode_modifier.vexw == VEXWIG)
3880     w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3881   else if (i.tm.opcode_modifier.vexw)
3882     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3883   else
3884     w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3885
3886   /* Encode the U bit.  */
3887   implied_prefix |= 0x4;
3888
3889   /* The third byte of the EVEX prefix.  */
3890   i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3891
3892   /* The fourth byte of the EVEX prefix.  */
3893   /* The zeroing-masking bit.  */
3894   if (i.mask && i.mask->zeroing)
3895     i.vex.bytes[3] |= 0x80;
3896
3897   /* Don't always set the broadcast bit if there is no RC.  */
3898   if (!i.rounding)
3899     {
3900       /* Encode the vector length.  */
3901       unsigned int vec_length;
3902
3903       if (!i.tm.opcode_modifier.evex
3904           || i.tm.opcode_modifier.evex == EVEXDYN)
3905         {
3906           unsigned int op;
3907
3908           /* Determine vector length from the last multi-length vector
3909              operand.  */
3910           for (op = i.operands; op--;)
3911             if (i.tm.operand_types[op].bitfield.xmmword
3912                 + i.tm.operand_types[op].bitfield.ymmword
3913                 + i.tm.operand_types[op].bitfield.zmmword > 1)
3914               {
3915                 if (i.types[op].bitfield.zmmword)
3916                   {
3917                     i.tm.opcode_modifier.evex = EVEX512;
3918                     break;
3919                   }
3920                 else if (i.types[op].bitfield.ymmword)
3921                   {
3922                     i.tm.opcode_modifier.evex = EVEX256;
3923                     break;
3924                   }
3925                 else if (i.types[op].bitfield.xmmword)
3926                   {
3927                     i.tm.opcode_modifier.evex = EVEX128;
3928                     break;
3929                   }
3930                 else if (i.broadcast && (int) op == i.broadcast->operand)
3931                   {
3932                     switch (i.broadcast->bytes)
3933                       {
3934                         case 64:
3935                           i.tm.opcode_modifier.evex = EVEX512;
3936                           break;
3937                         case 32:
3938                           i.tm.opcode_modifier.evex = EVEX256;
3939                           break;
3940                         case 16:
3941                           i.tm.opcode_modifier.evex = EVEX128;
3942                           break;
3943                         default:
3944                           abort ();
3945                       }
3946                     break;
3947                   }
3948               }
3949
3950           if (op >= MAX_OPERANDS)
3951             abort ();
3952         }
3953
3954       switch (i.tm.opcode_modifier.evex)
3955         {
3956         case EVEXLIG: /* LL' is ignored */
3957           vec_length = evexlig << 5;
3958           break;
3959         case EVEX128:
3960           vec_length = 0 << 5;
3961           break;
3962         case EVEX256:
3963           vec_length = 1 << 5;
3964           break;
3965         case EVEX512:
3966           vec_length = 2 << 5;
3967           break;
3968         default:
3969           abort ();
3970           break;
3971         }
3972       i.vex.bytes[3] |= vec_length;
3973       /* Encode the broadcast bit.  */
3974       if (i.broadcast)
3975         i.vex.bytes[3] |= 0x10;
3976     }
3977   else
3978     {
3979       if (i.rounding->type != saeonly)
3980         i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3981       else
3982         i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3983     }
3984
3985   if (i.mask && i.mask->mask)
3986     i.vex.bytes[3] |= i.mask->mask->reg_num;
3987 }
3988
3989 static void
3990 process_immext (void)
3991 {
3992   expressionS *exp;
3993
3994   /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3995      which is coded in the same place as an 8-bit immediate field
3996      would be.  Here we fake an 8-bit immediate operand from the
3997      opcode suffix stored in tm.extension_opcode.
3998
3999      AVX instructions also use this encoding, for some of
4000      3 argument instructions.  */
4001
4002   gas_assert (i.imm_operands <= 1
4003               && (i.operands <= 2
4004                   || (is_any_vex_encoding (&i.tm)
4005                       && i.operands <= 4)));
4006
4007   exp = &im_expressions[i.imm_operands++];
4008   i.op[i.operands].imms = exp;
4009   i.types[i.operands] = imm8;
4010   i.operands++;
4011   exp->X_op = O_constant;
4012   exp->X_add_number = i.tm.extension_opcode;
4013   i.tm.extension_opcode = None;
4014 }
4015
4016
4017 static int
4018 check_hle (void)
4019 {
4020   switch (i.tm.opcode_modifier.hleprefixok)
4021     {
4022     default:
4023       abort ();
4024     case HLEPrefixNone:
4025       as_bad (_("invalid instruction `%s' after `%s'"),
4026               i.tm.name, i.hle_prefix);
4027       return 0;
4028     case HLEPrefixLock:
4029       if (i.prefix[LOCK_PREFIX])
4030         return 1;
4031       as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
4032       return 0;
4033     case HLEPrefixAny:
4034       return 1;
4035     case HLEPrefixRelease:
4036       if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4037         {
4038           as_bad (_("instruction `%s' after `xacquire' not allowed"),
4039                   i.tm.name);
4040           return 0;
4041         }
4042       if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
4043         {
4044           as_bad (_("memory destination needed for instruction `%s'"
4045                     " after `xrelease'"), i.tm.name);
4046           return 0;
4047         }
4048       return 1;
4049     }
4050 }
4051
4052 /* Try the shortest encoding by shortening operand size.  */
4053
4054 static void
4055 optimize_encoding (void)
4056 {
4057   unsigned int j;
4058
4059   if (optimize_for_space
4060       && !is_any_vex_encoding (&i.tm)
4061       && i.reg_operands == 1
4062       && i.imm_operands == 1
4063       && !i.types[1].bitfield.byte
4064       && i.op[0].imms->X_op == O_constant
4065       && fits_in_imm7 (i.op[0].imms->X_add_number)
4066       && (i.tm.base_opcode == 0xa8
4067           || (i.tm.base_opcode == 0xf6
4068               && i.tm.extension_opcode == 0x0)))
4069     {
4070       /* Optimize: -Os:
4071            test $imm7, %r64/%r32/%r16  -> test $imm7, %r8
4072        */
4073       unsigned int base_regnum = i.op[1].regs->reg_num;
4074       if (flag_code == CODE_64BIT || base_regnum < 4)
4075         {
4076           i.types[1].bitfield.byte = 1;
4077           /* Ignore the suffix.  */
4078           i.suffix = 0;
4079           /* Convert to byte registers.  */
4080           if (i.types[1].bitfield.word)
4081             j = 16;
4082           else if (i.types[1].bitfield.dword)
4083             j = 32;
4084           else
4085             j = 48;
4086           if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4087             j += 8;
4088           i.op[1].regs -= j;
4089         }
4090     }
4091   else if (flag_code == CODE_64BIT
4092            && !is_any_vex_encoding (&i.tm)
4093            && ((i.types[1].bitfield.qword
4094                 && i.reg_operands == 1
4095                 && i.imm_operands == 1
4096                 && i.op[0].imms->X_op == O_constant
4097                 && ((i.tm.base_opcode == 0xb8
4098                      && i.tm.extension_opcode == None
4099                      && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4100                     || (fits_in_imm31 (i.op[0].imms->X_add_number)
4101                         && ((i.tm.base_opcode == 0x24
4102                              || i.tm.base_opcode == 0xa8)
4103                             || (i.tm.base_opcode == 0x80
4104                                 && i.tm.extension_opcode == 0x4)
4105                             || ((i.tm.base_opcode == 0xf6
4106                                  || (i.tm.base_opcode | 1) == 0xc7)
4107                                 && i.tm.extension_opcode == 0x0)))
4108                     || (fits_in_imm7 (i.op[0].imms->X_add_number)
4109                         && i.tm.base_opcode == 0x83
4110                         && i.tm.extension_opcode == 0x4)))
4111                || (i.types[0].bitfield.qword
4112                    && ((i.reg_operands == 2
4113                         && i.op[0].regs == i.op[1].regs
4114                         && (i.tm.base_opcode == 0x30
4115                             || i.tm.base_opcode == 0x28))
4116                        || (i.reg_operands == 1
4117                            && i.operands == 1
4118                            && i.tm.base_opcode == 0x30)))))
4119     {
4120       /* Optimize: -O:
4121            andq $imm31, %r64   -> andl $imm31, %r32
4122            andq $imm7, %r64    -> andl $imm7, %r32
4123            testq $imm31, %r64  -> testl $imm31, %r32
4124            xorq %r64, %r64     -> xorl %r32, %r32
4125            subq %r64, %r64     -> subl %r32, %r32
4126            movq $imm31, %r64   -> movl $imm31, %r32
4127            movq $imm32, %r64   -> movl $imm32, %r32
4128         */
4129       i.tm.opcode_modifier.norex64 = 1;
4130       if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4131         {
4132           /* Handle
4133                movq $imm31, %r64   -> movl $imm31, %r32
4134                movq $imm32, %r64   -> movl $imm32, %r32
4135            */
4136           i.tm.operand_types[0].bitfield.imm32 = 1;
4137           i.tm.operand_types[0].bitfield.imm32s = 0;
4138           i.tm.operand_types[0].bitfield.imm64 = 0;
4139           i.types[0].bitfield.imm32 = 1;
4140           i.types[0].bitfield.imm32s = 0;
4141           i.types[0].bitfield.imm64 = 0;
4142           i.types[1].bitfield.dword = 1;
4143           i.types[1].bitfield.qword = 0;
4144           if ((i.tm.base_opcode | 1) == 0xc7)
4145             {
4146               /* Handle
4147                    movq $imm31, %r64   -> movl $imm31, %r32
4148                */
4149               i.tm.base_opcode = 0xb8;
4150               i.tm.extension_opcode = None;
4151               i.tm.opcode_modifier.w = 0;
4152               i.tm.opcode_modifier.modrm = 0;
4153             }
4154         }
4155     }
4156   else if (optimize > 1
4157            && !optimize_for_space
4158            && !is_any_vex_encoding (&i.tm)
4159            && i.reg_operands == 2
4160            && i.op[0].regs == i.op[1].regs
4161            && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4162                || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4163            && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4164     {
4165       /* Optimize: -O2:
4166            andb %rN, %rN  -> testb %rN, %rN
4167            andw %rN, %rN  -> testw %rN, %rN
4168            andq %rN, %rN  -> testq %rN, %rN
4169            orb %rN, %rN   -> testb %rN, %rN
4170            orw %rN, %rN   -> testw %rN, %rN
4171            orq %rN, %rN   -> testq %rN, %rN
4172
4173            and outside of 64-bit mode
4174
4175            andl %rN, %rN  -> testl %rN, %rN
4176            orl %rN, %rN   -> testl %rN, %rN
4177        */
4178       i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4179     }
4180   else if (i.reg_operands == 3
4181            && i.op[0].regs == i.op[1].regs
4182            && !i.types[2].bitfield.xmmword
4183            && (i.tm.opcode_modifier.vex
4184                || ((!i.mask || i.mask->zeroing)
4185                    && !i.rounding
4186                    && is_evex_encoding (&i.tm)
4187                    && (i.vec_encoding != vex_encoding_evex
4188                        || cpu_arch_isa_flags.bitfield.cpuavx512vl
4189                        || i.tm.cpu_flags.bitfield.cpuavx512vl
4190                        || (i.tm.operand_types[2].bitfield.zmmword
4191                            && i.types[2].bitfield.ymmword))))
4192            && ((i.tm.base_opcode == 0x55
4193                 || i.tm.base_opcode == 0x6655
4194                 || i.tm.base_opcode == 0x66df
4195                 || i.tm.base_opcode == 0x57
4196                 || i.tm.base_opcode == 0x6657
4197                 || i.tm.base_opcode == 0x66ef
4198                 || i.tm.base_opcode == 0x66f8
4199                 || i.tm.base_opcode == 0x66f9
4200                 || i.tm.base_opcode == 0x66fa
4201                 || i.tm.base_opcode == 0x66fb
4202                 || i.tm.base_opcode == 0x42
4203                 || i.tm.base_opcode == 0x6642
4204                 || i.tm.base_opcode == 0x47
4205                 || i.tm.base_opcode == 0x6647)
4206                && i.tm.extension_opcode == None))
4207     {
4208       /* Optimize: -O1:
4209            VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4210            vpsubq and vpsubw:
4211              EVEX VOP %zmmM, %zmmM, %zmmN
4212                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4213                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4214              EVEX VOP %ymmM, %ymmM, %ymmN
4215                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4216                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4217              VEX VOP %ymmM, %ymmM, %ymmN
4218                -> VEX VOP %xmmM, %xmmM, %xmmN
4219            VOP, one of vpandn and vpxor:
4220              VEX VOP %ymmM, %ymmM, %ymmN
4221                -> VEX VOP %xmmM, %xmmM, %xmmN
4222            VOP, one of vpandnd and vpandnq:
4223              EVEX VOP %zmmM, %zmmM, %zmmN
4224                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4225                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4226              EVEX VOP %ymmM, %ymmM, %ymmN
4227                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4228                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4229            VOP, one of vpxord and vpxorq:
4230              EVEX VOP %zmmM, %zmmM, %zmmN
4231                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4232                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4233              EVEX VOP %ymmM, %ymmM, %ymmN
4234                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4235                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4236            VOP, one of kxord and kxorq:
4237              VEX VOP %kM, %kM, %kN
4238                -> VEX kxorw %kM, %kM, %kN
4239            VOP, one of kandnd and kandnq:
4240              VEX VOP %kM, %kM, %kN
4241                -> VEX kandnw %kM, %kM, %kN
4242        */
4243       if (is_evex_encoding (&i.tm))
4244         {
4245           if (i.vec_encoding != vex_encoding_evex)
4246             {
4247               i.tm.opcode_modifier.vex = VEX128;
4248               i.tm.opcode_modifier.vexw = VEXW0;
4249               i.tm.opcode_modifier.evex = 0;
4250             }
4251           else if (optimize > 1)
4252             i.tm.opcode_modifier.evex = EVEX128;
4253           else
4254             return;
4255         }
4256       else if (i.tm.operand_types[0].bitfield.class == RegMask)
4257         {
4258           i.tm.base_opcode &= 0xff;
4259           i.tm.opcode_modifier.vexw = VEXW0;
4260         }
4261       else
4262         i.tm.opcode_modifier.vex = VEX128;
4263
4264       if (i.tm.opcode_modifier.vex)
4265         for (j = 0; j < 3; j++)
4266           {
4267             i.types[j].bitfield.xmmword = 1;
4268             i.types[j].bitfield.ymmword = 0;
4269           }
4270     }
4271   else if (i.vec_encoding != vex_encoding_evex
4272            && !i.types[0].bitfield.zmmword
4273            && !i.types[1].bitfield.zmmword
4274            && !i.mask
4275            && !i.broadcast
4276            && is_evex_encoding (&i.tm)
4277            && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4278                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4279                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4280                || (i.tm.base_opcode & ~4) == 0x66db
4281                || (i.tm.base_opcode & ~4) == 0x66eb)
4282            && i.tm.extension_opcode == None)
4283     {
4284       /* Optimize: -O1:
4285            VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4286            vmovdqu32 and vmovdqu64:
4287              EVEX VOP %xmmM, %xmmN
4288                -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4289              EVEX VOP %ymmM, %ymmN
4290                -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4291              EVEX VOP %xmmM, mem
4292                -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4293              EVEX VOP %ymmM, mem
4294                -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4295              EVEX VOP mem, %xmmN
4296                -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4297              EVEX VOP mem, %ymmN
4298                -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4299            VOP, one of vpand, vpandn, vpor, vpxor:
4300              EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4301                -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4302              EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4303                -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4304              EVEX VOP{d,q} mem, %xmmM, %xmmN
4305                -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4306              EVEX VOP{d,q} mem, %ymmM, %ymmN
4307                -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4308        */
4309       for (j = 0; j < i.operands; j++)
4310         if (operand_type_check (i.types[j], disp)
4311             && i.op[j].disps->X_op == O_constant)
4312           {
4313             /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4314                has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4315                bytes, we choose EVEX Disp8 over VEX Disp32.  */
4316             int evex_disp8, vex_disp8;
4317             unsigned int memshift = i.memshift;
4318             offsetT n = i.op[j].disps->X_add_number;
4319
4320             evex_disp8 = fits_in_disp8 (n);
4321             i.memshift = 0;
4322             vex_disp8 = fits_in_disp8 (n);
4323             if (evex_disp8 != vex_disp8)
4324               {
4325                 i.memshift = memshift;
4326                 return;
4327               }
4328
4329             i.types[j].bitfield.disp8 = vex_disp8;
4330             break;
4331           }
4332       if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4333         i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4334       i.tm.opcode_modifier.vex
4335         = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4336       i.tm.opcode_modifier.vexw = VEXW0;
4337       /* VPAND, VPOR, and VPXOR are commutative.  */
4338       if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4339         i.tm.opcode_modifier.commutative = 1;
4340       i.tm.opcode_modifier.evex = 0;
4341       i.tm.opcode_modifier.masking = 0;
4342       i.tm.opcode_modifier.broadcast = 0;
4343       i.tm.opcode_modifier.disp8memshift = 0;
4344       i.memshift = 0;
4345       if (j < i.operands)
4346         i.types[j].bitfield.disp8
4347           = fits_in_disp8 (i.op[j].disps->X_add_number);
4348     }
4349 }
4350
4351 /* Return non-zero for load instruction.  */
4352
4353 static int
4354 load_insn_p (void)
4355 {
4356   unsigned int dest;
4357   int any_vex_p = is_any_vex_encoding (&i.tm);
4358   unsigned int base_opcode = i.tm.base_opcode | 1;
4359
4360   if (!any_vex_p)
4361     {
4362       /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4363          prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4364          bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote.  */
4365       if (i.tm.opcode_modifier.anysize)
4366         return 0;
4367
4368       /* pop, popf, popa.   */
4369       if (strcmp (i.tm.name, "pop") == 0
4370           || i.tm.base_opcode == 0x9d
4371           || i.tm.base_opcode == 0x61)
4372         return 1;
4373
4374       /* movs, cmps, lods, scas.  */
4375       if ((i.tm.base_opcode | 0xb) == 0xaf)
4376         return 1;
4377
4378       /* outs, xlatb.  */
4379       if (base_opcode == 0x6f
4380           || i.tm.base_opcode == 0xd7)
4381         return 1;
4382       /* NB: For AMD-specific insns with implicit memory operands,
4383          they're intentionally not covered.  */
4384     }
4385
4386   /* No memory operand.  */
4387   if (!i.mem_operands)
4388     return 0;
4389
4390   if (any_vex_p)
4391     {
4392       /* vldmxcsr.  */
4393       if (i.tm.base_opcode == 0xae
4394           && i.tm.opcode_modifier.vex
4395           && i.tm.opcode_modifier.vexopcode == VEX0F
4396           && i.tm.extension_opcode == 2)
4397         return 1;
4398     }
4399   else
4400     {
4401       /* test, not, neg, mul, imul, div, idiv.  */
4402       if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4403           && i.tm.extension_opcode != 1)
4404         return 1;
4405
4406       /* inc, dec.  */
4407       if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4408         return 1;
4409
4410       /* add, or, adc, sbb, and, sub, xor, cmp.  */
4411       if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4412         return 1;
4413
4414       /* bt, bts, btr, btc.  */
4415       if (i.tm.base_opcode == 0xfba
4416           && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4417         return 1;
4418
4419       /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4420       if ((base_opcode == 0xc1
4421            || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4422           && i.tm.extension_opcode != 6)
4423         return 1;
4424
4425       /* cmpxchg8b, cmpxchg16b, xrstors.  */
4426       if (i.tm.base_opcode == 0xfc7
4427           && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3))
4428         return 1;
4429
4430       /* fxrstor, ldmxcsr, xrstor.  */
4431       if (i.tm.base_opcode == 0xfae
4432           && (i.tm.extension_opcode == 1
4433               || i.tm.extension_opcode == 2
4434               || i.tm.extension_opcode == 5))
4435         return 1;
4436
4437       /* lgdt, lidt, lmsw.  */
4438       if (i.tm.base_opcode == 0xf01
4439           && (i.tm.extension_opcode == 2
4440               || i.tm.extension_opcode == 3
4441               || i.tm.extension_opcode == 6))
4442         return 1;
4443
4444       /* vmptrld */
4445       if (i.tm.base_opcode == 0xfc7
4446           && i.tm.extension_opcode == 6)
4447         return 1;
4448
4449       /* Check for x87 instructions.  */
4450       if (i.tm.base_opcode >= 0xd8 && i.tm.base_opcode <= 0xdf)
4451         {
4452           /* Skip fst, fstp, fstenv, fstcw.  */
4453           if (i.tm.base_opcode == 0xd9
4454               && (i.tm.extension_opcode == 2
4455                   || i.tm.extension_opcode == 3
4456                   || i.tm.extension_opcode == 6
4457                   || i.tm.extension_opcode == 7))
4458             return 0;
4459
4460           /* Skip fisttp, fist, fistp, fstp.  */
4461           if (i.tm.base_opcode == 0xdb
4462               && (i.tm.extension_opcode == 1
4463                   || i.tm.extension_opcode == 2
4464                   || i.tm.extension_opcode == 3
4465                   || i.tm.extension_opcode == 7))
4466             return 0;
4467
4468           /* Skip fisttp, fst, fstp, fsave, fstsw.  */
4469           if (i.tm.base_opcode == 0xdd
4470               && (i.tm.extension_opcode == 1
4471                   || i.tm.extension_opcode == 2
4472                   || i.tm.extension_opcode == 3
4473                   || i.tm.extension_opcode == 6
4474                   || i.tm.extension_opcode == 7))
4475             return 0;
4476
4477           /* Skip fisttp, fist, fistp, fbstp, fistp.  */
4478           if (i.tm.base_opcode == 0xdf
4479               && (i.tm.extension_opcode == 1
4480                   || i.tm.extension_opcode == 2
4481                   || i.tm.extension_opcode == 3
4482                   || i.tm.extension_opcode == 6
4483                   || i.tm.extension_opcode == 7))
4484             return 0;
4485
4486           return 1;
4487         }
4488     }
4489
4490   dest = i.operands - 1;
4491
4492   /* Check fake imm8 operand and 3 source operands.  */
4493   if ((i.tm.opcode_modifier.immext
4494        || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4495       && i.types[dest].bitfield.imm8)
4496     dest--;
4497
4498   /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg, xadd  */
4499   if (!any_vex_p
4500       && (base_opcode == 0x1
4501           || base_opcode == 0x9
4502           || base_opcode == 0x11
4503           || base_opcode == 0x19
4504           || base_opcode == 0x21
4505           || base_opcode == 0x29
4506           || base_opcode == 0x31
4507           || base_opcode == 0x39
4508           || (i.tm.base_opcode >= 0x84 && i.tm.base_opcode <= 0x87)
4509           || base_opcode == 0xfc1))
4510     return 1;
4511
4512   /* Check for load instruction.  */
4513   return (i.types[dest].bitfield.class != ClassNone
4514           || i.types[dest].bitfield.instance == Accum);
4515 }
4516
4517 /* Output lfence, 0xfaee8, after instruction.  */
4518
4519 static void
4520 insert_lfence_after (void)
4521 {
4522   if (lfence_after_load && load_insn_p ())
4523     {
4524       /* There are also two REP string instructions that require
4525          special treatment. Specifically, the compare string (CMPS)
4526          and scan string (SCAS) instructions set EFLAGS in a manner
4527          that depends on the data being compared/scanned. When used
4528          with a REP prefix, the number of iterations may therefore
4529          vary depending on this data. If the data is a program secret
4530          chosen by the adversary using an LVI method,
4531          then this data-dependent behavior may leak some aspect
4532          of the secret.  */
4533       if (((i.tm.base_opcode | 0x1) == 0xa7
4534            || (i.tm.base_opcode | 0x1) == 0xaf)
4535           && i.prefix[REP_PREFIX])
4536         {
4537             as_warn (_("`%s` changes flags which would affect control flow behavior"),
4538                      i.tm.name);
4539         }
4540       char *p = frag_more (3);
4541       *p++ = 0xf;
4542       *p++ = 0xae;
4543       *p = 0xe8;
4544     }
4545 }
4546
4547 /* Output lfence, 0xfaee8, before instruction.  */
4548
4549 static void
4550 insert_lfence_before (void)
4551 {
4552   char *p;
4553
4554   if (is_any_vex_encoding (&i.tm))
4555     return;
4556
4557   if (i.tm.base_opcode == 0xff
4558       && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4559     {
4560       /* Insert lfence before indirect branch if needed.  */
4561
4562       if (lfence_before_indirect_branch == lfence_branch_none)
4563         return;
4564
4565       if (i.operands != 1)
4566         abort ();
4567
4568       if (i.reg_operands == 1)
4569         {
4570           /* Indirect branch via register.  Don't insert lfence with
4571              -mlfence-after-load=yes.  */
4572           if (lfence_after_load
4573               || lfence_before_indirect_branch == lfence_branch_memory)
4574             return;
4575         }
4576       else if (i.mem_operands == 1
4577                && lfence_before_indirect_branch != lfence_branch_register)
4578         {
4579           as_warn (_("indirect `%s` with memory operand should be avoided"),
4580                    i.tm.name);
4581           return;
4582         }
4583       else
4584         return;
4585
4586       if (last_insn.kind != last_insn_other
4587           && last_insn.seg == now_seg)
4588         {
4589           as_warn_where (last_insn.file, last_insn.line,
4590                          _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4591                          last_insn.name, i.tm.name);
4592           return;
4593         }
4594
4595       p = frag_more (3);
4596       *p++ = 0xf;
4597       *p++ = 0xae;
4598       *p = 0xe8;
4599       return;
4600     }
4601
4602   /* Output or/not/shl and lfence before near ret.  */
4603   if (lfence_before_ret != lfence_before_ret_none
4604       && (i.tm.base_opcode == 0xc2
4605           || i.tm.base_opcode == 0xc3))
4606     {
4607       if (last_insn.kind != last_insn_other
4608           && last_insn.seg == now_seg)
4609         {
4610           as_warn_where (last_insn.file, last_insn.line,
4611                          _("`%s` skips -mlfence-before-ret on `%s`"),
4612                          last_insn.name, i.tm.name);
4613           return;
4614         }
4615
4616       /* Near ret ingore operand size override under CPU64.  */
4617       char prefix = flag_code == CODE_64BIT
4618                     ? 0x48
4619                     : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
4620
4621       if (lfence_before_ret == lfence_before_ret_not)
4622         {
4623           /* not: 0xf71424, may add prefix
4624              for operand size override or 64-bit code.  */
4625           p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4626           if (prefix)
4627             *p++ = prefix;
4628           *p++ = 0xf7;
4629           *p++ = 0x14;
4630           *p++ = 0x24;
4631           if (prefix)
4632             *p++ = prefix;
4633           *p++ = 0xf7;
4634           *p++ = 0x14;
4635           *p++ = 0x24;
4636         }
4637       else
4638         {
4639           p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4640           if (prefix)
4641             *p++ = prefix;
4642           if (lfence_before_ret == lfence_before_ret_or)
4643             {
4644               /* or: 0x830c2400, may add prefix
4645                  for operand size override or 64-bit code.  */
4646               *p++ = 0x83;
4647               *p++ = 0x0c;
4648             }
4649           else
4650             {
4651               /* shl: 0xc1242400, may add prefix
4652                  for operand size override or 64-bit code.  */
4653               *p++ = 0xc1;
4654               *p++ = 0x24;
4655             }
4656
4657           *p++ = 0x24;
4658           *p++ = 0x0;
4659         }
4660
4661       *p++ = 0xf;
4662       *p++ = 0xae;
4663       *p = 0xe8;
4664     }
4665 }
4666
4667 /* This is the guts of the machine-dependent assembler.  LINE points to a
4668    machine dependent instruction.  This function is supposed to emit
4669    the frags/bytes it assembles to.  */
4670
4671 void
4672 md_assemble (char *line)
4673 {
4674   unsigned int j;
4675   char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4676   const insn_template *t;
4677
4678   /* Initialize globals.  */
4679   memset (&i, '\0', sizeof (i));
4680   for (j = 0; j < MAX_OPERANDS; j++)
4681     i.reloc[j] = NO_RELOC;
4682   memset (disp_expressions, '\0', sizeof (disp_expressions));
4683   memset (im_expressions, '\0', sizeof (im_expressions));
4684   save_stack_p = save_stack;
4685
4686   /* First parse an instruction mnemonic & call i386_operand for the operands.
4687      We assume that the scrubber has arranged it so that line[0] is the valid
4688      start of a (possibly prefixed) mnemonic.  */
4689
4690   line = parse_insn (line, mnemonic);
4691   if (line == NULL)
4692     return;
4693   mnem_suffix = i.suffix;
4694
4695   line = parse_operands (line, mnemonic);
4696   this_operand = -1;
4697   xfree (i.memop1_string);
4698   i.memop1_string = NULL;
4699   if (line == NULL)
4700     return;
4701
4702   /* Now we've parsed the mnemonic into a set of templates, and have the
4703      operands at hand.  */
4704
4705   /* All Intel opcodes have reversed operands except for "bound", "enter",
4706      "monitor*", "mwait*", "tpause", and "umwait".  We also don't reverse
4707      intersegment "jmp" and "call" instructions with 2 immediate operands so
4708      that the immediate segment precedes the offset, as it does when in AT&T
4709      mode.  */
4710   if (intel_syntax
4711       && i.operands > 1
4712       && (strcmp (mnemonic, "bound") != 0)
4713       && (strcmp (mnemonic, "invlpga") != 0)
4714       && (strncmp (mnemonic, "monitor", 7) != 0)
4715       && (strncmp (mnemonic, "mwait", 5) != 0)
4716       && (strcmp (mnemonic, "tpause") != 0)
4717       && (strcmp (mnemonic, "umwait") != 0)
4718       && !(operand_type_check (i.types[0], imm)
4719            && operand_type_check (i.types[1], imm)))
4720     swap_operands ();
4721
4722   /* The order of the immediates should be reversed
4723      for 2 immediates extrq and insertq instructions */
4724   if (i.imm_operands == 2
4725       && (strcmp (mnemonic, "extrq") == 0
4726           || strcmp (mnemonic, "insertq") == 0))
4727       swap_2_operands (0, 1);
4728
4729   if (i.imm_operands)
4730     optimize_imm ();
4731
4732   /* Don't optimize displacement for movabs since it only takes 64bit
4733      displacement.  */
4734   if (i.disp_operands
4735       && i.disp_encoding != disp_encoding_32bit
4736       && (flag_code != CODE_64BIT
4737           || strcmp (mnemonic, "movabs") != 0))
4738     optimize_disp ();
4739
4740   /* Next, we find a template that matches the given insn,
4741      making sure the overlap of the given operands types is consistent
4742      with the template operand types.  */
4743
4744   if (!(t = match_template (mnem_suffix)))
4745     return;
4746
4747   if (sse_check != check_none
4748       && !i.tm.opcode_modifier.noavx
4749       && !i.tm.cpu_flags.bitfield.cpuavx
4750       && !i.tm.cpu_flags.bitfield.cpuavx512f
4751       && (i.tm.cpu_flags.bitfield.cpusse
4752           || i.tm.cpu_flags.bitfield.cpusse2
4753           || i.tm.cpu_flags.bitfield.cpusse3
4754           || i.tm.cpu_flags.bitfield.cpussse3
4755           || i.tm.cpu_flags.bitfield.cpusse4_1
4756           || i.tm.cpu_flags.bitfield.cpusse4_2
4757           || i.tm.cpu_flags.bitfield.cpupclmul
4758           || i.tm.cpu_flags.bitfield.cpuaes
4759           || i.tm.cpu_flags.bitfield.cpusha
4760           || i.tm.cpu_flags.bitfield.cpugfni))
4761     {
4762       (sse_check == check_warning
4763        ? as_warn
4764        : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4765     }
4766
4767   if (i.tm.opcode_modifier.fwait)
4768     if (!add_prefix (FWAIT_OPCODE))
4769       return;
4770
4771   /* Check if REP prefix is OK.  */
4772   if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4773     {
4774       as_bad (_("invalid instruction `%s' after `%s'"),
4775                 i.tm.name, i.rep_prefix);
4776       return;
4777     }
4778
4779   /* Check for lock without a lockable instruction.  Destination operand
4780      must be memory unless it is xchg (0x86).  */
4781   if (i.prefix[LOCK_PREFIX]
4782       && (!i.tm.opcode_modifier.islockable
4783           || i.mem_operands == 0
4784           || (i.tm.base_opcode != 0x86
4785               && !(i.flags[i.operands - 1] & Operand_Mem))))
4786     {
4787       as_bad (_("expecting lockable instruction after `lock'"));
4788       return;
4789     }
4790
4791   /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns.  */
4792   if (i.prefix[DATA_PREFIX]
4793       && (is_any_vex_encoding (&i.tm)
4794           || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
4795           || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX))
4796     {
4797       as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4798       return;
4799     }
4800
4801   /* Check if HLE prefix is OK.  */
4802   if (i.hle_prefix && !check_hle ())
4803     return;
4804
4805   /* Check BND prefix.  */
4806   if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4807     as_bad (_("expecting valid branch instruction after `bnd'"));
4808
4809   /* Check NOTRACK prefix.  */
4810   if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4811     as_bad (_("expecting indirect branch instruction after `notrack'"));
4812
4813   if (i.tm.cpu_flags.bitfield.cpumpx)
4814     {
4815       if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4816         as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4817       else if (flag_code != CODE_16BIT
4818                ? i.prefix[ADDR_PREFIX]
4819                : i.mem_operands && !i.prefix[ADDR_PREFIX])
4820         as_bad (_("16-bit address isn't allowed in MPX instructions"));
4821     }
4822
4823   /* Insert BND prefix.  */
4824   if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4825     {
4826       if (!i.prefix[BND_PREFIX])
4827         add_prefix (BND_PREFIX_OPCODE);
4828       else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4829         {
4830           as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4831           i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4832         }
4833     }
4834
4835   /* Check string instruction segment overrides.  */
4836   if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4837     {
4838       gas_assert (i.mem_operands);
4839       if (!check_string ())
4840         return;
4841       i.disp_operands = 0;
4842     }
4843
4844   if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4845     optimize_encoding ();
4846
4847   if (!process_suffix ())
4848     return;
4849
4850   /* Update operand types.  */
4851   for (j = 0; j < i.operands; j++)
4852     i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4853
4854   /* Make still unresolved immediate matches conform to size of immediate
4855      given in i.suffix.  */
4856   if (!finalize_imm ())
4857     return;
4858
4859   if (i.types[0].bitfield.imm1)
4860     i.imm_operands = 0; /* kludge for shift insns.  */
4861
4862   /* We only need to check those implicit registers for instructions
4863      with 3 operands or less.  */
4864   if (i.operands <= 3)
4865     for (j = 0; j < i.operands; j++)
4866       if (i.types[j].bitfield.instance != InstanceNone
4867           && !i.types[j].bitfield.xmmword)
4868         i.reg_operands--;
4869
4870   /* ImmExt should be processed after SSE2AVX.  */
4871   if (!i.tm.opcode_modifier.sse2avx
4872       && i.tm.opcode_modifier.immext)
4873     process_immext ();
4874
4875   /* For insns with operands there are more diddles to do to the opcode.  */
4876   if (i.operands)
4877     {
4878       if (!process_operands ())
4879         return;
4880     }
4881   else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4882     {
4883       /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc.  */
4884       as_warn (_("translating to `%sp'"), i.tm.name);
4885     }
4886
4887   if (is_any_vex_encoding (&i.tm))
4888     {
4889       if (!cpu_arch_flags.bitfield.cpui286)
4890         {
4891           as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4892                   i.tm.name);
4893           return;
4894         }
4895
4896       /* Check for explicit REX prefix.  */
4897       if (i.prefix[REX_PREFIX] || i.rex_encoding)
4898         {
4899           as_bad (_("REX prefix invalid with `%s'"), i.tm.name);
4900           return;
4901         }
4902
4903       if (i.tm.opcode_modifier.vex)
4904         build_vex_prefix (t);
4905       else
4906         build_evex_prefix ();
4907
4908       /* The individual REX.RXBW bits got consumed.  */
4909       i.rex &= REX_OPCODE;
4910     }
4911
4912   /* Handle conversion of 'int $3' --> special int3 insn.  XOP or FMA4
4913      instructions may define INT_OPCODE as well, so avoid this corner
4914      case for those instructions that use MODRM.  */
4915   if (i.tm.base_opcode == INT_OPCODE
4916       && !i.tm.opcode_modifier.modrm
4917       && i.op[0].imms->X_add_number == 3)
4918     {
4919       i.tm.base_opcode = INT3_OPCODE;
4920       i.imm_operands = 0;
4921     }
4922
4923   if ((i.tm.opcode_modifier.jump == JUMP
4924        || i.tm.opcode_modifier.jump == JUMP_BYTE
4925        || i.tm.opcode_modifier.jump == JUMP_DWORD)
4926       && i.op[0].disps->X_op == O_constant)
4927     {
4928       /* Convert "jmp constant" (and "call constant") to a jump (call) to
4929          the absolute address given by the constant.  Since ix86 jumps and
4930          calls are pc relative, we need to generate a reloc.  */
4931       i.op[0].disps->X_add_symbol = &abs_symbol;
4932       i.op[0].disps->X_op = O_symbol;
4933     }
4934
4935   /* For 8 bit registers we need an empty rex prefix.  Also if the
4936      instruction already has a prefix, we need to convert old
4937      registers to new ones.  */
4938
4939   if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4940        && (i.op[0].regs->reg_flags & RegRex64) != 0)
4941       || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4942           && (i.op[1].regs->reg_flags & RegRex64) != 0)
4943       || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4944            || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4945           && i.rex != 0))
4946     {
4947       int x;
4948
4949       i.rex |= REX_OPCODE;
4950       for (x = 0; x < 2; x++)
4951         {
4952           /* Look for 8 bit operand that uses old registers.  */
4953           if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4954               && (i.op[x].regs->reg_flags & RegRex64) == 0)
4955             {
4956               gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4957               /* In case it is "hi" register, give up.  */
4958               if (i.op[x].regs->reg_num > 3)
4959                 as_bad (_("can't encode register '%s%s' in an "
4960                           "instruction requiring REX prefix."),
4961                         register_prefix, i.op[x].regs->reg_name);
4962
4963               /* Otherwise it is equivalent to the extended register.
4964                  Since the encoding doesn't change this is merely
4965                  cosmetic cleanup for debug output.  */
4966
4967               i.op[x].regs = i.op[x].regs + 8;
4968             }
4969         }
4970     }
4971
4972   if (i.rex == 0 && i.rex_encoding)
4973     {
4974       /* Check if we can add a REX_OPCODE byte.  Look for 8 bit operand
4975          that uses legacy register.  If it is "hi" register, don't add
4976          the REX_OPCODE byte.  */
4977       int x;
4978       for (x = 0; x < 2; x++)
4979         if (i.types[x].bitfield.class == Reg
4980             && i.types[x].bitfield.byte
4981             && (i.op[x].regs->reg_flags & RegRex64) == 0
4982             && i.op[x].regs->reg_num > 3)
4983           {
4984             gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4985             i.rex_encoding = FALSE;
4986             break;
4987           }
4988
4989       if (i.rex_encoding)
4990         i.rex = REX_OPCODE;
4991     }
4992
4993   if (i.rex != 0)
4994     add_prefix (REX_OPCODE | i.rex);
4995
4996   insert_lfence_before ();
4997
4998   /* We are ready to output the insn.  */
4999   output_insn ();
5000
5001   insert_lfence_after ();
5002
5003   last_insn.seg = now_seg;
5004
5005   if (i.tm.opcode_modifier.isprefix)
5006     {
5007       last_insn.kind = last_insn_prefix;
5008       last_insn.name = i.tm.name;
5009       last_insn.file = as_where (&last_insn.line);
5010     }
5011   else
5012     last_insn.kind = last_insn_other;
5013 }
5014
5015 static char *
5016 parse_insn (char *line, char *mnemonic)
5017 {
5018   char *l = line;
5019   char *token_start = l;
5020   char *mnem_p;
5021   int supported;
5022   const insn_template *t;
5023   char *dot_p = NULL;
5024
5025   while (1)
5026     {
5027       mnem_p = mnemonic;
5028       while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5029         {
5030           if (*mnem_p == '.')
5031             dot_p = mnem_p;
5032           mnem_p++;
5033           if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
5034             {
5035               as_bad (_("no such instruction: `%s'"), token_start);
5036               return NULL;
5037             }
5038           l++;
5039         }
5040       if (!is_space_char (*l)
5041           && *l != END_OF_INSN
5042           && (intel_syntax
5043               || (*l != PREFIX_SEPARATOR
5044                   && *l != ',')))
5045         {
5046           as_bad (_("invalid character %s in mnemonic"),
5047                   output_invalid (*l));
5048           return NULL;
5049         }
5050       if (token_start == l)
5051         {
5052           if (!intel_syntax && *l == PREFIX_SEPARATOR)
5053             as_bad (_("expecting prefix; got nothing"));
5054           else
5055             as_bad (_("expecting mnemonic; got nothing"));
5056           return NULL;
5057         }
5058
5059       /* Look up instruction (or prefix) via hash table.  */
5060       current_templates = (const templates *) hash_find (op_hash, mnemonic);
5061
5062       if (*l != END_OF_INSN
5063           && (!is_space_char (*l) || l[1] != END_OF_INSN)
5064           && current_templates
5065           && current_templates->start->opcode_modifier.isprefix)
5066         {
5067           if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
5068             {
5069               as_bad ((flag_code != CODE_64BIT
5070                        ? _("`%s' is only supported in 64-bit mode")
5071                        : _("`%s' is not supported in 64-bit mode")),
5072                       current_templates->start->name);
5073               return NULL;
5074             }
5075           /* If we are in 16-bit mode, do not allow addr16 or data16.
5076              Similarly, in 32-bit mode, do not allow addr32 or data32.  */
5077           if ((current_templates->start->opcode_modifier.size == SIZE16
5078                || current_templates->start->opcode_modifier.size == SIZE32)
5079               && flag_code != CODE_64BIT
5080               && ((current_templates->start->opcode_modifier.size == SIZE32)
5081                   ^ (flag_code == CODE_16BIT)))
5082             {
5083               as_bad (_("redundant %s prefix"),
5084                       current_templates->start->name);
5085               return NULL;
5086             }
5087           if (current_templates->start->opcode_length == 0)
5088             {
5089               /* Handle pseudo prefixes.  */
5090               switch (current_templates->start->base_opcode)
5091                 {
5092                 case 0x0:
5093                   /* {disp8} */
5094                   i.disp_encoding = disp_encoding_8bit;
5095                   break;
5096                 case 0x1:
5097                   /* {disp32} */
5098                   i.disp_encoding = disp_encoding_32bit;
5099                   break;
5100                 case 0x2:
5101                   /* {load} */
5102                   i.dir_encoding = dir_encoding_load;
5103                   break;
5104                 case 0x3:
5105                   /* {store} */
5106                   i.dir_encoding = dir_encoding_store;
5107                   break;
5108                 case 0x4:
5109                   /* {vex} */
5110                   i.vec_encoding = vex_encoding_vex;
5111                   break;
5112                 case 0x5:
5113                   /* {vex3} */
5114                   i.vec_encoding = vex_encoding_vex3;
5115                   break;
5116                 case 0x6:
5117                   /* {evex} */
5118                   i.vec_encoding = vex_encoding_evex;
5119                   break;
5120                 case 0x7:
5121                   /* {rex} */
5122                   i.rex_encoding = TRUE;
5123                   break;
5124                 case 0x8:
5125                   /* {nooptimize} */
5126                   i.no_optimize = TRUE;
5127                   break;
5128                 default:
5129                   abort ();
5130                 }
5131             }
5132           else
5133             {
5134               /* Add prefix, checking for repeated prefixes.  */
5135               switch (add_prefix (current_templates->start->base_opcode))
5136                 {
5137                 case PREFIX_EXIST:
5138                   return NULL;
5139                 case PREFIX_DS:
5140                   if (current_templates->start->cpu_flags.bitfield.cpuibt)
5141                     i.notrack_prefix = current_templates->start->name;
5142                   break;
5143                 case PREFIX_REP:
5144                   if (current_templates->start->cpu_flags.bitfield.cpuhle)
5145                     i.hle_prefix = current_templates->start->name;
5146                   else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5147                     i.bnd_prefix = current_templates->start->name;
5148                   else
5149                     i.rep_prefix = current_templates->start->name;
5150                   break;
5151                 default:
5152                   break;
5153                 }
5154             }
5155           /* Skip past PREFIX_SEPARATOR and reset token_start.  */
5156           token_start = ++l;
5157         }
5158       else
5159         break;
5160     }
5161
5162   if (!current_templates)
5163     {
5164       /* Deprecated functionality (new code should use pseudo-prefixes instead):
5165          Check if we should swap operand or force 32bit displacement in
5166          encoding.  */
5167       if (mnem_p - 2 == dot_p && dot_p[1] == 's')
5168         i.dir_encoding = dir_encoding_swap;
5169       else if (mnem_p - 3 == dot_p
5170                && dot_p[1] == 'd'
5171                && dot_p[2] == '8')
5172         i.disp_encoding = disp_encoding_8bit;
5173       else if (mnem_p - 4 == dot_p
5174                && dot_p[1] == 'd'
5175                && dot_p[2] == '3'
5176                && dot_p[3] == '2')
5177         i.disp_encoding = disp_encoding_32bit;
5178       else
5179         goto check_suffix;
5180       mnem_p = dot_p;
5181       *dot_p = '\0';
5182       current_templates = (const templates *) hash_find (op_hash, mnemonic);
5183     }
5184
5185   if (!current_templates)
5186     {
5187     check_suffix:
5188       if (mnem_p > mnemonic)
5189         {
5190           /* See if we can get a match by trimming off a suffix.  */
5191           switch (mnem_p[-1])
5192             {
5193             case WORD_MNEM_SUFFIX:
5194               if (intel_syntax && (intel_float_operand (mnemonic) & 2))
5195                 i.suffix = SHORT_MNEM_SUFFIX;
5196               else
5197                 /* Fall through.  */
5198               case BYTE_MNEM_SUFFIX:
5199               case QWORD_MNEM_SUFFIX:
5200                 i.suffix = mnem_p[-1];
5201               mnem_p[-1] = '\0';
5202               current_templates = (const templates *) hash_find (op_hash,
5203                                                                  mnemonic);
5204               break;
5205             case SHORT_MNEM_SUFFIX:
5206             case LONG_MNEM_SUFFIX:
5207               if (!intel_syntax)
5208                 {
5209                   i.suffix = mnem_p[-1];
5210                   mnem_p[-1] = '\0';
5211                   current_templates = (const templates *) hash_find (op_hash,
5212                                                                      mnemonic);
5213                 }
5214               break;
5215
5216               /* Intel Syntax.  */
5217             case 'd':
5218               if (intel_syntax)
5219                 {
5220                   if (intel_float_operand (mnemonic) == 1)
5221                     i.suffix = SHORT_MNEM_SUFFIX;
5222                   else
5223                     i.suffix = LONG_MNEM_SUFFIX;
5224                   mnem_p[-1] = '\0';
5225                   current_templates = (const templates *) hash_find (op_hash,
5226                                                                      mnemonic);
5227                 }
5228               break;
5229             }
5230         }
5231
5232       if (!current_templates)
5233         {
5234           as_bad (_("no such instruction: `%s'"), token_start);
5235           return NULL;
5236         }
5237     }
5238
5239   if (current_templates->start->opcode_modifier.jump == JUMP
5240       || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
5241     {
5242       /* Check for a branch hint.  We allow ",pt" and ",pn" for
5243          predict taken and predict not taken respectively.
5244          I'm not sure that branch hints actually do anything on loop
5245          and jcxz insns (JumpByte) for current Pentium4 chips.  They
5246          may work in the future and it doesn't hurt to accept them
5247          now.  */
5248       if (l[0] == ',' && l[1] == 'p')
5249         {
5250           if (l[2] == 't')
5251             {
5252               if (!add_prefix (DS_PREFIX_OPCODE))
5253                 return NULL;
5254               l += 3;
5255             }
5256           else if (l[2] == 'n')
5257             {
5258               if (!add_prefix (CS_PREFIX_OPCODE))
5259                 return NULL;
5260               l += 3;
5261             }
5262         }
5263     }
5264   /* Any other comma loses.  */
5265   if (*l == ',')
5266     {
5267       as_bad (_("invalid character %s in mnemonic"),
5268               output_invalid (*l));
5269       return NULL;
5270     }
5271
5272   /* Check if instruction is supported on specified architecture.  */
5273   supported = 0;
5274   for (t = current_templates->start; t < current_templates->end; ++t)
5275     {
5276       supported |= cpu_flags_match (t);
5277       if (supported == CPU_FLAGS_PERFECT_MATCH)
5278         {
5279           if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5280             as_warn (_("use .code16 to ensure correct addressing mode"));
5281
5282           return l;
5283         }
5284     }
5285
5286   if (!(supported & CPU_FLAGS_64BIT_MATCH))
5287     as_bad (flag_code == CODE_64BIT
5288             ? _("`%s' is not supported in 64-bit mode")
5289             : _("`%s' is only supported in 64-bit mode"),
5290             current_templates->start->name);
5291   else
5292     as_bad (_("`%s' is not supported on `%s%s'"),
5293             current_templates->start->name,
5294             cpu_arch_name ? cpu_arch_name : default_arch,
5295             cpu_sub_arch_name ? cpu_sub_arch_name : "");
5296
5297   return NULL;
5298 }
5299
5300 static char *
5301 parse_operands (char *l, const char *mnemonic)
5302 {
5303   char *token_start;
5304
5305   /* 1 if operand is pending after ','.  */
5306   unsigned int expecting_operand = 0;
5307
5308   /* Non-zero if operand parens not balanced.  */
5309   unsigned int paren_not_balanced;
5310
5311   while (*l != END_OF_INSN)
5312     {
5313       /* Skip optional white space before operand.  */
5314       if (is_space_char (*l))
5315         ++l;
5316       if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
5317         {
5318           as_bad (_("invalid character %s before operand %d"),
5319                   output_invalid (*l),
5320                   i.operands + 1);
5321           return NULL;
5322         }
5323       token_start = l;  /* After white space.  */
5324       paren_not_balanced = 0;
5325       while (paren_not_balanced || *l != ',')
5326         {
5327           if (*l == END_OF_INSN)
5328             {
5329               if (paren_not_balanced)
5330                 {
5331                   if (!intel_syntax)
5332                     as_bad (_("unbalanced parenthesis in operand %d."),
5333                             i.operands + 1);
5334                   else
5335                     as_bad (_("unbalanced brackets in operand %d."),
5336                             i.operands + 1);
5337                   return NULL;
5338                 }
5339               else
5340                 break;  /* we are done */
5341             }
5342           else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
5343             {
5344               as_bad (_("invalid character %s in operand %d"),
5345                       output_invalid (*l),
5346                       i.operands + 1);
5347               return NULL;
5348             }
5349           if (!intel_syntax)
5350             {
5351               if (*l == '(')
5352                 ++paren_not_balanced;
5353               if (*l == ')')
5354                 --paren_not_balanced;
5355             }
5356           else
5357             {
5358               if (*l == '[')
5359                 ++paren_not_balanced;
5360               if (*l == ']')
5361                 --paren_not_balanced;
5362             }
5363           l++;
5364         }
5365       if (l != token_start)
5366         {                       /* Yes, we've read in another operand.  */
5367           unsigned int operand_ok;
5368           this_operand = i.operands++;
5369           if (i.operands > MAX_OPERANDS)
5370             {
5371               as_bad (_("spurious operands; (%d operands/instruction max)"),
5372                       MAX_OPERANDS);
5373               return NULL;
5374             }
5375           i.types[this_operand].bitfield.unspecified = 1;
5376           /* Now parse operand adding info to 'i' as we go along.  */
5377           END_STRING_AND_SAVE (l);
5378
5379           if (i.mem_operands > 1)
5380             {
5381               as_bad (_("too many memory references for `%s'"),
5382                       mnemonic);
5383               return 0;
5384             }
5385
5386           if (intel_syntax)
5387             operand_ok =
5388               i386_intel_operand (token_start,
5389                                   intel_float_operand (mnemonic));
5390           else
5391             operand_ok = i386_att_operand (token_start);
5392
5393           RESTORE_END_STRING (l);
5394           if (!operand_ok)
5395             return NULL;
5396         }
5397       else
5398         {
5399           if (expecting_operand)
5400             {
5401             expecting_operand_after_comma:
5402               as_bad (_("expecting operand after ','; got nothing"));
5403               return NULL;
5404             }
5405           if (*l == ',')
5406             {
5407               as_bad (_("expecting operand before ','; got nothing"));
5408               return NULL;
5409             }
5410         }
5411
5412       /* Now *l must be either ',' or END_OF_INSN.  */
5413       if (*l == ',')
5414         {
5415           if (*++l == END_OF_INSN)
5416             {
5417               /* Just skip it, if it's \n complain.  */
5418               goto expecting_operand_after_comma;
5419             }
5420           expecting_operand = 1;
5421         }
5422     }
5423   return l;
5424 }
5425
5426 static void
5427 swap_2_operands (int xchg1, int xchg2)
5428 {
5429   union i386_op temp_op;
5430   i386_operand_type temp_type;
5431   unsigned int temp_flags;
5432   enum bfd_reloc_code_real temp_reloc;
5433
5434   temp_type = i.types[xchg2];
5435   i.types[xchg2] = i.types[xchg1];
5436   i.types[xchg1] = temp_type;
5437
5438   temp_flags = i.flags[xchg2];
5439   i.flags[xchg2] = i.flags[xchg1];
5440   i.flags[xchg1] = temp_flags;
5441
5442   temp_op = i.op[xchg2];
5443   i.op[xchg2] = i.op[xchg1];
5444   i.op[xchg1] = temp_op;
5445
5446   temp_reloc = i.reloc[xchg2];
5447   i.reloc[xchg2] = i.reloc[xchg1];
5448   i.reloc[xchg1] = temp_reloc;
5449
5450   if (i.mask)
5451     {
5452       if (i.mask->operand == xchg1)
5453         i.mask->operand = xchg2;
5454       else if (i.mask->operand == xchg2)
5455         i.mask->operand = xchg1;
5456     }
5457   if (i.broadcast)
5458     {
5459       if (i.broadcast->operand == xchg1)
5460         i.broadcast->operand = xchg2;
5461       else if (i.broadcast->operand == xchg2)
5462         i.broadcast->operand = xchg1;
5463     }
5464   if (i.rounding)
5465     {
5466       if (i.rounding->operand == xchg1)
5467         i.rounding->operand = xchg2;
5468       else if (i.rounding->operand == xchg2)
5469         i.rounding->operand = xchg1;
5470     }
5471 }
5472
5473 static void
5474 swap_operands (void)
5475 {
5476   switch (i.operands)
5477     {
5478     case 5:
5479     case 4:
5480       swap_2_operands (1, i.operands - 2);
5481       /* Fall through.  */
5482     case 3:
5483     case 2:
5484       swap_2_operands (0, i.operands - 1);
5485       break;
5486     default:
5487       abort ();
5488     }
5489
5490   if (i.mem_operands == 2)
5491     {
5492       const seg_entry *temp_seg;
5493       temp_seg = i.seg[0];
5494       i.seg[0] = i.seg[1];
5495       i.seg[1] = temp_seg;
5496     }
5497 }
5498
5499 /* Try to ensure constant immediates are represented in the smallest
5500    opcode possible.  */
5501 static void
5502 optimize_imm (void)
5503 {
5504   char guess_suffix = 0;
5505   int op;
5506
5507   if (i.suffix)
5508     guess_suffix = i.suffix;
5509   else if (i.reg_operands)
5510     {
5511       /* Figure out a suffix from the last register operand specified.
5512          We can't do this properly yet, i.e. excluding special register
5513          instances, but the following works for instructions with
5514          immediates.  In any case, we can't set i.suffix yet.  */
5515       for (op = i.operands; --op >= 0;)
5516         if (i.types[op].bitfield.class != Reg)
5517           continue;
5518         else if (i.types[op].bitfield.byte)
5519           {
5520             guess_suffix = BYTE_MNEM_SUFFIX;
5521             break;
5522           }
5523         else if (i.types[op].bitfield.word)
5524           {
5525             guess_suffix = WORD_MNEM_SUFFIX;
5526             break;
5527           }
5528         else if (i.types[op].bitfield.dword)
5529           {
5530             guess_suffix = LONG_MNEM_SUFFIX;
5531             break;
5532           }
5533         else if (i.types[op].bitfield.qword)
5534           {
5535             guess_suffix = QWORD_MNEM_SUFFIX;
5536             break;
5537           }
5538     }
5539   else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5540     guess_suffix = WORD_MNEM_SUFFIX;
5541
5542   for (op = i.operands; --op >= 0;)
5543     if (operand_type_check (i.types[op], imm))
5544       {
5545         switch (i.op[op].imms->X_op)
5546           {
5547           case O_constant:
5548             /* If a suffix is given, this operand may be shortened.  */
5549             switch (guess_suffix)
5550               {
5551               case LONG_MNEM_SUFFIX:
5552                 i.types[op].bitfield.imm32 = 1;
5553                 i.types[op].bitfield.imm64 = 1;
5554                 break;
5555               case WORD_MNEM_SUFFIX:
5556                 i.types[op].bitfield.imm16 = 1;
5557                 i.types[op].bitfield.imm32 = 1;
5558                 i.types[op].bitfield.imm32s = 1;
5559                 i.types[op].bitfield.imm64 = 1;
5560                 break;
5561               case BYTE_MNEM_SUFFIX:
5562                 i.types[op].bitfield.imm8 = 1;
5563                 i.types[op].bitfield.imm8s = 1;
5564                 i.types[op].bitfield.imm16 = 1;
5565                 i.types[op].bitfield.imm32 = 1;
5566                 i.types[op].bitfield.imm32s = 1;
5567                 i.types[op].bitfield.imm64 = 1;
5568                 break;
5569               }
5570
5571             /* If this operand is at most 16 bits, convert it
5572                to a signed 16 bit number before trying to see
5573                whether it will fit in an even smaller size.
5574                This allows a 16-bit operand such as $0xffe0 to
5575                be recognised as within Imm8S range.  */
5576             if ((i.types[op].bitfield.imm16)
5577                 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5578               {
5579                 i.op[op].imms->X_add_number =
5580                   (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5581               }
5582 #ifdef BFD64
5583             /* Store 32-bit immediate in 64-bit for 64-bit BFD.  */
5584             if ((i.types[op].bitfield.imm32)
5585                 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5586                     == 0))
5587               {
5588                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5589                                                 ^ ((offsetT) 1 << 31))
5590                                                - ((offsetT) 1 << 31));
5591               }
5592 #endif
5593             i.types[op]
5594               = operand_type_or (i.types[op],
5595                                  smallest_imm_type (i.op[op].imms->X_add_number));
5596
5597             /* We must avoid matching of Imm32 templates when 64bit
5598                only immediate is available.  */
5599             if (guess_suffix == QWORD_MNEM_SUFFIX)
5600               i.types[op].bitfield.imm32 = 0;
5601             break;
5602
5603           case O_absent:
5604           case O_register:
5605             abort ();
5606
5607             /* Symbols and expressions.  */
5608           default:
5609             /* Convert symbolic operand to proper sizes for matching, but don't
5610                prevent matching a set of insns that only supports sizes other
5611                than those matching the insn suffix.  */
5612             {
5613               i386_operand_type mask, allowed;
5614               const insn_template *t;
5615
5616               operand_type_set (&mask, 0);
5617               operand_type_set (&allowed, 0);
5618
5619               for (t = current_templates->start;
5620                    t < current_templates->end;
5621                    ++t)
5622                 {
5623                   allowed = operand_type_or (allowed, t->operand_types[op]);
5624                   allowed = operand_type_and (allowed, anyimm);
5625                 }
5626               switch (guess_suffix)
5627                 {
5628                 case QWORD_MNEM_SUFFIX:
5629                   mask.bitfield.imm64 = 1;
5630                   mask.bitfield.imm32s = 1;
5631                   break;
5632                 case LONG_MNEM_SUFFIX:
5633                   mask.bitfield.imm32 = 1;
5634                   break;
5635                 case WORD_MNEM_SUFFIX:
5636                   mask.bitfield.imm16 = 1;
5637                   break;
5638                 case BYTE_MNEM_SUFFIX:
5639                   mask.bitfield.imm8 = 1;
5640                   break;
5641                 default:
5642                   break;
5643                 }
5644               allowed = operand_type_and (mask, allowed);
5645               if (!operand_type_all_zero (&allowed))
5646                 i.types[op] = operand_type_and (i.types[op], mask);
5647             }
5648             break;
5649           }
5650       }
5651 }
5652
5653 /* Try to use the smallest displacement type too.  */
5654 static void
5655 optimize_disp (void)
5656 {
5657   int op;
5658
5659   for (op = i.operands; --op >= 0;)
5660     if (operand_type_check (i.types[op], disp))
5661       {
5662         if (i.op[op].disps->X_op == O_constant)
5663           {
5664             offsetT op_disp = i.op[op].disps->X_add_number;
5665
5666             if (i.types[op].bitfield.disp16
5667                 && (op_disp & ~(offsetT) 0xffff) == 0)
5668               {
5669                 /* If this operand is at most 16 bits, convert
5670                    to a signed 16 bit number and don't use 64bit
5671                    displacement.  */
5672                 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5673                 i.types[op].bitfield.disp64 = 0;
5674               }
5675 #ifdef BFD64
5676             /* Optimize 64-bit displacement to 32-bit for 64-bit BFD.  */
5677             if (i.types[op].bitfield.disp32
5678                 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5679               {
5680                 /* If this operand is at most 32 bits, convert
5681                    to a signed 32 bit number and don't use 64bit
5682                    displacement.  */
5683                 op_disp &= (((offsetT) 2 << 31) - 1);
5684                 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5685                 i.types[op].bitfield.disp64 = 0;
5686               }
5687 #endif
5688             if (!op_disp && i.types[op].bitfield.baseindex)
5689               {
5690                 i.types[op].bitfield.disp8 = 0;
5691                 i.types[op].bitfield.disp16 = 0;
5692                 i.types[op].bitfield.disp32 = 0;
5693                 i.types[op].bitfield.disp32s = 0;
5694                 i.types[op].bitfield.disp64 = 0;
5695                 i.op[op].disps = 0;
5696                 i.disp_operands--;
5697               }
5698             else if (flag_code == CODE_64BIT)
5699               {
5700                 if (fits_in_signed_long (op_disp))
5701                   {
5702                     i.types[op].bitfield.disp64 = 0;
5703                     i.types[op].bitfield.disp32s = 1;
5704                   }
5705                 if (i.prefix[ADDR_PREFIX]
5706                     && fits_in_unsigned_long (op_disp))
5707                   i.types[op].bitfield.disp32 = 1;
5708               }
5709             if ((i.types[op].bitfield.disp32
5710                  || i.types[op].bitfield.disp32s
5711                  || i.types[op].bitfield.disp16)
5712                 && fits_in_disp8 (op_disp))
5713               i.types[op].bitfield.disp8 = 1;
5714           }
5715         else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5716                  || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5717           {
5718             fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5719                          i.op[op].disps, 0, i.reloc[op]);
5720             i.types[op].bitfield.disp8 = 0;
5721             i.types[op].bitfield.disp16 = 0;
5722             i.types[op].bitfield.disp32 = 0;
5723             i.types[op].bitfield.disp32s = 0;
5724             i.types[op].bitfield.disp64 = 0;
5725           }
5726         else
5727           /* We only support 64bit displacement on constants.  */
5728           i.types[op].bitfield.disp64 = 0;
5729       }
5730 }
5731
5732 /* Return 1 if there is a match in broadcast bytes between operand
5733    GIVEN and instruction template T.   */
5734
5735 static INLINE int
5736 match_broadcast_size (const insn_template *t, unsigned int given)
5737 {
5738   return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5739            && i.types[given].bitfield.byte)
5740           || (t->opcode_modifier.broadcast == WORD_BROADCAST
5741               && i.types[given].bitfield.word)
5742           || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5743               && i.types[given].bitfield.dword)
5744           || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5745               && i.types[given].bitfield.qword));
5746 }
5747
5748 /* Check if operands are valid for the instruction.  */
5749
5750 static int
5751 check_VecOperands (const insn_template *t)
5752 {
5753   unsigned int op;
5754   i386_cpu_flags cpu;
5755
5756   /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5757      any one operand are implicity requiring AVX512VL support if the actual
5758      operand size is YMMword or XMMword.  Since this function runs after
5759      template matching, there's no need to check for YMMword/XMMword in
5760      the template.  */
5761   cpu = cpu_flags_and (t->cpu_flags, avx512);
5762   if (!cpu_flags_all_zero (&cpu)
5763       && !t->cpu_flags.bitfield.cpuavx512vl
5764       && !cpu_arch_flags.bitfield.cpuavx512vl)
5765     {
5766       for (op = 0; op < t->operands; ++op)
5767         {
5768           if (t->operand_types[op].bitfield.zmmword
5769               && (i.types[op].bitfield.ymmword
5770                   || i.types[op].bitfield.xmmword))
5771             {
5772               i.error = unsupported;
5773               return 1;
5774             }
5775         }
5776     }
5777
5778   /* Without VSIB byte, we can't have a vector register for index.  */
5779   if (!t->opcode_modifier.vecsib
5780       && i.index_reg
5781       && (i.index_reg->reg_type.bitfield.xmmword
5782           || i.index_reg->reg_type.bitfield.ymmword
5783           || i.index_reg->reg_type.bitfield.zmmword))
5784     {
5785       i.error = unsupported_vector_index_register;
5786       return 1;
5787     }
5788
5789   /* Check if default mask is allowed.  */
5790   if (t->opcode_modifier.nodefmask
5791       && (!i.mask || i.mask->mask->reg_num == 0))
5792     {
5793       i.error = no_default_mask;
5794       return 1;
5795     }
5796
5797   /* For VSIB byte, we need a vector register for index, and all vector
5798      registers must be distinct.  */
5799   if (t->opcode_modifier.vecsib)
5800     {
5801       if (!i.index_reg
5802           || !((t->opcode_modifier.vecsib == VecSIB128
5803                 && i.index_reg->reg_type.bitfield.xmmword)
5804                || (t->opcode_modifier.vecsib == VecSIB256
5805                    && i.index_reg->reg_type.bitfield.ymmword)
5806                || (t->opcode_modifier.vecsib == VecSIB512
5807                    && i.index_reg->reg_type.bitfield.zmmword)))
5808       {
5809         i.error = invalid_vsib_address;
5810         return 1;
5811       }
5812
5813       gas_assert (i.reg_operands == 2 || i.mask);
5814       if (i.reg_operands == 2 && !i.mask)
5815         {
5816           gas_assert (i.types[0].bitfield.class == RegSIMD);
5817           gas_assert (i.types[0].bitfield.xmmword
5818                       || i.types[0].bitfield.ymmword);
5819           gas_assert (i.types[2].bitfield.class == RegSIMD);
5820           gas_assert (i.types[2].bitfield.xmmword
5821                       || i.types[2].bitfield.ymmword);
5822           if (operand_check == check_none)
5823             return 0;
5824           if (register_number (i.op[0].regs)
5825               != register_number (i.index_reg)
5826               && register_number (i.op[2].regs)
5827                  != register_number (i.index_reg)
5828               && register_number (i.op[0].regs)
5829                  != register_number (i.op[2].regs))
5830             return 0;
5831           if (operand_check == check_error)
5832             {
5833               i.error = invalid_vector_register_set;
5834               return 1;
5835             }
5836           as_warn (_("mask, index, and destination registers should be distinct"));
5837         }
5838       else if (i.reg_operands == 1 && i.mask)
5839         {
5840           if (i.types[1].bitfield.class == RegSIMD
5841               && (i.types[1].bitfield.xmmword
5842                   || i.types[1].bitfield.ymmword
5843                   || i.types[1].bitfield.zmmword)
5844               && (register_number (i.op[1].regs)
5845                   == register_number (i.index_reg)))
5846             {
5847               if (operand_check == check_error)
5848                 {
5849                   i.error = invalid_vector_register_set;
5850                   return 1;
5851                 }
5852               if (operand_check != check_none)
5853                 as_warn (_("index and destination registers should be distinct"));
5854             }
5855         }
5856     }
5857
5858   /* Check if broadcast is supported by the instruction and is applied
5859      to the memory operand.  */
5860   if (i.broadcast)
5861     {
5862       i386_operand_type type, overlap;
5863
5864       /* Check if specified broadcast is supported in this instruction,
5865          and its broadcast bytes match the memory operand.  */
5866       op = i.broadcast->operand;
5867       if (!t->opcode_modifier.broadcast
5868           || !(i.flags[op] & Operand_Mem)
5869           || (!i.types[op].bitfield.unspecified
5870               && !match_broadcast_size (t, op)))
5871         {
5872         bad_broadcast:
5873           i.error = unsupported_broadcast;
5874           return 1;
5875         }
5876
5877       i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5878                             * i.broadcast->type);
5879       operand_type_set (&type, 0);
5880       switch (i.broadcast->bytes)
5881         {
5882         case 2:
5883           type.bitfield.word = 1;
5884           break;
5885         case 4:
5886           type.bitfield.dword = 1;
5887           break;
5888         case 8:
5889           type.bitfield.qword = 1;
5890           break;
5891         case 16:
5892           type.bitfield.xmmword = 1;
5893           break;
5894         case 32:
5895           type.bitfield.ymmword = 1;
5896           break;
5897         case 64:
5898           type.bitfield.zmmword = 1;
5899           break;
5900         default:
5901           goto bad_broadcast;
5902         }
5903
5904       overlap = operand_type_and (type, t->operand_types[op]);
5905       if (t->operand_types[op].bitfield.class == RegSIMD
5906           && t->operand_types[op].bitfield.byte
5907              + t->operand_types[op].bitfield.word
5908              + t->operand_types[op].bitfield.dword
5909              + t->operand_types[op].bitfield.qword > 1)
5910         {
5911           overlap.bitfield.xmmword = 0;
5912           overlap.bitfield.ymmword = 0;
5913           overlap.bitfield.zmmword = 0;
5914         }
5915       if (operand_type_all_zero (&overlap))
5916           goto bad_broadcast;
5917
5918       if (t->opcode_modifier.checkregsize)
5919         {
5920           unsigned int j;
5921
5922           type.bitfield.baseindex = 1;
5923           for (j = 0; j < i.operands; ++j)
5924             {
5925               if (j != op
5926                   && !operand_type_register_match(i.types[j],
5927                                                   t->operand_types[j],
5928                                                   type,
5929                                                   t->operand_types[op]))
5930                 goto bad_broadcast;
5931             }
5932         }
5933     }
5934   /* If broadcast is supported in this instruction, we need to check if
5935      operand of one-element size isn't specified without broadcast.  */
5936   else if (t->opcode_modifier.broadcast && i.mem_operands)
5937     {
5938       /* Find memory operand.  */
5939       for (op = 0; op < i.operands; op++)
5940         if (i.flags[op] & Operand_Mem)
5941           break;
5942       gas_assert (op < i.operands);
5943       /* Check size of the memory operand.  */
5944       if (match_broadcast_size (t, op))
5945         {
5946           i.error = broadcast_needed;
5947           return 1;
5948         }
5949     }
5950   else
5951     op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning.  */
5952
5953   /* Check if requested masking is supported.  */
5954   if (i.mask)
5955     {
5956       switch (t->opcode_modifier.masking)
5957         {
5958         case BOTH_MASKING:
5959           break;
5960         case MERGING_MASKING:
5961           if (i.mask->zeroing)
5962             {
5963         case 0:
5964               i.error = unsupported_masking;
5965               return 1;
5966             }
5967           break;
5968         case DYNAMIC_MASKING:
5969           /* Memory destinations allow only merging masking.  */
5970           if (i.mask->zeroing && i.mem_operands)
5971             {
5972               /* Find memory operand.  */
5973               for (op = 0; op < i.operands; op++)
5974                 if (i.flags[op] & Operand_Mem)
5975                   break;
5976               gas_assert (op < i.operands);
5977               if (op == i.operands - 1)
5978                 {
5979                   i.error = unsupported_masking;
5980                   return 1;
5981                 }
5982             }
5983           break;
5984         default:
5985           abort ();
5986         }
5987     }
5988
5989   /* Check if masking is applied to dest operand.  */
5990   if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5991     {
5992       i.error = mask_not_on_destination;
5993       return 1;
5994     }
5995
5996   /* Check RC/SAE.  */
5997   if (i.rounding)
5998     {
5999       if (!t->opcode_modifier.sae
6000           || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
6001         {
6002           i.error = unsupported_rc_sae;
6003           return 1;
6004         }
6005       /* If the instruction has several immediate operands and one of
6006          them is rounding, the rounding operand should be the last
6007          immediate operand.  */
6008       if (i.imm_operands > 1
6009           && i.rounding->operand != (int) (i.imm_operands - 1))
6010         {
6011           i.error = rc_sae_operand_not_last_imm;
6012           return 1;
6013         }
6014     }
6015
6016   /* Check the special Imm4 cases; must be the first operand.  */
6017   if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6018     {
6019       if (i.op[0].imms->X_op != O_constant
6020           || !fits_in_imm4 (i.op[0].imms->X_add_number))
6021         {
6022           i.error = bad_imm4;
6023           return 1;
6024         }
6025
6026       /* Turn off Imm<N> so that update_imm won't complain.  */
6027       operand_type_set (&i.types[0], 0);
6028     }
6029
6030   /* Check vector Disp8 operand.  */
6031   if (t->opcode_modifier.disp8memshift
6032       && i.disp_encoding != disp_encoding_32bit)
6033     {
6034       if (i.broadcast)
6035         i.memshift = t->opcode_modifier.broadcast - 1;
6036       else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
6037         i.memshift = t->opcode_modifier.disp8memshift;
6038       else
6039         {
6040           const i386_operand_type *type = NULL;
6041
6042           i.memshift = 0;
6043           for (op = 0; op < i.operands; op++)
6044             if (i.flags[op] & Operand_Mem)
6045               {
6046                 if (t->opcode_modifier.evex == EVEXLIG)
6047                   i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6048                 else if (t->operand_types[op].bitfield.xmmword
6049                          + t->operand_types[op].bitfield.ymmword
6050                          + t->operand_types[op].bitfield.zmmword <= 1)
6051                   type = &t->operand_types[op];
6052                 else if (!i.types[op].bitfield.unspecified)
6053                   type = &i.types[op];
6054               }
6055             else if (i.types[op].bitfield.class == RegSIMD
6056                      && t->opcode_modifier.evex != EVEXLIG)
6057               {
6058                 if (i.types[op].bitfield.zmmword)
6059                   i.memshift = 6;
6060                 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6061                   i.memshift = 5;
6062                 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6063                   i.memshift = 4;
6064               }
6065
6066           if (type)
6067             {
6068               if (type->bitfield.zmmword)
6069                 i.memshift = 6;
6070               else if (type->bitfield.ymmword)
6071                 i.memshift = 5;
6072               else if (type->bitfield.xmmword)
6073                 i.memshift = 4;
6074             }
6075
6076           /* For the check in fits_in_disp8().  */
6077           if (i.memshift == 0)
6078             i.memshift = -1;
6079         }
6080
6081       for (op = 0; op < i.operands; op++)
6082         if (operand_type_check (i.types[op], disp)
6083             && i.op[op].disps->X_op == O_constant)
6084           {
6085             if (fits_in_disp8 (i.op[op].disps->X_add_number))
6086               {
6087                 i.types[op].bitfield.disp8 = 1;
6088                 return 0;
6089               }
6090             i.types[op].bitfield.disp8 = 0;
6091           }
6092     }
6093
6094   i.memshift = 0;
6095
6096   return 0;
6097 }
6098
6099 /* Check if encoding requirements are met by the instruction.  */
6100
6101 static int
6102 VEX_check_encoding (const insn_template *t)
6103 {
6104   if (i.vec_encoding == vex_encoding_error)
6105     {
6106       i.error = unsupported;
6107       return 1;
6108     }
6109
6110   if (i.vec_encoding == vex_encoding_evex)
6111     {
6112       /* This instruction must be encoded with EVEX prefix.  */
6113       if (!is_evex_encoding (t))
6114         {
6115           i.error = unsupported;
6116           return 1;
6117         }
6118       return 0;
6119     }
6120
6121   if (!t->opcode_modifier.vex)
6122     {
6123       /* This instruction template doesn't have VEX prefix.  */
6124       if (i.vec_encoding != vex_encoding_default)
6125         {
6126           i.error = unsupported;
6127           return 1;
6128         }
6129       return 0;
6130     }
6131
6132   return 0;
6133 }
6134
6135 static const insn_template *
6136 match_template (char mnem_suffix)
6137 {
6138   /* Points to template once we've found it.  */
6139   const insn_template *t;
6140   i386_operand_type overlap0, overlap1, overlap2, overlap3;
6141   i386_operand_type overlap4;
6142   unsigned int found_reverse_match;
6143   i386_opcode_modifier suffix_check;
6144   i386_operand_type operand_types [MAX_OPERANDS];
6145   int addr_prefix_disp;
6146   unsigned int j, size_match, check_register;
6147   enum i386_error specific_error = 0;
6148
6149 #if MAX_OPERANDS != 5
6150 # error "MAX_OPERANDS must be 5."
6151 #endif
6152
6153   found_reverse_match = 0;
6154   addr_prefix_disp = -1;
6155
6156   /* Prepare for mnemonic suffix check.  */
6157   memset (&suffix_check, 0, sizeof (suffix_check));
6158   switch (mnem_suffix)
6159     {
6160     case BYTE_MNEM_SUFFIX:
6161       suffix_check.no_bsuf = 1;
6162       break;
6163     case WORD_MNEM_SUFFIX:
6164       suffix_check.no_wsuf = 1;
6165       break;
6166     case SHORT_MNEM_SUFFIX:
6167       suffix_check.no_ssuf = 1;
6168       break;
6169     case LONG_MNEM_SUFFIX:
6170       suffix_check.no_lsuf = 1;
6171       break;
6172     case QWORD_MNEM_SUFFIX:
6173       suffix_check.no_qsuf = 1;
6174       break;
6175     default:
6176       /* NB: In Intel syntax, normally we can check for memory operand
6177          size when there is no mnemonic suffix.  But jmp and call have
6178          2 different encodings with Dword memory operand size, one with
6179          No_ldSuf and the other without.  i.suffix is set to
6180          LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf.  */
6181       if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6182         suffix_check.no_ldsuf = 1;
6183     }
6184
6185   /* Must have right number of operands.  */
6186   i.error = number_of_operands_mismatch;
6187
6188   for (t = current_templates->start; t < current_templates->end; t++)
6189     {
6190       addr_prefix_disp = -1;
6191       found_reverse_match = 0;
6192
6193       if (i.operands != t->operands)
6194         continue;
6195
6196       /* Check processor support.  */
6197       i.error = unsupported;
6198       if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
6199         continue;
6200
6201       /* Check AT&T mnemonic.   */
6202       i.error = unsupported_with_intel_mnemonic;
6203       if (intel_mnemonic && t->opcode_modifier.attmnemonic)
6204         continue;
6205
6206       /* Check AT&T/Intel syntax.  */
6207       i.error = unsupported_syntax;
6208       if ((intel_syntax && t->opcode_modifier.attsyntax)
6209           || (!intel_syntax && t->opcode_modifier.intelsyntax))
6210         continue;
6211
6212       /* Check Intel64/AMD64 ISA.   */
6213       switch (isa64)
6214         {
6215         default:
6216           /* Default: Don't accept Intel64.  */
6217           if (t->opcode_modifier.isa64 == INTEL64)
6218             continue;
6219           break;
6220         case amd64:
6221           /* -mamd64: Don't accept Intel64 and Intel64 only.  */
6222           if (t->opcode_modifier.isa64 >= INTEL64)
6223             continue;
6224           break;
6225         case intel64:
6226           /* -mintel64: Don't accept AMD64.  */
6227           if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
6228             continue;
6229           break;
6230         }
6231
6232       /* Check the suffix.  */
6233       i.error = invalid_instruction_suffix;
6234       if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6235           || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6236           || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6237           || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6238           || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6239           || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
6240         continue;
6241
6242       size_match = operand_size_match (t);
6243       if (!size_match)
6244         continue;
6245
6246       /* This is intentionally not
6247
6248          if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6249
6250          as the case of a missing * on the operand is accepted (perhaps with
6251          a warning, issued further down).  */
6252       if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6253         {
6254           i.error = operand_type_mismatch;
6255           continue;
6256         }
6257
6258       for (j = 0; j < MAX_OPERANDS; j++)
6259         operand_types[j] = t->operand_types[j];
6260
6261       /* In general, don't allow
6262          - 64-bit operands outside of 64-bit mode,
6263          - 32-bit operands on pre-386.  */
6264       j = i.imm_operands + (t->operands > i.imm_operands + 1);
6265       if (((i.suffix == QWORD_MNEM_SUFFIX
6266             && flag_code != CODE_64BIT
6267             && (t->base_opcode != 0x0fc7
6268                 || t->extension_opcode != 1 /* cmpxchg8b */))
6269            || (i.suffix == LONG_MNEM_SUFFIX
6270                && !cpu_arch_flags.bitfield.cpui386))
6271           && (intel_syntax
6272               ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
6273                  && !intel_float_operand (t->name))
6274               : intel_float_operand (t->name) != 2)
6275           && (t->operands == i.imm_operands
6276               || (operand_types[i.imm_operands].bitfield.class != RegMMX
6277                && operand_types[i.imm_operands].bitfield.class != RegSIMD
6278                && operand_types[i.imm_operands].bitfield.class != RegMask)
6279               || (operand_types[j].bitfield.class != RegMMX
6280                   && operand_types[j].bitfield.class != RegSIMD
6281                   && operand_types[j].bitfield.class != RegMask))
6282           && !t->opcode_modifier.vecsib)
6283         continue;
6284
6285       /* Do not verify operands when there are none.  */
6286       if (!t->operands)
6287         {
6288           if (VEX_check_encoding (t))
6289             {
6290               specific_error = i.error;
6291               continue;
6292             }
6293
6294           /* We've found a match; break out of loop.  */
6295           break;
6296         }
6297
6298       if (!t->opcode_modifier.jump
6299           || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6300         {
6301           /* There should be only one Disp operand.  */
6302           for (j = 0; j < MAX_OPERANDS; j++)
6303             if (operand_type_check (operand_types[j], disp))
6304               break;
6305           if (j < MAX_OPERANDS)
6306             {
6307               bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
6308
6309               addr_prefix_disp = j;
6310
6311               /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6312                  operand into Disp32/Disp32/Disp16/Disp32 operand.  */
6313               switch (flag_code)
6314                 {
6315                 case CODE_16BIT:
6316                   override = !override;
6317                   /* Fall through.  */
6318                 case CODE_32BIT:
6319                   if (operand_types[j].bitfield.disp32
6320                       && operand_types[j].bitfield.disp16)
6321                     {
6322                       operand_types[j].bitfield.disp16 = override;
6323                       operand_types[j].bitfield.disp32 = !override;
6324                     }
6325                   operand_types[j].bitfield.disp32s = 0;
6326                   operand_types[j].bitfield.disp64 = 0;
6327                   break;
6328
6329                 case CODE_64BIT:
6330                   if (operand_types[j].bitfield.disp32s
6331                       || operand_types[j].bitfield.disp64)
6332                     {
6333                       operand_types[j].bitfield.disp64 &= !override;
6334                       operand_types[j].bitfield.disp32s &= !override;
6335                       operand_types[j].bitfield.disp32 = override;
6336                     }
6337                   operand_types[j].bitfield.disp16 = 0;
6338                   break;
6339                 }
6340             }
6341         }
6342
6343       /* Force 0x8b encoding for "mov foo@GOT, %eax".  */
6344       if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
6345         continue;
6346
6347       /* We check register size if needed.  */
6348       if (t->opcode_modifier.checkregsize)
6349         {
6350           check_register = (1 << t->operands) - 1;
6351           if (i.broadcast)
6352             check_register &= ~(1 << i.broadcast->operand);
6353         }
6354       else
6355         check_register = 0;
6356
6357       overlap0 = operand_type_and (i.types[0], operand_types[0]);
6358       switch (t->operands)
6359         {
6360         case 1:
6361           if (!operand_type_match (overlap0, i.types[0]))
6362             continue;
6363           break;
6364         case 2:
6365           /* xchg %eax, %eax is a special case. It is an alias for nop
6366              only in 32bit mode and we can use opcode 0x90.  In 64bit
6367              mode, we can't use 0x90 for xchg %eax, %eax since it should
6368              zero-extend %eax to %rax.  */
6369           if (flag_code == CODE_64BIT
6370               && t->base_opcode == 0x90
6371               && i.types[0].bitfield.instance == Accum
6372               && i.types[0].bitfield.dword
6373               && i.types[1].bitfield.instance == Accum
6374               && i.types[1].bitfield.dword)
6375             continue;
6376           /* xrelease mov %eax, <disp> is another special case. It must not
6377              match the accumulator-only encoding of mov.  */
6378           if (flag_code != CODE_64BIT
6379               && i.hle_prefix
6380               && t->base_opcode == 0xa0
6381               && i.types[0].bitfield.instance == Accum
6382               && (i.flags[1] & Operand_Mem))
6383             continue;
6384           /* Fall through.  */
6385
6386         case 3:
6387           if (!(size_match & MATCH_STRAIGHT))
6388             goto check_reverse;
6389           /* Reverse direction of operands if swapping is possible in the first
6390              place (operands need to be symmetric) and
6391              - the load form is requested, and the template is a store form,
6392              - the store form is requested, and the template is a load form,
6393              - the non-default (swapped) form is requested.  */
6394           overlap1 = operand_type_and (operand_types[0], operand_types[1]);
6395           if (t->opcode_modifier.d && i.reg_operands == i.operands
6396               && !operand_type_all_zero (&overlap1))
6397             switch (i.dir_encoding)
6398               {
6399               case dir_encoding_load:
6400                 if (operand_type_check (operand_types[i.operands - 1], anymem)
6401                     || t->opcode_modifier.regmem)
6402                   goto check_reverse;
6403                 break;
6404
6405               case dir_encoding_store:
6406                 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6407                     && !t->opcode_modifier.regmem)
6408                   goto check_reverse;
6409                 break;
6410
6411               case dir_encoding_swap:
6412                 goto check_reverse;
6413
6414               case dir_encoding_default:
6415                 break;
6416               }
6417           /* If we want store form, we skip the current load.  */
6418           if ((i.dir_encoding == dir_encoding_store
6419                || i.dir_encoding == dir_encoding_swap)
6420               && i.mem_operands == 0
6421               && t->opcode_modifier.load)
6422             continue;
6423           /* Fall through.  */
6424         case 4:
6425         case 5:
6426           overlap1 = operand_type_and (i.types[1], operand_types[1]);
6427           if (!operand_type_match (overlap0, i.types[0])
6428               || !operand_type_match (overlap1, i.types[1])
6429               || ((check_register & 3) == 3
6430                   && !operand_type_register_match (i.types[0],
6431                                                    operand_types[0],
6432                                                    i.types[1],
6433                                                    operand_types[1])))
6434             {
6435               /* Check if other direction is valid ...  */
6436               if (!t->opcode_modifier.d)
6437                 continue;
6438
6439             check_reverse:
6440               if (!(size_match & MATCH_REVERSE))
6441                 continue;
6442               /* Try reversing direction of operands.  */
6443               overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6444               overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6445               if (!operand_type_match (overlap0, i.types[0])
6446                   || !operand_type_match (overlap1, i.types[i.operands - 1])
6447                   || (check_register
6448                       && !operand_type_register_match (i.types[0],
6449                                                        operand_types[i.operands - 1],
6450                                                        i.types[i.operands - 1],
6451                                                        operand_types[0])))
6452                 {
6453                   /* Does not match either direction.  */
6454                   continue;
6455                 }
6456               /* found_reverse_match holds which of D or FloatR
6457                  we've found.  */
6458               if (!t->opcode_modifier.d)
6459                 found_reverse_match = 0;
6460               else if (operand_types[0].bitfield.tbyte)
6461                 found_reverse_match = Opcode_FloatD;
6462               else if (operand_types[0].bitfield.xmmword
6463                        || operand_types[i.operands - 1].bitfield.xmmword
6464                        || operand_types[0].bitfield.class == RegMMX
6465                        || operand_types[i.operands - 1].bitfield.class == RegMMX
6466                        || is_any_vex_encoding(t))
6467                 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6468                                       ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6469               else
6470                 found_reverse_match = Opcode_D;
6471               if (t->opcode_modifier.floatr)
6472                 found_reverse_match |= Opcode_FloatR;
6473             }
6474           else
6475             {
6476               /* Found a forward 2 operand match here.  */
6477               switch (t->operands)
6478                 {
6479                 case 5:
6480                   overlap4 = operand_type_and (i.types[4],
6481                                                operand_types[4]);
6482                   /* Fall through.  */
6483                 case 4:
6484                   overlap3 = operand_type_and (i.types[3],
6485                                                operand_types[3]);
6486                   /* Fall through.  */
6487                 case 3:
6488                   overlap2 = operand_type_and (i.types[2],
6489                                                operand_types[2]);
6490                   break;
6491                 }
6492
6493               switch (t->operands)
6494                 {
6495                 case 5:
6496                   if (!operand_type_match (overlap4, i.types[4])
6497                       || !operand_type_register_match (i.types[3],
6498                                                        operand_types[3],
6499                                                        i.types[4],
6500                                                        operand_types[4]))
6501                     continue;
6502                   /* Fall through.  */
6503                 case 4:
6504                   if (!operand_type_match (overlap3, i.types[3])
6505                       || ((check_register & 0xa) == 0xa
6506                           && !operand_type_register_match (i.types[1],
6507                                                             operand_types[1],
6508                                                             i.types[3],
6509                                                             operand_types[3]))
6510                       || ((check_register & 0xc) == 0xc
6511                           && !operand_type_register_match (i.types[2],
6512                                                             operand_types[2],
6513                                                             i.types[3],
6514                                                             operand_types[3])))
6515                     continue;
6516                   /* Fall through.  */
6517                 case 3:
6518                   /* Here we make use of the fact that there are no
6519                      reverse match 3 operand instructions.  */
6520                   if (!operand_type_match (overlap2, i.types[2])
6521                       || ((check_register & 5) == 5
6522                           && !operand_type_register_match (i.types[0],
6523                                                             operand_types[0],
6524                                                             i.types[2],
6525                                                             operand_types[2]))
6526                       || ((check_register & 6) == 6
6527                           && !operand_type_register_match (i.types[1],
6528                                                             operand_types[1],
6529                                                             i.types[2],
6530                                                             operand_types[2])))
6531                     continue;
6532                   break;
6533                 }
6534             }
6535           /* Found either forward/reverse 2, 3 or 4 operand match here:
6536              slip through to break.  */
6537         }
6538
6539       /* Check if vector operands are valid.  */
6540       if (check_VecOperands (t))
6541         {
6542           specific_error = i.error;
6543           continue;
6544         }
6545
6546       /* Check if VEX/EVEX encoding requirements can be satisfied.  */
6547       if (VEX_check_encoding (t))
6548         {
6549           specific_error = i.error;
6550           continue;
6551         }
6552
6553       /* We've found a match; break out of loop.  */
6554       break;
6555     }
6556
6557   if (t == current_templates->end)
6558     {
6559       /* We found no match.  */
6560       const char *err_msg;
6561       switch (specific_error ? specific_error : i.error)
6562         {
6563         default:
6564           abort ();
6565         case operand_size_mismatch:
6566           err_msg = _("operand size mismatch");
6567           break;
6568         case operand_type_mismatch:
6569           err_msg = _("operand type mismatch");
6570           break;
6571         case register_type_mismatch:
6572           err_msg = _("register type mismatch");
6573           break;
6574         case number_of_operands_mismatch:
6575           err_msg = _("number of operands mismatch");
6576           break;
6577         case invalid_instruction_suffix:
6578           err_msg = _("invalid instruction suffix");
6579           break;
6580         case bad_imm4:
6581           err_msg = _("constant doesn't fit in 4 bits");
6582           break;
6583         case unsupported_with_intel_mnemonic:
6584           err_msg = _("unsupported with Intel mnemonic");
6585           break;
6586         case unsupported_syntax:
6587           err_msg = _("unsupported syntax");
6588           break;
6589         case unsupported:
6590           as_bad (_("unsupported instruction `%s'"),
6591                   current_templates->start->name);
6592           return NULL;
6593         case invalid_vsib_address:
6594           err_msg = _("invalid VSIB address");
6595           break;
6596         case invalid_vector_register_set:
6597           err_msg = _("mask, index, and destination registers must be distinct");
6598           break;
6599         case unsupported_vector_index_register:
6600           err_msg = _("unsupported vector index register");
6601           break;
6602         case unsupported_broadcast:
6603           err_msg = _("unsupported broadcast");
6604           break;
6605         case broadcast_needed:
6606           err_msg = _("broadcast is needed for operand of such type");
6607           break;
6608         case unsupported_masking:
6609           err_msg = _("unsupported masking");
6610           break;
6611         case mask_not_on_destination:
6612           err_msg = _("mask not on destination operand");
6613           break;
6614         case no_default_mask:
6615           err_msg = _("default mask isn't allowed");
6616           break;
6617         case unsupported_rc_sae:
6618           err_msg = _("unsupported static rounding/sae");
6619           break;
6620         case rc_sae_operand_not_last_imm:
6621           if (intel_syntax)
6622             err_msg = _("RC/SAE operand must precede immediate operands");
6623           else
6624             err_msg = _("RC/SAE operand must follow immediate operands");
6625           break;
6626         case invalid_register_operand:
6627           err_msg = _("invalid register operand");
6628           break;
6629         }
6630       as_bad (_("%s for `%s'"), err_msg,
6631               current_templates->start->name);
6632       return NULL;
6633     }
6634
6635   if (!quiet_warnings)
6636     {
6637       if (!intel_syntax
6638           && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6639         as_warn (_("indirect %s without `*'"), t->name);
6640
6641       if (t->opcode_modifier.isprefix
6642           && t->opcode_modifier.mnemonicsize == IGNORESIZE)
6643         {
6644           /* Warn them that a data or address size prefix doesn't
6645              affect assembly of the next line of code.  */
6646           as_warn (_("stand-alone `%s' prefix"), t->name);
6647         }
6648     }
6649
6650   /* Copy the template we found.  */
6651   i.tm = *t;
6652
6653   if (addr_prefix_disp != -1)
6654     i.tm.operand_types[addr_prefix_disp]
6655       = operand_types[addr_prefix_disp];
6656
6657   if (found_reverse_match)
6658     {
6659       /* If we found a reverse match we must alter the opcode direction
6660          bit and clear/flip the regmem modifier one.  found_reverse_match
6661          holds bits to change (different for int & float insns).  */
6662
6663       i.tm.base_opcode ^= found_reverse_match;
6664
6665       i.tm.operand_types[0] = operand_types[i.operands - 1];
6666       i.tm.operand_types[i.operands - 1] = operand_types[0];
6667
6668       /* Certain SIMD insns have their load forms specified in the opcode
6669          table, and hence we need to _set_ RegMem instead of clearing it.
6670          We need to avoid setting the bit though on insns like KMOVW.  */
6671       i.tm.opcode_modifier.regmem
6672         = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6673           && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6674           && !i.tm.opcode_modifier.regmem;
6675     }
6676
6677   return t;
6678 }
6679
6680 static int
6681 check_string (void)
6682 {
6683   unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6684   unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6685
6686   if (i.seg[op] != NULL && i.seg[op] != &es)
6687     {
6688       as_bad (_("`%s' operand %u must use `%ses' segment"),
6689               i.tm.name,
6690               intel_syntax ? i.tm.operands - es_op : es_op + 1,
6691               register_prefix);
6692       return 0;
6693     }
6694
6695   /* There's only ever one segment override allowed per instruction.
6696      This instruction possibly has a legal segment override on the
6697      second operand, so copy the segment to where non-string
6698      instructions store it, allowing common code.  */
6699   i.seg[op] = i.seg[1];
6700
6701   return 1;
6702 }
6703
6704 static int
6705 process_suffix (void)
6706 {
6707   /* If matched instruction specifies an explicit instruction mnemonic
6708      suffix, use it.  */
6709   if (i.tm.opcode_modifier.size == SIZE16)
6710     i.suffix = WORD_MNEM_SUFFIX;
6711   else if (i.tm.opcode_modifier.size == SIZE32)
6712     i.suffix = LONG_MNEM_SUFFIX;
6713   else if (i.tm.opcode_modifier.size == SIZE64)
6714     i.suffix = QWORD_MNEM_SUFFIX;
6715   else if (i.reg_operands
6716            && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6717            && !i.tm.opcode_modifier.addrprefixopreg)
6718     {
6719       unsigned int numop = i.operands;
6720
6721       /* movsx/movzx want only their source operand considered here, for the
6722          ambiguity checking below.  The suffix will be replaced afterwards
6723          to represent the destination (register).  */
6724       if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6725           || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6726         --i.operands;
6727
6728       /* crc32 needs REX.W set regardless of suffix / source operand size.  */
6729       if (i.tm.base_opcode == 0xf20f38f0
6730           && i.tm.operand_types[1].bitfield.qword)
6731         i.rex |= REX_W;
6732
6733       /* If there's no instruction mnemonic suffix we try to invent one
6734          based on GPR operands.  */
6735       if (!i.suffix)
6736         {
6737           /* We take i.suffix from the last register operand specified,
6738              Destination register type is more significant than source
6739              register type.  crc32 in SSE4.2 prefers source register
6740              type. */
6741           unsigned int op = i.tm.base_opcode != 0xf20f38f0 ? i.operands : 1;
6742
6743           while (op--)
6744             if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6745                 || i.tm.operand_types[op].bitfield.instance == Accum)
6746               {
6747                 if (i.types[op].bitfield.class != Reg)
6748                   continue;
6749                 if (i.types[op].bitfield.byte)
6750                   i.suffix = BYTE_MNEM_SUFFIX;
6751                 else if (i.types[op].bitfield.word)
6752                   i.suffix = WORD_MNEM_SUFFIX;
6753                 else if (i.types[op].bitfield.dword)
6754                   i.suffix = LONG_MNEM_SUFFIX;
6755                 else if (i.types[op].bitfield.qword)
6756                   i.suffix = QWORD_MNEM_SUFFIX;
6757                 else
6758                   continue;
6759                 break;
6760               }
6761
6762           /* As an exception, movsx/movzx silently default to a byte source
6763              in AT&T mode.  */
6764           if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6765               && !i.suffix && !intel_syntax)
6766             i.suffix = BYTE_MNEM_SUFFIX;
6767         }
6768       else if (i.suffix == BYTE_MNEM_SUFFIX)
6769         {
6770           if (intel_syntax
6771               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6772               && i.tm.opcode_modifier.no_bsuf)
6773             i.suffix = 0;
6774           else if (!check_byte_reg ())
6775             return 0;
6776         }
6777       else if (i.suffix == LONG_MNEM_SUFFIX)
6778         {
6779           if (intel_syntax
6780               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6781               && i.tm.opcode_modifier.no_lsuf
6782               && !i.tm.opcode_modifier.todword
6783               && !i.tm.opcode_modifier.toqword)
6784             i.suffix = 0;
6785           else if (!check_long_reg ())
6786             return 0;
6787         }
6788       else if (i.suffix == QWORD_MNEM_SUFFIX)
6789         {
6790           if (intel_syntax
6791               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6792               && i.tm.opcode_modifier.no_qsuf
6793               && !i.tm.opcode_modifier.todword
6794               && !i.tm.opcode_modifier.toqword)
6795             i.suffix = 0;
6796           else if (!check_qword_reg ())
6797             return 0;
6798         }
6799       else if (i.suffix == WORD_MNEM_SUFFIX)
6800         {
6801           if (intel_syntax
6802               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6803               && i.tm.opcode_modifier.no_wsuf)
6804             i.suffix = 0;
6805           else if (!check_word_reg ())
6806             return 0;
6807         }
6808       else if (intel_syntax
6809                && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
6810         /* Do nothing if the instruction is going to ignore the prefix.  */
6811         ;
6812       else
6813         abort ();
6814
6815       /* Undo the movsx/movzx change done above.  */
6816       i.operands = numop;
6817     }
6818   else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
6819            && !i.suffix)
6820     {
6821       i.suffix = stackop_size;
6822       if (stackop_size == LONG_MNEM_SUFFIX)
6823         {
6824           /* stackop_size is set to LONG_MNEM_SUFFIX for the
6825              .code16gcc directive to support 16-bit mode with
6826              32-bit address.  For IRET without a suffix, generate
6827              16-bit IRET (opcode 0xcf) to return from an interrupt
6828              handler.  */
6829           if (i.tm.base_opcode == 0xcf)
6830             {
6831               i.suffix = WORD_MNEM_SUFFIX;
6832               as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6833             }
6834           /* Warn about changed behavior for segment register push/pop.  */
6835           else if ((i.tm.base_opcode | 1) == 0x07)
6836             as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6837                      i.tm.name);
6838         }
6839     }
6840   else if (!i.suffix
6841            && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6842                || i.tm.opcode_modifier.jump == JUMP_BYTE
6843                || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6844                || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6845                    && i.tm.extension_opcode <= 3)))
6846     {
6847       switch (flag_code)
6848         {
6849         case CODE_64BIT:
6850           if (!i.tm.opcode_modifier.no_qsuf)
6851             {
6852               if (i.tm.opcode_modifier.jump == JUMP_BYTE
6853                   || i.tm.opcode_modifier.no_lsuf)
6854                 i.suffix = QWORD_MNEM_SUFFIX;
6855               break;
6856             }
6857           /* Fall through.  */
6858         case CODE_32BIT:
6859           if (!i.tm.opcode_modifier.no_lsuf)
6860             i.suffix = LONG_MNEM_SUFFIX;
6861           break;
6862         case CODE_16BIT:
6863           if (!i.tm.opcode_modifier.no_wsuf)
6864             i.suffix = WORD_MNEM_SUFFIX;
6865           break;
6866         }
6867     }
6868
6869   if (!i.suffix
6870       && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6871           /* Also cover lret/retf/iret in 64-bit mode.  */
6872           || (flag_code == CODE_64BIT
6873               && !i.tm.opcode_modifier.no_lsuf
6874               && !i.tm.opcode_modifier.no_qsuf))
6875       && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
6876       /* Explicit sizing prefixes are assumed to disambiguate insns.  */
6877       && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
6878       /* Accept FLDENV et al without suffix.  */
6879       && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6880     {
6881       unsigned int suffixes, evex = 0;
6882
6883       suffixes = !i.tm.opcode_modifier.no_bsuf;
6884       if (!i.tm.opcode_modifier.no_wsuf)
6885         suffixes |= 1 << 1;
6886       if (!i.tm.opcode_modifier.no_lsuf)
6887         suffixes |= 1 << 2;
6888       if (!i.tm.opcode_modifier.no_ldsuf)
6889         suffixes |= 1 << 3;
6890       if (!i.tm.opcode_modifier.no_ssuf)
6891         suffixes |= 1 << 4;
6892       if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6893         suffixes |= 1 << 5;
6894
6895       /* For [XYZ]MMWORD operands inspect operand sizes.  While generally
6896          also suitable for AT&T syntax mode, it was requested that this be
6897          restricted to just Intel syntax.  */
6898       if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6899         {
6900           unsigned int op;
6901
6902           for (op = 0; op < i.tm.operands; ++op)
6903             {
6904               if (is_evex_encoding (&i.tm)
6905                   && !cpu_arch_flags.bitfield.cpuavx512vl)
6906                 {
6907                   if (i.tm.operand_types[op].bitfield.ymmword)
6908                     i.tm.operand_types[op].bitfield.xmmword = 0;
6909                   if (i.tm.operand_types[op].bitfield.zmmword)
6910                     i.tm.operand_types[op].bitfield.ymmword = 0;
6911                   if (!i.tm.opcode_modifier.evex
6912                       || i.tm.opcode_modifier.evex == EVEXDYN)
6913                     i.tm.opcode_modifier.evex = EVEX512;
6914                 }
6915
6916               if (i.tm.operand_types[op].bitfield.xmmword
6917                   + i.tm.operand_types[op].bitfield.ymmword
6918                   + i.tm.operand_types[op].bitfield.zmmword < 2)
6919                 continue;
6920
6921               /* Any properly sized operand disambiguates the insn.  */
6922               if (i.types[op].bitfield.xmmword
6923                   || i.types[op].bitfield.ymmword
6924                   || i.types[op].bitfield.zmmword)
6925                 {
6926                   suffixes &= ~(7 << 6);
6927                   evex = 0;
6928                   break;
6929                 }
6930
6931               if ((i.flags[op] & Operand_Mem)
6932                   && i.tm.operand_types[op].bitfield.unspecified)
6933                 {
6934                   if (i.tm.operand_types[op].bitfield.xmmword)
6935                     suffixes |= 1 << 6;
6936                   if (i.tm.operand_types[op].bitfield.ymmword)
6937                     suffixes |= 1 << 7;
6938                   if (i.tm.operand_types[op].bitfield.zmmword)
6939                     suffixes |= 1 << 8;
6940                   if (is_evex_encoding (&i.tm))
6941                     evex = EVEX512;
6942                 }
6943             }
6944         }
6945
6946       /* Are multiple suffixes / operand sizes allowed?  */
6947       if (suffixes & (suffixes - 1))
6948         {
6949           if (intel_syntax
6950               && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6951                   || operand_check == check_error))
6952             {
6953               as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6954               return 0;
6955             }
6956           if (operand_check == check_error)
6957             {
6958               as_bad (_("no instruction mnemonic suffix given and "
6959                         "no register operands; can't size `%s'"), i.tm.name);
6960               return 0;
6961             }
6962           if (operand_check == check_warning)
6963             as_warn (_("%s; using default for `%s'"),
6964                        intel_syntax
6965                        ? _("ambiguous operand size")
6966                        : _("no instruction mnemonic suffix given and "
6967                            "no register operands"),
6968                        i.tm.name);
6969
6970           if (i.tm.opcode_modifier.floatmf)
6971             i.suffix = SHORT_MNEM_SUFFIX;
6972           else if ((i.tm.base_opcode | 8) == 0xfbe
6973                    || (i.tm.base_opcode == 0x63
6974                        && i.tm.cpu_flags.bitfield.cpu64))
6975             /* handled below */;
6976           else if (evex)
6977             i.tm.opcode_modifier.evex = evex;
6978           else if (flag_code == CODE_16BIT)
6979             i.suffix = WORD_MNEM_SUFFIX;
6980           else if (!i.tm.opcode_modifier.no_lsuf)
6981             i.suffix = LONG_MNEM_SUFFIX;
6982           else
6983             i.suffix = QWORD_MNEM_SUFFIX;
6984         }
6985     }
6986
6987   if ((i.tm.base_opcode | 8) == 0xfbe
6988       || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6989     {
6990       /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
6991          In AT&T syntax, if there is no suffix (warned about above), the default
6992          will be byte extension.  */
6993       if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
6994         i.tm.base_opcode |= 1;
6995
6996       /* For further processing, the suffix should represent the destination
6997          (register).  This is already the case when one was used with
6998          mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
6999          no suffix to begin with.  */
7000       if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
7001         {
7002           if (i.types[1].bitfield.word)
7003             i.suffix = WORD_MNEM_SUFFIX;
7004           else if (i.types[1].bitfield.qword)
7005             i.suffix = QWORD_MNEM_SUFFIX;
7006           else
7007             i.suffix = LONG_MNEM_SUFFIX;
7008
7009           i.tm.opcode_modifier.w = 0;
7010         }
7011     }
7012
7013   if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7014     i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7015                    != (i.tm.operand_types[1].bitfield.class == Reg);
7016
7017   /* Change the opcode based on the operand size given by i.suffix.  */
7018   switch (i.suffix)
7019     {
7020     /* Size floating point instruction.  */
7021     case LONG_MNEM_SUFFIX:
7022       if (i.tm.opcode_modifier.floatmf)
7023         {
7024           i.tm.base_opcode ^= 4;
7025           break;
7026         }
7027     /* fall through */
7028     case WORD_MNEM_SUFFIX:
7029     case QWORD_MNEM_SUFFIX:
7030       /* It's not a byte, select word/dword operation.  */
7031       if (i.tm.opcode_modifier.w)
7032         {
7033           if (i.short_form)
7034             i.tm.base_opcode |= 8;
7035           else
7036             i.tm.base_opcode |= 1;
7037         }
7038     /* fall through */
7039     case SHORT_MNEM_SUFFIX:
7040       /* Now select between word & dword operations via the operand
7041          size prefix, except for instructions that will ignore this
7042          prefix anyway.  */
7043       if (i.suffix != QWORD_MNEM_SUFFIX
7044           && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7045           && !i.tm.opcode_modifier.floatmf
7046           && !is_any_vex_encoding (&i.tm)
7047           && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7048               || (flag_code == CODE_64BIT
7049                   && i.tm.opcode_modifier.jump == JUMP_BYTE)))
7050         {
7051           unsigned int prefix = DATA_PREFIX_OPCODE;
7052
7053           if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
7054             prefix = ADDR_PREFIX_OPCODE;
7055
7056           if (!add_prefix (prefix))
7057             return 0;
7058         }
7059
7060       /* Set mode64 for an operand.  */
7061       if (i.suffix == QWORD_MNEM_SUFFIX
7062           && flag_code == CODE_64BIT
7063           && !i.tm.opcode_modifier.norex64
7064           && !i.tm.opcode_modifier.vexw
7065           /* Special case for xchg %rax,%rax.  It is NOP and doesn't
7066              need rex64. */
7067           && ! (i.operands == 2
7068                 && i.tm.base_opcode == 0x90
7069                 && i.tm.extension_opcode == None
7070                 && i.types[0].bitfield.instance == Accum
7071                 && i.types[0].bitfield.qword
7072                 && i.types[1].bitfield.instance == Accum
7073                 && i.types[1].bitfield.qword))
7074         i.rex |= REX_W;
7075
7076       break;
7077
7078     case 0:
7079       /* Select word/dword/qword operation with explict data sizing prefix
7080          when there are no suitable register operands.  */
7081       if (i.tm.opcode_modifier.w
7082           && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7083           && (!i.reg_operands
7084               || (i.reg_operands == 1
7085                       /* ShiftCount */
7086                   && (i.tm.operand_types[0].bitfield.instance == RegC
7087                       /* InOutPortReg */
7088                       || i.tm.operand_types[0].bitfield.instance == RegD
7089                       || i.tm.operand_types[1].bitfield.instance == RegD
7090                       /* CRC32 */
7091                       || i.tm.base_opcode == 0xf20f38f0))))
7092         i.tm.base_opcode |= 1;
7093       break;
7094     }
7095
7096   if (i.tm.opcode_modifier.addrprefixopreg)
7097     {
7098       gas_assert (!i.suffix);
7099       gas_assert (i.reg_operands);
7100
7101       if (i.tm.operand_types[0].bitfield.instance == Accum
7102           || i.operands == 1)
7103         {
7104           /* The address size override prefix changes the size of the
7105              first operand.  */
7106           if (flag_code == CODE_64BIT
7107               && i.op[0].regs->reg_type.bitfield.word)
7108             {
7109               as_bad (_("16-bit addressing unavailable for `%s'"),
7110                       i.tm.name);
7111               return 0;
7112             }
7113
7114           if ((flag_code == CODE_32BIT
7115                ? i.op[0].regs->reg_type.bitfield.word
7116                : i.op[0].regs->reg_type.bitfield.dword)
7117               && !add_prefix (ADDR_PREFIX_OPCODE))
7118             return 0;
7119         }
7120       else
7121         {
7122           /* Check invalid register operand when the address size override
7123              prefix changes the size of register operands.  */
7124           unsigned int op;
7125           enum { need_word, need_dword, need_qword } need;
7126
7127           if (flag_code == CODE_32BIT)
7128             need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7129           else if (i.prefix[ADDR_PREFIX])
7130             need = need_dword;
7131           else
7132             need = flag_code == CODE_64BIT ? need_qword : need_word;
7133
7134           for (op = 0; op < i.operands; op++)
7135             {
7136               if (i.types[op].bitfield.class != Reg)
7137                 continue;
7138
7139               switch (need)
7140                 {
7141                 case need_word:
7142                   if (i.op[op].regs->reg_type.bitfield.word)
7143                     continue;
7144                   break;
7145                 case need_dword:
7146                   if (i.op[op].regs->reg_type.bitfield.dword)
7147                     continue;
7148                   break;
7149                 case need_qword:
7150                   if (i.op[op].regs->reg_type.bitfield.qword)
7151                     continue;
7152                   break;
7153                 }
7154
7155               as_bad (_("invalid register operand size for `%s'"),
7156                       i.tm.name);
7157               return 0;
7158             }
7159         }
7160     }
7161
7162   return 1;
7163 }
7164
7165 static int
7166 check_byte_reg (void)
7167 {
7168   int op;
7169
7170   for (op = i.operands; --op >= 0;)
7171     {
7172       /* Skip non-register operands. */
7173       if (i.types[op].bitfield.class != Reg)
7174         continue;
7175
7176       /* If this is an eight bit register, it's OK.  If it's the 16 or
7177          32 bit version of an eight bit register, we will just use the
7178          low portion, and that's OK too.  */
7179       if (i.types[op].bitfield.byte)
7180         continue;
7181
7182       /* I/O port address operands are OK too.  */
7183       if (i.tm.operand_types[op].bitfield.instance == RegD
7184           && i.tm.operand_types[op].bitfield.word)
7185         continue;
7186
7187       /* crc32 only wants its source operand checked here.  */
7188       if (i.tm.base_opcode == 0xf20f38f0 && op)
7189         continue;
7190
7191       /* Any other register is bad.  */
7192       as_bad (_("`%s%s' not allowed with `%s%c'"),
7193               register_prefix, i.op[op].regs->reg_name,
7194               i.tm.name, i.suffix);
7195       return 0;
7196     }
7197   return 1;
7198 }
7199
7200 static int
7201 check_long_reg (void)
7202 {
7203   int op;
7204
7205   for (op = i.operands; --op >= 0;)
7206     /* Skip non-register operands. */
7207     if (i.types[op].bitfield.class != Reg)
7208       continue;
7209     /* Reject eight bit registers, except where the template requires
7210        them. (eg. movzb)  */
7211     else if (i.types[op].bitfield.byte
7212              && (i.tm.operand_types[op].bitfield.class == Reg
7213                  || i.tm.operand_types[op].bitfield.instance == Accum)
7214              && (i.tm.operand_types[op].bitfield.word
7215                  || i.tm.operand_types[op].bitfield.dword))
7216       {
7217         as_bad (_("`%s%s' not allowed with `%s%c'"),
7218                 register_prefix,
7219                 i.op[op].regs->reg_name,
7220                 i.tm.name,
7221                 i.suffix);
7222         return 0;
7223       }
7224     /* Error if the e prefix on a general reg is missing.  */
7225     else if (i.types[op].bitfield.word
7226              && (i.tm.operand_types[op].bitfield.class == Reg
7227                  || i.tm.operand_types[op].bitfield.instance == Accum)
7228              && i.tm.operand_types[op].bitfield.dword)
7229       {
7230         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7231                 register_prefix, i.op[op].regs->reg_name,
7232                 i.suffix);
7233         return 0;
7234       }
7235     /* Warn if the r prefix on a general reg is present.  */
7236     else if (i.types[op].bitfield.qword
7237              && (i.tm.operand_types[op].bitfield.class == Reg
7238                  || i.tm.operand_types[op].bitfield.instance == Accum)
7239              && i.tm.operand_types[op].bitfield.dword)
7240       {
7241         if (intel_syntax
7242             && i.tm.opcode_modifier.toqword
7243             && i.types[0].bitfield.class != RegSIMD)
7244           {
7245             /* Convert to QWORD.  We want REX byte. */
7246             i.suffix = QWORD_MNEM_SUFFIX;
7247           }
7248         else
7249           {
7250             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7251                     register_prefix, i.op[op].regs->reg_name,
7252                     i.suffix);
7253             return 0;
7254           }
7255       }
7256   return 1;
7257 }
7258
7259 static int
7260 check_qword_reg (void)
7261 {
7262   int op;
7263
7264   for (op = i.operands; --op >= 0; )
7265     /* Skip non-register operands. */
7266     if (i.types[op].bitfield.class != Reg)
7267       continue;
7268     /* Reject eight bit registers, except where the template requires
7269        them. (eg. movzb)  */
7270     else if (i.types[op].bitfield.byte
7271              && (i.tm.operand_types[op].bitfield.class == Reg
7272                  || i.tm.operand_types[op].bitfield.instance == Accum)
7273              && (i.tm.operand_types[op].bitfield.word
7274                  || i.tm.operand_types[op].bitfield.dword))
7275       {
7276         as_bad (_("`%s%s' not allowed with `%s%c'"),
7277                 register_prefix,
7278                 i.op[op].regs->reg_name,
7279                 i.tm.name,
7280                 i.suffix);
7281         return 0;
7282       }
7283     /* Warn if the r prefix on a general reg is missing.  */
7284     else if ((i.types[op].bitfield.word
7285               || i.types[op].bitfield.dword)
7286              && (i.tm.operand_types[op].bitfield.class == Reg
7287                  || i.tm.operand_types[op].bitfield.instance == Accum)
7288              && i.tm.operand_types[op].bitfield.qword)
7289       {
7290         /* Prohibit these changes in the 64bit mode, since the
7291            lowering is more complicated.  */
7292         if (intel_syntax
7293             && i.tm.opcode_modifier.todword
7294             && i.types[0].bitfield.class != RegSIMD)
7295           {
7296             /* Convert to DWORD.  We don't want REX byte. */
7297             i.suffix = LONG_MNEM_SUFFIX;
7298           }
7299         else
7300           {
7301             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7302                     register_prefix, i.op[op].regs->reg_name,
7303                     i.suffix);
7304             return 0;
7305           }
7306       }
7307   return 1;
7308 }
7309
7310 static int
7311 check_word_reg (void)
7312 {
7313   int op;
7314   for (op = i.operands; --op >= 0;)
7315     /* Skip non-register operands. */
7316     if (i.types[op].bitfield.class != Reg)
7317       continue;
7318     /* Reject eight bit registers, except where the template requires
7319        them. (eg. movzb)  */
7320     else if (i.types[op].bitfield.byte
7321              && (i.tm.operand_types[op].bitfield.class == Reg
7322                  || i.tm.operand_types[op].bitfield.instance == Accum)
7323              && (i.tm.operand_types[op].bitfield.word
7324                  || i.tm.operand_types[op].bitfield.dword))
7325       {
7326         as_bad (_("`%s%s' not allowed with `%s%c'"),
7327                 register_prefix,
7328                 i.op[op].regs->reg_name,
7329                 i.tm.name,
7330                 i.suffix);
7331         return 0;
7332       }
7333     /* Error if the e or r prefix on a general reg is present.  */
7334     else if ((i.types[op].bitfield.dword
7335                  || i.types[op].bitfield.qword)
7336              && (i.tm.operand_types[op].bitfield.class == Reg
7337                  || i.tm.operand_types[op].bitfield.instance == Accum)
7338              && i.tm.operand_types[op].bitfield.word)
7339       {
7340         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7341                 register_prefix, i.op[op].regs->reg_name,
7342                 i.suffix);
7343         return 0;
7344       }
7345   return 1;
7346 }
7347
7348 static int
7349 update_imm (unsigned int j)
7350 {
7351   i386_operand_type overlap = i.types[j];
7352   if ((overlap.bitfield.imm8
7353        || overlap.bitfield.imm8s
7354        || overlap.bitfield.imm16
7355        || overlap.bitfield.imm32
7356        || overlap.bitfield.imm32s
7357        || overlap.bitfield.imm64)
7358       && !operand_type_equal (&overlap, &imm8)
7359       && !operand_type_equal (&overlap, &imm8s)
7360       && !operand_type_equal (&overlap, &imm16)
7361       && !operand_type_equal (&overlap, &imm32)
7362       && !operand_type_equal (&overlap, &imm32s)
7363       && !operand_type_equal (&overlap, &imm64))
7364     {
7365       if (i.suffix)
7366         {
7367           i386_operand_type temp;
7368
7369           operand_type_set (&temp, 0);
7370           if (i.suffix == BYTE_MNEM_SUFFIX)
7371             {
7372               temp.bitfield.imm8 = overlap.bitfield.imm8;
7373               temp.bitfield.imm8s = overlap.bitfield.imm8s;
7374             }
7375           else if (i.suffix == WORD_MNEM_SUFFIX)
7376             temp.bitfield.imm16 = overlap.bitfield.imm16;
7377           else if (i.suffix == QWORD_MNEM_SUFFIX)
7378             {
7379               temp.bitfield.imm64 = overlap.bitfield.imm64;
7380               temp.bitfield.imm32s = overlap.bitfield.imm32s;
7381             }
7382           else
7383             temp.bitfield.imm32 = overlap.bitfield.imm32;
7384           overlap = temp;
7385         }
7386       else if (operand_type_equal (&overlap, &imm16_32_32s)
7387                || operand_type_equal (&overlap, &imm16_32)
7388                || operand_type_equal (&overlap, &imm16_32s))
7389         {
7390           if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
7391             overlap = imm16;
7392           else
7393             overlap = imm32s;
7394         }
7395       else if (i.prefix[REX_PREFIX] & REX_W)
7396         overlap = operand_type_and (overlap, imm32s);
7397       else if (i.prefix[DATA_PREFIX])
7398         overlap = operand_type_and (overlap,
7399                                     flag_code != CODE_16BIT ? imm16 : imm32);
7400       if (!operand_type_equal (&overlap, &imm8)
7401           && !operand_type_equal (&overlap, &imm8s)
7402           && !operand_type_equal (&overlap, &imm16)
7403           && !operand_type_equal (&overlap, &imm32)
7404           && !operand_type_equal (&overlap, &imm32s)
7405           && !operand_type_equal (&overlap, &imm64))
7406         {
7407           as_bad (_("no instruction mnemonic suffix given; "
7408                     "can't determine immediate size"));
7409           return 0;
7410         }
7411     }
7412   i.types[j] = overlap;
7413
7414   return 1;
7415 }
7416
7417 static int
7418 finalize_imm (void)
7419 {
7420   unsigned int j, n;
7421
7422   /* Update the first 2 immediate operands.  */
7423   n = i.operands > 2 ? 2 : i.operands;
7424   if (n)
7425     {
7426       for (j = 0; j < n; j++)
7427         if (update_imm (j) == 0)
7428           return 0;
7429
7430       /* The 3rd operand can't be immediate operand.  */
7431       gas_assert (operand_type_check (i.types[2], imm) == 0);
7432     }
7433
7434   return 1;
7435 }
7436
7437 static int
7438 process_operands (void)
7439 {
7440   /* Default segment register this instruction will use for memory
7441      accesses.  0 means unknown.  This is only for optimizing out
7442      unnecessary segment overrides.  */
7443   const seg_entry *default_seg = 0;
7444
7445   if (i.tm.opcode_modifier.sse2avx)
7446     {
7447       /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
7448          need converting.  */
7449       i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
7450       i.prefix[REX_PREFIX] = 0;
7451       i.rex_encoding = 0;
7452     }
7453
7454   if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
7455     {
7456       unsigned int dupl = i.operands;
7457       unsigned int dest = dupl - 1;
7458       unsigned int j;
7459
7460       /* The destination must be an xmm register.  */
7461       gas_assert (i.reg_operands
7462                   && MAX_OPERANDS > dupl
7463                   && operand_type_equal (&i.types[dest], &regxmm));
7464
7465       if (i.tm.operand_types[0].bitfield.instance == Accum
7466           && i.tm.operand_types[0].bitfield.xmmword)
7467         {
7468           if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
7469             {
7470               /* Keep xmm0 for instructions with VEX prefix and 3
7471                  sources.  */
7472               i.tm.operand_types[0].bitfield.instance = InstanceNone;
7473               i.tm.operand_types[0].bitfield.class = RegSIMD;
7474               goto duplicate;
7475             }
7476           else
7477             {
7478               /* We remove the first xmm0 and keep the number of
7479                  operands unchanged, which in fact duplicates the
7480                  destination.  */
7481               for (j = 1; j < i.operands; j++)
7482                 {
7483                   i.op[j - 1] = i.op[j];
7484                   i.types[j - 1] = i.types[j];
7485                   i.tm.operand_types[j - 1] = i.tm.operand_types[j];
7486                   i.flags[j - 1] = i.flags[j];
7487                 }
7488             }
7489         }
7490       else if (i.tm.opcode_modifier.implicit1stxmm0)
7491         {
7492           gas_assert ((MAX_OPERANDS - 1) > dupl
7493                       && (i.tm.opcode_modifier.vexsources
7494                           == VEX3SOURCES));
7495
7496           /* Add the implicit xmm0 for instructions with VEX prefix
7497              and 3 sources.  */
7498           for (j = i.operands; j > 0; j--)
7499             {
7500               i.op[j] = i.op[j - 1];
7501               i.types[j] = i.types[j - 1];
7502               i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7503               i.flags[j] = i.flags[j - 1];
7504             }
7505           i.op[0].regs
7506             = (const reg_entry *) hash_find (reg_hash, "xmm0");
7507           i.types[0] = regxmm;
7508           i.tm.operand_types[0] = regxmm;
7509
7510           i.operands += 2;
7511           i.reg_operands += 2;
7512           i.tm.operands += 2;
7513
7514           dupl++;
7515           dest++;
7516           i.op[dupl] = i.op[dest];
7517           i.types[dupl] = i.types[dest];
7518           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7519           i.flags[dupl] = i.flags[dest];
7520         }
7521       else
7522         {
7523         duplicate:
7524           i.operands++;
7525           i.reg_operands++;
7526           i.tm.operands++;
7527
7528           i.op[dupl] = i.op[dest];
7529           i.types[dupl] = i.types[dest];
7530           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7531           i.flags[dupl] = i.flags[dest];
7532         }
7533
7534        if (i.tm.opcode_modifier.immext)
7535          process_immext ();
7536     }
7537   else if (i.tm.operand_types[0].bitfield.instance == Accum
7538            && i.tm.operand_types[0].bitfield.xmmword)
7539     {
7540       unsigned int j;
7541
7542       for (j = 1; j < i.operands; j++)
7543         {
7544           i.op[j - 1] = i.op[j];
7545           i.types[j - 1] = i.types[j];
7546
7547           /* We need to adjust fields in i.tm since they are used by
7548              build_modrm_byte.  */
7549           i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7550
7551           i.flags[j - 1] = i.flags[j];
7552         }
7553
7554       i.operands--;
7555       i.reg_operands--;
7556       i.tm.operands--;
7557     }
7558   else if (i.tm.opcode_modifier.implicitquadgroup)
7559     {
7560       unsigned int regnum, first_reg_in_group, last_reg_in_group;
7561
7562       /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7563       gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7564       regnum = register_number (i.op[1].regs);
7565       first_reg_in_group = regnum & ~3;
7566       last_reg_in_group = first_reg_in_group + 3;
7567       if (regnum != first_reg_in_group)
7568         as_warn (_("source register `%s%s' implicitly denotes"
7569                    " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7570                  register_prefix, i.op[1].regs->reg_name,
7571                  register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7572                  register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7573                  i.tm.name);
7574     }
7575   else if (i.tm.opcode_modifier.regkludge)
7576     {
7577       /* The imul $imm, %reg instruction is converted into
7578          imul $imm, %reg, %reg, and the clr %reg instruction
7579          is converted into xor %reg, %reg.  */
7580
7581       unsigned int first_reg_op;
7582
7583       if (operand_type_check (i.types[0], reg))
7584         first_reg_op = 0;
7585       else
7586         first_reg_op = 1;
7587       /* Pretend we saw the extra register operand.  */
7588       gas_assert (i.reg_operands == 1
7589                   && i.op[first_reg_op + 1].regs == 0);
7590       i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7591       i.types[first_reg_op + 1] = i.types[first_reg_op];
7592       i.operands++;
7593       i.reg_operands++;
7594     }
7595
7596   if (i.tm.opcode_modifier.modrm)
7597     {
7598       /* The opcode is completed (modulo i.tm.extension_opcode which
7599          must be put into the modrm byte).  Now, we make the modrm and
7600          index base bytes based on all the info we've collected.  */
7601
7602       default_seg = build_modrm_byte ();
7603     }
7604   else if (i.types[0].bitfield.class == SReg)
7605     {
7606       if (flag_code != CODE_64BIT
7607           ? i.tm.base_opcode == POP_SEG_SHORT
7608             && i.op[0].regs->reg_num == 1
7609           : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7610             && i.op[0].regs->reg_num < 4)
7611         {
7612           as_bad (_("you can't `%s %s%s'"),
7613                   i.tm.name, register_prefix, i.op[0].regs->reg_name);
7614           return 0;
7615         }
7616       if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7617         {
7618           i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7619           i.tm.opcode_length = 2;
7620         }
7621       i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7622     }
7623   else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7624     {
7625       default_seg = &ds;
7626     }
7627   else if (i.tm.opcode_modifier.isstring)
7628     {
7629       /* For the string instructions that allow a segment override
7630          on one of their operands, the default segment is ds.  */
7631       default_seg = &ds;
7632     }
7633   else if (i.short_form)
7634     {
7635       /* The register or float register operand is in operand
7636          0 or 1.  */
7637       unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7638
7639       /* Register goes in low 3 bits of opcode.  */
7640       i.tm.base_opcode |= i.op[op].regs->reg_num;
7641       if ((i.op[op].regs->reg_flags & RegRex) != 0)
7642         i.rex |= REX_B;
7643       if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7644         {
7645           /* Warn about some common errors, but press on regardless.
7646              The first case can be generated by gcc (<= 2.8.1).  */
7647           if (i.operands == 2)
7648             {
7649               /* Reversed arguments on faddp, fsubp, etc.  */
7650               as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7651                        register_prefix, i.op[!intel_syntax].regs->reg_name,
7652                        register_prefix, i.op[intel_syntax].regs->reg_name);
7653             }
7654           else
7655             {
7656               /* Extraneous `l' suffix on fp insn.  */
7657               as_warn (_("translating to `%s %s%s'"), i.tm.name,
7658                        register_prefix, i.op[0].regs->reg_name);
7659             }
7660         }
7661     }
7662
7663   if ((i.seg[0] || i.prefix[SEG_PREFIX])
7664       && i.tm.base_opcode == 0x8d /* lea */
7665       && !is_any_vex_encoding(&i.tm))
7666     {
7667       if (!quiet_warnings)
7668         as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7669       if (optimize)
7670         {
7671           i.seg[0] = NULL;
7672           i.prefix[SEG_PREFIX] = 0;
7673         }
7674     }
7675
7676   /* If a segment was explicitly specified, and the specified segment
7677      is neither the default nor the one already recorded from a prefix,
7678      use an opcode prefix to select it.  If we never figured out what
7679      the default segment is, then default_seg will be zero at this
7680      point, and the specified segment prefix will always be used.  */
7681   if (i.seg[0]
7682       && i.seg[0] != default_seg
7683       && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
7684     {
7685       if (!add_prefix (i.seg[0]->seg_prefix))
7686         return 0;
7687     }
7688   return 1;
7689 }
7690
7691 static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
7692                                  bfd_boolean do_sse2avx)
7693 {
7694   if (r->reg_flags & RegRex)
7695     {
7696       if (i.rex & rex_bit)
7697         as_bad (_("same type of prefix used twice"));
7698       i.rex |= rex_bit;
7699     }
7700   else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
7701     {
7702       gas_assert (i.vex.register_specifier == r);
7703       i.vex.register_specifier += 8;
7704     }
7705
7706   if (r->reg_flags & RegVRex)
7707     i.vrex |= rex_bit;
7708 }
7709
7710 static const seg_entry *
7711 build_modrm_byte (void)
7712 {
7713   const seg_entry *default_seg = 0;
7714   unsigned int source, dest;
7715   int vex_3_sources;
7716
7717   vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7718   if (vex_3_sources)
7719     {
7720       unsigned int nds, reg_slot;
7721       expressionS *exp;
7722
7723       dest = i.operands - 1;
7724       nds = dest - 1;
7725
7726       /* There are 2 kinds of instructions:
7727          1. 5 operands: 4 register operands or 3 register operands
7728          plus 1 memory operand plus one Imm4 operand, VexXDS, and
7729          VexW0 or VexW1.  The destination must be either XMM, YMM or
7730          ZMM register.
7731          2. 4 operands: 4 register operands or 3 register operands
7732          plus 1 memory operand, with VexXDS.  */
7733       gas_assert ((i.reg_operands == 4
7734                    || (i.reg_operands == 3 && i.mem_operands == 1))
7735                   && i.tm.opcode_modifier.vexvvvv == VEXXDS
7736                   && i.tm.opcode_modifier.vexw
7737                   && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7738
7739       /* If VexW1 is set, the first non-immediate operand is the source and
7740          the second non-immediate one is encoded in the immediate operand.  */
7741       if (i.tm.opcode_modifier.vexw == VEXW1)
7742         {
7743           source = i.imm_operands;
7744           reg_slot = i.imm_operands + 1;
7745         }
7746       else
7747         {
7748           source = i.imm_operands + 1;
7749           reg_slot = i.imm_operands;
7750         }
7751
7752       if (i.imm_operands == 0)
7753         {
7754           /* When there is no immediate operand, generate an 8bit
7755              immediate operand to encode the first operand.  */
7756           exp = &im_expressions[i.imm_operands++];
7757           i.op[i.operands].imms = exp;
7758           i.types[i.operands] = imm8;
7759           i.operands++;
7760
7761           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7762           exp->X_op = O_constant;
7763           exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7764           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7765         }
7766       else
7767         {
7768           gas_assert (i.imm_operands == 1);
7769           gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7770           gas_assert (!i.tm.opcode_modifier.immext);
7771
7772           /* Turn on Imm8 again so that output_imm will generate it.  */
7773           i.types[0].bitfield.imm8 = 1;
7774
7775           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7776           i.op[0].imms->X_add_number
7777               |= register_number (i.op[reg_slot].regs) << 4;
7778           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7779         }
7780
7781       gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7782       i.vex.register_specifier = i.op[nds].regs;
7783     }
7784   else
7785     source = dest = 0;
7786
7787   /* i.reg_operands MUST be the number of real register operands;
7788      implicit registers do not count.  If there are 3 register
7789      operands, it must be a instruction with VexNDS.  For a
7790      instruction with VexNDD, the destination register is encoded
7791      in VEX prefix.  If there are 4 register operands, it must be
7792      a instruction with VEX prefix and 3 sources.  */
7793   if (i.mem_operands == 0
7794       && ((i.reg_operands == 2
7795            && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7796           || (i.reg_operands == 3
7797               && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7798           || (i.reg_operands == 4 && vex_3_sources)))
7799     {
7800       switch (i.operands)
7801         {
7802         case 2:
7803           source = 0;
7804           break;
7805         case 3:
7806           /* When there are 3 operands, one of them may be immediate,
7807              which may be the first or the last operand.  Otherwise,
7808              the first operand must be shift count register (cl) or it
7809              is an instruction with VexNDS. */
7810           gas_assert (i.imm_operands == 1
7811                       || (i.imm_operands == 0
7812                           && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7813                               || (i.types[0].bitfield.instance == RegC
7814                                   && i.types[0].bitfield.byte))));
7815           if (operand_type_check (i.types[0], imm)
7816               || (i.types[0].bitfield.instance == RegC
7817                   && i.types[0].bitfield.byte))
7818             source = 1;
7819           else
7820             source = 0;
7821           break;
7822         case 4:
7823           /* When there are 4 operands, the first two must be 8bit
7824              immediate operands. The source operand will be the 3rd
7825              one.
7826
7827              For instructions with VexNDS, if the first operand
7828              an imm8, the source operand is the 2nd one.  If the last
7829              operand is imm8, the source operand is the first one.  */
7830           gas_assert ((i.imm_operands == 2
7831                        && i.types[0].bitfield.imm8
7832                        && i.types[1].bitfield.imm8)
7833                       || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7834                           && i.imm_operands == 1
7835                           && (i.types[0].bitfield.imm8
7836                               || i.types[i.operands - 1].bitfield.imm8
7837                               || i.rounding)));
7838           if (i.imm_operands == 2)
7839             source = 2;
7840           else
7841             {
7842               if (i.types[0].bitfield.imm8)
7843                 source = 1;
7844               else
7845                 source = 0;
7846             }
7847           break;
7848         case 5:
7849           if (is_evex_encoding (&i.tm))
7850             {
7851               /* For EVEX instructions, when there are 5 operands, the
7852                  first one must be immediate operand.  If the second one
7853                  is immediate operand, the source operand is the 3th
7854                  one.  If the last one is immediate operand, the source
7855                  operand is the 2nd one.  */
7856               gas_assert (i.imm_operands == 2
7857                           && i.tm.opcode_modifier.sae
7858                           && operand_type_check (i.types[0], imm));
7859               if (operand_type_check (i.types[1], imm))
7860                 source = 2;
7861               else if (operand_type_check (i.types[4], imm))
7862                 source = 1;
7863               else
7864                 abort ();
7865             }
7866           break;
7867         default:
7868           abort ();
7869         }
7870
7871       if (!vex_3_sources)
7872         {
7873           dest = source + 1;
7874
7875           /* RC/SAE operand could be between DEST and SRC.  That happens
7876              when one operand is GPR and the other one is XMM/YMM/ZMM
7877              register.  */
7878           if (i.rounding && i.rounding->operand == (int) dest)
7879             dest++;
7880
7881           if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7882             {
7883               /* For instructions with VexNDS, the register-only source
7884                  operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7885                  register.  It is encoded in VEX prefix.  */
7886
7887               i386_operand_type op;
7888               unsigned int vvvv;
7889
7890               /* Check register-only source operand when two source
7891                  operands are swapped.  */
7892               if (!i.tm.operand_types[source].bitfield.baseindex
7893                   && i.tm.operand_types[dest].bitfield.baseindex)
7894                 {
7895                   vvvv = source;
7896                   source = dest;
7897                 }
7898               else
7899                 vvvv = dest;
7900
7901               op = i.tm.operand_types[vvvv];
7902               if ((dest + 1) >= i.operands
7903                   || ((op.bitfield.class != Reg
7904                        || (!op.bitfield.dword && !op.bitfield.qword))
7905                       && op.bitfield.class != RegSIMD
7906                       && !operand_type_equal (&op, &regmask)))
7907                 abort ();
7908               i.vex.register_specifier = i.op[vvvv].regs;
7909               dest++;
7910             }
7911         }
7912
7913       i.rm.mode = 3;
7914       /* One of the register operands will be encoded in the i.rm.reg
7915          field, the other in the combined i.rm.mode and i.rm.regmem
7916          fields.  If no form of this instruction supports a memory
7917          destination operand, then we assume the source operand may
7918          sometimes be a memory operand and so we need to store the
7919          destination in the i.rm.reg field.  */
7920       if (!i.tm.opcode_modifier.regmem
7921           && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7922         {
7923           i.rm.reg = i.op[dest].regs->reg_num;
7924           i.rm.regmem = i.op[source].regs->reg_num;
7925           if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7926                || i.op[source].regs->reg_type.bitfield.class == RegMMX)
7927             i.has_regmmx = TRUE;
7928           else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7929                    || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
7930             {
7931               if (i.types[dest].bitfield.zmmword
7932                   || i.types[source].bitfield.zmmword)
7933                 i.has_regzmm = TRUE;
7934               else if (i.types[dest].bitfield.ymmword
7935                        || i.types[source].bitfield.ymmword)
7936                 i.has_regymm = TRUE;
7937               else
7938                 i.has_regxmm = TRUE;
7939             }
7940           set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
7941           set_rex_vrex (i.op[source].regs, REX_B, FALSE);
7942         }
7943       else
7944         {
7945           i.rm.reg = i.op[source].regs->reg_num;
7946           i.rm.regmem = i.op[dest].regs->reg_num;
7947           set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
7948           set_rex_vrex (i.op[source].regs, REX_R, FALSE);
7949         }
7950       if (flag_code != CODE_64BIT && (i.rex & REX_R))
7951         {
7952           if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
7953             abort ();
7954           i.rex &= ~REX_R;
7955           add_prefix (LOCK_PREFIX_OPCODE);
7956         }
7957     }
7958   else
7959     {                   /* If it's not 2 reg operands...  */
7960       unsigned int mem;
7961
7962       if (i.mem_operands)
7963         {
7964           unsigned int fake_zero_displacement = 0;
7965           unsigned int op;
7966
7967           for (op = 0; op < i.operands; op++)
7968             if (i.flags[op] & Operand_Mem)
7969               break;
7970           gas_assert (op < i.operands);
7971
7972           if (i.tm.opcode_modifier.vecsib)
7973             {
7974               if (i.index_reg->reg_num == RegIZ)
7975                 abort ();
7976
7977               i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7978               if (!i.base_reg)
7979                 {
7980                   i.sib.base = NO_BASE_REGISTER;
7981                   i.sib.scale = i.log2_scale_factor;
7982                   i.types[op].bitfield.disp8 = 0;
7983                   i.types[op].bitfield.disp16 = 0;
7984                   i.types[op].bitfield.disp64 = 0;
7985                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7986                     {
7987                       /* Must be 32 bit */
7988                       i.types[op].bitfield.disp32 = 1;
7989                       i.types[op].bitfield.disp32s = 0;
7990                     }
7991                   else
7992                     {
7993                       i.types[op].bitfield.disp32 = 0;
7994                       i.types[op].bitfield.disp32s = 1;
7995                     }
7996                 }
7997               i.sib.index = i.index_reg->reg_num;
7998               set_rex_vrex (i.index_reg, REX_X, FALSE);
7999             }
8000
8001           default_seg = &ds;
8002
8003           if (i.base_reg == 0)
8004             {
8005               i.rm.mode = 0;
8006               if (!i.disp_operands)
8007                 fake_zero_displacement = 1;
8008               if (i.index_reg == 0)
8009                 {
8010                   i386_operand_type newdisp;
8011
8012                   gas_assert (!i.tm.opcode_modifier.vecsib);
8013                   /* Operand is just <disp>  */
8014                   if (flag_code == CODE_64BIT)
8015                     {
8016                       /* 64bit mode overwrites the 32bit absolute
8017                          addressing by RIP relative addressing and
8018                          absolute addressing is encoded by one of the
8019                          redundant SIB forms.  */
8020                       i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8021                       i.sib.base = NO_BASE_REGISTER;
8022                       i.sib.index = NO_INDEX_REGISTER;
8023                       newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
8024                     }
8025                   else if ((flag_code == CODE_16BIT)
8026                            ^ (i.prefix[ADDR_PREFIX] != 0))
8027                     {
8028                       i.rm.regmem = NO_BASE_REGISTER_16;
8029                       newdisp = disp16;
8030                     }
8031                   else
8032                     {
8033                       i.rm.regmem = NO_BASE_REGISTER;
8034                       newdisp = disp32;
8035                     }
8036                   i.types[op] = operand_type_and_not (i.types[op], anydisp);
8037                   i.types[op] = operand_type_or (i.types[op], newdisp);
8038                 }
8039               else if (!i.tm.opcode_modifier.vecsib)
8040                 {
8041                   /* !i.base_reg && i.index_reg  */
8042                   if (i.index_reg->reg_num == RegIZ)
8043                     i.sib.index = NO_INDEX_REGISTER;
8044                   else
8045                     i.sib.index = i.index_reg->reg_num;
8046                   i.sib.base = NO_BASE_REGISTER;
8047                   i.sib.scale = i.log2_scale_factor;
8048                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8049                   i.types[op].bitfield.disp8 = 0;
8050                   i.types[op].bitfield.disp16 = 0;
8051                   i.types[op].bitfield.disp64 = 0;
8052                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8053                     {
8054                       /* Must be 32 bit */
8055                       i.types[op].bitfield.disp32 = 1;
8056                       i.types[op].bitfield.disp32s = 0;
8057                     }
8058                   else
8059                     {
8060                       i.types[op].bitfield.disp32 = 0;
8061                       i.types[op].bitfield.disp32s = 1;
8062                     }
8063                   if ((i.index_reg->reg_flags & RegRex) != 0)
8064                     i.rex |= REX_X;
8065                 }
8066             }
8067           /* RIP addressing for 64bit mode.  */
8068           else if (i.base_reg->reg_num == RegIP)
8069             {
8070               gas_assert (!i.tm.opcode_modifier.vecsib);
8071               i.rm.regmem = NO_BASE_REGISTER;
8072               i.types[op].bitfield.disp8 = 0;
8073               i.types[op].bitfield.disp16 = 0;
8074               i.types[op].bitfield.disp32 = 0;
8075               i.types[op].bitfield.disp32s = 1;
8076               i.types[op].bitfield.disp64 = 0;
8077               i.flags[op] |= Operand_PCrel;
8078               if (! i.disp_operands)
8079                 fake_zero_displacement = 1;
8080             }
8081           else if (i.base_reg->reg_type.bitfield.word)
8082             {
8083               gas_assert (!i.tm.opcode_modifier.vecsib);
8084               switch (i.base_reg->reg_num)
8085                 {
8086                 case 3: /* (%bx)  */
8087                   if (i.index_reg == 0)
8088                     i.rm.regmem = 7;
8089                   else /* (%bx,%si) -> 0, or (%bx,%di) -> 1  */
8090                     i.rm.regmem = i.index_reg->reg_num - 6;
8091                   break;
8092                 case 5: /* (%bp)  */
8093                   default_seg = &ss;
8094                   if (i.index_reg == 0)
8095                     {
8096                       i.rm.regmem = 6;
8097                       if (operand_type_check (i.types[op], disp) == 0)
8098                         {
8099                           /* fake (%bp) into 0(%bp)  */
8100                           i.types[op].bitfield.disp8 = 1;
8101                           fake_zero_displacement = 1;
8102                         }
8103                     }
8104                   else /* (%bp,%si) -> 2, or (%bp,%di) -> 3  */
8105                     i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8106                   break;
8107                 default: /* (%si) -> 4 or (%di) -> 5  */
8108                   i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8109                 }
8110               i.rm.mode = mode_from_disp_size (i.types[op]);
8111             }
8112           else /* i.base_reg and 32/64 bit mode  */
8113             {
8114               if (flag_code == CODE_64BIT
8115                   && operand_type_check (i.types[op], disp))
8116                 {
8117                   i.types[op].bitfield.disp16 = 0;
8118                   i.types[op].bitfield.disp64 = 0;
8119                   if (i.prefix[ADDR_PREFIX] == 0)
8120                     {
8121                       i.types[op].bitfield.disp32 = 0;
8122                       i.types[op].bitfield.disp32s = 1;
8123                     }
8124                   else
8125                     {
8126                       i.types[op].bitfield.disp32 = 1;
8127                       i.types[op].bitfield.disp32s = 0;
8128                     }
8129                 }
8130
8131               if (!i.tm.opcode_modifier.vecsib)
8132                 i.rm.regmem = i.base_reg->reg_num;
8133               if ((i.base_reg->reg_flags & RegRex) != 0)
8134                 i.rex |= REX_B;
8135               i.sib.base = i.base_reg->reg_num;
8136               /* x86-64 ignores REX prefix bit here to avoid decoder
8137                  complications.  */
8138               if (!(i.base_reg->reg_flags & RegRex)
8139                   && (i.base_reg->reg_num == EBP_REG_NUM
8140                    || i.base_reg->reg_num == ESP_REG_NUM))
8141                   default_seg = &ss;
8142               if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
8143                 {
8144                   fake_zero_displacement = 1;
8145                   i.types[op].bitfield.disp8 = 1;
8146                 }
8147               i.sib.scale = i.log2_scale_factor;
8148               if (i.index_reg == 0)
8149                 {
8150                   gas_assert (!i.tm.opcode_modifier.vecsib);
8151                   /* <disp>(%esp) becomes two byte modrm with no index
8152                      register.  We've already stored the code for esp
8153                      in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8154                      Any base register besides %esp will not use the
8155                      extra modrm byte.  */
8156                   i.sib.index = NO_INDEX_REGISTER;
8157                 }
8158               else if (!i.tm.opcode_modifier.vecsib)
8159                 {
8160                   if (i.index_reg->reg_num == RegIZ)
8161                     i.sib.index = NO_INDEX_REGISTER;
8162                   else
8163                     i.sib.index = i.index_reg->reg_num;
8164                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8165                   if ((i.index_reg->reg_flags & RegRex) != 0)
8166                     i.rex |= REX_X;
8167                 }
8168
8169               if (i.disp_operands
8170                   && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8171                       || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8172                 i.rm.mode = 0;
8173               else
8174                 {
8175                   if (!fake_zero_displacement
8176                       && !i.disp_operands
8177                       && i.disp_encoding)
8178                     {
8179                       fake_zero_displacement = 1;
8180                       if (i.disp_encoding == disp_encoding_8bit)
8181                         i.types[op].bitfield.disp8 = 1;
8182                       else
8183                         i.types[op].bitfield.disp32 = 1;
8184                     }
8185                   i.rm.mode = mode_from_disp_size (i.types[op]);
8186                 }
8187             }
8188
8189           if (fake_zero_displacement)
8190             {
8191               /* Fakes a zero displacement assuming that i.types[op]
8192                  holds the correct displacement size.  */
8193               expressionS *exp;
8194
8195               gas_assert (i.op[op].disps == 0);
8196               exp = &disp_expressions[i.disp_operands++];
8197               i.op[op].disps = exp;
8198               exp->X_op = O_constant;
8199               exp->X_add_number = 0;
8200               exp->X_add_symbol = (symbolS *) 0;
8201               exp->X_op_symbol = (symbolS *) 0;
8202             }
8203
8204           mem = op;
8205         }
8206       else
8207         mem = ~0;
8208
8209       if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
8210         {
8211           if (operand_type_check (i.types[0], imm))
8212             i.vex.register_specifier = NULL;
8213           else
8214             {
8215               /* VEX.vvvv encodes one of the sources when the first
8216                  operand is not an immediate.  */
8217               if (i.tm.opcode_modifier.vexw == VEXW0)
8218                 i.vex.register_specifier = i.op[0].regs;
8219               else
8220                 i.vex.register_specifier = i.op[1].regs;
8221             }
8222
8223           /* Destination is a XMM register encoded in the ModRM.reg
8224              and VEX.R bit.  */
8225           i.rm.reg = i.op[2].regs->reg_num;
8226           if ((i.op[2].regs->reg_flags & RegRex) != 0)
8227             i.rex |= REX_R;
8228
8229           /* ModRM.rm and VEX.B encodes the other source.  */
8230           if (!i.mem_operands)
8231             {
8232               i.rm.mode = 3;
8233
8234               if (i.tm.opcode_modifier.vexw == VEXW0)
8235                 i.rm.regmem = i.op[1].regs->reg_num;
8236               else
8237                 i.rm.regmem = i.op[0].regs->reg_num;
8238
8239               if ((i.op[1].regs->reg_flags & RegRex) != 0)
8240                 i.rex |= REX_B;
8241             }
8242         }
8243       else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
8244         {
8245           i.vex.register_specifier = i.op[2].regs;
8246           if (!i.mem_operands)
8247             {
8248               i.rm.mode = 3;
8249               i.rm.regmem = i.op[1].regs->reg_num;
8250               if ((i.op[1].regs->reg_flags & RegRex) != 0)
8251                 i.rex |= REX_B;
8252             }
8253         }
8254       /* Fill in i.rm.reg or i.rm.regmem field with register operand
8255          (if any) based on i.tm.extension_opcode.  Again, we must be
8256          careful to make sure that segment/control/debug/test/MMX
8257          registers are coded into the i.rm.reg field.  */
8258       else if (i.reg_operands)
8259         {
8260           unsigned int op;
8261           unsigned int vex_reg = ~0;
8262
8263           for (op = 0; op < i.operands; op++)
8264             {
8265               if (i.types[op].bitfield.class == Reg
8266                   || i.types[op].bitfield.class == RegBND
8267                   || i.types[op].bitfield.class == RegMask
8268                   || i.types[op].bitfield.class == SReg
8269                   || i.types[op].bitfield.class == RegCR
8270                   || i.types[op].bitfield.class == RegDR
8271                   || i.types[op].bitfield.class == RegTR)
8272                 break;
8273               if (i.types[op].bitfield.class == RegSIMD)
8274                 {
8275                   if (i.types[op].bitfield.zmmword)
8276                     i.has_regzmm = TRUE;
8277                   else if (i.types[op].bitfield.ymmword)
8278                     i.has_regymm = TRUE;
8279                   else
8280                     i.has_regxmm = TRUE;
8281                   break;
8282                 }
8283               if (i.types[op].bitfield.class == RegMMX)
8284                 {
8285                   i.has_regmmx = TRUE;
8286                   break;
8287                 }
8288             }
8289
8290           if (vex_3_sources)
8291             op = dest;
8292           else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
8293             {
8294               /* For instructions with VexNDS, the register-only
8295                  source operand is encoded in VEX prefix. */
8296               gas_assert (mem != (unsigned int) ~0);
8297
8298               if (op > mem)
8299                 {
8300                   vex_reg = op++;
8301                   gas_assert (op < i.operands);
8302                 }
8303               else
8304                 {
8305                   /* Check register-only source operand when two source
8306                      operands are swapped.  */
8307                   if (!i.tm.operand_types[op].bitfield.baseindex
8308                       && i.tm.operand_types[op + 1].bitfield.baseindex)
8309                     {
8310                       vex_reg = op;
8311                       op += 2;
8312                       gas_assert (mem == (vex_reg + 1)
8313                                   && op < i.operands);
8314                     }
8315                   else
8316                     {
8317                       vex_reg = op + 1;
8318                       gas_assert (vex_reg < i.operands);
8319                     }
8320                 }
8321             }
8322           else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
8323             {
8324               /* For instructions with VexNDD, the register destination
8325                  is encoded in VEX prefix.  */
8326               if (i.mem_operands == 0)
8327                 {
8328                   /* There is no memory operand.  */
8329                   gas_assert ((op + 2) == i.operands);
8330                   vex_reg = op + 1;
8331                 }
8332               else
8333                 {
8334                   /* There are only 2 non-immediate operands.  */
8335                   gas_assert (op < i.imm_operands + 2
8336                               && i.operands == i.imm_operands + 2);
8337                   vex_reg = i.imm_operands + 1;
8338                 }
8339             }
8340           else
8341             gas_assert (op < i.operands);
8342
8343           if (vex_reg != (unsigned int) ~0)
8344             {
8345               i386_operand_type *type = &i.tm.operand_types[vex_reg];
8346
8347               if ((type->bitfield.class != Reg
8348                    || (!type->bitfield.dword && !type->bitfield.qword))
8349                   && type->bitfield.class != RegSIMD
8350                   && !operand_type_equal (type, &regmask))
8351                 abort ();
8352
8353               i.vex.register_specifier = i.op[vex_reg].regs;
8354             }
8355
8356           /* Don't set OP operand twice.  */
8357           if (vex_reg != op)
8358             {
8359               /* If there is an extension opcode to put here, the
8360                  register number must be put into the regmem field.  */
8361               if (i.tm.extension_opcode != None)
8362                 {
8363                   i.rm.regmem = i.op[op].regs->reg_num;
8364                   set_rex_vrex (i.op[op].regs, REX_B,
8365                                 i.tm.opcode_modifier.sse2avx);
8366                 }
8367               else
8368                 {
8369                   i.rm.reg = i.op[op].regs->reg_num;
8370                   set_rex_vrex (i.op[op].regs, REX_R,
8371                                 i.tm.opcode_modifier.sse2avx);
8372                 }
8373             }
8374
8375           /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8376              must set it to 3 to indicate this is a register operand
8377              in the regmem field.  */
8378           if (!i.mem_operands)
8379             i.rm.mode = 3;
8380         }
8381
8382       /* Fill in i.rm.reg field with extension opcode (if any).  */
8383       if (i.tm.extension_opcode != None)
8384         i.rm.reg = i.tm.extension_opcode;
8385     }
8386   return default_seg;
8387 }
8388
8389 static unsigned int
8390 flip_code16 (unsigned int code16)
8391 {
8392   gas_assert (i.tm.operands == 1);
8393
8394   return !(i.prefix[REX_PREFIX] & REX_W)
8395          && (code16 ? i.tm.operand_types[0].bitfield.disp32
8396                       || i.tm.operand_types[0].bitfield.disp32s
8397                     : i.tm.operand_types[0].bitfield.disp16)
8398          ? CODE16 : 0;
8399 }
8400
8401 static void
8402 output_branch (void)
8403 {
8404   char *p;
8405   int size;
8406   int code16;
8407   int prefix;
8408   relax_substateT subtype;
8409   symbolS *sym;
8410   offsetT off;
8411
8412   code16 = flag_code == CODE_16BIT ? CODE16 : 0;
8413   size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
8414
8415   prefix = 0;
8416   if (i.prefix[DATA_PREFIX] != 0)
8417     {
8418       prefix = 1;
8419       i.prefixes -= 1;
8420       code16 ^= flip_code16(code16);
8421     }
8422   /* Pentium4 branch hints.  */
8423   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8424       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8425     {
8426       prefix++;
8427       i.prefixes--;
8428     }
8429   if (i.prefix[REX_PREFIX] != 0)
8430     {
8431       prefix++;
8432       i.prefixes--;
8433     }
8434
8435   /* BND prefixed jump.  */
8436   if (i.prefix[BND_PREFIX] != 0)
8437     {
8438       prefix++;
8439       i.prefixes--;
8440     }
8441
8442   if (i.prefixes != 0)
8443     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8444
8445   /* It's always a symbol;  End frag & setup for relax.
8446      Make sure there is enough room in this frag for the largest
8447      instruction we may generate in md_convert_frag.  This is 2
8448      bytes for the opcode and room for the prefix and largest
8449      displacement.  */
8450   frag_grow (prefix + 2 + 4);
8451   /* Prefix and 1 opcode byte go in fr_fix.  */
8452   p = frag_more (prefix + 1);
8453   if (i.prefix[DATA_PREFIX] != 0)
8454     *p++ = DATA_PREFIX_OPCODE;
8455   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8456       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8457     *p++ = i.prefix[SEG_PREFIX];
8458   if (i.prefix[BND_PREFIX] != 0)
8459     *p++ = BND_PREFIX_OPCODE;
8460   if (i.prefix[REX_PREFIX] != 0)
8461     *p++ = i.prefix[REX_PREFIX];
8462   *p = i.tm.base_opcode;
8463
8464   if ((unsigned char) *p == JUMP_PC_RELATIVE)
8465     subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
8466   else if (cpu_arch_flags.bitfield.cpui386)
8467     subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
8468   else
8469     subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
8470   subtype |= code16;
8471
8472   sym = i.op[0].disps->X_add_symbol;
8473   off = i.op[0].disps->X_add_number;
8474
8475   if (i.op[0].disps->X_op != O_constant
8476       && i.op[0].disps->X_op != O_symbol)
8477     {
8478       /* Handle complex expressions.  */
8479       sym = make_expr_symbol (i.op[0].disps);
8480       off = 0;
8481     }
8482
8483   /* 1 possible extra opcode + 4 byte displacement go in var part.
8484      Pass reloc in fr_var.  */
8485   frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
8486 }
8487
8488 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8489 /* Return TRUE iff PLT32 relocation should be used for branching to
8490    symbol S.  */
8491
8492 static bfd_boolean
8493 need_plt32_p (symbolS *s)
8494 {
8495   /* PLT32 relocation is ELF only.  */
8496   if (!IS_ELF)
8497     return FALSE;
8498
8499 #ifdef TE_SOLARIS
8500   /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8501      krtld support it.  */
8502   return FALSE;
8503 #endif
8504
8505   /* Since there is no need to prepare for PLT branch on x86-64, we
8506      can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8507      be used as a marker for 32-bit PC-relative branches.  */
8508   if (!object_64bit)
8509     return FALSE;
8510
8511   /* Weak or undefined symbol need PLT32 relocation.  */
8512   if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8513     return TRUE;
8514
8515   /* Non-global symbol doesn't need PLT32 relocation.  */
8516   if (! S_IS_EXTERNAL (s))
8517     return FALSE;
8518
8519   /* Other global symbols need PLT32 relocation.  NB: Symbol with
8520      non-default visibilities are treated as normal global symbol
8521      so that PLT32 relocation can be used as a marker for 32-bit
8522      PC-relative branches.  It is useful for linker relaxation.  */
8523   return TRUE;
8524 }
8525 #endif
8526
8527 static void
8528 output_jump (void)
8529 {
8530   char *p;
8531   int size;
8532   fixS *fixP;
8533   bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8534
8535   if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8536     {
8537       /* This is a loop or jecxz type instruction.  */
8538       size = 1;
8539       if (i.prefix[ADDR_PREFIX] != 0)
8540         {
8541           FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
8542           i.prefixes -= 1;
8543         }
8544       /* Pentium4 branch hints.  */
8545       if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8546           || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8547         {
8548           FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
8549           i.prefixes--;
8550         }
8551     }
8552   else
8553     {
8554       int code16;
8555
8556       code16 = 0;
8557       if (flag_code == CODE_16BIT)
8558         code16 = CODE16;
8559
8560       if (i.prefix[DATA_PREFIX] != 0)
8561         {
8562           FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8563           i.prefixes -= 1;
8564           code16 ^= flip_code16(code16);
8565         }
8566
8567       size = 4;
8568       if (code16)
8569         size = 2;
8570     }
8571
8572   /* BND prefixed jump.  */
8573   if (i.prefix[BND_PREFIX] != 0)
8574     {
8575       FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
8576       i.prefixes -= 1;
8577     }
8578
8579   if (i.prefix[REX_PREFIX] != 0)
8580     {
8581       FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
8582       i.prefixes -= 1;
8583     }
8584
8585   if (i.prefixes != 0)
8586     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8587
8588   p = frag_more (i.tm.opcode_length + size);
8589   switch (i.tm.opcode_length)
8590     {
8591     case 2:
8592       *p++ = i.tm.base_opcode >> 8;
8593       /* Fall through.  */
8594     case 1:
8595       *p++ = i.tm.base_opcode;
8596       break;
8597     default:
8598       abort ();
8599     }
8600
8601 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8602   if (size == 4
8603       && jump_reloc == NO_RELOC
8604       && need_plt32_p (i.op[0].disps->X_add_symbol))
8605     jump_reloc = BFD_RELOC_X86_64_PLT32;
8606 #endif
8607
8608   jump_reloc = reloc (size, 1, 1, jump_reloc);
8609
8610   fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8611                       i.op[0].disps, 1, jump_reloc);
8612
8613   /* All jumps handled here are signed, but don't use a signed limit
8614      check for 32 and 16 bit jumps as we want to allow wrap around at
8615      4G and 64k respectively.  */
8616   if (size == 1)
8617     fixP->fx_signed = 1;
8618 }
8619
8620 static void
8621 output_interseg_jump (void)
8622 {
8623   char *p;
8624   int size;
8625   int prefix;
8626   int code16;
8627
8628   code16 = 0;
8629   if (flag_code == CODE_16BIT)
8630     code16 = CODE16;
8631
8632   prefix = 0;
8633   if (i.prefix[DATA_PREFIX] != 0)
8634     {
8635       prefix = 1;
8636       i.prefixes -= 1;
8637       code16 ^= CODE16;
8638     }
8639
8640   gas_assert (!i.prefix[REX_PREFIX]);
8641
8642   size = 4;
8643   if (code16)
8644     size = 2;
8645
8646   if (i.prefixes != 0)
8647     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8648
8649   /* 1 opcode; 2 segment; offset  */
8650   p = frag_more (prefix + 1 + 2 + size);
8651
8652   if (i.prefix[DATA_PREFIX] != 0)
8653     *p++ = DATA_PREFIX_OPCODE;
8654
8655   if (i.prefix[REX_PREFIX] != 0)
8656     *p++ = i.prefix[REX_PREFIX];
8657
8658   *p++ = i.tm.base_opcode;
8659   if (i.op[1].imms->X_op == O_constant)
8660     {
8661       offsetT n = i.op[1].imms->X_add_number;
8662
8663       if (size == 2
8664           && !fits_in_unsigned_word (n)
8665           && !fits_in_signed_word (n))
8666         {
8667           as_bad (_("16-bit jump out of range"));
8668           return;
8669         }
8670       md_number_to_chars (p, n, size);
8671     }
8672   else
8673     fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8674                  i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8675   if (i.op[0].imms->X_op != O_constant)
8676     as_bad (_("can't handle non absolute segment in `%s'"),
8677             i.tm.name);
8678   md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8679 }
8680
8681 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8682 void
8683 x86_cleanup (void)
8684 {
8685   char *p;
8686   asection *seg = now_seg;
8687   subsegT subseg = now_subseg;
8688   asection *sec;
8689   unsigned int alignment, align_size_1;
8690   unsigned int isa_1_descsz, feature_2_descsz, descsz;
8691   unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8692   unsigned int padding;
8693
8694   if (!IS_ELF || !x86_used_note)
8695     return;
8696
8697   x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8698
8699   /* The .note.gnu.property section layout:
8700
8701      Field      Length          Contents
8702      ----       ----            ----
8703      n_namsz    4               4
8704      n_descsz   4               The note descriptor size
8705      n_type     4               NT_GNU_PROPERTY_TYPE_0
8706      n_name     4               "GNU"
8707      n_desc     n_descsz        The program property array
8708      ....       ....            ....
8709    */
8710
8711   /* Create the .note.gnu.property section.  */
8712   sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8713   bfd_set_section_flags (sec,
8714                          (SEC_ALLOC
8715                           | SEC_LOAD
8716                           | SEC_DATA
8717                           | SEC_HAS_CONTENTS
8718                           | SEC_READONLY));
8719
8720   if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8721     {
8722       align_size_1 = 7;
8723       alignment = 3;
8724     }
8725   else
8726     {
8727       align_size_1 = 3;
8728       alignment = 2;
8729     }
8730
8731   bfd_set_section_alignment (sec, alignment);
8732   elf_section_type (sec) = SHT_NOTE;
8733
8734   /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8735                                   + 4-byte data  */
8736   isa_1_descsz_raw = 4 + 4 + 4;
8737   /* Align GNU_PROPERTY_X86_ISA_1_USED.  */
8738   isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8739
8740   feature_2_descsz_raw = isa_1_descsz;
8741   /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8742                                       + 4-byte data  */
8743   feature_2_descsz_raw += 4 + 4 + 4;
8744   /* Align GNU_PROPERTY_X86_FEATURE_2_USED.  */
8745   feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8746                       & ~align_size_1);
8747
8748   descsz = feature_2_descsz;
8749   /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz.  */
8750   p = frag_more (4 + 4 + 4 + 4 + descsz);
8751
8752   /* Write n_namsz.  */
8753   md_number_to_chars (p, (valueT) 4, 4);
8754
8755   /* Write n_descsz.  */
8756   md_number_to_chars (p + 4, (valueT) descsz, 4);
8757
8758   /* Write n_type.  */
8759   md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8760
8761   /* Write n_name.  */
8762   memcpy (p + 4 * 3, "GNU", 4);
8763
8764   /* Write 4-byte type.  */
8765   md_number_to_chars (p + 4 * 4,
8766                       (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8767
8768   /* Write 4-byte data size.  */
8769   md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8770
8771   /* Write 4-byte data.  */
8772   md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8773
8774   /* Zero out paddings.  */
8775   padding = isa_1_descsz - isa_1_descsz_raw;
8776   if (padding)
8777     memset (p + 4 * 7, 0, padding);
8778
8779   /* Write 4-byte type.  */
8780   md_number_to_chars (p + isa_1_descsz + 4 * 4,
8781                       (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8782
8783   /* Write 4-byte data size.  */
8784   md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8785
8786   /* Write 4-byte data.  */
8787   md_number_to_chars (p + isa_1_descsz + 4 * 6,
8788                       (valueT) x86_feature_2_used, 4);
8789
8790   /* Zero out paddings.  */
8791   padding = feature_2_descsz - feature_2_descsz_raw;
8792   if (padding)
8793     memset (p + isa_1_descsz + 4 * 7, 0, padding);
8794
8795   /* We probably can't restore the current segment, for there likely
8796      isn't one yet...  */
8797   if (seg && subseg)
8798     subseg_set (seg, subseg);
8799 }
8800 #endif
8801
8802 static unsigned int
8803 encoding_length (const fragS *start_frag, offsetT start_off,
8804                  const char *frag_now_ptr)
8805 {
8806   unsigned int len = 0;
8807
8808   if (start_frag != frag_now)
8809     {
8810       const fragS *fr = start_frag;
8811
8812       do {
8813         len += fr->fr_fix;
8814         fr = fr->fr_next;
8815       } while (fr && fr != frag_now);
8816     }
8817
8818   return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8819 }
8820
8821 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8822    be macro-fused with conditional jumps.
8823    NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
8824    or is one of the following format:
8825
8826     cmp m, imm
8827     add m, imm
8828     sub m, imm
8829    test m, imm
8830     and m, imm
8831     inc m
8832     dec m
8833
8834    it is unfusible.  */
8835
8836 static int
8837 maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
8838 {
8839   /* No RIP address.  */
8840   if (i.base_reg && i.base_reg->reg_num == RegIP)
8841     return 0;
8842
8843   /* No VEX/EVEX encoding.  */
8844   if (is_any_vex_encoding (&i.tm))
8845     return 0;
8846
8847   /* add, sub without add/sub m, imm.  */
8848   if (i.tm.base_opcode <= 5
8849       || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8850       || ((i.tm.base_opcode | 3) == 0x83
8851           && (i.tm.extension_opcode == 0x5
8852               || i.tm.extension_opcode == 0x0)))
8853     {
8854       *mf_cmp_p = mf_cmp_alu_cmp;
8855       return !(i.mem_operands && i.imm_operands);
8856     }
8857
8858   /* and without and m, imm.  */
8859   if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8860       || ((i.tm.base_opcode | 3) == 0x83
8861           && i.tm.extension_opcode == 0x4))
8862     {
8863       *mf_cmp_p = mf_cmp_test_and;
8864       return !(i.mem_operands && i.imm_operands);
8865     }
8866
8867   /* test without test m imm.  */
8868   if ((i.tm.base_opcode | 1) == 0x85
8869       || (i.tm.base_opcode | 1) == 0xa9
8870       || ((i.tm.base_opcode | 1) == 0xf7
8871           && i.tm.extension_opcode == 0))
8872     {
8873       *mf_cmp_p = mf_cmp_test_and;
8874       return !(i.mem_operands && i.imm_operands);
8875     }
8876
8877   /* cmp without cmp m, imm.  */
8878   if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8879       || ((i.tm.base_opcode | 3) == 0x83
8880           && (i.tm.extension_opcode == 0x7)))
8881     {
8882       *mf_cmp_p = mf_cmp_alu_cmp;
8883       return !(i.mem_operands && i.imm_operands);
8884     }
8885
8886   /* inc, dec without inc/dec m.   */
8887   if ((i.tm.cpu_flags.bitfield.cpuno64
8888        && (i.tm.base_opcode | 0xf) == 0x4f)
8889       || ((i.tm.base_opcode | 1) == 0xff
8890           && i.tm.extension_opcode <= 0x1))
8891     {
8892       *mf_cmp_p = mf_cmp_incdec;
8893       return !i.mem_operands;
8894     }
8895
8896   return 0;
8897 }
8898
8899 /* Return 1 if a FUSED_JCC_PADDING frag should be generated.  */
8900
8901 static int
8902 add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
8903 {
8904   /* NB: Don't work with COND_JUMP86 without i386.  */
8905   if (!align_branch_power
8906       || now_seg == absolute_section
8907       || !cpu_arch_flags.bitfield.cpui386
8908       || !(align_branch & align_branch_fused_bit))
8909     return 0;
8910
8911   if (maybe_fused_with_jcc_p (mf_cmp_p))
8912     {
8913       if (last_insn.kind == last_insn_other
8914           || last_insn.seg != now_seg)
8915         return 1;
8916       if (flag_debug)
8917         as_warn_where (last_insn.file, last_insn.line,
8918                        _("`%s` skips -malign-branch-boundary on `%s`"),
8919                        last_insn.name, i.tm.name);
8920     }
8921
8922   return 0;
8923 }
8924
8925 /* Return 1 if a BRANCH_PREFIX frag should be generated.  */
8926
8927 static int
8928 add_branch_prefix_frag_p (void)
8929 {
8930   /* NB: Don't work with COND_JUMP86 without i386.  Don't add prefix
8931      to PadLock instructions since they include prefixes in opcode.  */
8932   if (!align_branch_power
8933       || !align_branch_prefix_size
8934       || now_seg == absolute_section
8935       || i.tm.cpu_flags.bitfield.cpupadlock
8936       || !cpu_arch_flags.bitfield.cpui386)
8937     return 0;
8938
8939   /* Don't add prefix if it is a prefix or there is no operand in case
8940      that segment prefix is special.  */
8941   if (!i.operands || i.tm.opcode_modifier.isprefix)
8942     return 0;
8943
8944   if (last_insn.kind == last_insn_other
8945       || last_insn.seg != now_seg)
8946     return 1;
8947
8948   if (flag_debug)
8949     as_warn_where (last_insn.file, last_insn.line,
8950                    _("`%s` skips -malign-branch-boundary on `%s`"),
8951                    last_insn.name, i.tm.name);
8952
8953   return 0;
8954 }
8955
8956 /* Return 1 if a BRANCH_PADDING frag should be generated.  */
8957
8958 static int
8959 add_branch_padding_frag_p (enum align_branch_kind *branch_p,
8960                            enum mf_jcc_kind *mf_jcc_p)
8961 {
8962   int add_padding;
8963
8964   /* NB: Don't work with COND_JUMP86 without i386.  */
8965   if (!align_branch_power
8966       || now_seg == absolute_section
8967       || !cpu_arch_flags.bitfield.cpui386)
8968     return 0;
8969
8970   add_padding = 0;
8971
8972   /* Check for jcc and direct jmp.  */
8973   if (i.tm.opcode_modifier.jump == JUMP)
8974     {
8975       if (i.tm.base_opcode == JUMP_PC_RELATIVE)
8976         {
8977           *branch_p = align_branch_jmp;
8978           add_padding = align_branch & align_branch_jmp_bit;
8979         }
8980       else
8981         {
8982           /* Because J<cc> and JN<cc> share same group in macro-fusible table,
8983              igore the lowest bit.  */
8984           *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
8985           *branch_p = align_branch_jcc;
8986           if ((align_branch & align_branch_jcc_bit))
8987             add_padding = 1;
8988         }
8989     }
8990   else if (is_any_vex_encoding (&i.tm))
8991     return 0;
8992   else if ((i.tm.base_opcode | 1) == 0xc3)
8993     {
8994       /* Near ret.  */
8995       *branch_p = align_branch_ret;
8996       if ((align_branch & align_branch_ret_bit))
8997         add_padding = 1;
8998     }
8999   else
9000     {
9001       /* Check for indirect jmp, direct and indirect calls.  */
9002       if (i.tm.base_opcode == 0xe8)
9003         {
9004           /* Direct call.  */
9005           *branch_p = align_branch_call;
9006           if ((align_branch & align_branch_call_bit))
9007             add_padding = 1;
9008         }
9009       else if (i.tm.base_opcode == 0xff
9010                && (i.tm.extension_opcode == 2
9011                    || i.tm.extension_opcode == 4))
9012         {
9013           /* Indirect call and jmp.  */
9014           *branch_p = align_branch_indirect;
9015           if ((align_branch & align_branch_indirect_bit))
9016             add_padding = 1;
9017         }
9018
9019       if (add_padding
9020           && i.disp_operands
9021           && tls_get_addr
9022           && (i.op[0].disps->X_op == O_symbol
9023               || (i.op[0].disps->X_op == O_subtract
9024                   && i.op[0].disps->X_op_symbol == GOT_symbol)))
9025         {
9026           symbolS *s = i.op[0].disps->X_add_symbol;
9027           /* No padding to call to global or undefined tls_get_addr.  */
9028           if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9029               && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9030             return 0;
9031         }
9032     }
9033
9034   if (add_padding
9035       && last_insn.kind != last_insn_other
9036       && last_insn.seg == now_seg)
9037     {
9038       if (flag_debug)
9039         as_warn_where (last_insn.file, last_insn.line,
9040                        _("`%s` skips -malign-branch-boundary on `%s`"),
9041                        last_insn.name, i.tm.name);
9042       return 0;
9043     }
9044
9045   return add_padding;
9046 }
9047
9048 static void
9049 output_insn (void)
9050 {
9051   fragS *insn_start_frag;
9052   offsetT insn_start_off;
9053   fragS *fragP = NULL;
9054   enum align_branch_kind branch = align_branch_none;
9055   /* The initializer is arbitrary just to avoid uninitialized error.
9056      it's actually either assigned in add_branch_padding_frag_p
9057      or never be used.  */
9058   enum mf_jcc_kind mf_jcc = mf_jcc_jo;
9059
9060 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9061   if (IS_ELF && x86_used_note)
9062     {
9063       if (i.tm.cpu_flags.bitfield.cpucmov)
9064         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
9065       if (i.tm.cpu_flags.bitfield.cpusse)
9066         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
9067       if (i.tm.cpu_flags.bitfield.cpusse2)
9068         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
9069       if (i.tm.cpu_flags.bitfield.cpusse3)
9070         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
9071       if (i.tm.cpu_flags.bitfield.cpussse3)
9072         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
9073       if (i.tm.cpu_flags.bitfield.cpusse4_1)
9074         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
9075       if (i.tm.cpu_flags.bitfield.cpusse4_2)
9076         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
9077       if (i.tm.cpu_flags.bitfield.cpuavx)
9078         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
9079       if (i.tm.cpu_flags.bitfield.cpuavx2)
9080         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
9081       if (i.tm.cpu_flags.bitfield.cpufma)
9082         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
9083       if (i.tm.cpu_flags.bitfield.cpuavx512f)
9084         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
9085       if (i.tm.cpu_flags.bitfield.cpuavx512cd)
9086         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
9087       if (i.tm.cpu_flags.bitfield.cpuavx512er)
9088         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
9089       if (i.tm.cpu_flags.bitfield.cpuavx512pf)
9090         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
9091       if (i.tm.cpu_flags.bitfield.cpuavx512vl)
9092         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
9093       if (i.tm.cpu_flags.bitfield.cpuavx512dq)
9094         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
9095       if (i.tm.cpu_flags.bitfield.cpuavx512bw)
9096         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
9097       if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
9098         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
9099       if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
9100         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
9101       if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
9102         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
9103       if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
9104         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
9105       if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
9106         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
9107       if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
9108         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
9109       if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
9110         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
9111       if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
9112         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
9113
9114       if (i.tm.cpu_flags.bitfield.cpu8087
9115           || i.tm.cpu_flags.bitfield.cpu287
9116           || i.tm.cpu_flags.bitfield.cpu387
9117           || i.tm.cpu_flags.bitfield.cpu687
9118           || i.tm.cpu_flags.bitfield.cpufisttp)
9119         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
9120       if (i.has_regmmx
9121           || i.tm.base_opcode == 0xf77 /* emms */
9122           || i.tm.base_opcode == 0xf0e /* femms */
9123           || i.tm.base_opcode == 0xf2a /* cvtpi2ps */
9124           || i.tm.base_opcode == 0x660f2a /* cvtpi2pd */)
9125         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9126       if (i.has_regxmm)
9127         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9128       if (i.has_regymm)
9129         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9130       if (i.has_regzmm)
9131         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9132       if (i.tm.cpu_flags.bitfield.cpufxsr)
9133         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9134       if (i.tm.cpu_flags.bitfield.cpuxsave)
9135         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9136       if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9137         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9138       if (i.tm.cpu_flags.bitfield.cpuxsavec)
9139         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9140     }
9141 #endif
9142
9143   /* Tie dwarf2 debug info to the address at the start of the insn.
9144      We can't do this after the insn has been output as the current
9145      frag may have been closed off.  eg. by frag_var.  */
9146   dwarf2_emit_insn (0);
9147
9148   insn_start_frag = frag_now;
9149   insn_start_off = frag_now_fix ();
9150
9151   if (add_branch_padding_frag_p (&branch, &mf_jcc))
9152     {
9153       char *p;
9154       /* Branch can be 8 bytes.  Leave some room for prefixes.  */
9155       unsigned int max_branch_padding_size = 14;
9156
9157       /* Align section to boundary.  */
9158       record_alignment (now_seg, align_branch_power);
9159
9160       /* Make room for padding.  */
9161       frag_grow (max_branch_padding_size);
9162
9163       /* Start of the padding.  */
9164       p = frag_more (0);
9165
9166       fragP = frag_now;
9167
9168       frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9169                 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9170                 NULL, 0, p);
9171
9172       fragP->tc_frag_data.mf_type = mf_jcc;
9173       fragP->tc_frag_data.branch_type = branch;
9174       fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9175     }
9176
9177   /* Output jumps.  */
9178   if (i.tm.opcode_modifier.jump == JUMP)
9179     output_branch ();
9180   else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9181            || i.tm.opcode_modifier.jump == JUMP_DWORD)
9182     output_jump ();
9183   else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
9184     output_interseg_jump ();
9185   else
9186     {
9187       /* Output normal instructions here.  */
9188       char *p;
9189       unsigned char *q;
9190       unsigned int j;
9191       unsigned int prefix;
9192       enum mf_cmp_kind mf_cmp;
9193
9194       if (avoid_fence
9195           && (i.tm.base_opcode == 0xfaee8
9196               || i.tm.base_opcode == 0xfaef0
9197               || i.tm.base_opcode == 0xfaef8))
9198         {
9199           /* Encode lfence, mfence, and sfence as
9200              f0 83 04 24 00   lock addl $0x0, (%{re}sp).  */
9201           offsetT val = 0x240483f0ULL;
9202           p = frag_more (5);
9203           md_number_to_chars (p, val, 5);
9204           return;
9205         }
9206
9207       /* Some processors fail on LOCK prefix. This options makes
9208          assembler ignore LOCK prefix and serves as a workaround.  */
9209       if (omit_lock_prefix)
9210         {
9211           if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
9212             return;
9213           i.prefix[LOCK_PREFIX] = 0;
9214         }
9215
9216       if (branch)
9217         /* Skip if this is a branch.  */
9218         ;
9219       else if (add_fused_jcc_padding_frag_p (&mf_cmp))
9220         {
9221           /* Make room for padding.  */
9222           frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9223           p = frag_more (0);
9224
9225           fragP = frag_now;
9226
9227           frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9228                     ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9229                     NULL, 0, p);
9230
9231           fragP->tc_frag_data.mf_type = mf_cmp;
9232           fragP->tc_frag_data.branch_type = align_branch_fused;
9233           fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9234         }
9235       else if (add_branch_prefix_frag_p ())
9236         {
9237           unsigned int max_prefix_size = align_branch_prefix_size;
9238
9239           /* Make room for padding.  */
9240           frag_grow (max_prefix_size);
9241           p = frag_more (0);
9242
9243           fragP = frag_now;
9244
9245           frag_var (rs_machine_dependent, max_prefix_size, 0,
9246                     ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9247                     NULL, 0, p);
9248
9249           fragP->tc_frag_data.max_bytes = max_prefix_size;
9250         }
9251
9252       /* Since the VEX/EVEX prefix contains the implicit prefix, we
9253          don't need the explicit prefix.  */
9254       if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
9255         {
9256           switch (i.tm.opcode_length)
9257             {
9258             case 3:
9259               if (i.tm.base_opcode & 0xff000000)
9260                 {
9261                   prefix = (i.tm.base_opcode >> 24) & 0xff;
9262                   if (!i.tm.cpu_flags.bitfield.cpupadlock
9263                       || prefix != REPE_PREFIX_OPCODE
9264                       || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
9265                     add_prefix (prefix);
9266                 }
9267               break;
9268             case 2:
9269               if ((i.tm.base_opcode & 0xff0000) != 0)
9270                 {
9271                   prefix = (i.tm.base_opcode >> 16) & 0xff;
9272                   add_prefix (prefix);
9273                 }
9274               break;
9275             case 1:
9276               break;
9277             case 0:
9278               /* Check for pseudo prefixes.  */
9279               as_bad_where (insn_start_frag->fr_file,
9280                             insn_start_frag->fr_line,
9281                              _("pseudo prefix without instruction"));
9282               return;
9283             default:
9284               abort ();
9285             }
9286
9287 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
9288           /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9289              R_X86_64_GOTTPOFF relocation so that linker can safely
9290              perform IE->LE optimization.  A dummy REX_OPCODE prefix
9291              is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9292              relocation for GDesc -> IE/LE optimization.  */
9293           if (x86_elf_abi == X86_64_X32_ABI
9294               && i.operands == 2
9295               && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9296                   || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
9297               && i.prefix[REX_PREFIX] == 0)
9298             add_prefix (REX_OPCODE);
9299 #endif
9300
9301           /* The prefix bytes.  */
9302           for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9303             if (*q)
9304               FRAG_APPEND_1_CHAR (*q);
9305         }
9306       else
9307         {
9308           for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9309             if (*q)
9310               switch (j)
9311                 {
9312                 case SEG_PREFIX:
9313                 case ADDR_PREFIX:
9314                   FRAG_APPEND_1_CHAR (*q);
9315                   break;
9316                 default:
9317                   /* There should be no other prefixes for instructions
9318                      with VEX prefix.  */
9319                   abort ();
9320                 }
9321
9322           /* For EVEX instructions i.vrex should become 0 after
9323              build_evex_prefix.  For VEX instructions upper 16 registers
9324              aren't available, so VREX should be 0.  */
9325           if (i.vrex)
9326             abort ();
9327           /* Now the VEX prefix.  */
9328           p = frag_more (i.vex.length);
9329           for (j = 0; j < i.vex.length; j++)
9330             p[j] = i.vex.bytes[j];
9331         }
9332
9333       /* Now the opcode; be careful about word order here!  */
9334       if (i.tm.opcode_length == 1)
9335         {
9336           FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9337         }
9338       else
9339         {
9340           switch (i.tm.opcode_length)
9341             {
9342             case 4:
9343               p = frag_more (4);
9344               *p++ = (i.tm.base_opcode >> 24) & 0xff;
9345               *p++ = (i.tm.base_opcode >> 16) & 0xff;
9346               break;
9347             case 3:
9348               p = frag_more (3);
9349               *p++ = (i.tm.base_opcode >> 16) & 0xff;
9350               break;
9351             case 2:
9352               p = frag_more (2);
9353               break;
9354             default:
9355               abort ();
9356               break;
9357             }
9358
9359           /* Put out high byte first: can't use md_number_to_chars!  */
9360           *p++ = (i.tm.base_opcode >> 8) & 0xff;
9361           *p = i.tm.base_opcode & 0xff;
9362         }
9363
9364       /* Now the modrm byte and sib byte (if present).  */
9365       if (i.tm.opcode_modifier.modrm)
9366         {
9367           FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
9368                                | i.rm.reg << 3
9369                                | i.rm.mode << 6));
9370           /* If i.rm.regmem == ESP (4)
9371              && i.rm.mode != (Register mode)
9372              && not 16 bit
9373              ==> need second modrm byte.  */
9374           if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9375               && i.rm.mode != 3
9376               && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
9377             FRAG_APPEND_1_CHAR ((i.sib.base << 0
9378                                  | i.sib.index << 3
9379                                  | i.sib.scale << 6));
9380         }
9381
9382       if (i.disp_operands)
9383         output_disp (insn_start_frag, insn_start_off);
9384
9385       if (i.imm_operands)
9386         output_imm (insn_start_frag, insn_start_off);
9387
9388       /*
9389        * frag_now_fix () returning plain abs_section_offset when we're in the
9390        * absolute section, and abs_section_offset not getting updated as data
9391        * gets added to the frag breaks the logic below.
9392        */
9393       if (now_seg != absolute_section)
9394         {
9395           j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9396           if (j > 15)
9397             as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9398                      j);
9399           else if (fragP)
9400             {
9401               /* NB: Don't add prefix with GOTPC relocation since
9402                  output_disp() above depends on the fixed encoding
9403                  length.  Can't add prefix with TLS relocation since
9404                  it breaks TLS linker optimization.  */
9405               unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9406               /* Prefix count on the current instruction.  */
9407               unsigned int count = i.vex.length;
9408               unsigned int k;
9409               for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9410                 /* REX byte is encoded in VEX/EVEX prefix.  */
9411                 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9412                   count++;
9413
9414               /* Count prefixes for extended opcode maps.  */
9415               if (!i.vex.length)
9416                 switch (i.tm.opcode_length)
9417                   {
9418                   case 3:
9419                     if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
9420                       {
9421                         count++;
9422                         switch ((i.tm.base_opcode >> 8) & 0xff)
9423                           {
9424                           case 0x38:
9425                           case 0x3a:
9426                             count++;
9427                             break;
9428                           default:
9429                             break;
9430                           }
9431                       }
9432                     break;
9433                   case 2:
9434                     if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
9435                       count++;
9436                     break;
9437                   case 1:
9438                     break;
9439                   default:
9440                     abort ();
9441                   }
9442
9443               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9444                   == BRANCH_PREFIX)
9445                 {
9446                   /* Set the maximum prefix size in BRANCH_PREFIX
9447                      frag.  */
9448                   if (fragP->tc_frag_data.max_bytes > max)
9449                     fragP->tc_frag_data.max_bytes = max;
9450                   if (fragP->tc_frag_data.max_bytes > count)
9451                     fragP->tc_frag_data.max_bytes -= count;
9452                   else
9453                     fragP->tc_frag_data.max_bytes = 0;
9454                 }
9455               else
9456                 {
9457                   /* Remember the maximum prefix size in FUSED_JCC_PADDING
9458                      frag.  */
9459                   unsigned int max_prefix_size;
9460                   if (align_branch_prefix_size > max)
9461                     max_prefix_size = max;
9462                   else
9463                     max_prefix_size = align_branch_prefix_size;
9464                   if (max_prefix_size > count)
9465                     fragP->tc_frag_data.max_prefix_length
9466                       = max_prefix_size - count;
9467                 }
9468
9469               /* Use existing segment prefix if possible.  Use CS
9470                  segment prefix in 64-bit mode.  In 32-bit mode, use SS
9471                  segment prefix with ESP/EBP base register and use DS
9472                  segment prefix without ESP/EBP base register.  */
9473               if (i.prefix[SEG_PREFIX])
9474                 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9475               else if (flag_code == CODE_64BIT)
9476                 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9477               else if (i.base_reg
9478                        && (i.base_reg->reg_num == 4
9479                            || i.base_reg->reg_num == 5))
9480                 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9481               else
9482                 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9483             }
9484         }
9485     }
9486
9487   /* NB: Don't work with COND_JUMP86 without i386.  */
9488   if (align_branch_power
9489       && now_seg != absolute_section
9490       && cpu_arch_flags.bitfield.cpui386)
9491     {
9492       /* Terminate each frag so that we can add prefix and check for
9493          fused jcc.  */
9494       frag_wane (frag_now);
9495       frag_new (0);
9496     }
9497
9498 #ifdef DEBUG386
9499   if (flag_debug)
9500     {
9501       pi ("" /*line*/, &i);
9502     }
9503 #endif /* DEBUG386  */
9504 }
9505
9506 /* Return the size of the displacement operand N.  */
9507
9508 static int
9509 disp_size (unsigned int n)
9510 {
9511   int size = 4;
9512
9513   if (i.types[n].bitfield.disp64)
9514     size = 8;
9515   else if (i.types[n].bitfield.disp8)
9516     size = 1;
9517   else if (i.types[n].bitfield.disp16)
9518     size = 2;
9519   return size;
9520 }
9521
9522 /* Return the size of the immediate operand N.  */
9523
9524 static int
9525 imm_size (unsigned int n)
9526 {
9527   int size = 4;
9528   if (i.types[n].bitfield.imm64)
9529     size = 8;
9530   else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9531     size = 1;
9532   else if (i.types[n].bitfield.imm16)
9533     size = 2;
9534   return size;
9535 }
9536
9537 static void
9538 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9539 {
9540   char *p;
9541   unsigned int n;
9542
9543   for (n = 0; n < i.operands; n++)
9544     {
9545       if (operand_type_check (i.types[n], disp))
9546         {
9547           if (i.op[n].disps->X_op == O_constant)
9548             {
9549               int size = disp_size (n);
9550               offsetT val = i.op[n].disps->X_add_number;
9551
9552               val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9553                                      size);
9554               p = frag_more (size);
9555               md_number_to_chars (p, val, size);
9556             }
9557           else
9558             {
9559               enum bfd_reloc_code_real reloc_type;
9560               int size = disp_size (n);
9561               int sign = i.types[n].bitfield.disp32s;
9562               int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9563               fixS *fixP;
9564
9565               /* We can't have 8 bit displacement here.  */
9566               gas_assert (!i.types[n].bitfield.disp8);
9567
9568               /* The PC relative address is computed relative
9569                  to the instruction boundary, so in case immediate
9570                  fields follows, we need to adjust the value.  */
9571               if (pcrel && i.imm_operands)
9572                 {
9573                   unsigned int n1;
9574                   int sz = 0;
9575
9576                   for (n1 = 0; n1 < i.operands; n1++)
9577                     if (operand_type_check (i.types[n1], imm))
9578                       {
9579                         /* Only one immediate is allowed for PC
9580                            relative address.  */
9581                         gas_assert (sz == 0);
9582                         sz = imm_size (n1);
9583                         i.op[n].disps->X_add_number -= sz;
9584                       }
9585                   /* We should find the immediate.  */
9586                   gas_assert (sz != 0);
9587                 }
9588
9589               p = frag_more (size);
9590               reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9591               if (GOT_symbol
9592                   && GOT_symbol == i.op[n].disps->X_add_symbol
9593                   && (((reloc_type == BFD_RELOC_32
9594                         || reloc_type == BFD_RELOC_X86_64_32S
9595                         || (reloc_type == BFD_RELOC_64
9596                             && object_64bit))
9597                        && (i.op[n].disps->X_op == O_symbol
9598                            || (i.op[n].disps->X_op == O_add
9599                                && ((symbol_get_value_expression
9600                                     (i.op[n].disps->X_op_symbol)->X_op)
9601                                    == O_subtract))))
9602                       || reloc_type == BFD_RELOC_32_PCREL))
9603                 {
9604                   if (!object_64bit)
9605                     {
9606                       reloc_type = BFD_RELOC_386_GOTPC;
9607                       i.has_gotpc_tls_reloc = TRUE;
9608                       i.op[n].imms->X_add_number +=
9609                         encoding_length (insn_start_frag, insn_start_off, p);
9610                     }
9611                   else if (reloc_type == BFD_RELOC_64)
9612                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9613                   else
9614                     /* Don't do the adjustment for x86-64, as there
9615                        the pcrel addressing is relative to the _next_
9616                        insn, and that is taken care of in other code.  */
9617                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9618                 }
9619               else if (align_branch_power)
9620                 {
9621                   switch (reloc_type)
9622                     {
9623                     case BFD_RELOC_386_TLS_GD:
9624                     case BFD_RELOC_386_TLS_LDM:
9625                     case BFD_RELOC_386_TLS_IE:
9626                     case BFD_RELOC_386_TLS_IE_32:
9627                     case BFD_RELOC_386_TLS_GOTIE:
9628                     case BFD_RELOC_386_TLS_GOTDESC:
9629                     case BFD_RELOC_386_TLS_DESC_CALL:
9630                     case BFD_RELOC_X86_64_TLSGD:
9631                     case BFD_RELOC_X86_64_TLSLD:
9632                     case BFD_RELOC_X86_64_GOTTPOFF:
9633                     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9634                     case BFD_RELOC_X86_64_TLSDESC_CALL:
9635                       i.has_gotpc_tls_reloc = TRUE;
9636                     default:
9637                       break;
9638                     }
9639                 }
9640               fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9641                                   size, i.op[n].disps, pcrel,
9642                                   reloc_type);
9643               /* Check for "call/jmp *mem", "mov mem, %reg",
9644                  "test %reg, mem" and "binop mem, %reg" where binop
9645                  is one of adc, add, and, cmp, or, sbb, sub, xor
9646                  instructions without data prefix.  Always generate
9647                  R_386_GOT32X for "sym*GOT" operand in 32-bit mode.  */
9648               if (i.prefix[DATA_PREFIX] == 0
9649                   && (generate_relax_relocations
9650                       || (!object_64bit
9651                           && i.rm.mode == 0
9652                           && i.rm.regmem == 5))
9653                   && (i.rm.mode == 2
9654                       || (i.rm.mode == 0 && i.rm.regmem == 5))
9655                   && !is_any_vex_encoding(&i.tm)
9656                   && ((i.operands == 1
9657                        && i.tm.base_opcode == 0xff
9658                        && (i.rm.reg == 2 || i.rm.reg == 4))
9659                       || (i.operands == 2
9660                           && (i.tm.base_opcode == 0x8b
9661                               || i.tm.base_opcode == 0x85
9662                               || (i.tm.base_opcode & ~0x38) == 0x03))))
9663                 {
9664                   if (object_64bit)
9665                     {
9666                       fixP->fx_tcbit = i.rex != 0;
9667                       if (i.base_reg
9668                           && (i.base_reg->reg_num == RegIP))
9669                       fixP->fx_tcbit2 = 1;
9670                     }
9671                   else
9672                     fixP->fx_tcbit2 = 1;
9673                 }
9674             }
9675         }
9676     }
9677 }
9678
9679 static void
9680 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9681 {
9682   char *p;
9683   unsigned int n;
9684
9685   for (n = 0; n < i.operands; n++)
9686     {
9687       /* Skip SAE/RC Imm operand in EVEX.  They are already handled.  */
9688       if (i.rounding && (int) n == i.rounding->operand)
9689         continue;
9690
9691       if (operand_type_check (i.types[n], imm))
9692         {
9693           if (i.op[n].imms->X_op == O_constant)
9694             {
9695               int size = imm_size (n);
9696               offsetT val;
9697
9698               val = offset_in_range (i.op[n].imms->X_add_number,
9699                                      size);
9700               p = frag_more (size);
9701               md_number_to_chars (p, val, size);
9702             }
9703           else
9704             {
9705               /* Not absolute_section.
9706                  Need a 32-bit fixup (don't support 8bit
9707                  non-absolute imms).  Try to support other
9708                  sizes ...  */
9709               enum bfd_reloc_code_real reloc_type;
9710               int size = imm_size (n);
9711               int sign;
9712
9713               if (i.types[n].bitfield.imm32s
9714                   && (i.suffix == QWORD_MNEM_SUFFIX
9715                       || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9716                 sign = 1;
9717               else
9718                 sign = 0;
9719
9720               p = frag_more (size);
9721               reloc_type = reloc (size, 0, sign, i.reloc[n]);
9722
9723               /*   This is tough to explain.  We end up with this one if we
9724                * have operands that look like
9725                * "_GLOBAL_OFFSET_TABLE_+[.-.L284]".  The goal here is to
9726                * obtain the absolute address of the GOT, and it is strongly
9727                * preferable from a performance point of view to avoid using
9728                * a runtime relocation for this.  The actual sequence of
9729                * instructions often look something like:
9730                *
9731                *        call    .L66
9732                * .L66:
9733                *        popl    %ebx
9734                *        addl    $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9735                *
9736                *   The call and pop essentially return the absolute address
9737                * of the label .L66 and store it in %ebx.  The linker itself
9738                * will ultimately change the first operand of the addl so
9739                * that %ebx points to the GOT, but to keep things simple, the
9740                * .o file must have this operand set so that it generates not
9741                * the absolute address of .L66, but the absolute address of
9742                * itself.  This allows the linker itself simply treat a GOTPC
9743                * relocation as asking for a pcrel offset to the GOT to be
9744                * added in, and the addend of the relocation is stored in the
9745                * operand field for the instruction itself.
9746                *
9747                *   Our job here is to fix the operand so that it would add
9748                * the correct offset so that %ebx would point to itself.  The
9749                * thing that is tricky is that .-.L66 will point to the
9750                * beginning of the instruction, so we need to further modify
9751                * the operand so that it will point to itself.  There are
9752                * other cases where you have something like:
9753                *
9754                *        .long   $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9755                *
9756                * and here no correction would be required.  Internally in
9757                * the assembler we treat operands of this form as not being
9758                * pcrel since the '.' is explicitly mentioned, and I wonder
9759                * whether it would simplify matters to do it this way.  Who
9760                * knows.  In earlier versions of the PIC patches, the
9761                * pcrel_adjust field was used to store the correction, but
9762                * since the expression is not pcrel, I felt it would be
9763                * confusing to do it this way.  */
9764
9765               if ((reloc_type == BFD_RELOC_32
9766                    || reloc_type == BFD_RELOC_X86_64_32S
9767                    || reloc_type == BFD_RELOC_64)
9768                   && GOT_symbol
9769                   && GOT_symbol == i.op[n].imms->X_add_symbol
9770                   && (i.op[n].imms->X_op == O_symbol
9771                       || (i.op[n].imms->X_op == O_add
9772                           && ((symbol_get_value_expression
9773                                (i.op[n].imms->X_op_symbol)->X_op)
9774                               == O_subtract))))
9775                 {
9776                   if (!object_64bit)
9777                     reloc_type = BFD_RELOC_386_GOTPC;
9778                   else if (size == 4)
9779                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9780                   else if (size == 8)
9781                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9782                   i.has_gotpc_tls_reloc = TRUE;
9783                   i.op[n].imms->X_add_number +=
9784                     encoding_length (insn_start_frag, insn_start_off, p);
9785                 }
9786               fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9787                            i.op[n].imms, 0, reloc_type);
9788             }
9789         }
9790     }
9791 }
9792 \f
9793 /* x86_cons_fix_new is called via the expression parsing code when a
9794    reloc is needed.  We use this hook to get the correct .got reloc.  */
9795 static int cons_sign = -1;
9796
9797 void
9798 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9799                   expressionS *exp, bfd_reloc_code_real_type r)
9800 {
9801   r = reloc (len, 0, cons_sign, r);
9802
9803 #ifdef TE_PE
9804   if (exp->X_op == O_secrel)
9805     {
9806       exp->X_op = O_symbol;
9807       r = BFD_RELOC_32_SECREL;
9808     }
9809 #endif
9810
9811   fix_new_exp (frag, off, len, exp, 0, r);
9812 }
9813
9814 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9815    purpose of the `.dc.a' internal pseudo-op.  */
9816
9817 int
9818 x86_address_bytes (void)
9819 {
9820   if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9821     return 4;
9822   return stdoutput->arch_info->bits_per_address / 8;
9823 }
9824
9825 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9826     || defined (LEX_AT)
9827 # define lex_got(reloc, adjust, types) NULL
9828 #else
9829 /* Parse operands of the form
9830    <symbol>@GOTOFF+<nnn>
9831    and similar .plt or .got references.
9832
9833    If we find one, set up the correct relocation in RELOC and copy the
9834    input string, minus the `@GOTOFF' into a malloc'd buffer for
9835    parsing by the calling routine.  Return this buffer, and if ADJUST
9836    is non-null set it to the length of the string we removed from the
9837    input line.  Otherwise return NULL.  */
9838 static char *
9839 lex_got (enum bfd_reloc_code_real *rel,
9840          int *adjust,
9841          i386_operand_type *types)
9842 {
9843   /* Some of the relocations depend on the size of what field is to
9844      be relocated.  But in our callers i386_immediate and i386_displacement
9845      we don't yet know the operand size (this will be set by insn
9846      matching).  Hence we record the word32 relocation here,
9847      and adjust the reloc according to the real size in reloc().  */
9848   static const struct {
9849     const char *str;
9850     int len;
9851     const enum bfd_reloc_code_real rel[2];
9852     const i386_operand_type types64;
9853   } gotrel[] = {
9854 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9855     { STRING_COMMA_LEN ("SIZE"),      { BFD_RELOC_SIZE32,
9856                                         BFD_RELOC_SIZE32 },
9857       OPERAND_TYPE_IMM32_64 },
9858 #endif
9859     { STRING_COMMA_LEN ("PLTOFF"),   { _dummy_first_bfd_reloc_code_real,
9860                                        BFD_RELOC_X86_64_PLTOFF64 },
9861       OPERAND_TYPE_IMM64 },
9862     { STRING_COMMA_LEN ("PLT"),      { BFD_RELOC_386_PLT32,
9863                                        BFD_RELOC_X86_64_PLT32    },
9864       OPERAND_TYPE_IMM32_32S_DISP32 },
9865     { STRING_COMMA_LEN ("GOTPLT"),   { _dummy_first_bfd_reloc_code_real,
9866                                        BFD_RELOC_X86_64_GOTPLT64 },
9867       OPERAND_TYPE_IMM64_DISP64 },
9868     { STRING_COMMA_LEN ("GOTOFF"),   { BFD_RELOC_386_GOTOFF,
9869                                        BFD_RELOC_X86_64_GOTOFF64 },
9870       OPERAND_TYPE_IMM64_DISP64 },
9871     { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9872                                        BFD_RELOC_X86_64_GOTPCREL },
9873       OPERAND_TYPE_IMM32_32S_DISP32 },
9874     { STRING_COMMA_LEN ("TLSGD"),    { BFD_RELOC_386_TLS_GD,
9875                                        BFD_RELOC_X86_64_TLSGD    },
9876       OPERAND_TYPE_IMM32_32S_DISP32 },
9877     { STRING_COMMA_LEN ("TLSLDM"),   { BFD_RELOC_386_TLS_LDM,
9878                                        _dummy_first_bfd_reloc_code_real },
9879       OPERAND_TYPE_NONE },
9880     { STRING_COMMA_LEN ("TLSLD"),    { _dummy_first_bfd_reloc_code_real,
9881                                        BFD_RELOC_X86_64_TLSLD    },
9882       OPERAND_TYPE_IMM32_32S_DISP32 },
9883     { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9884                                        BFD_RELOC_X86_64_GOTTPOFF },
9885       OPERAND_TYPE_IMM32_32S_DISP32 },
9886     { STRING_COMMA_LEN ("TPOFF"),    { BFD_RELOC_386_TLS_LE_32,
9887                                        BFD_RELOC_X86_64_TPOFF32  },
9888       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9889     { STRING_COMMA_LEN ("NTPOFF"),   { BFD_RELOC_386_TLS_LE,
9890                                        _dummy_first_bfd_reloc_code_real },
9891       OPERAND_TYPE_NONE },
9892     { STRING_COMMA_LEN ("DTPOFF"),   { BFD_RELOC_386_TLS_LDO_32,
9893                                        BFD_RELOC_X86_64_DTPOFF32 },
9894       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9895     { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9896                                        _dummy_first_bfd_reloc_code_real },
9897       OPERAND_TYPE_NONE },
9898     { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9899                                        _dummy_first_bfd_reloc_code_real },
9900       OPERAND_TYPE_NONE },
9901     { STRING_COMMA_LEN ("GOT"),      { BFD_RELOC_386_GOT32,
9902                                        BFD_RELOC_X86_64_GOT32    },
9903       OPERAND_TYPE_IMM32_32S_64_DISP32 },
9904     { STRING_COMMA_LEN ("TLSDESC"),  { BFD_RELOC_386_TLS_GOTDESC,
9905                                        BFD_RELOC_X86_64_GOTPC32_TLSDESC },
9906       OPERAND_TYPE_IMM32_32S_DISP32 },
9907     { STRING_COMMA_LEN ("TLSCALL"),  { BFD_RELOC_386_TLS_DESC_CALL,
9908                                        BFD_RELOC_X86_64_TLSDESC_CALL },
9909       OPERAND_TYPE_IMM32_32S_DISP32 },
9910   };
9911   char *cp;
9912   unsigned int j;
9913
9914 #if defined (OBJ_MAYBE_ELF)
9915   if (!IS_ELF)
9916     return NULL;
9917 #endif
9918
9919   for (cp = input_line_pointer; *cp != '@'; cp++)
9920     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9921       return NULL;
9922
9923   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9924     {
9925       int len = gotrel[j].len;
9926       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9927         {
9928           if (gotrel[j].rel[object_64bit] != 0)
9929             {
9930               int first, second;
9931               char *tmpbuf, *past_reloc;
9932
9933               *rel = gotrel[j].rel[object_64bit];
9934
9935               if (types)
9936                 {
9937                   if (flag_code != CODE_64BIT)
9938                     {
9939                       types->bitfield.imm32 = 1;
9940                       types->bitfield.disp32 = 1;
9941                     }
9942                   else
9943                     *types = gotrel[j].types64;
9944                 }
9945
9946               if (j != 0 && GOT_symbol == NULL)
9947                 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9948
9949               /* The length of the first part of our input line.  */
9950               first = cp - input_line_pointer;
9951
9952               /* The second part goes from after the reloc token until
9953                  (and including) an end_of_line char or comma.  */
9954               past_reloc = cp + 1 + len;
9955               cp = past_reloc;
9956               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9957                 ++cp;
9958               second = cp + 1 - past_reloc;
9959
9960               /* Allocate and copy string.  The trailing NUL shouldn't
9961                  be necessary, but be safe.  */
9962               tmpbuf = XNEWVEC (char, first + second + 2);
9963               memcpy (tmpbuf, input_line_pointer, first);
9964               if (second != 0 && *past_reloc != ' ')
9965                 /* Replace the relocation token with ' ', so that
9966                    errors like foo@GOTOFF1 will be detected.  */
9967                 tmpbuf[first++] = ' ';
9968               else
9969                 /* Increment length by 1 if the relocation token is
9970                    removed.  */
9971                 len++;
9972               if (adjust)
9973                 *adjust = len;
9974               memcpy (tmpbuf + first, past_reloc, second);
9975               tmpbuf[first + second] = '\0';
9976               return tmpbuf;
9977             }
9978
9979           as_bad (_("@%s reloc is not supported with %d-bit output format"),
9980                   gotrel[j].str, 1 << (5 + object_64bit));
9981           return NULL;
9982         }
9983     }
9984
9985   /* Might be a symbol version string.  Don't as_bad here.  */
9986   return NULL;
9987 }
9988 #endif
9989
9990 #ifdef TE_PE
9991 #ifdef lex_got
9992 #undef lex_got
9993 #endif
9994 /* Parse operands of the form
9995    <symbol>@SECREL32+<nnn>
9996
9997    If we find one, set up the correct relocation in RELOC and copy the
9998    input string, minus the `@SECREL32' into a malloc'd buffer for
9999    parsing by the calling routine.  Return this buffer, and if ADJUST
10000    is non-null set it to the length of the string we removed from the
10001    input line.  Otherwise return NULL.
10002
10003    This function is copied from the ELF version above adjusted for PE targets.  */
10004
10005 static char *
10006 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
10007          int *adjust ATTRIBUTE_UNUSED,
10008          i386_operand_type *types)
10009 {
10010   static const struct
10011   {
10012     const char *str;
10013     int len;
10014     const enum bfd_reloc_code_real rel[2];
10015     const i386_operand_type types64;
10016   }
10017   gotrel[] =
10018   {
10019     { STRING_COMMA_LEN ("SECREL32"),    { BFD_RELOC_32_SECREL,
10020                                           BFD_RELOC_32_SECREL },
10021       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
10022   };
10023
10024   char *cp;
10025   unsigned j;
10026
10027   for (cp = input_line_pointer; *cp != '@'; cp++)
10028     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10029       return NULL;
10030
10031   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10032     {
10033       int len = gotrel[j].len;
10034
10035       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10036         {
10037           if (gotrel[j].rel[object_64bit] != 0)
10038             {
10039               int first, second;
10040               char *tmpbuf, *past_reloc;
10041
10042               *rel = gotrel[j].rel[object_64bit];
10043               if (adjust)
10044                 *adjust = len;
10045
10046               if (types)
10047                 {
10048                   if (flag_code != CODE_64BIT)
10049                     {
10050                       types->bitfield.imm32 = 1;
10051                       types->bitfield.disp32 = 1;
10052                     }
10053                   else
10054                     *types = gotrel[j].types64;
10055                 }
10056
10057               /* The length of the first part of our input line.  */
10058               first = cp - input_line_pointer;
10059
10060               /* The second part goes from after the reloc token until
10061                  (and including) an end_of_line char or comma.  */
10062               past_reloc = cp + 1 + len;
10063               cp = past_reloc;
10064               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10065                 ++cp;
10066               second = cp + 1 - past_reloc;
10067
10068               /* Allocate and copy string.  The trailing NUL shouldn't
10069                  be necessary, but be safe.  */
10070               tmpbuf = XNEWVEC (char, first + second + 2);
10071               memcpy (tmpbuf, input_line_pointer, first);
10072               if (second != 0 && *past_reloc != ' ')
10073                 /* Replace the relocation token with ' ', so that
10074                    errors like foo@SECLREL321 will be detected.  */
10075                 tmpbuf[first++] = ' ';
10076               memcpy (tmpbuf + first, past_reloc, second);
10077               tmpbuf[first + second] = '\0';
10078               return tmpbuf;
10079             }
10080
10081           as_bad (_("@%s reloc is not supported with %d-bit output format"),
10082                   gotrel[j].str, 1 << (5 + object_64bit));
10083           return NULL;
10084         }
10085     }
10086
10087   /* Might be a symbol version string.  Don't as_bad here.  */
10088   return NULL;
10089 }
10090
10091 #endif /* TE_PE */
10092
10093 bfd_reloc_code_real_type
10094 x86_cons (expressionS *exp, int size)
10095 {
10096   bfd_reloc_code_real_type got_reloc = NO_RELOC;
10097
10098   intel_syntax = -intel_syntax;
10099
10100   exp->X_md = 0;
10101   if (size == 4 || (object_64bit && size == 8))
10102     {
10103       /* Handle @GOTOFF and the like in an expression.  */
10104       char *save;
10105       char *gotfree_input_line;
10106       int adjust = 0;
10107
10108       save = input_line_pointer;
10109       gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
10110       if (gotfree_input_line)
10111         input_line_pointer = gotfree_input_line;
10112
10113       expression (exp);
10114
10115       if (gotfree_input_line)
10116         {
10117           /* expression () has merrily parsed up to the end of line,
10118              or a comma - in the wrong buffer.  Transfer how far
10119              input_line_pointer has moved to the right buffer.  */
10120           input_line_pointer = (save
10121                                 + (input_line_pointer - gotfree_input_line)
10122                                 + adjust);
10123           free (gotfree_input_line);
10124           if (exp->X_op == O_constant
10125               || exp->X_op == O_absent
10126               || exp->X_op == O_illegal
10127               || exp->X_op == O_register
10128               || exp->X_op == O_big)
10129             {
10130               char c = *input_line_pointer;
10131               *input_line_pointer = 0;
10132               as_bad (_("missing or invalid expression `%s'"), save);
10133               *input_line_pointer = c;
10134             }
10135           else if ((got_reloc == BFD_RELOC_386_PLT32
10136                     || got_reloc == BFD_RELOC_X86_64_PLT32)
10137                    && exp->X_op != O_symbol)
10138             {
10139               char c = *input_line_pointer;
10140               *input_line_pointer = 0;
10141               as_bad (_("invalid PLT expression `%s'"), save);
10142               *input_line_pointer = c;
10143             }
10144         }
10145     }
10146   else
10147     expression (exp);
10148
10149   intel_syntax = -intel_syntax;
10150
10151   if (intel_syntax)
10152     i386_intel_simplify (exp);
10153
10154   return got_reloc;
10155 }
10156
10157 static void
10158 signed_cons (int size)
10159 {
10160   if (flag_code == CODE_64BIT)
10161     cons_sign = 1;
10162   cons (size);
10163   cons_sign = -1;
10164 }
10165
10166 #ifdef TE_PE
10167 static void
10168 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
10169 {
10170   expressionS exp;
10171
10172   do
10173     {
10174       expression (&exp);
10175       if (exp.X_op == O_symbol)
10176         exp.X_op = O_secrel;
10177
10178       emit_expr (&exp, 4);
10179     }
10180   while (*input_line_pointer++ == ',');
10181
10182   input_line_pointer--;
10183   demand_empty_rest_of_line ();
10184 }
10185 #endif
10186
10187 /* Handle Vector operations.  */
10188
10189 static char *
10190 check_VecOperations (char *op_string, char *op_end)
10191 {
10192   const reg_entry *mask;
10193   const char *saved;
10194   char *end_op;
10195
10196   while (*op_string
10197          && (op_end == NULL || op_string < op_end))
10198     {
10199       saved = op_string;
10200       if (*op_string == '{')
10201         {
10202           op_string++;
10203
10204           /* Check broadcasts.  */
10205           if (strncmp (op_string, "1to", 3) == 0)
10206             {
10207               int bcst_type;
10208
10209               if (i.broadcast)
10210                 goto duplicated_vec_op;
10211
10212               op_string += 3;
10213               if (*op_string == '8')
10214                 bcst_type = 8;
10215               else if (*op_string == '4')
10216                 bcst_type = 4;
10217               else if (*op_string == '2')
10218                 bcst_type = 2;
10219               else if (*op_string == '1'
10220                        && *(op_string+1) == '6')
10221                 {
10222                   bcst_type = 16;
10223                   op_string++;
10224                 }
10225               else
10226                 {
10227                   as_bad (_("Unsupported broadcast: `%s'"), saved);
10228                   return NULL;
10229                 }
10230               op_string++;
10231
10232               broadcast_op.type = bcst_type;
10233               broadcast_op.operand = this_operand;
10234               broadcast_op.bytes = 0;
10235               i.broadcast = &broadcast_op;
10236             }
10237           /* Check masking operation.  */
10238           else if ((mask = parse_register (op_string, &end_op)) != NULL)
10239             {
10240               if (mask == &bad_reg)
10241                 return NULL;
10242
10243               /* k0 can't be used for write mask.  */
10244               if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
10245                 {
10246                   as_bad (_("`%s%s' can't be used for write mask"),
10247                           register_prefix, mask->reg_name);
10248                   return NULL;
10249                 }
10250
10251               if (!i.mask)
10252                 {
10253                   mask_op.mask = mask;
10254                   mask_op.zeroing = 0;
10255                   mask_op.operand = this_operand;
10256                   i.mask = &mask_op;
10257                 }
10258               else
10259                 {
10260                   if (i.mask->mask)
10261                     goto duplicated_vec_op;
10262
10263                   i.mask->mask = mask;
10264
10265                   /* Only "{z}" is allowed here.  No need to check
10266                      zeroing mask explicitly.  */
10267                   if (i.mask->operand != this_operand)
10268                     {
10269                       as_bad (_("invalid write mask `%s'"), saved);
10270                       return NULL;
10271                     }
10272                 }
10273
10274               op_string = end_op;
10275             }
10276           /* Check zeroing-flag for masking operation.  */
10277           else if (*op_string == 'z')
10278             {
10279               if (!i.mask)
10280                 {
10281                   mask_op.mask = NULL;
10282                   mask_op.zeroing = 1;
10283                   mask_op.operand = this_operand;
10284                   i.mask = &mask_op;
10285                 }
10286               else
10287                 {
10288                   if (i.mask->zeroing)
10289                     {
10290                     duplicated_vec_op:
10291                       as_bad (_("duplicated `%s'"), saved);
10292                       return NULL;
10293                     }
10294
10295                   i.mask->zeroing = 1;
10296
10297                   /* Only "{%k}" is allowed here.  No need to check mask
10298                      register explicitly.  */
10299                   if (i.mask->operand != this_operand)
10300                     {
10301                       as_bad (_("invalid zeroing-masking `%s'"),
10302                               saved);
10303                       return NULL;
10304                     }
10305                 }
10306
10307               op_string++;
10308             }
10309           else
10310             goto unknown_vec_op;
10311
10312           if (*op_string != '}')
10313             {
10314               as_bad (_("missing `}' in `%s'"), saved);
10315               return NULL;
10316             }
10317           op_string++;
10318
10319           /* Strip whitespace since the addition of pseudo prefixes
10320              changed how the scrubber treats '{'.  */
10321           if (is_space_char (*op_string))
10322             ++op_string;
10323
10324           continue;
10325         }
10326     unknown_vec_op:
10327       /* We don't know this one.  */
10328       as_bad (_("unknown vector operation: `%s'"), saved);
10329       return NULL;
10330     }
10331
10332   if (i.mask && i.mask->zeroing && !i.mask->mask)
10333     {
10334       as_bad (_("zeroing-masking only allowed with write mask"));
10335       return NULL;
10336     }
10337
10338   return op_string;
10339 }
10340
10341 static int
10342 i386_immediate (char *imm_start)
10343 {
10344   char *save_input_line_pointer;
10345   char *gotfree_input_line;
10346   segT exp_seg = 0;
10347   expressionS *exp;
10348   i386_operand_type types;
10349
10350   operand_type_set (&types, ~0);
10351
10352   if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10353     {
10354       as_bad (_("at most %d immediate operands are allowed"),
10355               MAX_IMMEDIATE_OPERANDS);
10356       return 0;
10357     }
10358
10359   exp = &im_expressions[i.imm_operands++];
10360   i.op[this_operand].imms = exp;
10361
10362   if (is_space_char (*imm_start))
10363     ++imm_start;
10364
10365   save_input_line_pointer = input_line_pointer;
10366   input_line_pointer = imm_start;
10367
10368   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10369   if (gotfree_input_line)
10370     input_line_pointer = gotfree_input_line;
10371
10372   exp_seg = expression (exp);
10373
10374   SKIP_WHITESPACE ();
10375
10376   /* Handle vector operations.  */
10377   if (*input_line_pointer == '{')
10378     {
10379       input_line_pointer = check_VecOperations (input_line_pointer,
10380                                                 NULL);
10381       if (input_line_pointer == NULL)
10382         return 0;
10383     }
10384
10385   if (*input_line_pointer)
10386     as_bad (_("junk `%s' after expression"), input_line_pointer);
10387
10388   input_line_pointer = save_input_line_pointer;
10389   if (gotfree_input_line)
10390     {
10391       free (gotfree_input_line);
10392
10393       if (exp->X_op == O_constant || exp->X_op == O_register)
10394         exp->X_op = O_illegal;
10395     }
10396
10397   return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10398 }
10399
10400 static int
10401 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10402                          i386_operand_type types, const char *imm_start)
10403 {
10404   if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
10405     {
10406       if (imm_start)
10407         as_bad (_("missing or invalid immediate expression `%s'"),
10408                 imm_start);
10409       return 0;
10410     }
10411   else if (exp->X_op == O_constant)
10412     {
10413       /* Size it properly later.  */
10414       i.types[this_operand].bitfield.imm64 = 1;
10415       /* If not 64bit, sign extend val.  */
10416       if (flag_code != CODE_64BIT
10417           && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
10418         exp->X_add_number
10419           = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
10420     }
10421 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10422   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
10423            && exp_seg != absolute_section
10424            && exp_seg != text_section
10425            && exp_seg != data_section
10426            && exp_seg != bss_section
10427            && exp_seg != undefined_section
10428            && !bfd_is_com_section (exp_seg))
10429     {
10430       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10431       return 0;
10432     }
10433 #endif
10434   else if (!intel_syntax && exp_seg == reg_section)
10435     {
10436       if (imm_start)
10437         as_bad (_("illegal immediate register operand %s"), imm_start);
10438       return 0;
10439     }
10440   else
10441     {
10442       /* This is an address.  The size of the address will be
10443          determined later, depending on destination register,
10444          suffix, or the default for the section.  */
10445       i.types[this_operand].bitfield.imm8 = 1;
10446       i.types[this_operand].bitfield.imm16 = 1;
10447       i.types[this_operand].bitfield.imm32 = 1;
10448       i.types[this_operand].bitfield.imm32s = 1;
10449       i.types[this_operand].bitfield.imm64 = 1;
10450       i.types[this_operand] = operand_type_and (i.types[this_operand],
10451                                                 types);
10452     }
10453
10454   return 1;
10455 }
10456
10457 static char *
10458 i386_scale (char *scale)
10459 {
10460   offsetT val;
10461   char *save = input_line_pointer;
10462
10463   input_line_pointer = scale;
10464   val = get_absolute_expression ();
10465
10466   switch (val)
10467     {
10468     case 1:
10469       i.log2_scale_factor = 0;
10470       break;
10471     case 2:
10472       i.log2_scale_factor = 1;
10473       break;
10474     case 4:
10475       i.log2_scale_factor = 2;
10476       break;
10477     case 8:
10478       i.log2_scale_factor = 3;
10479       break;
10480     default:
10481       {
10482         char sep = *input_line_pointer;
10483
10484         *input_line_pointer = '\0';
10485         as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10486                 scale);
10487         *input_line_pointer = sep;
10488         input_line_pointer = save;
10489         return NULL;
10490       }
10491     }
10492   if (i.log2_scale_factor != 0 && i.index_reg == 0)
10493     {
10494       as_warn (_("scale factor of %d without an index register"),
10495                1 << i.log2_scale_factor);
10496       i.log2_scale_factor = 0;
10497     }
10498   scale = input_line_pointer;
10499   input_line_pointer = save;
10500   return scale;
10501 }
10502
10503 static int
10504 i386_displacement (char *disp_start, char *disp_end)
10505 {
10506   expressionS *exp;
10507   segT exp_seg = 0;
10508   char *save_input_line_pointer;
10509   char *gotfree_input_line;
10510   int override;
10511   i386_operand_type bigdisp, types = anydisp;
10512   int ret;
10513
10514   if (i.disp_operands == MAX_MEMORY_OPERANDS)
10515     {
10516       as_bad (_("at most %d displacement operands are allowed"),
10517               MAX_MEMORY_OPERANDS);
10518       return 0;
10519     }
10520
10521   operand_type_set (&bigdisp, 0);
10522   if (i.jumpabsolute
10523       || i.types[this_operand].bitfield.baseindex
10524       || (current_templates->start->opcode_modifier.jump != JUMP
10525           && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
10526     {
10527       i386_addressing_mode ();
10528       override = (i.prefix[ADDR_PREFIX] != 0);
10529       if (flag_code == CODE_64BIT)
10530         {
10531           if (!override)
10532             {
10533               bigdisp.bitfield.disp32s = 1;
10534               bigdisp.bitfield.disp64 = 1;
10535             }
10536           else
10537             bigdisp.bitfield.disp32 = 1;
10538         }
10539       else if ((flag_code == CODE_16BIT) ^ override)
10540           bigdisp.bitfield.disp16 = 1;
10541       else
10542           bigdisp.bitfield.disp32 = 1;
10543     }
10544   else
10545     {
10546       /* For PC-relative branches, the width of the displacement may be
10547          dependent upon data size, but is never dependent upon address size.
10548          Also make sure to not unintentionally match against a non-PC-relative
10549          branch template.  */
10550       static templates aux_templates;
10551       const insn_template *t = current_templates->start;
10552       bfd_boolean has_intel64 = FALSE;
10553
10554       aux_templates.start = t;
10555       while (++t < current_templates->end)
10556         {
10557           if (t->opcode_modifier.jump
10558               != current_templates->start->opcode_modifier.jump)
10559             break;
10560           if ((t->opcode_modifier.isa64 >= INTEL64))
10561             has_intel64 = TRUE;
10562         }
10563       if (t < current_templates->end)
10564         {
10565           aux_templates.end = t;
10566           current_templates = &aux_templates;
10567         }
10568
10569       override = (i.prefix[DATA_PREFIX] != 0);
10570       if (flag_code == CODE_64BIT)
10571         {
10572           if ((override || i.suffix == WORD_MNEM_SUFFIX)
10573               && (!intel64 || !has_intel64))
10574             bigdisp.bitfield.disp16 = 1;
10575           else
10576             bigdisp.bitfield.disp32s = 1;
10577         }
10578       else
10579         {
10580           if (!override)
10581             override = (i.suffix == (flag_code != CODE_16BIT
10582                                      ? WORD_MNEM_SUFFIX
10583                                      : LONG_MNEM_SUFFIX));
10584           bigdisp.bitfield.disp32 = 1;
10585           if ((flag_code == CODE_16BIT) ^ override)
10586             {
10587               bigdisp.bitfield.disp32 = 0;
10588               bigdisp.bitfield.disp16 = 1;
10589             }
10590         }
10591     }
10592   i.types[this_operand] = operand_type_or (i.types[this_operand],
10593                                            bigdisp);
10594
10595   exp = &disp_expressions[i.disp_operands];
10596   i.op[this_operand].disps = exp;
10597   i.disp_operands++;
10598   save_input_line_pointer = input_line_pointer;
10599   input_line_pointer = disp_start;
10600   END_STRING_AND_SAVE (disp_end);
10601
10602 #ifndef GCC_ASM_O_HACK
10603 #define GCC_ASM_O_HACK 0
10604 #endif
10605 #if GCC_ASM_O_HACK
10606   END_STRING_AND_SAVE (disp_end + 1);
10607   if (i.types[this_operand].bitfield.baseIndex
10608       && displacement_string_end[-1] == '+')
10609     {
10610       /* This hack is to avoid a warning when using the "o"
10611          constraint within gcc asm statements.
10612          For instance:
10613
10614          #define _set_tssldt_desc(n,addr,limit,type) \
10615          __asm__ __volatile__ ( \
10616          "movw %w2,%0\n\t" \
10617          "movw %w1,2+%0\n\t" \
10618          "rorl $16,%1\n\t" \
10619          "movb %b1,4+%0\n\t" \
10620          "movb %4,5+%0\n\t" \
10621          "movb $0,6+%0\n\t" \
10622          "movb %h1,7+%0\n\t" \
10623          "rorl $16,%1" \
10624          : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10625
10626          This works great except that the output assembler ends
10627          up looking a bit weird if it turns out that there is
10628          no offset.  You end up producing code that looks like:
10629
10630          #APP
10631          movw $235,(%eax)
10632          movw %dx,2+(%eax)
10633          rorl $16,%edx
10634          movb %dl,4+(%eax)
10635          movb $137,5+(%eax)
10636          movb $0,6+(%eax)
10637          movb %dh,7+(%eax)
10638          rorl $16,%edx
10639          #NO_APP
10640
10641          So here we provide the missing zero.  */
10642
10643       *displacement_string_end = '0';
10644     }
10645 #endif
10646   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10647   if (gotfree_input_line)
10648     input_line_pointer = gotfree_input_line;
10649
10650   exp_seg = expression (exp);
10651
10652   SKIP_WHITESPACE ();
10653   if (*input_line_pointer)
10654     as_bad (_("junk `%s' after expression"), input_line_pointer);
10655 #if GCC_ASM_O_HACK
10656   RESTORE_END_STRING (disp_end + 1);
10657 #endif
10658   input_line_pointer = save_input_line_pointer;
10659   if (gotfree_input_line)
10660     {
10661       free (gotfree_input_line);
10662
10663       if (exp->X_op == O_constant || exp->X_op == O_register)
10664         exp->X_op = O_illegal;
10665     }
10666
10667   ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10668
10669   RESTORE_END_STRING (disp_end);
10670
10671   return ret;
10672 }
10673
10674 static int
10675 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10676                             i386_operand_type types, const char *disp_start)
10677 {
10678   i386_operand_type bigdisp;
10679   int ret = 1;
10680
10681   /* We do this to make sure that the section symbol is in
10682      the symbol table.  We will ultimately change the relocation
10683      to be relative to the beginning of the section.  */
10684   if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10685       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10686       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10687     {
10688       if (exp->X_op != O_symbol)
10689         goto inv_disp;
10690
10691       if (S_IS_LOCAL (exp->X_add_symbol)
10692           && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10693           && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10694         section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10695       exp->X_op = O_subtract;
10696       exp->X_op_symbol = GOT_symbol;
10697       if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10698         i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10699       else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10700         i.reloc[this_operand] = BFD_RELOC_64;
10701       else
10702         i.reloc[this_operand] = BFD_RELOC_32;
10703     }
10704
10705   else if (exp->X_op == O_absent
10706            || exp->X_op == O_illegal
10707            || exp->X_op == O_big)
10708     {
10709     inv_disp:
10710       as_bad (_("missing or invalid displacement expression `%s'"),
10711               disp_start);
10712       ret = 0;
10713     }
10714
10715   else if (flag_code == CODE_64BIT
10716            && !i.prefix[ADDR_PREFIX]
10717            && exp->X_op == O_constant)
10718     {
10719       /* Since displacement is signed extended to 64bit, don't allow
10720          disp32 and turn off disp32s if they are out of range.  */
10721       i.types[this_operand].bitfield.disp32 = 0;
10722       if (!fits_in_signed_long (exp->X_add_number))
10723         {
10724           i.types[this_operand].bitfield.disp32s = 0;
10725           if (i.types[this_operand].bitfield.baseindex)
10726             {
10727               as_bad (_("0x%lx out range of signed 32bit displacement"),
10728                       (long) exp->X_add_number);
10729               ret = 0;
10730             }
10731         }
10732     }
10733
10734 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10735   else if (exp->X_op != O_constant
10736            && OUTPUT_FLAVOR == bfd_target_aout_flavour
10737            && exp_seg != absolute_section
10738            && exp_seg != text_section
10739            && exp_seg != data_section
10740            && exp_seg != bss_section
10741            && exp_seg != undefined_section
10742            && !bfd_is_com_section (exp_seg))
10743     {
10744       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10745       ret = 0;
10746     }
10747 #endif
10748
10749   if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10750       /* Constants get taken care of by optimize_disp().  */
10751       && exp->X_op != O_constant)
10752     i.types[this_operand].bitfield.disp8 = 1;
10753
10754   /* Check if this is a displacement only operand.  */
10755   bigdisp = i.types[this_operand];
10756   bigdisp.bitfield.disp8 = 0;
10757   bigdisp.bitfield.disp16 = 0;
10758   bigdisp.bitfield.disp32 = 0;
10759   bigdisp.bitfield.disp32s = 0;
10760   bigdisp.bitfield.disp64 = 0;
10761   if (operand_type_all_zero (&bigdisp))
10762     i.types[this_operand] = operand_type_and (i.types[this_operand],
10763                                               types);
10764
10765   return ret;
10766 }
10767
10768 /* Return the active addressing mode, taking address override and
10769    registers forming the address into consideration.  Update the
10770    address override prefix if necessary.  */
10771
10772 static enum flag_code
10773 i386_addressing_mode (void)
10774 {
10775   enum flag_code addr_mode;
10776
10777   if (i.prefix[ADDR_PREFIX])
10778     addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10779   else if (flag_code == CODE_16BIT
10780            && current_templates->start->cpu_flags.bitfield.cpumpx
10781            /* Avoid replacing the "16-bit addressing not allowed" diagnostic
10782               from md_assemble() by "is not a valid base/index expression"
10783               when there is a base and/or index.  */
10784            && !i.types[this_operand].bitfield.baseindex)
10785     {
10786       /* MPX insn memory operands with neither base nor index must be forced
10787          to use 32-bit addressing in 16-bit mode.  */
10788       addr_mode = CODE_32BIT;
10789       i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10790       ++i.prefixes;
10791       gas_assert (!i.types[this_operand].bitfield.disp16);
10792       gas_assert (!i.types[this_operand].bitfield.disp32);
10793     }
10794   else
10795     {
10796       addr_mode = flag_code;
10797
10798 #if INFER_ADDR_PREFIX
10799       if (i.mem_operands == 0)
10800         {
10801           /* Infer address prefix from the first memory operand.  */
10802           const reg_entry *addr_reg = i.base_reg;
10803
10804           if (addr_reg == NULL)
10805             addr_reg = i.index_reg;
10806
10807           if (addr_reg)
10808             {
10809               if (addr_reg->reg_type.bitfield.dword)
10810                 addr_mode = CODE_32BIT;
10811               else if (flag_code != CODE_64BIT
10812                        && addr_reg->reg_type.bitfield.word)
10813                 addr_mode = CODE_16BIT;
10814
10815               if (addr_mode != flag_code)
10816                 {
10817                   i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10818                   i.prefixes += 1;
10819                   /* Change the size of any displacement too.  At most one
10820                      of Disp16 or Disp32 is set.
10821                      FIXME.  There doesn't seem to be any real need for
10822                      separate Disp16 and Disp32 flags.  The same goes for
10823                      Imm16 and Imm32.  Removing them would probably clean
10824                      up the code quite a lot.  */
10825                   if (flag_code != CODE_64BIT
10826                       && (i.types[this_operand].bitfield.disp16
10827                           || i.types[this_operand].bitfield.disp32))
10828                     i.types[this_operand]
10829                       = operand_type_xor (i.types[this_operand], disp16_32);
10830                 }
10831             }
10832         }
10833 #endif
10834     }
10835
10836   return addr_mode;
10837 }
10838
10839 /* Make sure the memory operand we've been dealt is valid.
10840    Return 1 on success, 0 on a failure.  */
10841
10842 static int
10843 i386_index_check (const char *operand_string)
10844 {
10845   const char *kind = "base/index";
10846   enum flag_code addr_mode = i386_addressing_mode ();
10847
10848   if (current_templates->start->opcode_modifier.isstring
10849       && !current_templates->start->cpu_flags.bitfield.cpupadlock
10850       && (current_templates->end[-1].opcode_modifier.isstring
10851           || i.mem_operands))
10852     {
10853       /* Memory operands of string insns are special in that they only allow
10854          a single register (rDI, rSI, or rBX) as their memory address.  */
10855       const reg_entry *expected_reg;
10856       static const char *di_si[][2] =
10857         {
10858           { "esi", "edi" },
10859           { "si", "di" },
10860           { "rsi", "rdi" }
10861         };
10862       static const char *bx[] = { "ebx", "bx", "rbx" };
10863
10864       kind = "string address";
10865
10866       if (current_templates->start->opcode_modifier.repprefixok)
10867         {
10868           int es_op = current_templates->end[-1].opcode_modifier.isstring
10869                       - IS_STRING_ES_OP0;
10870           int op = 0;
10871
10872           if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
10873               || ((!i.mem_operands != !intel_syntax)
10874                   && current_templates->end[-1].operand_types[1]
10875                      .bitfield.baseindex))
10876             op = 1;
10877           expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
10878         }
10879       else
10880         expected_reg = hash_find (reg_hash, bx[addr_mode]);
10881
10882       if (i.base_reg != expected_reg
10883           || i.index_reg
10884           || operand_type_check (i.types[this_operand], disp))
10885         {
10886           /* The second memory operand must have the same size as
10887              the first one.  */
10888           if (i.mem_operands
10889               && i.base_reg
10890               && !((addr_mode == CODE_64BIT
10891                     && i.base_reg->reg_type.bitfield.qword)
10892                    || (addr_mode == CODE_32BIT
10893                        ? i.base_reg->reg_type.bitfield.dword
10894                        : i.base_reg->reg_type.bitfield.word)))
10895             goto bad_address;
10896
10897           as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10898                    operand_string,
10899                    intel_syntax ? '[' : '(',
10900                    register_prefix,
10901                    expected_reg->reg_name,
10902                    intel_syntax ? ']' : ')');
10903           return 1;
10904         }
10905       else
10906         return 1;
10907
10908     bad_address:
10909       as_bad (_("`%s' is not a valid %s expression"),
10910               operand_string, kind);
10911       return 0;
10912     }
10913   else
10914     {
10915       if (addr_mode != CODE_16BIT)
10916         {
10917           /* 32-bit/64-bit checks.  */
10918           if ((i.base_reg
10919                && ((addr_mode == CODE_64BIT
10920                     ? !i.base_reg->reg_type.bitfield.qword
10921                     : !i.base_reg->reg_type.bitfield.dword)
10922                    || (i.index_reg && i.base_reg->reg_num == RegIP)
10923                    || i.base_reg->reg_num == RegIZ))
10924               || (i.index_reg
10925                   && !i.index_reg->reg_type.bitfield.xmmword
10926                   && !i.index_reg->reg_type.bitfield.ymmword
10927                   && !i.index_reg->reg_type.bitfield.zmmword
10928                   && ((addr_mode == CODE_64BIT
10929                        ? !i.index_reg->reg_type.bitfield.qword
10930                        : !i.index_reg->reg_type.bitfield.dword)
10931                       || !i.index_reg->reg_type.bitfield.baseindex)))
10932             goto bad_address;
10933
10934           /* bndmk, bndldx, and bndstx have special restrictions. */
10935           if (current_templates->start->base_opcode == 0xf30f1b
10936               || (current_templates->start->base_opcode & ~1) == 0x0f1a)
10937             {
10938               /* They cannot use RIP-relative addressing. */
10939               if (i.base_reg && i.base_reg->reg_num == RegIP)
10940                 {
10941                   as_bad (_("`%s' cannot be used here"), operand_string);
10942                   return 0;
10943                 }
10944
10945               /* bndldx and bndstx ignore their scale factor. */
10946               if (current_templates->start->base_opcode != 0xf30f1b
10947                   && i.log2_scale_factor)
10948                 as_warn (_("register scaling is being ignored here"));
10949             }
10950         }
10951       else
10952         {
10953           /* 16-bit checks.  */
10954           if ((i.base_reg
10955                && (!i.base_reg->reg_type.bitfield.word
10956                    || !i.base_reg->reg_type.bitfield.baseindex))
10957               || (i.index_reg
10958                   && (!i.index_reg->reg_type.bitfield.word
10959                       || !i.index_reg->reg_type.bitfield.baseindex
10960                       || !(i.base_reg
10961                            && i.base_reg->reg_num < 6
10962                            && i.index_reg->reg_num >= 6
10963                            && i.log2_scale_factor == 0))))
10964             goto bad_address;
10965         }
10966     }
10967   return 1;
10968 }
10969
10970 /* Handle vector immediates.  */
10971
10972 static int
10973 RC_SAE_immediate (const char *imm_start)
10974 {
10975   unsigned int match_found, j;
10976   const char *pstr = imm_start;
10977   expressionS *exp;
10978
10979   if (*pstr != '{')
10980     return 0;
10981
10982   pstr++;
10983   match_found = 0;
10984   for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10985     {
10986       if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10987         {
10988           if (!i.rounding)
10989             {
10990               rc_op.type = RC_NamesTable[j].type;
10991               rc_op.operand = this_operand;
10992               i.rounding = &rc_op;
10993             }
10994           else
10995             {
10996               as_bad (_("duplicated `%s'"), imm_start);
10997               return 0;
10998             }
10999           pstr += RC_NamesTable[j].len;
11000           match_found = 1;
11001           break;
11002         }
11003     }
11004   if (!match_found)
11005     return 0;
11006
11007   if (*pstr++ != '}')
11008     {
11009       as_bad (_("Missing '}': '%s'"), imm_start);
11010       return 0;
11011     }
11012   /* RC/SAE immediate string should contain nothing more.  */;
11013   if (*pstr != 0)
11014     {
11015       as_bad (_("Junk after '}': '%s'"), imm_start);
11016       return 0;
11017     }
11018
11019   exp = &im_expressions[i.imm_operands++];
11020   i.op[this_operand].imms = exp;
11021
11022   exp->X_op = O_constant;
11023   exp->X_add_number = 0;
11024   exp->X_add_symbol = (symbolS *) 0;
11025   exp->X_op_symbol = (symbolS *) 0;
11026
11027   i.types[this_operand].bitfield.imm8 = 1;
11028   return 1;
11029 }
11030
11031 /* Only string instructions can have a second memory operand, so
11032    reduce current_templates to just those if it contains any.  */
11033 static int
11034 maybe_adjust_templates (void)
11035 {
11036   const insn_template *t;
11037
11038   gas_assert (i.mem_operands == 1);
11039
11040   for (t = current_templates->start; t < current_templates->end; ++t)
11041     if (t->opcode_modifier.isstring)
11042       break;
11043
11044   if (t < current_templates->end)
11045     {
11046       static templates aux_templates;
11047       bfd_boolean recheck;
11048
11049       aux_templates.start = t;
11050       for (; t < current_templates->end; ++t)
11051         if (!t->opcode_modifier.isstring)
11052           break;
11053       aux_templates.end = t;
11054
11055       /* Determine whether to re-check the first memory operand.  */
11056       recheck = (aux_templates.start != current_templates->start
11057                  || t != current_templates->end);
11058
11059       current_templates = &aux_templates;
11060
11061       if (recheck)
11062         {
11063           i.mem_operands = 0;
11064           if (i.memop1_string != NULL
11065               && i386_index_check (i.memop1_string) == 0)
11066             return 0;
11067           i.mem_operands = 1;
11068         }
11069     }
11070
11071   return 1;
11072 }
11073
11074 /* Parse OPERAND_STRING into the i386_insn structure I.  Returns zero
11075    on error.  */
11076
11077 static int
11078 i386_att_operand (char *operand_string)
11079 {
11080   const reg_entry *r;
11081   char *end_op;
11082   char *op_string = operand_string;
11083
11084   if (is_space_char (*op_string))
11085     ++op_string;
11086
11087   /* We check for an absolute prefix (differentiating,
11088      for example, 'jmp pc_relative_label' from 'jmp *absolute_label'.  */
11089   if (*op_string == ABSOLUTE_PREFIX)
11090     {
11091       ++op_string;
11092       if (is_space_char (*op_string))
11093         ++op_string;
11094       i.jumpabsolute = TRUE;
11095     }
11096
11097   /* Check if operand is a register.  */
11098   if ((r = parse_register (op_string, &end_op)) != NULL)
11099     {
11100       i386_operand_type temp;
11101
11102       if (r == &bad_reg)
11103         return 0;
11104
11105       /* Check for a segment override by searching for ':' after a
11106          segment register.  */
11107       op_string = end_op;
11108       if (is_space_char (*op_string))
11109         ++op_string;
11110       if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
11111         {
11112           switch (r->reg_num)
11113             {
11114             case 0:
11115               i.seg[i.mem_operands] = &es;
11116               break;
11117             case 1:
11118               i.seg[i.mem_operands] = &cs;
11119               break;
11120             case 2:
11121               i.seg[i.mem_operands] = &ss;
11122               break;
11123             case 3:
11124               i.seg[i.mem_operands] = &ds;
11125               break;
11126             case 4:
11127               i.seg[i.mem_operands] = &fs;
11128               break;
11129             case 5:
11130               i.seg[i.mem_operands] = &gs;
11131               break;
11132             }
11133
11134           /* Skip the ':' and whitespace.  */
11135           ++op_string;
11136           if (is_space_char (*op_string))
11137             ++op_string;
11138
11139           if (!is_digit_char (*op_string)
11140               && !is_identifier_char (*op_string)
11141               && *op_string != '('
11142               && *op_string != ABSOLUTE_PREFIX)
11143             {
11144               as_bad (_("bad memory operand `%s'"), op_string);
11145               return 0;
11146             }
11147           /* Handle case of %es:*foo.  */
11148           if (*op_string == ABSOLUTE_PREFIX)
11149             {
11150               ++op_string;
11151               if (is_space_char (*op_string))
11152                 ++op_string;
11153               i.jumpabsolute = TRUE;
11154             }
11155           goto do_memory_reference;
11156         }
11157
11158       /* Handle vector operations.  */
11159       if (*op_string == '{')
11160         {
11161           op_string = check_VecOperations (op_string, NULL);
11162           if (op_string == NULL)
11163             return 0;
11164         }
11165
11166       if (*op_string)
11167         {
11168           as_bad (_("junk `%s' after register"), op_string);
11169           return 0;
11170         }
11171       temp = r->reg_type;
11172       temp.bitfield.baseindex = 0;
11173       i.types[this_operand] = operand_type_or (i.types[this_operand],
11174                                                temp);
11175       i.types[this_operand].bitfield.unspecified = 0;
11176       i.op[this_operand].regs = r;
11177       i.reg_operands++;
11178     }
11179   else if (*op_string == REGISTER_PREFIX)
11180     {
11181       as_bad (_("bad register name `%s'"), op_string);
11182       return 0;
11183     }
11184   else if (*op_string == IMMEDIATE_PREFIX)
11185     {
11186       ++op_string;
11187       if (i.jumpabsolute)
11188         {
11189           as_bad (_("immediate operand illegal with absolute jump"));
11190           return 0;
11191         }
11192       if (!i386_immediate (op_string))
11193         return 0;
11194     }
11195   else if (RC_SAE_immediate (operand_string))
11196     {
11197       /* If it is a RC or SAE immediate, do nothing.  */
11198       ;
11199     }
11200   else if (is_digit_char (*op_string)
11201            || is_identifier_char (*op_string)
11202            || *op_string == '"'
11203            || *op_string == '(')
11204     {
11205       /* This is a memory reference of some sort.  */
11206       char *base_string;
11207
11208       /* Start and end of displacement string expression (if found).  */
11209       char *displacement_string_start;
11210       char *displacement_string_end;
11211       char *vop_start;
11212
11213     do_memory_reference:
11214       if (i.mem_operands == 1 && !maybe_adjust_templates ())
11215         return 0;
11216       if ((i.mem_operands == 1
11217            && !current_templates->start->opcode_modifier.isstring)
11218           || i.mem_operands == 2)
11219         {
11220           as_bad (_("too many memory references for `%s'"),
11221                   current_templates->start->name);
11222           return 0;
11223         }
11224
11225       /* Check for base index form.  We detect the base index form by
11226          looking for an ')' at the end of the operand, searching
11227          for the '(' matching it, and finding a REGISTER_PREFIX or ','
11228          after the '('.  */
11229       base_string = op_string + strlen (op_string);
11230
11231       /* Handle vector operations.  */
11232       vop_start = strchr (op_string, '{');
11233       if (vop_start && vop_start < base_string)
11234         {
11235           if (check_VecOperations (vop_start, base_string) == NULL)
11236             return 0;
11237           base_string = vop_start;
11238         }
11239
11240       --base_string;
11241       if (is_space_char (*base_string))
11242         --base_string;
11243
11244       /* If we only have a displacement, set-up for it to be parsed later.  */
11245       displacement_string_start = op_string;
11246       displacement_string_end = base_string + 1;
11247
11248       if (*base_string == ')')
11249         {
11250           char *temp_string;
11251           unsigned int parens_balanced = 1;
11252           /* We've already checked that the number of left & right ()'s are
11253              equal, so this loop will not be infinite.  */
11254           do
11255             {
11256               base_string--;
11257               if (*base_string == ')')
11258                 parens_balanced++;
11259               if (*base_string == '(')
11260                 parens_balanced--;
11261             }
11262           while (parens_balanced);
11263
11264           temp_string = base_string;
11265
11266           /* Skip past '(' and whitespace.  */
11267           ++base_string;
11268           if (is_space_char (*base_string))
11269             ++base_string;
11270
11271           if (*base_string == ','
11272               || ((i.base_reg = parse_register (base_string, &end_op))
11273                   != NULL))
11274             {
11275               displacement_string_end = temp_string;
11276
11277               i.types[this_operand].bitfield.baseindex = 1;
11278
11279               if (i.base_reg)
11280                 {
11281                   if (i.base_reg == &bad_reg)
11282                     return 0;
11283                   base_string = end_op;
11284                   if (is_space_char (*base_string))
11285                     ++base_string;
11286                 }
11287
11288               /* There may be an index reg or scale factor here.  */
11289               if (*base_string == ',')
11290                 {
11291                   ++base_string;
11292                   if (is_space_char (*base_string))
11293                     ++base_string;
11294
11295                   if ((i.index_reg = parse_register (base_string, &end_op))
11296                       != NULL)
11297                     {
11298                       if (i.index_reg == &bad_reg)
11299                         return 0;
11300                       base_string = end_op;
11301                       if (is_space_char (*base_string))
11302                         ++base_string;
11303                       if (*base_string == ',')
11304                         {
11305                           ++base_string;
11306                           if (is_space_char (*base_string))
11307                             ++base_string;
11308                         }
11309                       else if (*base_string != ')')
11310                         {
11311                           as_bad (_("expecting `,' or `)' "
11312                                     "after index register in `%s'"),
11313                                   operand_string);
11314                           return 0;
11315                         }
11316                     }
11317                   else if (*base_string == REGISTER_PREFIX)
11318                     {
11319                       end_op = strchr (base_string, ',');
11320                       if (end_op)
11321                         *end_op = '\0';
11322                       as_bad (_("bad register name `%s'"), base_string);
11323                       return 0;
11324                     }
11325
11326                   /* Check for scale factor.  */
11327                   if (*base_string != ')')
11328                     {
11329                       char *end_scale = i386_scale (base_string);
11330
11331                       if (!end_scale)
11332                         return 0;
11333
11334                       base_string = end_scale;
11335                       if (is_space_char (*base_string))
11336                         ++base_string;
11337                       if (*base_string != ')')
11338                         {
11339                           as_bad (_("expecting `)' "
11340                                     "after scale factor in `%s'"),
11341                                   operand_string);
11342                           return 0;
11343                         }
11344                     }
11345                   else if (!i.index_reg)
11346                     {
11347                       as_bad (_("expecting index register or scale factor "
11348                                 "after `,'; got '%c'"),
11349                               *base_string);
11350                       return 0;
11351                     }
11352                 }
11353               else if (*base_string != ')')
11354                 {
11355                   as_bad (_("expecting `,' or `)' "
11356                             "after base register in `%s'"),
11357                           operand_string);
11358                   return 0;
11359                 }
11360             }
11361           else if (*base_string == REGISTER_PREFIX)
11362             {
11363               end_op = strchr (base_string, ',');
11364               if (end_op)
11365                 *end_op = '\0';
11366               as_bad (_("bad register name `%s'"), base_string);
11367               return 0;
11368             }
11369         }
11370
11371       /* If there's an expression beginning the operand, parse it,
11372          assuming displacement_string_start and
11373          displacement_string_end are meaningful.  */
11374       if (displacement_string_start != displacement_string_end)
11375         {
11376           if (!i386_displacement (displacement_string_start,
11377                                   displacement_string_end))
11378             return 0;
11379         }
11380
11381       /* Special case for (%dx) while doing input/output op.  */
11382       if (i.base_reg
11383           && i.base_reg->reg_type.bitfield.instance == RegD
11384           && i.base_reg->reg_type.bitfield.word
11385           && i.index_reg == 0
11386           && i.log2_scale_factor == 0
11387           && i.seg[i.mem_operands] == 0
11388           && !operand_type_check (i.types[this_operand], disp))
11389         {
11390           i.types[this_operand] = i.base_reg->reg_type;
11391           return 1;
11392         }
11393
11394       if (i386_index_check (operand_string) == 0)
11395         return 0;
11396       i.flags[this_operand] |= Operand_Mem;
11397       if (i.mem_operands == 0)
11398         i.memop1_string = xstrdup (operand_string);
11399       i.mem_operands++;
11400     }
11401   else
11402     {
11403       /* It's not a memory operand; argh!  */
11404       as_bad (_("invalid char %s beginning operand %d `%s'"),
11405               output_invalid (*op_string),
11406               this_operand + 1,
11407               op_string);
11408       return 0;
11409     }
11410   return 1;                     /* Normal return.  */
11411 }
11412 \f
11413 /* Calculate the maximum variable size (i.e., excluding fr_fix)
11414    that an rs_machine_dependent frag may reach.  */
11415
11416 unsigned int
11417 i386_frag_max_var (fragS *frag)
11418 {
11419   /* The only relaxable frags are for jumps.
11420      Unconditional jumps can grow by 4 bytes and others by 5 bytes.  */
11421   gas_assert (frag->fr_type == rs_machine_dependent);
11422   return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11423 }
11424
11425 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11426 static int
11427 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
11428 {
11429   /* STT_GNU_IFUNC symbol must go through PLT.  */
11430   if ((symbol_get_bfdsym (fr_symbol)->flags
11431        & BSF_GNU_INDIRECT_FUNCTION) != 0)
11432     return 0;
11433
11434   if (!S_IS_EXTERNAL (fr_symbol))
11435     /* Symbol may be weak or local.  */
11436     return !S_IS_WEAK (fr_symbol);
11437
11438   /* Global symbols with non-default visibility can't be preempted. */
11439   if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11440     return 1;
11441
11442   if (fr_var != NO_RELOC)
11443     switch ((enum bfd_reloc_code_real) fr_var)
11444       {
11445       case BFD_RELOC_386_PLT32:
11446       case BFD_RELOC_X86_64_PLT32:
11447         /* Symbol with PLT relocation may be preempted. */
11448         return 0;
11449       default:
11450         abort ();
11451       }
11452
11453   /* Global symbols with default visibility in a shared library may be
11454      preempted by another definition.  */
11455   return !shared;
11456 }
11457 #endif
11458
11459 /* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11460    Note also work for Skylake and Cascadelake.
11461 ---------------------------------------------------------------------
11462 |   JCC   | ADD/SUB/CMP | INC/DEC | TEST/AND |
11463 | ------  | ----------- | ------- | -------- |
11464 |   Jo    |      N      |    N    |     Y    |
11465 |   Jno   |      N      |    N    |     Y    |
11466 |  Jc/Jb  |      Y      |    N    |     Y    |
11467 | Jae/Jnb |      Y      |    N    |     Y    |
11468 |  Je/Jz  |      Y      |    Y    |     Y    |
11469 | Jne/Jnz |      Y      |    Y    |     Y    |
11470 | Jna/Jbe |      Y      |    N    |     Y    |
11471 | Ja/Jnbe |      Y      |    N    |     Y    |
11472 |   Js    |      N      |    N    |     Y    |
11473 |   Jns   |      N      |    N    |     Y    |
11474 |  Jp/Jpe |      N      |    N    |     Y    |
11475 | Jnp/Jpo |      N      |    N    |     Y    |
11476 | Jl/Jnge |      Y      |    Y    |     Y    |
11477 | Jge/Jnl |      Y      |    Y    |     Y    |
11478 | Jle/Jng |      Y      |    Y    |     Y    |
11479 | Jg/Jnle |      Y      |    Y    |     Y    |
11480 ---------------------------------------------------------------------  */
11481 static int
11482 i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11483 {
11484   if (mf_cmp == mf_cmp_alu_cmp)
11485     return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11486             || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11487   if (mf_cmp == mf_cmp_incdec)
11488     return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11489             || mf_jcc == mf_jcc_jle);
11490   if (mf_cmp == mf_cmp_test_and)
11491     return 1;
11492   return 0;
11493 }
11494
11495 /* Return the next non-empty frag.  */
11496
11497 static fragS *
11498 i386_next_non_empty_frag (fragS *fragP)
11499 {
11500   /* There may be a frag with a ".fill 0" when there is no room in
11501      the current frag for frag_grow in output_insn.  */
11502   for (fragP = fragP->fr_next;
11503        (fragP != NULL
11504         && fragP->fr_type == rs_fill
11505         && fragP->fr_fix == 0);
11506        fragP = fragP->fr_next)
11507     ;
11508   return fragP;
11509 }
11510
11511 /* Return the next jcc frag after BRANCH_PADDING.  */
11512
11513 static fragS *
11514 i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
11515 {
11516   fragS *branch_fragP;
11517   if (!pad_fragP)
11518     return NULL;
11519
11520   if (pad_fragP->fr_type == rs_machine_dependent
11521       && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
11522           == BRANCH_PADDING))
11523     {
11524       branch_fragP = i386_next_non_empty_frag (pad_fragP);
11525       if (branch_fragP->fr_type != rs_machine_dependent)
11526         return NULL;
11527       if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11528           && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11529                                    pad_fragP->tc_frag_data.mf_type))
11530         return branch_fragP;
11531     }
11532
11533   return NULL;
11534 }
11535
11536 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags.  */
11537
11538 static void
11539 i386_classify_machine_dependent_frag (fragS *fragP)
11540 {
11541   fragS *cmp_fragP;
11542   fragS *pad_fragP;
11543   fragS *branch_fragP;
11544   fragS *next_fragP;
11545   unsigned int max_prefix_length;
11546
11547   if (fragP->tc_frag_data.classified)
11548     return;
11549
11550   /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING.  Convert
11551      FUSED_JCC_PADDING and merge BRANCH_PADDING.  */
11552   for (next_fragP = fragP;
11553        next_fragP != NULL;
11554        next_fragP = next_fragP->fr_next)
11555     {
11556       next_fragP->tc_frag_data.classified = 1;
11557       if (next_fragP->fr_type == rs_machine_dependent)
11558         switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11559           {
11560           case BRANCH_PADDING:
11561             /* The BRANCH_PADDING frag must be followed by a branch
11562                frag.  */
11563             branch_fragP = i386_next_non_empty_frag (next_fragP);
11564             next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11565             break;
11566           case FUSED_JCC_PADDING:
11567             /* Check if this is a fused jcc:
11568                FUSED_JCC_PADDING
11569                CMP like instruction
11570                BRANCH_PADDING
11571                COND_JUMP
11572                */
11573             cmp_fragP = i386_next_non_empty_frag (next_fragP);
11574             pad_fragP = i386_next_non_empty_frag (cmp_fragP);
11575             branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
11576             if (branch_fragP)
11577               {
11578                 /* The BRANCH_PADDING frag is merged with the
11579                    FUSED_JCC_PADDING frag.  */
11580                 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11581                 /* CMP like instruction size.  */
11582                 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11583                 frag_wane (pad_fragP);
11584                 /* Skip to branch_fragP.  */
11585                 next_fragP = branch_fragP;
11586               }
11587             else if (next_fragP->tc_frag_data.max_prefix_length)
11588               {
11589                 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11590                    a fused jcc.  */
11591                 next_fragP->fr_subtype
11592                   = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11593                 next_fragP->tc_frag_data.max_bytes
11594                   = next_fragP->tc_frag_data.max_prefix_length;
11595                 /* This will be updated in the BRANCH_PREFIX scan.  */
11596                 next_fragP->tc_frag_data.max_prefix_length = 0;
11597               }
11598             else
11599               frag_wane (next_fragP);
11600             break;
11601           }
11602     }
11603
11604   /* Stop if there is no BRANCH_PREFIX.  */
11605   if (!align_branch_prefix_size)
11606     return;
11607
11608   /* Scan for BRANCH_PREFIX.  */
11609   for (; fragP != NULL; fragP = fragP->fr_next)
11610     {
11611       if (fragP->fr_type != rs_machine_dependent
11612           || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11613               != BRANCH_PREFIX))
11614         continue;
11615
11616       /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11617          COND_JUMP_PREFIX.  */
11618       max_prefix_length = 0;
11619       for (next_fragP = fragP;
11620            next_fragP != NULL;
11621            next_fragP = next_fragP->fr_next)
11622         {
11623           if (next_fragP->fr_type == rs_fill)
11624             /* Skip rs_fill frags.  */
11625             continue;
11626           else if (next_fragP->fr_type != rs_machine_dependent)
11627             /* Stop for all other frags.  */
11628             break;
11629
11630           /* rs_machine_dependent frags.  */
11631           if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11632               == BRANCH_PREFIX)
11633             {
11634               /* Count BRANCH_PREFIX frags.  */
11635               if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11636                 {
11637                   max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11638                   frag_wane (next_fragP);
11639                 }
11640               else
11641                 max_prefix_length
11642                   += next_fragP->tc_frag_data.max_bytes;
11643             }
11644           else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11645                     == BRANCH_PADDING)
11646                    || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11647                        == FUSED_JCC_PADDING))
11648             {
11649               /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING.  */
11650               fragP->tc_frag_data.u.padding_fragP = next_fragP;
11651               break;
11652             }
11653           else
11654             /* Stop for other rs_machine_dependent frags.  */
11655             break;
11656         }
11657
11658       fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11659
11660       /* Skip to the next frag.  */
11661       fragP = next_fragP;
11662     }
11663 }
11664
11665 /* Compute padding size for
11666
11667         FUSED_JCC_PADDING
11668         CMP like instruction
11669         BRANCH_PADDING
11670         COND_JUMP/UNCOND_JUMP
11671
11672    or
11673
11674         BRANCH_PADDING
11675         COND_JUMP/UNCOND_JUMP
11676  */
11677
11678 static int
11679 i386_branch_padding_size (fragS *fragP, offsetT address)
11680 {
11681   unsigned int offset, size, padding_size;
11682   fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11683
11684   /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag.  */
11685   if (!address)
11686     address = fragP->fr_address;
11687   address += fragP->fr_fix;
11688
11689   /* CMP like instrunction size.  */
11690   size = fragP->tc_frag_data.cmp_size;
11691
11692   /* The base size of the branch frag.  */
11693   size += branch_fragP->fr_fix;
11694
11695   /* Add opcode and displacement bytes for the rs_machine_dependent
11696      branch frag.  */
11697   if (branch_fragP->fr_type == rs_machine_dependent)
11698     size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11699
11700   /* Check if branch is within boundary and doesn't end at the last
11701      byte.  */
11702   offset = address & ((1U << align_branch_power) - 1);
11703   if ((offset + size) >= (1U << align_branch_power))
11704     /* Padding needed to avoid crossing boundary.  */
11705     padding_size = (1U << align_branch_power) - offset;
11706   else
11707     /* No padding needed.  */
11708     padding_size = 0;
11709
11710   /* The return value may be saved in tc_frag_data.length which is
11711      unsigned byte.  */
11712   if (!fits_in_unsigned_byte (padding_size))
11713     abort ();
11714
11715   return padding_size;
11716 }
11717
11718 /* i386_generic_table_relax_frag()
11719
11720    Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11721    grow/shrink padding to align branch frags.  Hand others to
11722    relax_frag().  */
11723
11724 long
11725 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11726 {
11727   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11728       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11729     {
11730       long padding_size = i386_branch_padding_size (fragP, 0);
11731       long grow = padding_size - fragP->tc_frag_data.length;
11732
11733       /* When the BRANCH_PREFIX frag is used, the computed address
11734          must match the actual address and there should be no padding.  */
11735       if (fragP->tc_frag_data.padding_address
11736           && (fragP->tc_frag_data.padding_address != fragP->fr_address
11737               || padding_size))
11738         abort ();
11739
11740       /* Update the padding size.  */
11741       if (grow)
11742         fragP->tc_frag_data.length = padding_size;
11743
11744       return grow;
11745     }
11746   else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11747     {
11748       fragS *padding_fragP, *next_fragP;
11749       long padding_size, left_size, last_size;
11750
11751       padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11752       if (!padding_fragP)
11753         /* Use the padding set by the leading BRANCH_PREFIX frag.  */
11754         return (fragP->tc_frag_data.length
11755                 - fragP->tc_frag_data.last_length);
11756
11757       /* Compute the relative address of the padding frag in the very
11758         first time where the BRANCH_PREFIX frag sizes are zero.  */
11759       if (!fragP->tc_frag_data.padding_address)
11760         fragP->tc_frag_data.padding_address
11761           = padding_fragP->fr_address - (fragP->fr_address - stretch);
11762
11763       /* First update the last length from the previous interation.  */
11764       left_size = fragP->tc_frag_data.prefix_length;
11765       for (next_fragP = fragP;
11766            next_fragP != padding_fragP;
11767            next_fragP = next_fragP->fr_next)
11768         if (next_fragP->fr_type == rs_machine_dependent
11769             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11770                 == BRANCH_PREFIX))
11771           {
11772             if (left_size)
11773               {
11774                 int max = next_fragP->tc_frag_data.max_bytes;
11775                 if (max)
11776                   {
11777                     int size;
11778                     if (max > left_size)
11779                       size = left_size;
11780                     else
11781                       size = max;
11782                     left_size -= size;
11783                     next_fragP->tc_frag_data.last_length = size;
11784                   }
11785               }
11786             else
11787               next_fragP->tc_frag_data.last_length = 0;
11788           }
11789
11790       /* Check the padding size for the padding frag.  */
11791       padding_size = i386_branch_padding_size
11792         (padding_fragP, (fragP->fr_address
11793                          + fragP->tc_frag_data.padding_address));
11794
11795       last_size = fragP->tc_frag_data.prefix_length;
11796       /* Check if there is change from the last interation.  */
11797       if (padding_size == last_size)
11798         {
11799           /* Update the expected address of the padding frag.  */
11800           padding_fragP->tc_frag_data.padding_address
11801             = (fragP->fr_address + padding_size
11802                + fragP->tc_frag_data.padding_address);
11803           return 0;
11804         }
11805
11806       if (padding_size > fragP->tc_frag_data.max_prefix_length)
11807         {
11808           /* No padding if there is no sufficient room.  Clear the
11809              expected address of the padding frag.  */
11810           padding_fragP->tc_frag_data.padding_address = 0;
11811           padding_size = 0;
11812         }
11813       else
11814         /* Store the expected address of the padding frag.  */
11815         padding_fragP->tc_frag_data.padding_address
11816           = (fragP->fr_address + padding_size
11817              + fragP->tc_frag_data.padding_address);
11818
11819       fragP->tc_frag_data.prefix_length = padding_size;
11820
11821       /* Update the length for the current interation.  */
11822       left_size = padding_size;
11823       for (next_fragP = fragP;
11824            next_fragP != padding_fragP;
11825            next_fragP = next_fragP->fr_next)
11826         if (next_fragP->fr_type == rs_machine_dependent
11827             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11828                 == BRANCH_PREFIX))
11829           {
11830             if (left_size)
11831               {
11832                 int max = next_fragP->tc_frag_data.max_bytes;
11833                 if (max)
11834                   {
11835                     int size;
11836                     if (max > left_size)
11837                       size = left_size;
11838                     else
11839                       size = max;
11840                     left_size -= size;
11841                     next_fragP->tc_frag_data.length = size;
11842                   }
11843               }
11844             else
11845               next_fragP->tc_frag_data.length = 0;
11846           }
11847
11848       return (fragP->tc_frag_data.length
11849               - fragP->tc_frag_data.last_length);
11850     }
11851   return relax_frag (segment, fragP, stretch);
11852 }
11853
11854 /* md_estimate_size_before_relax()
11855
11856    Called just before relax() for rs_machine_dependent frags.  The x86
11857    assembler uses these frags to handle variable size jump
11858    instructions.
11859
11860    Any symbol that is now undefined will not become defined.
11861    Return the correct fr_subtype in the frag.
11862    Return the initial "guess for variable size of frag" to caller.
11863    The guess is actually the growth beyond the fixed part.  Whatever
11864    we do to grow the fixed or variable part contributes to our
11865    returned value.  */
11866
11867 int
11868 md_estimate_size_before_relax (fragS *fragP, segT segment)
11869 {
11870   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11871       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11872       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11873     {
11874       i386_classify_machine_dependent_frag (fragP);
11875       return fragP->tc_frag_data.length;
11876     }
11877
11878   /* We've already got fragP->fr_subtype right;  all we have to do is
11879      check for un-relaxable symbols.  On an ELF system, we can't relax
11880      an externally visible symbol, because it may be overridden by a
11881      shared library.  */
11882   if (S_GET_SEGMENT (fragP->fr_symbol) != segment
11883 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11884       || (IS_ELF
11885           && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11886                                                 fragP->fr_var))
11887 #endif
11888 #if defined (OBJ_COFF) && defined (TE_PE)
11889       || (OUTPUT_FLAVOR == bfd_target_coff_flavour
11890           && S_IS_WEAK (fragP->fr_symbol))
11891 #endif
11892       )
11893     {
11894       /* Symbol is undefined in this segment, or we need to keep a
11895          reloc so that weak symbols can be overridden.  */
11896       int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
11897       enum bfd_reloc_code_real reloc_type;
11898       unsigned char *opcode;
11899       int old_fr_fix;
11900
11901       if (fragP->fr_var != NO_RELOC)
11902         reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
11903       else if (size == 2)
11904         reloc_type = BFD_RELOC_16_PCREL;
11905 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11906       else if (need_plt32_p (fragP->fr_symbol))
11907         reloc_type = BFD_RELOC_X86_64_PLT32;
11908 #endif
11909       else
11910         reloc_type = BFD_RELOC_32_PCREL;
11911
11912       old_fr_fix = fragP->fr_fix;
11913       opcode = (unsigned char *) fragP->fr_opcode;
11914
11915       switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
11916         {
11917         case UNCOND_JUMP:
11918           /* Make jmp (0xeb) a (d)word displacement jump.  */
11919           opcode[0] = 0xe9;
11920           fragP->fr_fix += size;
11921           fix_new (fragP, old_fr_fix, size,
11922                    fragP->fr_symbol,
11923                    fragP->fr_offset, 1,
11924                    reloc_type);
11925           break;
11926
11927         case COND_JUMP86:
11928           if (size == 2
11929               && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
11930             {
11931               /* Negate the condition, and branch past an
11932                  unconditional jump.  */
11933               opcode[0] ^= 1;
11934               opcode[1] = 3;
11935               /* Insert an unconditional jump.  */
11936               opcode[2] = 0xe9;
11937               /* We added two extra opcode bytes, and have a two byte
11938                  offset.  */
11939               fragP->fr_fix += 2 + 2;
11940               fix_new (fragP, old_fr_fix + 2, 2,
11941                        fragP->fr_symbol,
11942                        fragP->fr_offset, 1,
11943                        reloc_type);
11944               break;
11945             }
11946           /* Fall through.  */
11947
11948         case COND_JUMP:
11949           if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11950             {
11951               fixS *fixP;
11952
11953               fragP->fr_fix += 1;
11954               fixP = fix_new (fragP, old_fr_fix, 1,
11955                               fragP->fr_symbol,
11956                               fragP->fr_offset, 1,
11957                               BFD_RELOC_8_PCREL);
11958               fixP->fx_signed = 1;
11959               break;
11960             }
11961
11962           /* This changes the byte-displacement jump 0x7N
11963              to the (d)word-displacement jump 0x0f,0x8N.  */
11964           opcode[1] = opcode[0] + 0x10;
11965           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11966           /* We've added an opcode byte.  */
11967           fragP->fr_fix += 1 + size;
11968           fix_new (fragP, old_fr_fix + 1, size,
11969                    fragP->fr_symbol,
11970                    fragP->fr_offset, 1,
11971                    reloc_type);
11972           break;
11973
11974         default:
11975           BAD_CASE (fragP->fr_subtype);
11976           break;
11977         }
11978       frag_wane (fragP);
11979       return fragP->fr_fix - old_fr_fix;
11980     }
11981
11982   /* Guess size depending on current relax state.  Initially the relax
11983      state will correspond to a short jump and we return 1, because
11984      the variable part of the frag (the branch offset) is one byte
11985      long.  However, we can relax a section more than once and in that
11986      case we must either set fr_subtype back to the unrelaxed state,
11987      or return the value for the appropriate branch.  */
11988   return md_relax_table[fragP->fr_subtype].rlx_length;
11989 }
11990
11991 /* Called after relax() is finished.
11992
11993    In:  Address of frag.
11994         fr_type == rs_machine_dependent.
11995         fr_subtype is what the address relaxed to.
11996
11997    Out: Any fixSs and constants are set up.
11998         Caller will turn frag into a ".space 0".  */
11999
12000 void
12001 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
12002                  fragS *fragP)
12003 {
12004   unsigned char *opcode;
12005   unsigned char *where_to_put_displacement = NULL;
12006   offsetT target_address;
12007   offsetT opcode_address;
12008   unsigned int extension = 0;
12009   offsetT displacement_from_opcode_start;
12010
12011   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12012       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
12013       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12014     {
12015       /* Generate nop padding.  */
12016       unsigned int size = fragP->tc_frag_data.length;
12017       if (size)
12018         {
12019           if (size > fragP->tc_frag_data.max_bytes)
12020             abort ();
12021
12022           if (flag_debug)
12023             {
12024               const char *msg;
12025               const char *branch = "branch";
12026               const char *prefix = "";
12027               fragS *padding_fragP;
12028               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12029                   == BRANCH_PREFIX)
12030                 {
12031                   padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12032                   switch (fragP->tc_frag_data.default_prefix)
12033                     {
12034                     default:
12035                       abort ();
12036                       break;
12037                     case CS_PREFIX_OPCODE:
12038                       prefix = " cs";
12039                       break;
12040                     case DS_PREFIX_OPCODE:
12041                       prefix = " ds";
12042                       break;
12043                     case ES_PREFIX_OPCODE:
12044                       prefix = " es";
12045                       break;
12046                     case FS_PREFIX_OPCODE:
12047                       prefix = " fs";
12048                       break;
12049                     case GS_PREFIX_OPCODE:
12050                       prefix = " gs";
12051                       break;
12052                     case SS_PREFIX_OPCODE:
12053                       prefix = " ss";
12054                       break;
12055                     }
12056                   if (padding_fragP)
12057                     msg = _("%s:%u: add %d%s at 0x%llx to align "
12058                             "%s within %d-byte boundary\n");
12059                   else
12060                     msg = _("%s:%u: add additional %d%s at 0x%llx to "
12061                             "align %s within %d-byte boundary\n");
12062                 }
12063               else
12064                 {
12065                   padding_fragP = fragP;
12066                   msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12067                           "%s within %d-byte boundary\n");
12068                 }
12069
12070               if (padding_fragP)
12071                 switch (padding_fragP->tc_frag_data.branch_type)
12072                   {
12073                   case align_branch_jcc:
12074                     branch = "jcc";
12075                     break;
12076                   case align_branch_fused:
12077                     branch = "fused jcc";
12078                     break;
12079                   case align_branch_jmp:
12080                     branch = "jmp";
12081                     break;
12082                   case align_branch_call:
12083                     branch = "call";
12084                     break;
12085                   case align_branch_indirect:
12086                     branch = "indiret branch";
12087                     break;
12088                   case align_branch_ret:
12089                     branch = "ret";
12090                     break;
12091                   default:
12092                     break;
12093                   }
12094
12095               fprintf (stdout, msg,
12096                        fragP->fr_file, fragP->fr_line, size, prefix,
12097                        (long long) fragP->fr_address, branch,
12098                        1 << align_branch_power);
12099             }
12100           if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12101             memset (fragP->fr_opcode,
12102                     fragP->tc_frag_data.default_prefix, size);
12103           else
12104             i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12105                                 size, 0);
12106           fragP->fr_fix += size;
12107         }
12108       return;
12109     }
12110
12111   opcode = (unsigned char *) fragP->fr_opcode;
12112
12113   /* Address we want to reach in file space.  */
12114   target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
12115
12116   /* Address opcode resides at in file space.  */
12117   opcode_address = fragP->fr_address + fragP->fr_fix;
12118
12119   /* Displacement from opcode start to fill into instruction.  */
12120   displacement_from_opcode_start = target_address - opcode_address;
12121
12122   if ((fragP->fr_subtype & BIG) == 0)
12123     {
12124       /* Don't have to change opcode.  */
12125       extension = 1;            /* 1 opcode + 1 displacement  */
12126       where_to_put_displacement = &opcode[1];
12127     }
12128   else
12129     {
12130       if (no_cond_jump_promotion
12131           && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
12132         as_warn_where (fragP->fr_file, fragP->fr_line,
12133                        _("long jump required"));
12134
12135       switch (fragP->fr_subtype)
12136         {
12137         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12138           extension = 4;                /* 1 opcode + 4 displacement  */
12139           opcode[0] = 0xe9;
12140           where_to_put_displacement = &opcode[1];
12141           break;
12142
12143         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12144           extension = 2;                /* 1 opcode + 2 displacement  */
12145           opcode[0] = 0xe9;
12146           where_to_put_displacement = &opcode[1];
12147           break;
12148
12149         case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12150         case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12151           extension = 5;                /* 2 opcode + 4 displacement  */
12152           opcode[1] = opcode[0] + 0x10;
12153           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12154           where_to_put_displacement = &opcode[2];
12155           break;
12156
12157         case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12158           extension = 3;                /* 2 opcode + 2 displacement  */
12159           opcode[1] = opcode[0] + 0x10;
12160           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12161           where_to_put_displacement = &opcode[2];
12162           break;
12163
12164         case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12165           extension = 4;
12166           opcode[0] ^= 1;
12167           opcode[1] = 3;
12168           opcode[2] = 0xe9;
12169           where_to_put_displacement = &opcode[3];
12170           break;
12171
12172         default:
12173           BAD_CASE (fragP->fr_subtype);
12174           break;
12175         }
12176     }
12177
12178   /* If size if less then four we are sure that the operand fits,
12179      but if it's 4, then it could be that the displacement is larger
12180      then -/+ 2GB.  */
12181   if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12182       && object_64bit
12183       && ((addressT) (displacement_from_opcode_start - extension
12184                       + ((addressT) 1 << 31))
12185           > (((addressT) 2 << 31) - 1)))
12186     {
12187       as_bad_where (fragP->fr_file, fragP->fr_line,
12188                     _("jump target out of range"));
12189       /* Make us emit 0.  */
12190       displacement_from_opcode_start = extension;
12191     }
12192   /* Now put displacement after opcode.  */
12193   md_number_to_chars ((char *) where_to_put_displacement,
12194                       (valueT) (displacement_from_opcode_start - extension),
12195                       DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
12196   fragP->fr_fix += extension;
12197 }
12198 \f
12199 /* Apply a fixup (fixP) to segment data, once it has been determined
12200    by our caller that we have all the info we need to fix it up.
12201
12202    Parameter valP is the pointer to the value of the bits.
12203
12204    On the 386, immediates, displacements, and data pointers are all in
12205    the same (little-endian) format, so we don't need to care about which
12206    we are handling.  */
12207
12208 void
12209 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
12210 {
12211   char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
12212   valueT value = *valP;
12213
12214 #if !defined (TE_Mach)
12215   if (fixP->fx_pcrel)
12216     {
12217       switch (fixP->fx_r_type)
12218         {
12219         default:
12220           break;
12221
12222         case BFD_RELOC_64:
12223           fixP->fx_r_type = BFD_RELOC_64_PCREL;
12224           break;
12225         case BFD_RELOC_32:
12226         case BFD_RELOC_X86_64_32S:
12227           fixP->fx_r_type = BFD_RELOC_32_PCREL;
12228           break;
12229         case BFD_RELOC_16:
12230           fixP->fx_r_type = BFD_RELOC_16_PCREL;
12231           break;
12232         case BFD_RELOC_8:
12233           fixP->fx_r_type = BFD_RELOC_8_PCREL;
12234           break;
12235         }
12236     }
12237
12238   if (fixP->fx_addsy != NULL
12239       && (fixP->fx_r_type == BFD_RELOC_32_PCREL
12240           || fixP->fx_r_type == BFD_RELOC_64_PCREL
12241           || fixP->fx_r_type == BFD_RELOC_16_PCREL
12242           || fixP->fx_r_type == BFD_RELOC_8_PCREL)
12243       && !use_rela_relocations)
12244     {
12245       /* This is a hack.  There should be a better way to handle this.
12246          This covers for the fact that bfd_install_relocation will
12247          subtract the current location (for partial_inplace, PC relative
12248          relocations); see more below.  */
12249 #ifndef OBJ_AOUT
12250       if (IS_ELF
12251 #ifdef TE_PE
12252           || OUTPUT_FLAVOR == bfd_target_coff_flavour
12253 #endif
12254           )
12255         value += fixP->fx_where + fixP->fx_frag->fr_address;
12256 #endif
12257 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12258       if (IS_ELF)
12259         {
12260           segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
12261
12262           if ((sym_seg == seg
12263                || (symbol_section_p (fixP->fx_addsy)
12264                    && sym_seg != absolute_section))
12265               && !generic_force_reloc (fixP))
12266             {
12267               /* Yes, we add the values in twice.  This is because
12268                  bfd_install_relocation subtracts them out again.  I think
12269                  bfd_install_relocation is broken, but I don't dare change
12270                  it.  FIXME.  */
12271               value += fixP->fx_where + fixP->fx_frag->fr_address;
12272             }
12273         }
12274 #endif
12275 #if defined (OBJ_COFF) && defined (TE_PE)
12276       /* For some reason, the PE format does not store a
12277          section address offset for a PC relative symbol.  */
12278       if (S_GET_SEGMENT (fixP->fx_addsy) != seg
12279           || S_IS_WEAK (fixP->fx_addsy))
12280         value += md_pcrel_from (fixP);
12281 #endif
12282     }
12283 #if defined (OBJ_COFF) && defined (TE_PE)
12284   if (fixP->fx_addsy != NULL
12285       && S_IS_WEAK (fixP->fx_addsy)
12286       /* PR 16858: Do not modify weak function references.  */
12287       && ! fixP->fx_pcrel)
12288     {
12289 #if !defined (TE_PEP)
12290       /* For x86 PE weak function symbols are neither PC-relative
12291          nor do they set S_IS_FUNCTION.  So the only reliable way
12292          to detect them is to check the flags of their containing
12293          section.  */
12294       if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12295           && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12296         ;
12297       else
12298 #endif
12299       value -= S_GET_VALUE (fixP->fx_addsy);
12300     }
12301 #endif
12302
12303   /* Fix a few things - the dynamic linker expects certain values here,
12304      and we must not disappoint it.  */
12305 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12306   if (IS_ELF && fixP->fx_addsy)
12307     switch (fixP->fx_r_type)
12308       {
12309       case BFD_RELOC_386_PLT32:
12310       case BFD_RELOC_X86_64_PLT32:
12311         /* Make the jump instruction point to the address of the operand.
12312            At runtime we merely add the offset to the actual PLT entry.
12313            NB: Subtract the offset size only for jump instructions.  */
12314         if (fixP->fx_pcrel)
12315           value = -4;
12316         break;
12317
12318       case BFD_RELOC_386_TLS_GD:
12319       case BFD_RELOC_386_TLS_LDM:
12320       case BFD_RELOC_386_TLS_IE_32:
12321       case BFD_RELOC_386_TLS_IE:
12322       case BFD_RELOC_386_TLS_GOTIE:
12323       case BFD_RELOC_386_TLS_GOTDESC:
12324       case BFD_RELOC_X86_64_TLSGD:
12325       case BFD_RELOC_X86_64_TLSLD:
12326       case BFD_RELOC_X86_64_GOTTPOFF:
12327       case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12328         value = 0; /* Fully resolved at runtime.  No addend.  */
12329         /* Fallthrough */
12330       case BFD_RELOC_386_TLS_LE:
12331       case BFD_RELOC_386_TLS_LDO_32:
12332       case BFD_RELOC_386_TLS_LE_32:
12333       case BFD_RELOC_X86_64_DTPOFF32:
12334       case BFD_RELOC_X86_64_DTPOFF64:
12335       case BFD_RELOC_X86_64_TPOFF32:
12336       case BFD_RELOC_X86_64_TPOFF64:
12337         S_SET_THREAD_LOCAL (fixP->fx_addsy);
12338         break;
12339
12340       case BFD_RELOC_386_TLS_DESC_CALL:
12341       case BFD_RELOC_X86_64_TLSDESC_CALL:
12342         value = 0; /* Fully resolved at runtime.  No addend.  */
12343         S_SET_THREAD_LOCAL (fixP->fx_addsy);
12344         fixP->fx_done = 0;
12345         return;
12346
12347       case BFD_RELOC_VTABLE_INHERIT:
12348       case BFD_RELOC_VTABLE_ENTRY:
12349         fixP->fx_done = 0;
12350         return;
12351
12352       default:
12353         break;
12354       }
12355 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)  */
12356   *valP = value;
12357 #endif /* !defined (TE_Mach)  */
12358
12359   /* Are we finished with this relocation now?  */
12360   if (fixP->fx_addsy == NULL)
12361     fixP->fx_done = 1;
12362 #if defined (OBJ_COFF) && defined (TE_PE)
12363   else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12364     {
12365       fixP->fx_done = 0;
12366       /* Remember value for tc_gen_reloc.  */
12367       fixP->fx_addnumber = value;
12368       /* Clear out the frag for now.  */
12369       value = 0;
12370     }
12371 #endif
12372   else if (use_rela_relocations)
12373     {
12374       fixP->fx_no_overflow = 1;
12375       /* Remember value for tc_gen_reloc.  */
12376       fixP->fx_addnumber = value;
12377       value = 0;
12378     }
12379
12380   md_number_to_chars (p, value, fixP->fx_size);
12381 }
12382 \f
12383 const char *
12384 md_atof (int type, char *litP, int *sizeP)
12385 {
12386   /* This outputs the LITTLENUMs in REVERSE order;
12387      in accord with the bigendian 386.  */
12388   return ieee_md_atof (type, litP, sizeP, FALSE);
12389 }
12390 \f
12391 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
12392
12393 static char *
12394 output_invalid (int c)
12395 {
12396   if (ISPRINT (c))
12397     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12398               "'%c'", c);
12399   else
12400     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12401               "(0x%x)", (unsigned char) c);
12402   return output_invalid_buf;
12403 }
12404
12405 /* Verify that @r can be used in the current context.  */
12406
12407 static bfd_boolean check_register (const reg_entry *r)
12408 {
12409   if (allow_pseudo_reg)
12410     return TRUE;
12411
12412   if (operand_type_all_zero (&r->reg_type))
12413     return FALSE;
12414
12415   if ((r->reg_type.bitfield.dword
12416        || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12417        || r->reg_type.bitfield.class == RegCR
12418        || r->reg_type.bitfield.class == RegDR)
12419       && !cpu_arch_flags.bitfield.cpui386)
12420     return FALSE;
12421
12422   if (r->reg_type.bitfield.class == RegTR
12423       && (flag_code == CODE_64BIT
12424           || !cpu_arch_flags.bitfield.cpui386
12425           || cpu_arch_isa_flags.bitfield.cpui586
12426           || cpu_arch_isa_flags.bitfield.cpui686))
12427     return FALSE;
12428
12429   if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12430     return FALSE;
12431
12432   if (!cpu_arch_flags.bitfield.cpuavx512f)
12433     {
12434       if (r->reg_type.bitfield.zmmword
12435           || r->reg_type.bitfield.class == RegMask)
12436         return FALSE;
12437
12438       if (!cpu_arch_flags.bitfield.cpuavx)
12439         {
12440           if (r->reg_type.bitfield.ymmword)
12441             return FALSE;
12442
12443           if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12444             return FALSE;
12445         }
12446     }
12447
12448   if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12449     return FALSE;
12450
12451   /* Don't allow fake index register unless allow_index_reg isn't 0. */
12452   if (!allow_index_reg && r->reg_num == RegIZ)
12453     return FALSE;
12454
12455   /* Upper 16 vector registers are only available with VREX in 64bit
12456      mode, and require EVEX encoding.  */
12457   if (r->reg_flags & RegVRex)
12458     {
12459       if (!cpu_arch_flags.bitfield.cpuavx512f
12460           || flag_code != CODE_64BIT)
12461         return FALSE;
12462
12463       if (i.vec_encoding == vex_encoding_default)
12464         i.vec_encoding = vex_encoding_evex;
12465       else if (i.vec_encoding != vex_encoding_evex)
12466         i.vec_encoding = vex_encoding_error;
12467     }
12468
12469   if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12470       && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12471       && flag_code != CODE_64BIT)
12472     return FALSE;
12473
12474   if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12475       && !intel_syntax)
12476     return FALSE;
12477
12478   return TRUE;
12479 }
12480
12481 /* REG_STRING starts *before* REGISTER_PREFIX.  */
12482
12483 static const reg_entry *
12484 parse_real_register (char *reg_string, char **end_op)
12485 {
12486   char *s = reg_string;
12487   char *p;
12488   char reg_name_given[MAX_REG_NAME_SIZE + 1];
12489   const reg_entry *r;
12490
12491   /* Skip possible REGISTER_PREFIX and possible whitespace.  */
12492   if (*s == REGISTER_PREFIX)
12493     ++s;
12494
12495   if (is_space_char (*s))
12496     ++s;
12497
12498   p = reg_name_given;
12499   while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
12500     {
12501       if (p >= reg_name_given + MAX_REG_NAME_SIZE)
12502         return (const reg_entry *) NULL;
12503       s++;
12504     }
12505
12506   /* For naked regs, make sure that we are not dealing with an identifier.
12507      This prevents confusing an identifier like `eax_var' with register
12508      `eax'.  */
12509   if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12510     return (const reg_entry *) NULL;
12511
12512   *end_op = s;
12513
12514   r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
12515
12516   /* Handle floating point regs, allowing spaces in the (i) part.  */
12517   if (r == i386_regtab /* %st is first entry of table  */)
12518     {
12519       if (!cpu_arch_flags.bitfield.cpu8087
12520           && !cpu_arch_flags.bitfield.cpu287
12521           && !cpu_arch_flags.bitfield.cpu387
12522           && !allow_pseudo_reg)
12523         return (const reg_entry *) NULL;
12524
12525       if (is_space_char (*s))
12526         ++s;
12527       if (*s == '(')
12528         {
12529           ++s;
12530           if (is_space_char (*s))
12531             ++s;
12532           if (*s >= '0' && *s <= '7')
12533             {
12534               int fpr = *s - '0';
12535               ++s;
12536               if (is_space_char (*s))
12537                 ++s;
12538               if (*s == ')')
12539                 {
12540                   *end_op = s + 1;
12541                   r = (const reg_entry *) hash_find (reg_hash, "st(0)");
12542                   know (r);
12543                   return r + fpr;
12544                 }
12545             }
12546           /* We have "%st(" then garbage.  */
12547           return (const reg_entry *) NULL;
12548         }
12549     }
12550
12551   return r && check_register (r) ? r : NULL;
12552 }
12553
12554 /* REG_STRING starts *before* REGISTER_PREFIX.  */
12555
12556 static const reg_entry *
12557 parse_register (char *reg_string, char **end_op)
12558 {
12559   const reg_entry *r;
12560
12561   if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12562     r = parse_real_register (reg_string, end_op);
12563   else
12564     r = NULL;
12565   if (!r)
12566     {
12567       char *save = input_line_pointer;
12568       char c;
12569       symbolS *symbolP;
12570
12571       input_line_pointer = reg_string;
12572       c = get_symbol_name (&reg_string);
12573       symbolP = symbol_find (reg_string);
12574       if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12575         {
12576           const expressionS *e = symbol_get_value_expression (symbolP);
12577
12578           know (e->X_op == O_register);
12579           know (e->X_add_number >= 0
12580                 && (valueT) e->X_add_number < i386_regtab_size);
12581           r = i386_regtab + e->X_add_number;
12582           if (!check_register (r))
12583             {
12584               as_bad (_("register '%s%s' cannot be used here"),
12585                       register_prefix, r->reg_name);
12586               r = &bad_reg;
12587             }
12588           *end_op = input_line_pointer;
12589         }
12590       *input_line_pointer = c;
12591       input_line_pointer = save;
12592     }
12593   return r;
12594 }
12595
12596 int
12597 i386_parse_name (char *name, expressionS *e, char *nextcharP)
12598 {
12599   const reg_entry *r;
12600   char *end = input_line_pointer;
12601
12602   *end = *nextcharP;
12603   r = parse_register (name, &input_line_pointer);
12604   if (r && end <= input_line_pointer)
12605     {
12606       *nextcharP = *input_line_pointer;
12607       *input_line_pointer = 0;
12608       if (r != &bad_reg)
12609         {
12610           e->X_op = O_register;
12611           e->X_add_number = r - i386_regtab;
12612         }
12613       else
12614           e->X_op = O_illegal;
12615       return 1;
12616     }
12617   input_line_pointer = end;
12618   *end = 0;
12619   return intel_syntax ? i386_intel_parse_name (name, e) : 0;
12620 }
12621
12622 void
12623 md_operand (expressionS *e)
12624 {
12625   char *end;
12626   const reg_entry *r;
12627
12628   switch (*input_line_pointer)
12629     {
12630     case REGISTER_PREFIX:
12631       r = parse_real_register (input_line_pointer, &end);
12632       if (r)
12633         {
12634           e->X_op = O_register;
12635           e->X_add_number = r - i386_regtab;
12636           input_line_pointer = end;
12637         }
12638       break;
12639
12640     case '[':
12641       gas_assert (intel_syntax);
12642       end = input_line_pointer++;
12643       expression (e);
12644       if (*input_line_pointer == ']')
12645         {
12646           ++input_line_pointer;
12647           e->X_op_symbol = make_expr_symbol (e);
12648           e->X_add_symbol = NULL;
12649           e->X_add_number = 0;
12650           e->X_op = O_index;
12651         }
12652       else
12653         {
12654           e->X_op = O_absent;
12655           input_line_pointer = end;
12656         }
12657       break;
12658     }
12659 }
12660
12661 \f
12662 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12663 const char *md_shortopts = "kVQ:sqnO::";
12664 #else
12665 const char *md_shortopts = "qnO::";
12666 #endif
12667
12668 #define OPTION_32 (OPTION_MD_BASE + 0)
12669 #define OPTION_64 (OPTION_MD_BASE + 1)
12670 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12671 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12672 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12673 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12674 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12675 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12676 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12677 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12678 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12679 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12680 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12681 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12682 #define OPTION_X32 (OPTION_MD_BASE + 14)
12683 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12684 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12685 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12686 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12687 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12688 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12689 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12690 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12691 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12692 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12693 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12694 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12695 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12696 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12697 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12698 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12699 #define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
12700 #define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
12701 #define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
12702
12703 struct option md_longopts[] =
12704 {
12705   {"32", no_argument, NULL, OPTION_32},
12706 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12707      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12708   {"64", no_argument, NULL, OPTION_64},
12709 #endif
12710 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12711   {"x32", no_argument, NULL, OPTION_X32},
12712   {"mshared", no_argument, NULL, OPTION_MSHARED},
12713   {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12714 #endif
12715   {"divide", no_argument, NULL, OPTION_DIVIDE},
12716   {"march", required_argument, NULL, OPTION_MARCH},
12717   {"mtune", required_argument, NULL, OPTION_MTUNE},
12718   {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12719   {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12720   {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12721   {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12722   {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12723   {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12724   {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12725   {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12726   {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12727   {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12728   {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12729   {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12730 # if defined (TE_PE) || defined (TE_PEP)
12731   {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12732 #endif
12733   {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12734   {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12735   {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12736   {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12737   {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12738   {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12739   {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12740   {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12741   {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
12742   {"mlfence-before-indirect-branch", required_argument, NULL,
12743    OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
12744   {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
12745   {"mamd64", no_argument, NULL, OPTION_MAMD64},
12746   {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12747   {NULL, no_argument, NULL, 0}
12748 };
12749 size_t md_longopts_size = sizeof (md_longopts);
12750
12751 int
12752 md_parse_option (int c, const char *arg)
12753 {
12754   unsigned int j;
12755   char *arch, *next, *saved, *type;
12756
12757   switch (c)
12758     {
12759     case 'n':
12760       optimize_align_code = 0;
12761       break;
12762
12763     case 'q':
12764       quiet_warnings = 1;
12765       break;
12766
12767 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12768       /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12769          should be emitted or not.  FIXME: Not implemented.  */
12770     case 'Q':
12771       if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12772         return 0;
12773       break;
12774
12775       /* -V: SVR4 argument to print version ID.  */
12776     case 'V':
12777       print_version_id ();
12778       break;
12779
12780       /* -k: Ignore for FreeBSD compatibility.  */
12781     case 'k':
12782       break;
12783
12784     case 's':
12785       /* -s: On i386 Solaris, this tells the native assembler to use
12786          .stab instead of .stab.excl.  We always use .stab anyhow.  */
12787       break;
12788
12789     case OPTION_MSHARED:
12790       shared = 1;
12791       break;
12792
12793     case OPTION_X86_USED_NOTE:
12794       if (strcasecmp (arg, "yes") == 0)
12795         x86_used_note = 1;
12796       else if (strcasecmp (arg, "no") == 0)
12797         x86_used_note = 0;
12798       else
12799         as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12800       break;
12801
12802
12803 #endif
12804 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12805      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12806     case OPTION_64:
12807       {
12808         const char **list, **l;
12809
12810         list = bfd_target_list ();
12811         for (l = list; *l != NULL; l++)
12812           if (CONST_STRNEQ (*l, "elf64-x86-64")
12813               || strcmp (*l, "coff-x86-64") == 0
12814               || strcmp (*l, "pe-x86-64") == 0
12815               || strcmp (*l, "pei-x86-64") == 0
12816               || strcmp (*l, "mach-o-x86-64") == 0)
12817             {
12818               default_arch = "x86_64";
12819               break;
12820             }
12821         if (*l == NULL)
12822           as_fatal (_("no compiled in support for x86_64"));
12823         free (list);
12824       }
12825       break;
12826 #endif
12827
12828 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12829     case OPTION_X32:
12830       if (IS_ELF)
12831         {
12832           const char **list, **l;
12833
12834           list = bfd_target_list ();
12835           for (l = list; *l != NULL; l++)
12836             if (CONST_STRNEQ (*l, "elf32-x86-64"))
12837               {
12838                 default_arch = "x86_64:32";
12839                 break;
12840               }
12841           if (*l == NULL)
12842             as_fatal (_("no compiled in support for 32bit x86_64"));
12843           free (list);
12844         }
12845       else
12846         as_fatal (_("32bit x86_64 is only supported for ELF"));
12847       break;
12848 #endif
12849
12850     case OPTION_32:
12851       default_arch = "i386";
12852       break;
12853
12854     case OPTION_DIVIDE:
12855 #ifdef SVR4_COMMENT_CHARS
12856       {
12857         char *n, *t;
12858         const char *s;
12859
12860         n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
12861         t = n;
12862         for (s = i386_comment_chars; *s != '\0'; s++)
12863           if (*s != '/')
12864             *t++ = *s;
12865         *t = '\0';
12866         i386_comment_chars = n;
12867       }
12868 #endif
12869       break;
12870
12871     case OPTION_MARCH:
12872       saved = xstrdup (arg);
12873       arch = saved;
12874       /* Allow -march=+nosse.  */
12875       if (*arch == '+')
12876         arch++;
12877       do
12878         {
12879           if (*arch == '.')
12880             as_fatal (_("invalid -march= option: `%s'"), arg);
12881           next = strchr (arch, '+');
12882           if (next)
12883             *next++ = '\0';
12884           for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12885             {
12886               if (strcmp (arch, cpu_arch [j].name) == 0)
12887                 {
12888                   /* Processor.  */
12889                   if (! cpu_arch[j].flags.bitfield.cpui386)
12890                     continue;
12891
12892                   cpu_arch_name = cpu_arch[j].name;
12893                   cpu_sub_arch_name = NULL;
12894                   cpu_arch_flags = cpu_arch[j].flags;
12895                   cpu_arch_isa = cpu_arch[j].type;
12896                   cpu_arch_isa_flags = cpu_arch[j].flags;
12897                   if (!cpu_arch_tune_set)
12898                     {
12899                       cpu_arch_tune = cpu_arch_isa;
12900                       cpu_arch_tune_flags = cpu_arch_isa_flags;
12901                     }
12902                   break;
12903                 }
12904               else if (*cpu_arch [j].name == '.'
12905                        && strcmp (arch, cpu_arch [j].name + 1) == 0)
12906                 {
12907                   /* ISA extension.  */
12908                   i386_cpu_flags flags;
12909
12910                   flags = cpu_flags_or (cpu_arch_flags,
12911                                         cpu_arch[j].flags);
12912
12913                   if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12914                     {
12915                       if (cpu_sub_arch_name)
12916                         {
12917                           char *name = cpu_sub_arch_name;
12918                           cpu_sub_arch_name = concat (name,
12919                                                       cpu_arch[j].name,
12920                                                       (const char *) NULL);
12921                           free (name);
12922                         }
12923                       else
12924                         cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
12925                       cpu_arch_flags = flags;
12926                       cpu_arch_isa_flags = flags;
12927                     }
12928                   else
12929                     cpu_arch_isa_flags
12930                       = cpu_flags_or (cpu_arch_isa_flags,
12931                                       cpu_arch[j].flags);
12932                   break;
12933                 }
12934             }
12935
12936           if (j >= ARRAY_SIZE (cpu_arch))
12937             {
12938               /* Disable an ISA extension.  */
12939               for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12940                 if (strcmp (arch, cpu_noarch [j].name) == 0)
12941                   {
12942                     i386_cpu_flags flags;
12943
12944                     flags = cpu_flags_and_not (cpu_arch_flags,
12945                                                cpu_noarch[j].flags);
12946                     if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12947                       {
12948                         if (cpu_sub_arch_name)
12949                           {
12950                             char *name = cpu_sub_arch_name;
12951                             cpu_sub_arch_name = concat (arch,
12952                                                         (const char *) NULL);
12953                             free (name);
12954                           }
12955                         else
12956                           cpu_sub_arch_name = xstrdup (arch);
12957                         cpu_arch_flags = flags;
12958                         cpu_arch_isa_flags = flags;
12959                       }
12960                     break;
12961                   }
12962
12963               if (j >= ARRAY_SIZE (cpu_noarch))
12964                 j = ARRAY_SIZE (cpu_arch);
12965             }
12966
12967           if (j >= ARRAY_SIZE (cpu_arch))
12968             as_fatal (_("invalid -march= option: `%s'"), arg);
12969
12970           arch = next;
12971         }
12972       while (next != NULL);
12973       free (saved);
12974       break;
12975
12976     case OPTION_MTUNE:
12977       if (*arg == '.')
12978         as_fatal (_("invalid -mtune= option: `%s'"), arg);
12979       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12980         {
12981           if (strcmp (arg, cpu_arch [j].name) == 0)
12982             {
12983               cpu_arch_tune_set = 1;
12984               cpu_arch_tune = cpu_arch [j].type;
12985               cpu_arch_tune_flags = cpu_arch[j].flags;
12986               break;
12987             }
12988         }
12989       if (j >= ARRAY_SIZE (cpu_arch))
12990         as_fatal (_("invalid -mtune= option: `%s'"), arg);
12991       break;
12992
12993     case OPTION_MMNEMONIC:
12994       if (strcasecmp (arg, "att") == 0)
12995         intel_mnemonic = 0;
12996       else if (strcasecmp (arg, "intel") == 0)
12997         intel_mnemonic = 1;
12998       else
12999         as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
13000       break;
13001
13002     case OPTION_MSYNTAX:
13003       if (strcasecmp (arg, "att") == 0)
13004         intel_syntax = 0;
13005       else if (strcasecmp (arg, "intel") == 0)
13006         intel_syntax = 1;
13007       else
13008         as_fatal (_("invalid -msyntax= option: `%s'"), arg);
13009       break;
13010
13011     case OPTION_MINDEX_REG:
13012       allow_index_reg = 1;
13013       break;
13014
13015     case OPTION_MNAKED_REG:
13016       allow_naked_reg = 1;
13017       break;
13018
13019     case OPTION_MSSE2AVX:
13020       sse2avx = 1;
13021       break;
13022
13023     case OPTION_MSSE_CHECK:
13024       if (strcasecmp (arg, "error") == 0)
13025         sse_check = check_error;
13026       else if (strcasecmp (arg, "warning") == 0)
13027         sse_check = check_warning;
13028       else if (strcasecmp (arg, "none") == 0)
13029         sse_check = check_none;
13030       else
13031         as_fatal (_("invalid -msse-check= option: `%s'"), arg);
13032       break;
13033
13034     case OPTION_MOPERAND_CHECK:
13035       if (strcasecmp (arg, "error") == 0)
13036         operand_check = check_error;
13037       else if (strcasecmp (arg, "warning") == 0)
13038         operand_check = check_warning;
13039       else if (strcasecmp (arg, "none") == 0)
13040         operand_check = check_none;
13041       else
13042         as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
13043       break;
13044
13045     case OPTION_MAVXSCALAR:
13046       if (strcasecmp (arg, "128") == 0)
13047         avxscalar = vex128;
13048       else if (strcasecmp (arg, "256") == 0)
13049         avxscalar = vex256;
13050       else
13051         as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
13052       break;
13053
13054     case OPTION_MVEXWIG:
13055       if (strcmp (arg, "0") == 0)
13056         vexwig = vexw0;
13057       else if (strcmp (arg, "1") == 0)
13058         vexwig = vexw1;
13059       else
13060         as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
13061       break;
13062
13063     case OPTION_MADD_BND_PREFIX:
13064       add_bnd_prefix = 1;
13065       break;
13066
13067     case OPTION_MEVEXLIG:
13068       if (strcmp (arg, "128") == 0)
13069         evexlig = evexl128;
13070       else if (strcmp (arg, "256") == 0)
13071         evexlig = evexl256;
13072       else  if (strcmp (arg, "512") == 0)
13073         evexlig = evexl512;
13074       else
13075         as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13076       break;
13077
13078     case OPTION_MEVEXRCIG:
13079       if (strcmp (arg, "rne") == 0)
13080         evexrcig = rne;
13081       else if (strcmp (arg, "rd") == 0)
13082         evexrcig = rd;
13083       else if (strcmp (arg, "ru") == 0)
13084         evexrcig = ru;
13085       else if (strcmp (arg, "rz") == 0)
13086         evexrcig = rz;
13087       else
13088         as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13089       break;
13090
13091     case OPTION_MEVEXWIG:
13092       if (strcmp (arg, "0") == 0)
13093         evexwig = evexw0;
13094       else if (strcmp (arg, "1") == 0)
13095         evexwig = evexw1;
13096       else
13097         as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13098       break;
13099
13100 # if defined (TE_PE) || defined (TE_PEP)
13101     case OPTION_MBIG_OBJ:
13102       use_big_obj = 1;
13103       break;
13104 #endif
13105
13106     case OPTION_MOMIT_LOCK_PREFIX:
13107       if (strcasecmp (arg, "yes") == 0)
13108         omit_lock_prefix = 1;
13109       else if (strcasecmp (arg, "no") == 0)
13110         omit_lock_prefix = 0;
13111       else
13112         as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13113       break;
13114
13115     case OPTION_MFENCE_AS_LOCK_ADD:
13116       if (strcasecmp (arg, "yes") == 0)
13117         avoid_fence = 1;
13118       else if (strcasecmp (arg, "no") == 0)
13119         avoid_fence = 0;
13120       else
13121         as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13122       break;
13123
13124     case OPTION_MLFENCE_AFTER_LOAD:
13125       if (strcasecmp (arg, "yes") == 0)
13126         lfence_after_load = 1;
13127       else if (strcasecmp (arg, "no") == 0)
13128         lfence_after_load = 0;
13129       else
13130         as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13131       break;
13132
13133     case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13134       if (strcasecmp (arg, "all") == 0)
13135         {
13136           lfence_before_indirect_branch = lfence_branch_all;
13137           if (lfence_before_ret == lfence_before_ret_none)
13138             lfence_before_ret = lfence_before_ret_shl;
13139         }
13140       else if (strcasecmp (arg, "memory") == 0)
13141         lfence_before_indirect_branch = lfence_branch_memory;
13142       else if (strcasecmp (arg, "register") == 0)
13143         lfence_before_indirect_branch = lfence_branch_register;
13144       else if (strcasecmp (arg, "none") == 0)
13145         lfence_before_indirect_branch = lfence_branch_none;
13146       else
13147         as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13148                   arg);
13149       break;
13150
13151     case OPTION_MLFENCE_BEFORE_RET:
13152       if (strcasecmp (arg, "or") == 0)
13153         lfence_before_ret = lfence_before_ret_or;
13154       else if (strcasecmp (arg, "not") == 0)
13155         lfence_before_ret = lfence_before_ret_not;
13156       else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13157         lfence_before_ret = lfence_before_ret_shl;
13158       else if (strcasecmp (arg, "none") == 0)
13159         lfence_before_ret = lfence_before_ret_none;
13160       else
13161         as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13162                   arg);
13163       break;
13164
13165     case OPTION_MRELAX_RELOCATIONS:
13166       if (strcasecmp (arg, "yes") == 0)
13167         generate_relax_relocations = 1;
13168       else if (strcasecmp (arg, "no") == 0)
13169         generate_relax_relocations = 0;
13170       else
13171         as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13172       break;
13173
13174     case OPTION_MALIGN_BRANCH_BOUNDARY:
13175       {
13176         char *end;
13177         long int align = strtoul (arg, &end, 0);
13178         if (*end == '\0')
13179           {
13180             if (align == 0)
13181               {
13182                 align_branch_power = 0;
13183                 break;
13184               }
13185             else if (align >= 16)
13186               {
13187                 int align_power;
13188                 for (align_power = 0;
13189                      (align & 1) == 0;
13190                      align >>= 1, align_power++)
13191                   continue;
13192                 /* Limit alignment power to 31.  */
13193                 if (align == 1 && align_power < 32)
13194                   {
13195                     align_branch_power = align_power;
13196                     break;
13197                   }
13198               }
13199           }
13200         as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13201       }
13202       break;
13203
13204     case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13205       {
13206         char *end;
13207         int align = strtoul (arg, &end, 0);
13208         /* Some processors only support 5 prefixes.  */
13209         if (*end == '\0' && align >= 0 && align < 6)
13210           {
13211             align_branch_prefix_size = align;
13212             break;
13213           }
13214         as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13215                   arg);
13216       }
13217       break;
13218
13219     case OPTION_MALIGN_BRANCH:
13220       align_branch = 0;
13221       saved = xstrdup (arg);
13222       type = saved;
13223       do
13224         {
13225           next = strchr (type, '+');
13226           if (next)
13227             *next++ = '\0';
13228           if (strcasecmp (type, "jcc") == 0)
13229             align_branch |= align_branch_jcc_bit;
13230           else if (strcasecmp (type, "fused") == 0)
13231             align_branch |= align_branch_fused_bit;
13232           else if (strcasecmp (type, "jmp") == 0)
13233             align_branch |= align_branch_jmp_bit;
13234           else if (strcasecmp (type, "call") == 0)
13235             align_branch |= align_branch_call_bit;
13236           else if (strcasecmp (type, "ret") == 0)
13237             align_branch |= align_branch_ret_bit;
13238           else if (strcasecmp (type, "indirect") == 0)
13239             align_branch |= align_branch_indirect_bit;
13240           else
13241             as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13242           type = next;
13243         }
13244       while (next != NULL);
13245       free (saved);
13246       break;
13247
13248     case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13249       align_branch_power = 5;
13250       align_branch_prefix_size = 5;
13251       align_branch = (align_branch_jcc_bit
13252                       | align_branch_fused_bit
13253                       | align_branch_jmp_bit);
13254       break;
13255
13256     case OPTION_MAMD64:
13257       isa64 = amd64;
13258       break;
13259
13260     case OPTION_MINTEL64:
13261       isa64 = intel64;
13262       break;
13263
13264     case 'O':
13265       if (arg == NULL)
13266         {
13267           optimize = 1;
13268           /* Turn off -Os.  */
13269           optimize_for_space = 0;
13270         }
13271       else if (*arg == 's')
13272         {
13273           optimize_for_space = 1;
13274           /* Turn on all encoding optimizations.  */
13275           optimize = INT_MAX;
13276         }
13277       else
13278         {
13279           optimize = atoi (arg);
13280           /* Turn off -Os.  */
13281           optimize_for_space = 0;
13282         }
13283       break;
13284
13285     default:
13286       return 0;
13287     }
13288   return 1;
13289 }
13290
13291 #define MESSAGE_TEMPLATE \
13292 "                                                                                "
13293
13294 static char *
13295 output_message (FILE *stream, char *p, char *message, char *start,
13296                 int *left_p, const char *name, int len)
13297 {
13298   int size = sizeof (MESSAGE_TEMPLATE);
13299   int left = *left_p;
13300
13301   /* Reserve 2 spaces for ", " or ",\0" */
13302   left -= len + 2;
13303
13304   /* Check if there is any room.  */
13305   if (left >= 0)
13306     {
13307       if (p != start)
13308         {
13309           *p++ = ',';
13310           *p++ = ' ';
13311         }
13312       p = mempcpy (p, name, len);
13313     }
13314   else
13315     {
13316       /* Output the current message now and start a new one.  */
13317       *p++ = ',';
13318       *p = '\0';
13319       fprintf (stream, "%s\n", message);
13320       p = start;
13321       left = size - (start - message) - len - 2;
13322
13323       gas_assert (left >= 0);
13324
13325       p = mempcpy (p, name, len);
13326     }
13327
13328   *left_p = left;
13329   return p;
13330 }
13331
13332 static void
13333 show_arch (FILE *stream, int ext, int check)
13334 {
13335   static char message[] = MESSAGE_TEMPLATE;
13336   char *start = message + 27;
13337   char *p;
13338   int size = sizeof (MESSAGE_TEMPLATE);
13339   int left;
13340   const char *name;
13341   int len;
13342   unsigned int j;
13343
13344   p = start;
13345   left = size - (start - message);
13346   for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13347     {
13348       /* Should it be skipped?  */
13349       if (cpu_arch [j].skip)
13350         continue;
13351
13352       name = cpu_arch [j].name;
13353       len = cpu_arch [j].len;
13354       if (*name == '.')
13355         {
13356           /* It is an extension.  Skip if we aren't asked to show it.  */
13357           if (ext)
13358             {
13359               name++;
13360               len--;
13361             }
13362           else
13363             continue;
13364         }
13365       else if (ext)
13366         {
13367           /* It is an processor.  Skip if we show only extension.  */
13368           continue;
13369         }
13370       else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13371         {
13372           /* It is an impossible processor - skip.  */
13373           continue;
13374         }
13375
13376       p = output_message (stream, p, message, start, &left, name, len);
13377     }
13378
13379   /* Display disabled extensions.  */
13380   if (ext)
13381     for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13382       {
13383         name = cpu_noarch [j].name;
13384         len = cpu_noarch [j].len;
13385         p = output_message (stream, p, message, start, &left, name,
13386                             len);
13387       }
13388
13389   *p = '\0';
13390   fprintf (stream, "%s\n", message);
13391 }
13392
13393 void
13394 md_show_usage (FILE *stream)
13395 {
13396 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13397   fprintf (stream, _("\
13398   -Qy, -Qn                ignored\n\
13399   -V                      print assembler version number\n\
13400   -k                      ignored\n"));
13401 #endif
13402   fprintf (stream, _("\
13403   -n                      Do not optimize code alignment\n\
13404   -q                      quieten some warnings\n"));
13405 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13406   fprintf (stream, _("\
13407   -s                      ignored\n"));
13408 #endif
13409 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13410                       || defined (TE_PE) || defined (TE_PEP))
13411   fprintf (stream, _("\
13412   --32/--64/--x32         generate 32bit/64bit/x32 code\n"));
13413 #endif
13414 #ifdef SVR4_COMMENT_CHARS
13415   fprintf (stream, _("\
13416   --divide                do not treat `/' as a comment character\n"));
13417 #else
13418   fprintf (stream, _("\
13419   --divide                ignored\n"));
13420 #endif
13421   fprintf (stream, _("\
13422   -march=CPU[,+EXTENSION...]\n\
13423                           generate code for CPU and EXTENSION, CPU is one of:\n"));
13424   show_arch (stream, 0, 1);
13425   fprintf (stream, _("\
13426                           EXTENSION is combination of:\n"));
13427   show_arch (stream, 1, 0);
13428   fprintf (stream, _("\
13429   -mtune=CPU              optimize for CPU, CPU is one of:\n"));
13430   show_arch (stream, 0, 0);
13431   fprintf (stream, _("\
13432   -msse2avx               encode SSE instructions with VEX prefix\n"));
13433   fprintf (stream, _("\
13434   -msse-check=[none|error|warning] (default: warning)\n\
13435                           check SSE instructions\n"));
13436   fprintf (stream, _("\
13437   -moperand-check=[none|error|warning] (default: warning)\n\
13438                           check operand combinations for validity\n"));
13439   fprintf (stream, _("\
13440   -mavxscalar=[128|256] (default: 128)\n\
13441                           encode scalar AVX instructions with specific vector\n\
13442                            length\n"));
13443   fprintf (stream, _("\
13444   -mvexwig=[0|1] (default: 0)\n\
13445                           encode VEX instructions with specific VEX.W value\n\
13446                            for VEX.W bit ignored instructions\n"));
13447   fprintf (stream, _("\
13448   -mevexlig=[128|256|512] (default: 128)\n\
13449                           encode scalar EVEX instructions with specific vector\n\
13450                            length\n"));
13451   fprintf (stream, _("\
13452   -mevexwig=[0|1] (default: 0)\n\
13453                           encode EVEX instructions with specific EVEX.W value\n\
13454                            for EVEX.W bit ignored instructions\n"));
13455   fprintf (stream, _("\
13456   -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
13457                           encode EVEX instructions with specific EVEX.RC value\n\
13458                            for SAE-only ignored instructions\n"));
13459   fprintf (stream, _("\
13460   -mmnemonic=[att|intel] "));
13461   if (SYSV386_COMPAT)
13462     fprintf (stream, _("(default: att)\n"));
13463   else
13464     fprintf (stream, _("(default: intel)\n"));
13465   fprintf (stream, _("\
13466                           use AT&T/Intel mnemonic\n"));
13467   fprintf (stream, _("\
13468   -msyntax=[att|intel] (default: att)\n\
13469                           use AT&T/Intel syntax\n"));
13470   fprintf (stream, _("\
13471   -mindex-reg             support pseudo index registers\n"));
13472   fprintf (stream, _("\
13473   -mnaked-reg             don't require `%%' prefix for registers\n"));
13474   fprintf (stream, _("\
13475   -madd-bnd-prefix        add BND prefix for all valid branches\n"));
13476 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13477   fprintf (stream, _("\
13478   -mshared                disable branch optimization for shared code\n"));
13479   fprintf (stream, _("\
13480   -mx86-used-note=[no|yes] "));
13481   if (DEFAULT_X86_USED_NOTE)
13482     fprintf (stream, _("(default: yes)\n"));
13483   else
13484     fprintf (stream, _("(default: no)\n"));
13485   fprintf (stream, _("\
13486                           generate x86 used ISA and feature properties\n"));
13487 #endif
13488 #if defined (TE_PE) || defined (TE_PEP)
13489   fprintf (stream, _("\
13490   -mbig-obj               generate big object files\n"));
13491 #endif
13492   fprintf (stream, _("\
13493   -momit-lock-prefix=[no|yes] (default: no)\n\
13494                           strip all lock prefixes\n"));
13495   fprintf (stream, _("\
13496   -mfence-as-lock-add=[no|yes] (default: no)\n\
13497                           encode lfence, mfence and sfence as\n\
13498                            lock addl $0x0, (%%{re}sp)\n"));
13499   fprintf (stream, _("\
13500   -mrelax-relocations=[no|yes] "));
13501   if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13502     fprintf (stream, _("(default: yes)\n"));
13503   else
13504     fprintf (stream, _("(default: no)\n"));
13505   fprintf (stream, _("\
13506                           generate relax relocations\n"));
13507   fprintf (stream, _("\
13508   -malign-branch-boundary=NUM (default: 0)\n\
13509                           align branches within NUM byte boundary\n"));
13510   fprintf (stream, _("\
13511   -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13512                           TYPE is combination of jcc, fused, jmp, call, ret,\n\
13513                            indirect\n\
13514                           specify types of branches to align\n"));
13515   fprintf (stream, _("\
13516   -malign-branch-prefix-size=NUM (default: 5)\n\
13517                           align branches with NUM prefixes per instruction\n"));
13518   fprintf (stream, _("\
13519   -mbranches-within-32B-boundaries\n\
13520                           align branches within 32 byte boundary\n"));
13521   fprintf (stream, _("\
13522   -mlfence-after-load=[no|yes] (default: no)\n\
13523                           generate lfence after load\n"));
13524   fprintf (stream, _("\
13525   -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13526                           generate lfence before indirect near branch\n"));
13527   fprintf (stream, _("\
13528   -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
13529                           generate lfence before ret\n"));
13530   fprintf (stream, _("\
13531   -mamd64                 accept only AMD64 ISA [default]\n"));
13532   fprintf (stream, _("\
13533   -mintel64               accept only Intel64 ISA\n"));
13534 }
13535
13536 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
13537      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13538      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13539
13540 /* Pick the target format to use.  */
13541
13542 const char *
13543 i386_target_format (void)
13544 {
13545   if (!strncmp (default_arch, "x86_64", 6))
13546     {
13547       update_code_flag (CODE_64BIT, 1);
13548       if (default_arch[6] == '\0')
13549         x86_elf_abi = X86_64_ABI;
13550       else
13551         x86_elf_abi = X86_64_X32_ABI;
13552     }
13553   else if (!strcmp (default_arch, "i386"))
13554     update_code_flag (CODE_32BIT, 1);
13555   else if (!strcmp (default_arch, "iamcu"))
13556     {
13557       update_code_flag (CODE_32BIT, 1);
13558       if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13559         {
13560           static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13561           cpu_arch_name = "iamcu";
13562           cpu_sub_arch_name = NULL;
13563           cpu_arch_flags = iamcu_flags;
13564           cpu_arch_isa = PROCESSOR_IAMCU;
13565           cpu_arch_isa_flags = iamcu_flags;
13566           if (!cpu_arch_tune_set)
13567             {
13568               cpu_arch_tune = cpu_arch_isa;
13569               cpu_arch_tune_flags = cpu_arch_isa_flags;
13570             }
13571         }
13572       else if (cpu_arch_isa != PROCESSOR_IAMCU)
13573         as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13574                   cpu_arch_name);
13575     }
13576   else
13577     as_fatal (_("unknown architecture"));
13578
13579   if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13580     cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13581   if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13582     cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13583
13584   switch (OUTPUT_FLAVOR)
13585     {
13586 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
13587     case bfd_target_aout_flavour:
13588       return AOUT_TARGET_FORMAT;
13589 #endif
13590 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13591 # if defined (TE_PE) || defined (TE_PEP)
13592     case bfd_target_coff_flavour:
13593       if (flag_code == CODE_64BIT)
13594         return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13595       else
13596         return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
13597 # elif defined (TE_GO32)
13598     case bfd_target_coff_flavour:
13599       return "coff-go32";
13600 # else
13601     case bfd_target_coff_flavour:
13602       return "coff-i386";
13603 # endif
13604 #endif
13605 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13606     case bfd_target_elf_flavour:
13607       {
13608         const char *format;
13609
13610         switch (x86_elf_abi)
13611           {
13612           default:
13613             format = ELF_TARGET_FORMAT;
13614 #ifndef TE_SOLARIS
13615             tls_get_addr = "___tls_get_addr";
13616 #endif
13617             break;
13618           case X86_64_ABI:
13619             use_rela_relocations = 1;
13620             object_64bit = 1;
13621 #ifndef TE_SOLARIS
13622             tls_get_addr = "__tls_get_addr";
13623 #endif
13624             format = ELF_TARGET_FORMAT64;
13625             break;
13626           case X86_64_X32_ABI:
13627             use_rela_relocations = 1;
13628             object_64bit = 1;
13629 #ifndef TE_SOLARIS
13630             tls_get_addr = "__tls_get_addr";
13631 #endif
13632             disallow_64bit_reloc = 1;
13633             format = ELF_TARGET_FORMAT32;
13634             break;
13635           }
13636         if (cpu_arch_isa == PROCESSOR_L1OM)
13637           {
13638             if (x86_elf_abi != X86_64_ABI)
13639               as_fatal (_("Intel L1OM is 64bit only"));
13640             return ELF_TARGET_L1OM_FORMAT;
13641           }
13642         else if (cpu_arch_isa == PROCESSOR_K1OM)
13643           {
13644             if (x86_elf_abi != X86_64_ABI)
13645               as_fatal (_("Intel K1OM is 64bit only"));
13646             return ELF_TARGET_K1OM_FORMAT;
13647           }
13648         else if (cpu_arch_isa == PROCESSOR_IAMCU)
13649           {
13650             if (x86_elf_abi != I386_ABI)
13651               as_fatal (_("Intel MCU is 32bit only"));
13652             return ELF_TARGET_IAMCU_FORMAT;
13653           }
13654         else
13655           return format;
13656       }
13657 #endif
13658 #if defined (OBJ_MACH_O)
13659     case bfd_target_mach_o_flavour:
13660       if (flag_code == CODE_64BIT)
13661         {
13662           use_rela_relocations = 1;
13663           object_64bit = 1;
13664           return "mach-o-x86-64";
13665         }
13666       else
13667         return "mach-o-i386";
13668 #endif
13669     default:
13670       abort ();
13671       return NULL;
13672     }
13673 }
13674
13675 #endif /* OBJ_MAYBE_ more than one  */
13676 \f
13677 symbolS *
13678 md_undefined_symbol (char *name)
13679 {
13680   if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13681       && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13682       && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13683       && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
13684     {
13685       if (!GOT_symbol)
13686         {
13687           if (symbol_find (name))
13688             as_bad (_("GOT already in symbol table"));
13689           GOT_symbol = symbol_new (name, undefined_section,
13690                                    (valueT) 0, &zero_address_frag);
13691         };
13692       return GOT_symbol;
13693     }
13694   return 0;
13695 }
13696
13697 /* Round up a section size to the appropriate boundary.  */
13698
13699 valueT
13700 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13701 {
13702 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13703   if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13704     {
13705       /* For a.out, force the section size to be aligned.  If we don't do
13706          this, BFD will align it for us, but it will not write out the
13707          final bytes of the section.  This may be a bug in BFD, but it is
13708          easier to fix it here since that is how the other a.out targets
13709          work.  */
13710       int align;
13711
13712       align = bfd_section_alignment (segment);
13713       size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13714     }
13715 #endif
13716
13717   return size;
13718 }
13719
13720 /* On the i386, PC-relative offsets are relative to the start of the
13721    next instruction.  That is, the address of the offset, plus its
13722    size, since the offset is always the last part of the insn.  */
13723
13724 long
13725 md_pcrel_from (fixS *fixP)
13726 {
13727   return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13728 }
13729
13730 #ifndef I386COFF
13731
13732 static void
13733 s_bss (int ignore ATTRIBUTE_UNUSED)
13734 {
13735   int temp;
13736
13737 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13738   if (IS_ELF)
13739     obj_elf_section_change_hook ();
13740 #endif
13741   temp = get_absolute_expression ();
13742   subseg_set (bss_section, (subsegT) temp);
13743   demand_empty_rest_of_line ();
13744 }
13745
13746 #endif
13747
13748 /* Remember constant directive.  */
13749
13750 void
13751 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13752 {
13753   if (last_insn.kind != last_insn_directive
13754       && (bfd_section_flags (now_seg) & SEC_CODE))
13755     {
13756       last_insn.seg = now_seg;
13757       last_insn.kind = last_insn_directive;
13758       last_insn.name = "constant directive";
13759       last_insn.file = as_where (&last_insn.line);
13760       if (lfence_before_ret != lfence_before_ret_none)
13761         {
13762           if (lfence_before_indirect_branch != lfence_branch_none)
13763             as_warn (_("constant directive skips -mlfence-before-ret "
13764                        "and -mlfence-before-indirect-branch"));
13765           else
13766             as_warn (_("constant directive skips -mlfence-before-ret"));
13767         }
13768       else if (lfence_before_indirect_branch != lfence_branch_none)
13769         as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
13770     }
13771 }
13772
13773 void
13774 i386_validate_fix (fixS *fixp)
13775 {
13776   if (fixp->fx_subsy)
13777     {
13778       if (fixp->fx_subsy == GOT_symbol)
13779         {
13780           if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13781             {
13782               if (!object_64bit)
13783                 abort ();
13784 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13785               if (fixp->fx_tcbit2)
13786                 fixp->fx_r_type = (fixp->fx_tcbit
13787                                    ? BFD_RELOC_X86_64_REX_GOTPCRELX
13788                                    : BFD_RELOC_X86_64_GOTPCRELX);
13789               else
13790 #endif
13791                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13792             }
13793           else
13794             {
13795               if (!object_64bit)
13796                 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13797               else
13798                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13799             }
13800           fixp->fx_subsy = 0;
13801         }
13802     }
13803 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13804   else if (!object_64bit)
13805     {
13806       if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13807           && fixp->fx_tcbit2)
13808         fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13809     }
13810 #endif
13811 }
13812
13813 arelent *
13814 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
13815 {
13816   arelent *rel;
13817   bfd_reloc_code_real_type code;
13818
13819   switch (fixp->fx_r_type)
13820     {
13821 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13822     case BFD_RELOC_SIZE32:
13823     case BFD_RELOC_SIZE64:
13824       if (S_IS_DEFINED (fixp->fx_addsy)
13825           && !S_IS_EXTERNAL (fixp->fx_addsy))
13826         {
13827           /* Resolve size relocation against local symbol to size of
13828              the symbol plus addend.  */
13829           valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13830           if (fixp->fx_r_type == BFD_RELOC_SIZE32
13831               && !fits_in_unsigned_long (value))
13832             as_bad_where (fixp->fx_file, fixp->fx_line,
13833                           _("symbol size computation overflow"));
13834           fixp->fx_addsy = NULL;
13835           fixp->fx_subsy = NULL;
13836           md_apply_fix (fixp, (valueT *) &value, NULL);
13837           return NULL;
13838         }
13839 #endif
13840       /* Fall through.  */
13841
13842     case BFD_RELOC_X86_64_PLT32:
13843     case BFD_RELOC_X86_64_GOT32:
13844     case BFD_RELOC_X86_64_GOTPCREL:
13845     case BFD_RELOC_X86_64_GOTPCRELX:
13846     case BFD_RELOC_X86_64_REX_GOTPCRELX:
13847     case BFD_RELOC_386_PLT32:
13848     case BFD_RELOC_386_GOT32:
13849     case BFD_RELOC_386_GOT32X:
13850     case BFD_RELOC_386_GOTOFF:
13851     case BFD_RELOC_386_GOTPC:
13852     case BFD_RELOC_386_TLS_GD:
13853     case BFD_RELOC_386_TLS_LDM:
13854     case BFD_RELOC_386_TLS_LDO_32:
13855     case BFD_RELOC_386_TLS_IE_32:
13856     case BFD_RELOC_386_TLS_IE:
13857     case BFD_RELOC_386_TLS_GOTIE:
13858     case BFD_RELOC_386_TLS_LE_32:
13859     case BFD_RELOC_386_TLS_LE:
13860     case BFD_RELOC_386_TLS_GOTDESC:
13861     case BFD_RELOC_386_TLS_DESC_CALL:
13862     case BFD_RELOC_X86_64_TLSGD:
13863     case BFD_RELOC_X86_64_TLSLD:
13864     case BFD_RELOC_X86_64_DTPOFF32:
13865     case BFD_RELOC_X86_64_DTPOFF64:
13866     case BFD_RELOC_X86_64_GOTTPOFF:
13867     case BFD_RELOC_X86_64_TPOFF32:
13868     case BFD_RELOC_X86_64_TPOFF64:
13869     case BFD_RELOC_X86_64_GOTOFF64:
13870     case BFD_RELOC_X86_64_GOTPC32:
13871     case BFD_RELOC_X86_64_GOT64:
13872     case BFD_RELOC_X86_64_GOTPCREL64:
13873     case BFD_RELOC_X86_64_GOTPC64:
13874     case BFD_RELOC_X86_64_GOTPLT64:
13875     case BFD_RELOC_X86_64_PLTOFF64:
13876     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13877     case BFD_RELOC_X86_64_TLSDESC_CALL:
13878     case BFD_RELOC_RVA:
13879     case BFD_RELOC_VTABLE_ENTRY:
13880     case BFD_RELOC_VTABLE_INHERIT:
13881 #ifdef TE_PE
13882     case BFD_RELOC_32_SECREL:
13883 #endif
13884       code = fixp->fx_r_type;
13885       break;
13886     case BFD_RELOC_X86_64_32S:
13887       if (!fixp->fx_pcrel)
13888         {
13889           /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32.  */
13890           code = fixp->fx_r_type;
13891           break;
13892         }
13893       /* Fall through.  */
13894     default:
13895       if (fixp->fx_pcrel)
13896         {
13897           switch (fixp->fx_size)
13898             {
13899             default:
13900               as_bad_where (fixp->fx_file, fixp->fx_line,
13901                             _("can not do %d byte pc-relative relocation"),
13902                             fixp->fx_size);
13903               code = BFD_RELOC_32_PCREL;
13904               break;
13905             case 1: code = BFD_RELOC_8_PCREL;  break;
13906             case 2: code = BFD_RELOC_16_PCREL; break;
13907             case 4: code = BFD_RELOC_32_PCREL; break;
13908 #ifdef BFD64
13909             case 8: code = BFD_RELOC_64_PCREL; break;
13910 #endif
13911             }
13912         }
13913       else
13914         {
13915           switch (fixp->fx_size)
13916             {
13917             default:
13918               as_bad_where (fixp->fx_file, fixp->fx_line,
13919                             _("can not do %d byte relocation"),
13920                             fixp->fx_size);
13921               code = BFD_RELOC_32;
13922               break;
13923             case 1: code = BFD_RELOC_8;  break;
13924             case 2: code = BFD_RELOC_16; break;
13925             case 4: code = BFD_RELOC_32; break;
13926 #ifdef BFD64
13927             case 8: code = BFD_RELOC_64; break;
13928 #endif
13929             }
13930         }
13931       break;
13932     }
13933
13934   if ((code == BFD_RELOC_32
13935        || code == BFD_RELOC_32_PCREL
13936        || code == BFD_RELOC_X86_64_32S)
13937       && GOT_symbol
13938       && fixp->fx_addsy == GOT_symbol)
13939     {
13940       if (!object_64bit)
13941         code = BFD_RELOC_386_GOTPC;
13942       else
13943         code = BFD_RELOC_X86_64_GOTPC32;
13944     }
13945   if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13946       && GOT_symbol
13947       && fixp->fx_addsy == GOT_symbol)
13948     {
13949       code = BFD_RELOC_X86_64_GOTPC64;
13950     }
13951
13952   rel = XNEW (arelent);
13953   rel->sym_ptr_ptr = XNEW (asymbol *);
13954   *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
13955
13956   rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
13957
13958   if (!use_rela_relocations)
13959     {
13960       /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
13961          vtable entry to be used in the relocation's section offset.  */
13962       if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
13963         rel->address = fixp->fx_offset;
13964 #if defined (OBJ_COFF) && defined (TE_PE)
13965       else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
13966         rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
13967       else
13968 #endif
13969       rel->addend = 0;
13970     }
13971   /* Use the rela in 64bit mode.  */
13972   else
13973     {
13974       if (disallow_64bit_reloc)
13975         switch (code)
13976           {
13977           case BFD_RELOC_X86_64_DTPOFF64:
13978           case BFD_RELOC_X86_64_TPOFF64:
13979           case BFD_RELOC_64_PCREL:
13980           case BFD_RELOC_X86_64_GOTOFF64:
13981           case BFD_RELOC_X86_64_GOT64:
13982           case BFD_RELOC_X86_64_GOTPCREL64:
13983           case BFD_RELOC_X86_64_GOTPC64:
13984           case BFD_RELOC_X86_64_GOTPLT64:
13985           case BFD_RELOC_X86_64_PLTOFF64:
13986             as_bad_where (fixp->fx_file, fixp->fx_line,
13987                           _("cannot represent relocation type %s in x32 mode"),
13988                           bfd_get_reloc_code_name (code));
13989             break;
13990           default:
13991             break;
13992           }
13993
13994       if (!fixp->fx_pcrel)
13995         rel->addend = fixp->fx_offset;
13996       else
13997         switch (code)
13998           {
13999           case BFD_RELOC_X86_64_PLT32:
14000           case BFD_RELOC_X86_64_GOT32:
14001           case BFD_RELOC_X86_64_GOTPCREL:
14002           case BFD_RELOC_X86_64_GOTPCRELX:
14003           case BFD_RELOC_X86_64_REX_GOTPCRELX:
14004           case BFD_RELOC_X86_64_TLSGD:
14005           case BFD_RELOC_X86_64_TLSLD:
14006           case BFD_RELOC_X86_64_GOTTPOFF:
14007           case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14008           case BFD_RELOC_X86_64_TLSDESC_CALL:
14009             rel->addend = fixp->fx_offset - fixp->fx_size;
14010             break;
14011           default:
14012             rel->addend = (section->vma
14013                            - fixp->fx_size
14014                            + fixp->fx_addnumber
14015                            + md_pcrel_from (fixp));
14016             break;
14017           }
14018     }
14019
14020   rel->howto = bfd_reloc_type_lookup (stdoutput, code);
14021   if (rel->howto == NULL)
14022     {
14023       as_bad_where (fixp->fx_file, fixp->fx_line,
14024                     _("cannot represent relocation type %s"),
14025                     bfd_get_reloc_code_name (code));
14026       /* Set howto to a garbage value so that we can keep going.  */
14027       rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
14028       gas_assert (rel->howto != NULL);
14029     }
14030
14031   return rel;
14032 }
14033
14034 #include "tc-i386-intel.c"
14035
14036 void
14037 tc_x86_parse_to_dw2regnum (expressionS *exp)
14038 {
14039   int saved_naked_reg;
14040   char saved_register_dot;
14041
14042   saved_naked_reg = allow_naked_reg;
14043   allow_naked_reg = 1;
14044   saved_register_dot = register_chars['.'];
14045   register_chars['.'] = '.';
14046   allow_pseudo_reg = 1;
14047   expression_and_evaluate (exp);
14048   allow_pseudo_reg = 0;
14049   register_chars['.'] = saved_register_dot;
14050   allow_naked_reg = saved_naked_reg;
14051
14052   if (exp->X_op == O_register && exp->X_add_number >= 0)
14053     {
14054       if ((addressT) exp->X_add_number < i386_regtab_size)
14055         {
14056           exp->X_op = O_constant;
14057           exp->X_add_number = i386_regtab[exp->X_add_number]
14058                               .dw2_regnum[flag_code >> 1];
14059         }
14060       else
14061         exp->X_op = O_illegal;
14062     }
14063 }
14064
14065 void
14066 tc_x86_frame_initial_instructions (void)
14067 {
14068   static unsigned int sp_regno[2];
14069
14070   if (!sp_regno[flag_code >> 1])
14071     {
14072       char *saved_input = input_line_pointer;
14073       char sp[][4] = {"esp", "rsp"};
14074       expressionS exp;
14075
14076       input_line_pointer = sp[flag_code >> 1];
14077       tc_x86_parse_to_dw2regnum (&exp);
14078       gas_assert (exp.X_op == O_constant);
14079       sp_regno[flag_code >> 1] = exp.X_add_number;
14080       input_line_pointer = saved_input;
14081     }
14082
14083   cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14084   cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
14085 }
14086
14087 int
14088 x86_dwarf2_addr_size (void)
14089 {
14090 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14091   if (x86_elf_abi == X86_64_X32_ABI)
14092     return 4;
14093 #endif
14094   return bfd_arch_bits_per_address (stdoutput) / 8;
14095 }
14096
14097 int
14098 i386_elf_section_type (const char *str, size_t len)
14099 {
14100   if (flag_code == CODE_64BIT
14101       && len == sizeof ("unwind") - 1
14102       && strncmp (str, "unwind", 6) == 0)
14103     return SHT_X86_64_UNWIND;
14104
14105   return -1;
14106 }
14107
14108 #ifdef TE_SOLARIS
14109 void
14110 i386_solaris_fix_up_eh_frame (segT sec)
14111 {
14112   if (flag_code == CODE_64BIT)
14113     elf_section_type (sec) = SHT_X86_64_UNWIND;
14114 }
14115 #endif
14116
14117 #ifdef TE_PE
14118 void
14119 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14120 {
14121   expressionS exp;
14122
14123   exp.X_op = O_secrel;
14124   exp.X_add_symbol = symbol;
14125   exp.X_add_number = 0;
14126   emit_expr (&exp, size);
14127 }
14128 #endif
14129
14130 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14131 /* For ELF on x86-64, add support for SHF_X86_64_LARGE.  */
14132
14133 bfd_vma
14134 x86_64_section_letter (int letter, const char **ptr_msg)
14135 {
14136   if (flag_code == CODE_64BIT)
14137     {
14138       if (letter == 'l')
14139         return SHF_X86_64_LARGE;
14140
14141       *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
14142     }
14143   else
14144     *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
14145   return -1;
14146 }
14147
14148 bfd_vma
14149 x86_64_section_word (char *str, size_t len)
14150 {
14151   if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
14152     return SHF_X86_64_LARGE;
14153
14154   return -1;
14155 }
14156
14157 static void
14158 handle_large_common (int small ATTRIBUTE_UNUSED)
14159 {
14160   if (flag_code != CODE_64BIT)
14161     {
14162       s_comm_internal (0, elf_common_parse);
14163       as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14164     }
14165   else
14166     {
14167       static segT lbss_section;
14168       asection *saved_com_section_ptr = elf_com_section_ptr;
14169       asection *saved_bss_section = bss_section;
14170
14171       if (lbss_section == NULL)
14172         {
14173           flagword applicable;
14174           segT seg = now_seg;
14175           subsegT subseg = now_subseg;
14176
14177           /* The .lbss section is for local .largecomm symbols.  */
14178           lbss_section = subseg_new (".lbss", 0);
14179           applicable = bfd_applicable_section_flags (stdoutput);
14180           bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
14181           seg_info (lbss_section)->bss = 1;
14182
14183           subseg_set (seg, subseg);
14184         }
14185
14186       elf_com_section_ptr = &_bfd_elf_large_com_section;
14187       bss_section = lbss_section;
14188
14189       s_comm_internal (0, elf_common_parse);
14190
14191       elf_com_section_ptr = saved_com_section_ptr;
14192       bss_section = saved_bss_section;
14193     }
14194 }
14195 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */