gas/config/tc-i386.c

   1 /* tc-i386.c -- Assemble code for the Intel 80386
   2    Copyright (C) 1989-2019 Free Software Foundation, Inc.
   3
   4    This file is part of GAS, the GNU Assembler.
   5
   6    GAS is free software; you can redistribute it and/or modify
   7    it under the terms of the GNU General Public License as published by
   8    the Free Software Foundation; either version 3, or (at your option)
   9    any later version.
  10
  11    GAS is distributed in the hope that it will be useful,
  12    but WITHOUT ANY WARRANTY; without even the implied warranty of
  13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14    GNU General Public License for more details.
  15
  16    You should have received a copy of the GNU General Public License
  17    along with GAS; see the file COPYING.  If not, write to the Free
  18    Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
  19    02110-1301, USA.  */
  20
  21 /* Intel 80386 machine specific gas.
  22    Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
  23    x86_64 support by Jan Hubicka (jh@suse.cz)
  24    VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
  25    Bugs & suggestions are completely welcome.  This is free software.
  26    Please help us make it better.  */
  27
  28 #include "as.h"
  29 #include "safe-ctype.h"
  30 #include "subsegs.h"
  31 #include "dwarf2dbg.h"
  32 #include "dw2gencfi.h"
  33 #include "elf/x86-64.h"
  34 #include "opcodes/i386-init.h"
  35
  36 #ifdef HAVE_LIMITS_H
  37 #include <limits.h>
  38 #else
  39 #ifdef HAVE_SYS_PARAM_H
  40 #include <sys/param.h>
  41 #endif
  42 #ifndef INT_MAX
  43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
  44 #endif
  45 #endif
  46
  47 #ifndef REGISTER_WARNINGS
  48 #define REGISTER_WARNINGS 1
  49 #endif
  50
  51 #ifndef INFER_ADDR_PREFIX
  52 #define INFER_ADDR_PREFIX 1
  53 #endif
  54
  55 #ifndef DEFAULT_ARCH
  56 #define DEFAULT_ARCH "i386"
  57 #endif
  58
  59 #ifndef INLINE
  60 #if __GNUC__ >= 2
  61 #define INLINE __inline__
  62 #else
  63 #define INLINE
  64 #endif
  65 #endif
  66
  67 /* Prefixes will be emitted in the order defined below.
  68    WAIT_PREFIX must be the first prefix since FWAIT is really is an
  69    instruction, and so must come before any prefixes.
  70    The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
  71    REP_PREFIX/HLE_PREFIX, LOCK_PREFIX.  */
  72 #define WAIT_PREFIX     0
  73 #define SEG_PREFIX      1
  74 #define ADDR_PREFIX     2
  75 #define DATA_PREFIX     3
  76 #define REP_PREFIX      4
  77 #define HLE_PREFIX      REP_PREFIX
  78 #define BND_PREFIX      REP_PREFIX
  79 #define LOCK_PREFIX     5
  80 #define REX_PREFIX      6       /* must come last.  */
  81 #define MAX_PREFIXES    7       /* max prefixes per opcode */
  82
  83 /* we define the syntax here (modulo base,index,scale syntax) */
  84 #define REGISTER_PREFIX '%'
  85 #define IMMEDIATE_PREFIX '$'
  86 #define ABSOLUTE_PREFIX '*'
  87
  88 /* these are the instruction mnemonic suffixes in AT&T syntax or
  89    memory operand size in Intel syntax.  */
  90 #define WORD_MNEM_SUFFIX  'w'
  91 #define BYTE_MNEM_SUFFIX  'b'
  92 #define SHORT_MNEM_SUFFIX 's'
  93 #define LONG_MNEM_SUFFIX  'l'
  94 #define QWORD_MNEM_SUFFIX  'q'
  95 /* Intel Syntax.  Use a non-ascii letter since since it never appears
  96    in instructions.  */
  97 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
  98
  99 #define END_OF_INSN '\0'
 100
 101 /* This matches the C -> StaticRounding alias in the opcode table.  */
 102 #define commutative staticrounding
 103
 104 /*
 105   'templates' is for grouping together 'template' structures for opcodes
 106   of the same name.  This is only used for storing the insns in the grand
 107   ole hash table of insns.
 108   The templates themselves start at START and range up to (but not including)
 109   END.
 110   */
 111 typedef struct
 112 {
 113   const insn_template *start;
 114   const insn_template *end;
 115 }
 116 templates;
 117
 118 /* 386 operand encoding bytes:  see 386 book for details of this.  */
 119 typedef struct
 120 {
 121   unsigned int regmem;  /* codes register or memory operand */
 122   unsigned int reg;     /* codes register operand (or extended opcode) */
 123   unsigned int mode;    /* how to interpret regmem & reg */
 124 }
 125 modrm_byte;
 126
 127 /* x86-64 extension prefix.  */
 128 typedef int rex_byte;
 129
 130 /* 386 opcode byte to code indirect addressing.  */
 131 typedef struct
 132 {
 133   unsigned base;
 134   unsigned index;
 135   unsigned scale;
 136 }
 137 sib_byte;
 138
 139 /* x86 arch names, types and features */
 140 typedef struct
 141 {
 142   const char *name;             /* arch name */
 143   unsigned int len;             /* arch string length */
 144   enum processor_type type;     /* arch type */
 145   i386_cpu_flags flags;         /* cpu feature flags */
 146   unsigned int skip;            /* show_arch should skip this. */
 147 }
 148 arch_entry;
 149
 150 /* Used to turn off indicated flags.  */
 151 typedef struct
 152 {
 153   const char *name;             /* arch name */
 154   unsigned int len;             /* arch string length */
 155   i386_cpu_flags flags;         /* cpu feature flags */
 156 }
 157 noarch_entry;
 158
 159 static void update_code_flag (int, int);
 160 static void set_code_flag (int);
 161 static void set_16bit_gcc_code_flag (int);
 162 static void set_intel_syntax (int);
 163 static void set_intel_mnemonic (int);
 164 static void set_allow_index_reg (int);
 165 static void set_check (int);
 166 static void set_cpu_arch (int);
 167 #ifdef TE_PE
 168 static void pe_directive_secrel (int);
 169 #endif
 170 static void signed_cons (int);
 171 static char *output_invalid (int c);
 172 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
 173                                     const char *);
 174 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
 175                                        const char *);
 176 static int i386_att_operand (char *);
 177 static int i386_intel_operand (char *, int);
 178 static int i386_intel_simplify (expressionS *);
 179 static int i386_intel_parse_name (const char *, expressionS *);
 180 static const reg_entry *parse_register (char *, char **);
 181 static char *parse_insn (char *, char *);
 182 static char *parse_operands (char *, const char *);
 183 static void swap_operands (void);
 184 static void swap_2_operands (int, int);
 185 static void optimize_imm (void);
 186 static void optimize_disp (void);
 187 static const insn_template *match_template (char);
 188 static int check_string (void);
 189 static int process_suffix (void);
 190 static int check_byte_reg (void);
 191 static int check_long_reg (void);
 192 static int check_qword_reg (void);
 193 static int check_word_reg (void);
 194 static int finalize_imm (void);
 195 static int process_operands (void);
 196 static const seg_entry *build_modrm_byte (void);
 197 static void output_insn (void);
 198 static void output_imm (fragS *, offsetT);
 199 static void output_disp (fragS *, offsetT);
 200 #ifndef I386COFF
 201 static void s_bss (int);
 202 #endif
 203 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 204 static void handle_large_common (int small ATTRIBUTE_UNUSED);
 205
 206 /* GNU_PROPERTY_X86_ISA_1_USED.  */
 207 static unsigned int x86_isa_1_used;
 208 /* GNU_PROPERTY_X86_FEATURE_2_USED.  */
 209 static unsigned int x86_feature_2_used;
 210 /* Generate x86 used ISA and feature properties.  */
 211 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
 212 #endif
 213
 214 static const char *default_arch = DEFAULT_ARCH;
 215
 216 /* This struct describes rounding control and SAE in the instruction.  */
 217 struct RC_Operation
 218 {
 219   enum rc_type
 220     {
 221       rne = 0,
 222       rd,
 223       ru,
 224       rz,
 225       saeonly
 226     } type;
 227   int operand;
 228 };
 229
 230 static struct RC_Operation rc_op;
 231
 232 /* The struct describes masking, applied to OPERAND in the instruction.
 233    MASK is a pointer to the corresponding mask register.  ZEROING tells
 234    whether merging or zeroing mask is used.  */
 235 struct Mask_Operation
 236 {
 237   const reg_entry *mask;
 238   unsigned int zeroing;
 239   /* The operand where this operation is associated.  */
 240   int operand;
 241 };
 242
 243 static struct Mask_Operation mask_op;
 244
 245 /* The struct describes broadcasting, applied to OPERAND.  FACTOR is
 246    broadcast factor.  */
 247 struct Broadcast_Operation
 248 {
 249   /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}.  */
 250   int type;
 251
 252   /* Index of broadcasted operand.  */
 253   int operand;
 254
 255   /* Number of bytes to broadcast.  */
 256   int bytes;
 257 };
 258
 259 static struct Broadcast_Operation broadcast_op;
 260
 261 /* VEX prefix.  */
 262 typedef struct
 263 {
 264   /* VEX prefix is either 2 byte or 3 byte.  EVEX is 4 byte.  */
 265   unsigned char bytes[4];
 266   unsigned int length;
 267   /* Destination or source register specifier.  */
 268   const reg_entry *register_specifier;
 269 } vex_prefix;
 270
 271 /* 'md_assemble ()' gathers together information and puts it into a
 272    i386_insn.  */
 273
 274 union i386_op
 275   {
 276     expressionS *disps;
 277     expressionS *imms;
 278     const reg_entry *regs;
 279   };
 280
 281 enum i386_error
 282   {
 283     operand_size_mismatch,
 284     operand_type_mismatch,
 285     register_type_mismatch,
 286     number_of_operands_mismatch,
 287     invalid_instruction_suffix,
 288     bad_imm4,
 289     unsupported_with_intel_mnemonic,
 290     unsupported_syntax,
 291     unsupported,
 292     invalid_vsib_address,
 293     invalid_vector_register_set,
 294     unsupported_vector_index_register,
 295     unsupported_broadcast,
 296     broadcast_needed,
 297     unsupported_masking,
 298     mask_not_on_destination,
 299     no_default_mask,
 300     unsupported_rc_sae,
 301     rc_sae_operand_not_last_imm,
 302     invalid_register_operand,
 303   };
 304
 305 struct _i386_insn
 306   {
 307     /* TM holds the template for the insn were currently assembling.  */
 308     insn_template tm;
 309
 310     /* SUFFIX holds the instruction size suffix for byte, word, dword
 311        or qword, if given.  */
 312     char suffix;
 313
 314     /* OPERANDS gives the number of given operands.  */
 315     unsigned int operands;
 316
 317     /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
 318        of given register, displacement, memory operands and immediate
 319        operands.  */
 320     unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
 321
 322     /* TYPES [i] is the type (see above #defines) which tells us how to
 323        use OP[i] for the corresponding operand.  */
 324     i386_operand_type types[MAX_OPERANDS];
 325
 326     /* Displacement expression, immediate expression, or register for each
 327        operand.  */
 328     union i386_op op[MAX_OPERANDS];
 329
 330     /* Flags for operands.  */
 331     unsigned int flags[MAX_OPERANDS];
 332 #define Operand_PCrel 1
 333 #define Operand_Mem   2
 334
 335     /* Relocation type for operand */
 336     enum bfd_reloc_code_real reloc[MAX_OPERANDS];
 337
 338     /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
 339        the base index byte below.  */
 340     const reg_entry *base_reg;
 341     const reg_entry *index_reg;
 342     unsigned int log2_scale_factor;
 343
 344     /* SEG gives the seg_entries of this insn.  They are zero unless
 345        explicit segment overrides are given.  */
 346     const seg_entry *seg[2];
 347
 348     /* Copied first memory operand string, for re-checking.  */
 349     char *memop1_string;
 350
 351     /* PREFIX holds all the given prefix opcodes (usually null).
 352        PREFIXES is the number of prefix opcodes.  */
 353     unsigned int prefixes;
 354     unsigned char prefix[MAX_PREFIXES];
 355
 356     /* Has MMX register operands.  */
 357     bfd_boolean has_regmmx;
 358
 359     /* Has XMM register operands.  */
 360     bfd_boolean has_regxmm;
 361
 362     /* Has YMM register operands.  */
 363     bfd_boolean has_regymm;
 364
 365     /* Has ZMM register operands.  */
 366     bfd_boolean has_regzmm;
 367
 368     /* RM and SIB are the modrm byte and the sib byte where the
 369        addressing modes of this insn are encoded.  */
 370     modrm_byte rm;
 371     rex_byte rex;
 372     rex_byte vrex;
 373     sib_byte sib;
 374     vex_prefix vex;
 375
 376     /* Masking attributes.  */
 377     struct Mask_Operation *mask;
 378
 379     /* Rounding control and SAE attributes.  */
 380     struct RC_Operation *rounding;
 381
 382     /* Broadcasting attributes.  */
 383     struct Broadcast_Operation *broadcast;
 384
 385     /* Compressed disp8*N attribute.  */
 386     unsigned int memshift;
 387
 388     /* Prefer load or store in encoding.  */
 389     enum
 390       {
 391         dir_encoding_default = 0,
 392         dir_encoding_load,
 393         dir_encoding_store,
 394         dir_encoding_swap
 395       } dir_encoding;
 396
 397     /* Prefer 8bit or 32bit displacement in encoding.  */
 398     enum
 399       {
 400         disp_encoding_default = 0,
 401         disp_encoding_8bit,
 402         disp_encoding_32bit
 403       } disp_encoding;
 404
 405     /* Prefer the REX byte in encoding.  */
 406     bfd_boolean rex_encoding;
 407
 408     /* Disable instruction size optimization.  */
 409     bfd_boolean no_optimize;
 410
 411     /* How to encode vector instructions.  */
 412     enum
 413       {
 414         vex_encoding_default = 0,
 415         vex_encoding_vex2,
 416         vex_encoding_vex3,
 417         vex_encoding_evex
 418       } vec_encoding;
 419
 420     /* REP prefix.  */
 421     const char *rep_prefix;
 422
 423     /* HLE prefix.  */
 424     const char *hle_prefix;
 425
 426     /* Have BND prefix.  */
 427     const char *bnd_prefix;
 428
 429     /* Have NOTRACK prefix.  */
 430     const char *notrack_prefix;
 431
 432     /* Error message.  */
 433     enum i386_error error;
 434   };
 435
 436 typedef struct _i386_insn i386_insn;
 437
 438 /* Link RC type with corresponding string, that'll be looked for in
 439    asm.  */
 440 struct RC_name
 441 {
 442   enum rc_type type;
 443   const char *name;
 444   unsigned int len;
 445 };
 446
 447 static const struct RC_name RC_NamesTable[] =
 448 {
 449   {  rne, STRING_COMMA_LEN ("rn-sae") },
 450   {  rd,  STRING_COMMA_LEN ("rd-sae") },
 451   {  ru,  STRING_COMMA_LEN ("ru-sae") },
 452   {  rz,  STRING_COMMA_LEN ("rz-sae") },
 453   {  saeonly,  STRING_COMMA_LEN ("sae") },
 454 };
 455
 456 /* List of chars besides those in app.c:symbol_chars that can start an
 457    operand.  Used to prevent the scrubber eating vital white-space.  */
 458 const char extra_symbol_chars[] = "*%-([{}"
 459 #ifdef LEX_AT
 460         "@"
 461 #endif
 462 #ifdef LEX_QM
 463         "?"
 464 #endif
 465         ;
 466
 467 #if (defined (TE_I386AIX)                               \
 468      || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
 469          && !defined (TE_GNU)                           \
 470          && !defined (TE_LINUX)                         \
 471          && !defined (TE_NACL)                          \
 472          && !defined (TE_FreeBSD)                       \
 473          && !defined (TE_DragonFly)                     \
 474          && !defined (TE_NetBSD)))
 475 /* This array holds the chars that always start a comment.  If the
 476    pre-processor is disabled, these aren't very useful.  The option
 477    --divide will remove '/' from this list.  */
 478 const char *i386_comment_chars = "#/";
 479 #define SVR4_COMMENT_CHARS 1
 480 #define PREFIX_SEPARATOR '\\'
 481
 482 #else
 483 const char *i386_comment_chars = "#";
 484 #define PREFIX_SEPARATOR '/'
 485 #endif
 486
 487 /* This array holds the chars that only start a comment at the beginning of
 488    a line.  If the line seems to have the form '# 123 filename'
 489    .line and .file directives will appear in the pre-processed output.
 490    Note that input_file.c hand checks for '#' at the beginning of the
 491    first line of the input file.  This is because the compiler outputs
 492    #NO_APP at the beginning of its output.
 493    Also note that comments started like this one will always work if
 494    '/' isn't otherwise defined.  */
 495 const char line_comment_chars[] = "#/";
 496
 497 const char line_separator_chars[] = ";";
 498
 499 /* Chars that can be used to separate mant from exp in floating point
 500    nums.  */
 501 const char EXP_CHARS[] = "eE";
 502
 503 /* Chars that mean this number is a floating point constant
 504    As in 0f12.456
 505    or    0d1.2345e12.  */
 506 const char FLT_CHARS[] = "fFdDxX";
 507
 508 /* Tables for lexical analysis.  */
 509 static char mnemonic_chars[256];
 510 static char register_chars[256];
 511 static char operand_chars[256];
 512 static char identifier_chars[256];
 513 static char digit_chars[256];
 514
 515 /* Lexical macros.  */
 516 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
 517 #define is_operand_char(x) (operand_chars[(unsigned char) x])
 518 #define is_register_char(x) (register_chars[(unsigned char) x])
 519 #define is_space_char(x) ((x) == ' ')
 520 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
 521 #define is_digit_char(x) (digit_chars[(unsigned char) x])
 522
 523 /* All non-digit non-letter characters that may occur in an operand.  */
 524 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
 525
 526 /* md_assemble() always leaves the strings it's passed unaltered.  To
 527    effect this we maintain a stack of saved characters that we've smashed
 528    with '\0's (indicating end of strings for various sub-fields of the
 529    assembler instruction).  */
 530 static char save_stack[32];
 531 static char *save_stack_p;
 532 #define END_STRING_AND_SAVE(s) \
 533         do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
 534 #define RESTORE_END_STRING(s) \
 535         do { *(s) = *--save_stack_p; } while (0)
 536
 537 /* The instruction we're assembling.  */
 538 static i386_insn i;
 539
 540 /* Possible templates for current insn.  */
 541 static const templates *current_templates;
 542
 543 /* Per instruction expressionS buffers: max displacements & immediates.  */
 544 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
 545 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
 546
 547 /* Current operand we are working on.  */
 548 static int this_operand = -1;
 549
 550 /* We support four different modes.  FLAG_CODE variable is used to distinguish
 551    these.  */
 552
 553 enum flag_code {
 554         CODE_32BIT,
 555         CODE_16BIT,
 556         CODE_64BIT };
 557
 558 static enum flag_code flag_code;
 559 static unsigned int object_64bit;
 560 static unsigned int disallow_64bit_reloc;
 561 static int use_rela_relocations = 0;
 562
 563 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
 564      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
 565      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
 566
 567 /* The ELF ABI to use.  */
 568 enum x86_elf_abi
 569 {
 570   I386_ABI,
 571   X86_64_ABI,
 572   X86_64_X32_ABI
 573 };
 574
 575 static enum x86_elf_abi x86_elf_abi = I386_ABI;
 576 #endif
 577
 578 #if defined (TE_PE) || defined (TE_PEP)
 579 /* Use big object file format.  */
 580 static int use_big_obj = 0;
 581 #endif
 582
 583 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 584 /* 1 if generating code for a shared library.  */
 585 static int shared = 0;
 586 #endif
 587
 588 /* 1 for intel syntax,
 589    0 if att syntax.  */
 590 static int intel_syntax = 0;
 591
 592 /* 1 for Intel64 ISA,
 593    0 if AMD64 ISA.  */
 594 static int intel64;
 595
 596 /* 1 for intel mnemonic,
 597    0 if att mnemonic.  */
 598 static int intel_mnemonic = !SYSV386_COMPAT;
 599
 600 /* 1 if pseudo registers are permitted.  */
 601 static int allow_pseudo_reg = 0;
 602
 603 /* 1 if register prefix % not required.  */
 604 static int allow_naked_reg = 0;
 605
 606 /* 1 if the assembler should add BND prefix for all control-transferring
 607    instructions supporting it, even if this prefix wasn't specified
 608    explicitly.  */
 609 static int add_bnd_prefix = 0;
 610
 611 /* 1 if pseudo index register, eiz/riz, is allowed .  */
 612 static int allow_index_reg = 0;
 613
 614 /* 1 if the assembler should ignore LOCK prefix, even if it was
 615    specified explicitly.  */
 616 static int omit_lock_prefix = 0;
 617
 618 /* 1 if the assembler should encode lfence, mfence, and sfence as
 619    "lock addl $0, (%{re}sp)".  */
 620 static int avoid_fence = 0;
 621
 622 /* 1 if the assembler should generate relax relocations.  */
 623
 624 static int generate_relax_relocations
 625   = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
 626
 627 static enum check_kind
 628   {
 629     check_none = 0,
 630     check_warning,
 631     check_error
 632   }
 633 sse_check, operand_check = check_warning;
 634
 635 /* Optimization:
 636    1. Clear the REX_W bit with register operand if possible.
 637    2. Above plus use 128bit vector instruction to clear the full vector
 638       register.
 639  */
 640 static int optimize = 0;
 641
 642 /* Optimization:
 643    1. Clear the REX_W bit with register operand if possible.
 644    2. Above plus use 128bit vector instruction to clear the full vector
 645       register.
 646    3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
 647       "testb $imm7,%r8".
 648  */
 649 static int optimize_for_space = 0;
 650
 651 /* Register prefix used for error message.  */
 652 static const char *register_prefix = "%";
 653
 654 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
 655    leave, push, and pop instructions so that gcc has the same stack
 656    frame as in 32 bit mode.  */
 657 static char stackop_size = '\0';
 658
 659 /* Non-zero to optimize code alignment.  */
 660 int optimize_align_code = 1;
 661
 662 /* Non-zero to quieten some warnings.  */
 663 static int quiet_warnings = 0;
 664
 665 /* CPU name.  */
 666 static const char *cpu_arch_name = NULL;
 667 static char *cpu_sub_arch_name = NULL;
 668
 669 /* CPU feature flags.  */
 670 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
 671
 672 /* If we have selected a cpu we are generating instructions for.  */
 673 static int cpu_arch_tune_set = 0;
 674
 675 /* Cpu we are generating instructions for.  */
 676 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
 677
 678 /* CPU feature flags of cpu we are generating instructions for.  */
 679 static i386_cpu_flags cpu_arch_tune_flags;
 680
 681 /* CPU instruction set architecture used.  */
 682 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
 683
 684 /* CPU feature flags of instruction set architecture used.  */
 685 i386_cpu_flags cpu_arch_isa_flags;
 686
 687 /* If set, conditional jumps are not automatically promoted to handle
 688    larger than a byte offset.  */
 689 static unsigned int no_cond_jump_promotion = 0;
 690
 691 /* Encode SSE instructions with VEX prefix.  */
 692 static unsigned int sse2avx;
 693
 694 /* Encode scalar AVX instructions with specific vector length.  */
 695 static enum
 696   {
 697     vex128 = 0,
 698     vex256
 699   } avxscalar;
 700
 701 /* Encode VEX WIG instructions with specific vex.w.  */
 702 static enum
 703   {
 704     vexw0 = 0,
 705     vexw1
 706   } vexwig;
 707
 708 /* Encode scalar EVEX LIG instructions with specific vector length.  */
 709 static enum
 710   {
 711     evexl128 = 0,
 712     evexl256,
 713     evexl512
 714   } evexlig;
 715
 716 /* Encode EVEX WIG instructions with specific evex.w.  */
 717 static enum
 718   {
 719     evexw0 = 0,
 720     evexw1
 721   } evexwig;
 722
 723 /* Value to encode in EVEX RC bits, for SAE-only instructions.  */
 724 static enum rc_type evexrcig = rne;
 725
 726 /* Pre-defined "_GLOBAL_OFFSET_TABLE_".  */
 727 static symbolS *GOT_symbol;
 728
 729 /* The dwarf2 return column, adjusted for 32 or 64 bit.  */
 730 unsigned int x86_dwarf2_return_column;
 731
 732 /* The dwarf2 data alignment, adjusted for 32 or 64 bit.  */
 733 int x86_cie_data_alignment;
 734
 735 /* Interface to relax_segment.
 736    There are 3 major relax states for 386 jump insns because the
 737    different types of jumps add different sizes to frags when we're
 738    figuring out what sort of jump to choose to reach a given label.  */
 739
 740 /* Types.  */
 741 #define UNCOND_JUMP 0
 742 #define COND_JUMP 1
 743 #define COND_JUMP86 2
 744
 745 /* Sizes.  */
 746 #define CODE16  1
 747 #define SMALL   0
 748 #define SMALL16 (SMALL | CODE16)
 749 #define BIG     2
 750 #define BIG16   (BIG | CODE16)
 751
 752 #ifndef INLINE
 753 #ifdef __GNUC__
 754 #define INLINE __inline__
 755 #else
 756 #define INLINE
 757 #endif
 758 #endif
 759
 760 #define ENCODE_RELAX_STATE(type, size) \
 761   ((relax_substateT) (((type) << 2) | (size)))
 762 #define TYPE_FROM_RELAX_STATE(s) \
 763   ((s) >> 2)
 764 #define DISP_SIZE_FROM_RELAX_STATE(s) \
 765     ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
 766
 767 /* This table is used by relax_frag to promote short jumps to long
 768    ones where necessary.  SMALL (short) jumps may be promoted to BIG
 769    (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long).  We
 770    don't allow a short jump in a 32 bit code segment to be promoted to
 771    a 16 bit offset jump because it's slower (requires data size
 772    prefix), and doesn't work, unless the destination is in the bottom
 773    64k of the code segment (The top 16 bits of eip are zeroed).  */
 774
 775 const relax_typeS md_relax_table[] =
 776 {
 777   /* The fields are:
 778      1) most positive reach of this state,
 779      2) most negative reach of this state,
 780      3) how many bytes this mode will have in the variable part of the frag
 781      4) which index into the table to try if we can't fit into this one.  */
 782
 783   /* UNCOND_JUMP states.  */
 784   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
 785   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
 786   /* dword jmp adds 4 bytes to frag:
 787      0 extra opcode bytes, 4 displacement bytes.  */
 788   {0, 0, 4, 0},
 789   /* word jmp adds 2 byte2 to frag:
 790      0 extra opcode bytes, 2 displacement bytes.  */
 791   {0, 0, 2, 0},
 792
 793   /* COND_JUMP states.  */
 794   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
 795   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
 796   /* dword conditionals adds 5 bytes to frag:
 797      1 extra opcode byte, 4 displacement bytes.  */
 798   {0, 0, 5, 0},
 799   /* word conditionals add 3 bytes to frag:
 800      1 extra opcode byte, 2 displacement bytes.  */
 801   {0, 0, 3, 0},
 802
 803   /* COND_JUMP86 states.  */
 804   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
 805   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
 806   /* dword conditionals adds 5 bytes to frag:
 807      1 extra opcode byte, 4 displacement bytes.  */
 808   {0, 0, 5, 0},
 809   /* word conditionals add 4 bytes to frag:
 810      1 displacement byte and a 3 byte long branch insn.  */
 811   {0, 0, 4, 0}
 812 };
 813
 814 static const arch_entry cpu_arch[] =
 815 {
 816   /* Do not replace the first two entries - i386_target_format()
 817      relies on them being there in this order.  */
 818   { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
 819     CPU_GENERIC32_FLAGS, 0 },
 820   { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
 821     CPU_GENERIC64_FLAGS, 0 },
 822   { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
 823     CPU_NONE_FLAGS, 0 },
 824   { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
 825     CPU_I186_FLAGS, 0 },
 826   { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
 827     CPU_I286_FLAGS, 0 },
 828   { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
 829     CPU_I386_FLAGS, 0 },
 830   { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
 831     CPU_I486_FLAGS, 0 },
 832   { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
 833     CPU_I586_FLAGS, 0 },
 834   { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
 835     CPU_I686_FLAGS, 0 },
 836   { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
 837     CPU_I586_FLAGS, 0 },
 838   { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
 839     CPU_PENTIUMPRO_FLAGS, 0 },
 840   { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
 841     CPU_P2_FLAGS, 0 },
 842   { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
 843     CPU_P3_FLAGS, 0 },
 844   { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
 845     CPU_P4_FLAGS, 0 },
 846   { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
 847     CPU_CORE_FLAGS, 0 },
 848   { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
 849     CPU_NOCONA_FLAGS, 0 },
 850   { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
 851     CPU_CORE_FLAGS, 1 },
 852   { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
 853     CPU_CORE_FLAGS, 0 },
 854   { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
 855     CPU_CORE2_FLAGS, 1 },
 856   { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
 857     CPU_CORE2_FLAGS, 0 },
 858   { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
 859     CPU_COREI7_FLAGS, 0 },
 860   { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
 861     CPU_L1OM_FLAGS, 0 },
 862   { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
 863     CPU_K1OM_FLAGS, 0 },
 864   { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
 865     CPU_IAMCU_FLAGS, 0 },
 866   { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
 867     CPU_K6_FLAGS, 0 },
 868   { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
 869     CPU_K6_2_FLAGS, 0 },
 870   { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
 871     CPU_ATHLON_FLAGS, 0 },
 872   { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
 873     CPU_K8_FLAGS, 1 },
 874   { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
 875     CPU_K8_FLAGS, 0 },
 876   { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
 877     CPU_K8_FLAGS, 0 },
 878   { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
 879     CPU_AMDFAM10_FLAGS, 0 },
 880   { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
 881     CPU_BDVER1_FLAGS, 0 },
 882   { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
 883     CPU_BDVER2_FLAGS, 0 },
 884   { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
 885     CPU_BDVER3_FLAGS, 0 },
 886   { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
 887     CPU_BDVER4_FLAGS, 0 },
 888   { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
 889     CPU_ZNVER1_FLAGS, 0 },
 890   { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
 891     CPU_ZNVER2_FLAGS, 0 },
 892   { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
 893     CPU_BTVER1_FLAGS, 0 },
 894   { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
 895     CPU_BTVER2_FLAGS, 0 },
 896   { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
 897     CPU_8087_FLAGS, 0 },
 898   { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
 899     CPU_287_FLAGS, 0 },
 900   { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
 901     CPU_387_FLAGS, 0 },
 902   { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
 903     CPU_687_FLAGS, 0 },
 904   { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
 905     CPU_CMOV_FLAGS, 0 },
 906   { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
 907     CPU_FXSR_FLAGS, 0 },
 908   { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
 909     CPU_MMX_FLAGS, 0 },
 910   { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
 911     CPU_SSE_FLAGS, 0 },
 912   { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
 913     CPU_SSE2_FLAGS, 0 },
 914   { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
 915     CPU_SSE3_FLAGS, 0 },
 916   { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
 917     CPU_SSSE3_FLAGS, 0 },
 918   { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
 919     CPU_SSE4_1_FLAGS, 0 },
 920   { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
 921     CPU_SSE4_2_FLAGS, 0 },
 922   { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
 923     CPU_SSE4_2_FLAGS, 0 },
 924   { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
 925     CPU_AVX_FLAGS, 0 },
 926   { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
 927     CPU_AVX2_FLAGS, 0 },
 928   { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
 929     CPU_AVX512F_FLAGS, 0 },
 930   { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
 931     CPU_AVX512CD_FLAGS, 0 },
 932   { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
 933     CPU_AVX512ER_FLAGS, 0 },
 934   { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
 935     CPU_AVX512PF_FLAGS, 0 },
 936   { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
 937     CPU_AVX512DQ_FLAGS, 0 },
 938   { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
 939     CPU_AVX512BW_FLAGS, 0 },
 940   { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
 941     CPU_AVX512VL_FLAGS, 0 },
 942   { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
 943     CPU_VMX_FLAGS, 0 },
 944   { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
 945     CPU_VMFUNC_FLAGS, 0 },
 946   { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
 947     CPU_SMX_FLAGS, 0 },
 948   { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
 949     CPU_XSAVE_FLAGS, 0 },
 950   { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
 951     CPU_XSAVEOPT_FLAGS, 0 },
 952   { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
 953     CPU_XSAVEC_FLAGS, 0 },
 954   { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
 955     CPU_XSAVES_FLAGS, 0 },
 956   { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
 957     CPU_AES_FLAGS, 0 },
 958   { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
 959     CPU_PCLMUL_FLAGS, 0 },
 960   { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
 961     CPU_PCLMUL_FLAGS, 1 },
 962   { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
 963     CPU_FSGSBASE_FLAGS, 0 },
 964   { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
 965     CPU_RDRND_FLAGS, 0 },
 966   { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
 967     CPU_F16C_FLAGS, 0 },
 968   { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
 969     CPU_BMI2_FLAGS, 0 },
 970   { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
 971     CPU_FMA_FLAGS, 0 },
 972   { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
 973     CPU_FMA4_FLAGS, 0 },
 974   { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
 975     CPU_XOP_FLAGS, 0 },
 976   { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
 977     CPU_LWP_FLAGS, 0 },
 978   { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
 979     CPU_MOVBE_FLAGS, 0 },
 980   { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
 981     CPU_CX16_FLAGS, 0 },
 982   { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
 983     CPU_EPT_FLAGS, 0 },
 984   { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
 985     CPU_LZCNT_FLAGS, 0 },
 986   { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
 987     CPU_HLE_FLAGS, 0 },
 988   { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
 989     CPU_RTM_FLAGS, 0 },
 990   { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
 991     CPU_INVPCID_FLAGS, 0 },
 992   { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
 993     CPU_CLFLUSH_FLAGS, 0 },
 994   { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
 995     CPU_NOP_FLAGS, 0 },
 996   { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
 997     CPU_SYSCALL_FLAGS, 0 },
 998   { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
 999     CPU_RDTSCP_FLAGS, 0 },
1000   { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1001     CPU_3DNOW_FLAGS, 0 },
1002   { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1003     CPU_3DNOWA_FLAGS, 0 },
1004   { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1005     CPU_PADLOCK_FLAGS, 0 },
1006   { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1007     CPU_SVME_FLAGS, 1 },
1008   { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1009     CPU_SVME_FLAGS, 0 },
1010   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1011     CPU_SSE4A_FLAGS, 0 },
1012   { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1013     CPU_ABM_FLAGS, 0 },
1014   { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1015     CPU_BMI_FLAGS, 0 },
1016   { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1017     CPU_TBM_FLAGS, 0 },
1018   { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1019     CPU_ADX_FLAGS, 0 },
1020   { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1021     CPU_RDSEED_FLAGS, 0 },
1022   { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1023     CPU_PRFCHW_FLAGS, 0 },
1024   { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1025     CPU_SMAP_FLAGS, 0 },
1026   { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1027     CPU_MPX_FLAGS, 0 },
1028   { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1029     CPU_SHA_FLAGS, 0 },
1030   { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1031     CPU_CLFLUSHOPT_FLAGS, 0 },
1032   { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1033     CPU_PREFETCHWT1_FLAGS, 0 },
1034   { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1035     CPU_SE1_FLAGS, 0 },
1036   { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1037     CPU_CLWB_FLAGS, 0 },
1038   { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1039     CPU_AVX512IFMA_FLAGS, 0 },
1040   { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1041     CPU_AVX512VBMI_FLAGS, 0 },
1042   { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1043     CPU_AVX512_4FMAPS_FLAGS, 0 },
1044   { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1045     CPU_AVX512_4VNNIW_FLAGS, 0 },
1046   { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1047     CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1048   { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1049     CPU_AVX512_VBMI2_FLAGS, 0 },
1050   { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1051     CPU_AVX512_VNNI_FLAGS, 0 },
1052   { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1053     CPU_AVX512_BITALG_FLAGS, 0 },
1054   { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1055     CPU_CLZERO_FLAGS, 0 },
1056   { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1057     CPU_MWAITX_FLAGS, 0 },
1058   { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1059     CPU_OSPKE_FLAGS, 0 },
1060   { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1061     CPU_RDPID_FLAGS, 0 },
1062   { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1063     CPU_PTWRITE_FLAGS, 0 },
1064   { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1065     CPU_IBT_FLAGS, 0 },
1066   { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1067     CPU_SHSTK_FLAGS, 0 },
1068   { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1069     CPU_GFNI_FLAGS, 0 },
1070   { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1071     CPU_VAES_FLAGS, 0 },
1072   { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1073     CPU_VPCLMULQDQ_FLAGS, 0 },
1074   { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1075     CPU_WBNOINVD_FLAGS, 0 },
1076   { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1077     CPU_PCONFIG_FLAGS, 0 },
1078   { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1079     CPU_WAITPKG_FLAGS, 0 },
1080   { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1081     CPU_CLDEMOTE_FLAGS, 0 },
1082   { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1083     CPU_MOVDIRI_FLAGS, 0 },
1084   { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1085     CPU_MOVDIR64B_FLAGS, 0 },
1086   { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1087     CPU_AVX512_BF16_FLAGS, 0 },
1088   { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1089     CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1090   { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1091     CPU_ENQCMD_FLAGS, 0 },
1092 };
1093
1094 static const noarch_entry cpu_noarch[] =
1095 {
1096   { STRING_COMMA_LEN ("no87"),  CPU_ANY_X87_FLAGS },
1097   { STRING_COMMA_LEN ("no287"),  CPU_ANY_287_FLAGS },
1098   { STRING_COMMA_LEN ("no387"),  CPU_ANY_387_FLAGS },
1099   { STRING_COMMA_LEN ("no687"),  CPU_ANY_687_FLAGS },
1100   { STRING_COMMA_LEN ("nocmov"),  CPU_ANY_CMOV_FLAGS },
1101   { STRING_COMMA_LEN ("nofxsr"),  CPU_ANY_FXSR_FLAGS },
1102   { STRING_COMMA_LEN ("nommx"),  CPU_ANY_MMX_FLAGS },
1103   { STRING_COMMA_LEN ("nosse"),  CPU_ANY_SSE_FLAGS },
1104   { STRING_COMMA_LEN ("nosse2"),  CPU_ANY_SSE2_FLAGS },
1105   { STRING_COMMA_LEN ("nosse3"),  CPU_ANY_SSE3_FLAGS },
1106   { STRING_COMMA_LEN ("nossse3"),  CPU_ANY_SSSE3_FLAGS },
1107   { STRING_COMMA_LEN ("nosse4.1"),  CPU_ANY_SSE4_1_FLAGS },
1108   { STRING_COMMA_LEN ("nosse4.2"),  CPU_ANY_SSE4_2_FLAGS },
1109   { STRING_COMMA_LEN ("nosse4"),  CPU_ANY_SSE4_1_FLAGS },
1110   { STRING_COMMA_LEN ("noavx"),  CPU_ANY_AVX_FLAGS },
1111   { STRING_COMMA_LEN ("noavx2"),  CPU_ANY_AVX2_FLAGS },
1112   { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1113   { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1114   { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1115   { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1116   { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1117   { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1118   { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1119   { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1120   { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1121   { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1122   { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1123   { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1124   { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1125   { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1126   { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1127   { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1128   { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1129   { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1130   { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1131   { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1132   { STRING_COMMA_LEN ("noavx512_vp2intersect"), CPU_ANY_SHSTK_FLAGS },
1133   { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1134 };
1135
1136 #ifdef I386COFF
1137 /* Like s_lcomm_internal in gas/read.c but the alignment string
1138    is allowed to be optional.  */
1139
1140 static symbolS *
1141 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1142 {
1143   addressT align = 0;
1144
1145   SKIP_WHITESPACE ();
1146
1147   if (needs_align
1148       && *input_line_pointer == ',')
1149     {
1150       align = parse_align (needs_align - 1);
1151
1152       if (align == (addressT) -1)
1153         return NULL;
1154     }
1155   else
1156     {
1157       if (size >= 8)
1158         align = 3;
1159       else if (size >= 4)
1160         align = 2;
1161       else if (size >= 2)
1162         align = 1;
1163       else
1164         align = 0;
1165     }
1166
1167   bss_alloc (symbolP, size, align);
1168   return symbolP;
1169 }
1170
1171 static void
1172 pe_lcomm (int needs_align)
1173 {
1174   s_comm_internal (needs_align * 2, pe_lcomm_internal);
1175 }
1176 #endif
1177
1178 const pseudo_typeS md_pseudo_table[] =
1179 {
1180 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1181   {"align", s_align_bytes, 0},
1182 #else
1183   {"align", s_align_ptwo, 0},
1184 #endif
1185   {"arch", set_cpu_arch, 0},
1186 #ifndef I386COFF
1187   {"bss", s_bss, 0},
1188 #else
1189   {"lcomm", pe_lcomm, 1},
1190 #endif
1191   {"ffloat", float_cons, 'f'},
1192   {"dfloat", float_cons, 'd'},
1193   {"tfloat", float_cons, 'x'},
1194   {"value", cons, 2},
1195   {"slong", signed_cons, 4},
1196   {"noopt", s_ignore, 0},
1197   {"optim", s_ignore, 0},
1198   {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1199   {"code16", set_code_flag, CODE_16BIT},
1200   {"code32", set_code_flag, CODE_32BIT},
1201 #ifdef BFD64
1202   {"code64", set_code_flag, CODE_64BIT},
1203 #endif
1204   {"intel_syntax", set_intel_syntax, 1},
1205   {"att_syntax", set_intel_syntax, 0},
1206   {"intel_mnemonic", set_intel_mnemonic, 1},
1207   {"att_mnemonic", set_intel_mnemonic, 0},
1208   {"allow_index_reg", set_allow_index_reg, 1},
1209   {"disallow_index_reg", set_allow_index_reg, 0},
1210   {"sse_check", set_check, 0},
1211   {"operand_check", set_check, 1},
1212 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1213   {"largecomm", handle_large_common, 0},
1214 #else
1215   {"file", dwarf2_directive_file, 0},
1216   {"loc", dwarf2_directive_loc, 0},
1217   {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1218 #endif
1219 #ifdef TE_PE
1220   {"secrel32", pe_directive_secrel, 0},
1221 #endif
1222   {0, 0, 0}
1223 };
1224
1225 /* For interface with expression ().  */
1226 extern char *input_line_pointer;
1227
1228 /* Hash table for instruction mnemonic lookup.  */
1229 static struct hash_control *op_hash;
1230
1231 /* Hash table for register lookup.  */
1232 static struct hash_control *reg_hash;
1233 \f
1234   /* Various efficient no-op patterns for aligning code labels.
1235      Note: Don't try to assemble the instructions in the comments.
1236      0L and 0w are not legal.  */
1237 static const unsigned char f32_1[] =
1238   {0x90};                               /* nop                  */
1239 static const unsigned char f32_2[] =
1240   {0x66,0x90};                          /* xchg %ax,%ax         */
1241 static const unsigned char f32_3[] =
1242   {0x8d,0x76,0x00};                     /* leal 0(%esi),%esi    */
1243 static const unsigned char f32_4[] =
1244   {0x8d,0x74,0x26,0x00};                /* leal 0(%esi,1),%esi  */
1245 static const unsigned char f32_6[] =
1246   {0x8d,0xb6,0x00,0x00,0x00,0x00};      /* leal 0L(%esi),%esi   */
1247 static const unsigned char f32_7[] =
1248   {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1249 static const unsigned char f16_3[] =
1250   {0x8d,0x74,0x00};                     /* lea 0(%si),%si       */
1251 static const unsigned char f16_4[] =
1252   {0x8d,0xb4,0x00,0x00};                /* lea 0W(%si),%si      */
1253 static const unsigned char jump_disp8[] =
1254   {0xeb};                               /* jmp disp8           */
1255 static const unsigned char jump32_disp32[] =
1256   {0xe9};                               /* jmp disp32          */
1257 static const unsigned char jump16_disp32[] =
1258   {0x66,0xe9};                          /* jmp disp32          */
1259 /* 32-bit NOPs patterns.  */
1260 static const unsigned char *const f32_patt[] = {
1261   f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1262 };
1263 /* 16-bit NOPs patterns.  */
1264 static const unsigned char *const f16_patt[] = {
1265   f32_1, f32_2, f16_3, f16_4
1266 };
1267 /* nopl (%[re]ax) */
1268 static const unsigned char alt_3[] =
1269   {0x0f,0x1f,0x00};
1270 /* nopl 0(%[re]ax) */
1271 static const unsigned char alt_4[] =
1272   {0x0f,0x1f,0x40,0x00};
1273 /* nopl 0(%[re]ax,%[re]ax,1) */
1274 static const unsigned char alt_5[] =
1275   {0x0f,0x1f,0x44,0x00,0x00};
1276 /* nopw 0(%[re]ax,%[re]ax,1) */
1277 static const unsigned char alt_6[] =
1278   {0x66,0x0f,0x1f,0x44,0x00,0x00};
1279 /* nopl 0L(%[re]ax) */
1280 static const unsigned char alt_7[] =
1281   {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1282 /* nopl 0L(%[re]ax,%[re]ax,1) */
1283 static const unsigned char alt_8[] =
1284   {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1285 /* nopw 0L(%[re]ax,%[re]ax,1) */
1286 static const unsigned char alt_9[] =
1287   {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1288 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1289 static const unsigned char alt_10[] =
1290   {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1291 /* data16 nopw %cs:0L(%eax,%eax,1) */
1292 static const unsigned char alt_11[] =
1293   {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1294 /* 32-bit and 64-bit NOPs patterns.  */
1295 static const unsigned char *const alt_patt[] = {
1296   f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1297   alt_9, alt_10, alt_11
1298 };
1299
1300 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1301    size of a single NOP instruction MAX_SINGLE_NOP_SIZE.  */
1302
1303 static void
1304 i386_output_nops (char *where, const unsigned char *const *patt,
1305                   int count, int max_single_nop_size)
1306
1307 {
1308   /* Place the longer NOP first.  */
1309   int last;
1310   int offset;
1311   const unsigned char *nops;
1312
1313   if (max_single_nop_size < 1)
1314     {
1315       as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1316                 max_single_nop_size);
1317       return;
1318     }
1319
1320   nops = patt[max_single_nop_size - 1];
1321
1322   /* Use the smaller one if the requsted one isn't available.  */
1323   if (nops == NULL)
1324     {
1325       max_single_nop_size--;
1326       nops = patt[max_single_nop_size - 1];
1327     }
1328
1329   last = count % max_single_nop_size;
1330
1331   count -= last;
1332   for (offset = 0; offset < count; offset += max_single_nop_size)
1333     memcpy (where + offset, nops, max_single_nop_size);
1334
1335   if (last)
1336     {
1337       nops = patt[last - 1];
1338       if (nops == NULL)
1339         {
1340           /* Use the smaller one plus one-byte NOP if the needed one
1341              isn't available.  */
1342           last--;
1343           nops = patt[last - 1];
1344           memcpy (where + offset, nops, last);
1345           where[offset + last] = *patt[0];
1346         }
1347       else
1348         memcpy (where + offset, nops, last);
1349     }
1350 }
1351
1352 static INLINE int
1353 fits_in_imm7 (offsetT num)
1354 {
1355   return (num & 0x7f) == num;
1356 }
1357
1358 static INLINE int
1359 fits_in_imm31 (offsetT num)
1360 {
1361   return (num & 0x7fffffff) == num;
1362 }
1363
1364 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1365    single NOP instruction LIMIT.  */
1366
1367 void
1368 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1369 {
1370   const unsigned char *const *patt = NULL;
1371   int max_single_nop_size;
1372   /* Maximum number of NOPs before switching to jump over NOPs.  */
1373   int max_number_of_nops;
1374
1375   switch (fragP->fr_type)
1376     {
1377     case rs_fill_nop:
1378     case rs_align_code:
1379       break;
1380     default:
1381       return;
1382     }
1383
1384   /* We need to decide which NOP sequence to use for 32bit and
1385      64bit. When -mtune= is used:
1386
1387      1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1388      PROCESSOR_GENERIC32, f32_patt will be used.
1389      2. For the rest, alt_patt will be used.
1390
1391      When -mtune= isn't used, alt_patt will be used if
1392      cpu_arch_isa_flags has CpuNop.  Otherwise, f32_patt will
1393      be used.
1394
1395      When -march= or .arch is used, we can't use anything beyond
1396      cpu_arch_isa_flags.   */
1397
1398   if (flag_code == CODE_16BIT)
1399     {
1400       patt = f16_patt;
1401       max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1402       /* Limit number of NOPs to 2 in 16-bit mode.  */
1403       max_number_of_nops = 2;
1404     }
1405   else
1406     {
1407       if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1408         {
1409           /* PROCESSOR_UNKNOWN means that all ISAs may be used.  */
1410           switch (cpu_arch_tune)
1411             {
1412             case PROCESSOR_UNKNOWN:
1413               /* We use cpu_arch_isa_flags to check if we SHOULD
1414                  optimize with nops.  */
1415               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1416                 patt = alt_patt;
1417               else
1418                 patt = f32_patt;
1419               break;
1420             case PROCESSOR_PENTIUM4:
1421             case PROCESSOR_NOCONA:
1422             case PROCESSOR_CORE:
1423             case PROCESSOR_CORE2:
1424             case PROCESSOR_COREI7:
1425             case PROCESSOR_L1OM:
1426             case PROCESSOR_K1OM:
1427             case PROCESSOR_GENERIC64:
1428             case PROCESSOR_K6:
1429             case PROCESSOR_ATHLON:
1430             case PROCESSOR_K8:
1431             case PROCESSOR_AMDFAM10:
1432             case PROCESSOR_BD:
1433             case PROCESSOR_ZNVER:
1434             case PROCESSOR_BT:
1435               patt = alt_patt;
1436               break;
1437             case PROCESSOR_I386:
1438             case PROCESSOR_I486:
1439             case PROCESSOR_PENTIUM:
1440             case PROCESSOR_PENTIUMPRO:
1441             case PROCESSOR_IAMCU:
1442             case PROCESSOR_GENERIC32:
1443               patt = f32_patt;
1444               break;
1445             }
1446         }
1447       else
1448         {
1449           switch (fragP->tc_frag_data.tune)
1450             {
1451             case PROCESSOR_UNKNOWN:
1452               /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1453                  PROCESSOR_UNKNOWN.  */
1454               abort ();
1455               break;
1456
1457             case PROCESSOR_I386:
1458             case PROCESSOR_I486:
1459             case PROCESSOR_PENTIUM:
1460             case PROCESSOR_IAMCU:
1461             case PROCESSOR_K6:
1462             case PROCESSOR_ATHLON:
1463             case PROCESSOR_K8:
1464             case PROCESSOR_AMDFAM10:
1465             case PROCESSOR_BD:
1466             case PROCESSOR_ZNVER:
1467             case PROCESSOR_BT:
1468             case PROCESSOR_GENERIC32:
1469               /* We use cpu_arch_isa_flags to check if we CAN optimize
1470                  with nops.  */
1471               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1472                 patt = alt_patt;
1473               else
1474                 patt = f32_patt;
1475               break;
1476             case PROCESSOR_PENTIUMPRO:
1477             case PROCESSOR_PENTIUM4:
1478             case PROCESSOR_NOCONA:
1479             case PROCESSOR_CORE:
1480             case PROCESSOR_CORE2:
1481             case PROCESSOR_COREI7:
1482             case PROCESSOR_L1OM:
1483             case PROCESSOR_K1OM:
1484               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1485                 patt = alt_patt;
1486               else
1487                 patt = f32_patt;
1488               break;
1489             case PROCESSOR_GENERIC64:
1490               patt = alt_patt;
1491               break;
1492             }
1493         }
1494
1495       if (patt == f32_patt)
1496         {
1497           max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1498           /* Limit number of NOPs to 2 for older processors.  */
1499           max_number_of_nops = 2;
1500         }
1501       else
1502         {
1503           max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1504           /* Limit number of NOPs to 7 for newer processors.  */
1505           max_number_of_nops = 7;
1506         }
1507     }
1508
1509   if (limit == 0)
1510     limit = max_single_nop_size;
1511
1512   if (fragP->fr_type == rs_fill_nop)
1513     {
1514       /* Output NOPs for .nop directive.  */
1515       if (limit > max_single_nop_size)
1516         {
1517           as_bad_where (fragP->fr_file, fragP->fr_line,
1518                         _("invalid single nop size: %d "
1519                           "(expect within [0, %d])"),
1520                         limit, max_single_nop_size);
1521           return;
1522         }
1523     }
1524   else
1525     fragP->fr_var = count;
1526
1527   if ((count / max_single_nop_size) > max_number_of_nops)
1528     {
1529       /* Generate jump over NOPs.  */
1530       offsetT disp = count - 2;
1531       if (fits_in_imm7 (disp))
1532         {
1533           /* Use "jmp disp8" if possible.  */
1534           count = disp;
1535           where[0] = jump_disp8[0];
1536           where[1] = count;
1537           where += 2;
1538         }
1539       else
1540         {
1541           unsigned int size_of_jump;
1542
1543           if (flag_code == CODE_16BIT)
1544             {
1545               where[0] = jump16_disp32[0];
1546               where[1] = jump16_disp32[1];
1547               size_of_jump = 2;
1548             }
1549           else
1550             {
1551               where[0] = jump32_disp32[0];
1552               size_of_jump = 1;
1553             }
1554
1555           count -= size_of_jump + 4;
1556           if (!fits_in_imm31 (count))
1557             {
1558               as_bad_where (fragP->fr_file, fragP->fr_line,
1559                             _("jump over nop padding out of range"));
1560               return;
1561             }
1562
1563           md_number_to_chars (where + size_of_jump, count, 4);
1564           where += size_of_jump + 4;
1565         }
1566     }
1567
1568   /* Generate multiple NOPs.  */
1569   i386_output_nops (where, patt, count, limit);
1570 }
1571
1572 static INLINE int
1573 operand_type_all_zero (const union i386_operand_type *x)
1574 {
1575   switch (ARRAY_SIZE(x->array))
1576     {
1577     case 3:
1578       if (x->array[2])
1579         return 0;
1580       /* Fall through.  */
1581     case 2:
1582       if (x->array[1])
1583         return 0;
1584       /* Fall through.  */
1585     case 1:
1586       return !x->array[0];
1587     default:
1588       abort ();
1589     }
1590 }
1591
1592 static INLINE void
1593 operand_type_set (union i386_operand_type *x, unsigned int v)
1594 {
1595   switch (ARRAY_SIZE(x->array))
1596     {
1597     case 3:
1598       x->array[2] = v;
1599       /* Fall through.  */
1600     case 2:
1601       x->array[1] = v;
1602       /* Fall through.  */
1603     case 1:
1604       x->array[0] = v;
1605       /* Fall through.  */
1606       break;
1607     default:
1608       abort ();
1609     }
1610 }
1611
1612 static INLINE int
1613 operand_type_equal (const union i386_operand_type *x,
1614                     const union i386_operand_type *y)
1615 {
1616   switch (ARRAY_SIZE(x->array))
1617     {
1618     case 3:
1619       if (x->array[2] != y->array[2])
1620         return 0;
1621       /* Fall through.  */
1622     case 2:
1623       if (x->array[1] != y->array[1])
1624         return 0;
1625       /* Fall through.  */
1626     case 1:
1627       return x->array[0] == y->array[0];
1628       break;
1629     default:
1630       abort ();
1631     }
1632 }
1633
1634 static INLINE int
1635 cpu_flags_all_zero (const union i386_cpu_flags *x)
1636 {
1637   switch (ARRAY_SIZE(x->array))
1638     {
1639     case 4:
1640       if (x->array[3])
1641         return 0;
1642       /* Fall through.  */
1643     case 3:
1644       if (x->array[2])
1645         return 0;
1646       /* Fall through.  */
1647     case 2:
1648       if (x->array[1])
1649         return 0;
1650       /* Fall through.  */
1651     case 1:
1652       return !x->array[0];
1653     default:
1654       abort ();
1655     }
1656 }
1657
1658 static INLINE int
1659 cpu_flags_equal (const union i386_cpu_flags *x,
1660                  const union i386_cpu_flags *y)
1661 {
1662   switch (ARRAY_SIZE(x->array))
1663     {
1664     case 4:
1665       if (x->array[3] != y->array[3])
1666         return 0;
1667       /* Fall through.  */
1668     case 3:
1669       if (x->array[2] != y->array[2])
1670         return 0;
1671       /* Fall through.  */
1672     case 2:
1673       if (x->array[1] != y->array[1])
1674         return 0;
1675       /* Fall through.  */
1676     case 1:
1677       return x->array[0] == y->array[0];
1678       break;
1679     default:
1680       abort ();
1681     }
1682 }
1683
1684 static INLINE int
1685 cpu_flags_check_cpu64 (i386_cpu_flags f)
1686 {
1687   return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1688            || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1689 }
1690
1691 static INLINE i386_cpu_flags
1692 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1693 {
1694   switch (ARRAY_SIZE (x.array))
1695     {
1696     case 4:
1697       x.array [3] &= y.array [3];
1698       /* Fall through.  */
1699     case 3:
1700       x.array [2] &= y.array [2];
1701       /* Fall through.  */
1702     case 2:
1703       x.array [1] &= y.array [1];
1704       /* Fall through.  */
1705     case 1:
1706       x.array [0] &= y.array [0];
1707       break;
1708     default:
1709       abort ();
1710     }
1711   return x;
1712 }
1713
1714 static INLINE i386_cpu_flags
1715 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1716 {
1717   switch (ARRAY_SIZE (x.array))
1718     {
1719     case 4:
1720       x.array [3] |= y.array [3];
1721       /* Fall through.  */
1722     case 3:
1723       x.array [2] |= y.array [2];
1724       /* Fall through.  */
1725     case 2:
1726       x.array [1] |= y.array [1];
1727       /* Fall through.  */
1728     case 1:
1729       x.array [0] |= y.array [0];
1730       break;
1731     default:
1732       abort ();
1733     }
1734   return x;
1735 }
1736
1737 static INLINE i386_cpu_flags
1738 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1739 {
1740   switch (ARRAY_SIZE (x.array))
1741     {
1742     case 4:
1743       x.array [3] &= ~y.array [3];
1744       /* Fall through.  */
1745     case 3:
1746       x.array [2] &= ~y.array [2];
1747       /* Fall through.  */
1748     case 2:
1749       x.array [1] &= ~y.array [1];
1750       /* Fall through.  */
1751     case 1:
1752       x.array [0] &= ~y.array [0];
1753       break;
1754     default:
1755       abort ();
1756     }
1757   return x;
1758 }
1759
1760 #define CPU_FLAGS_ARCH_MATCH            0x1
1761 #define CPU_FLAGS_64BIT_MATCH           0x2
1762
1763 #define CPU_FLAGS_PERFECT_MATCH \
1764   (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1765
1766 /* Return CPU flags match bits. */
1767
1768 static int
1769 cpu_flags_match (const insn_template *t)
1770 {
1771   i386_cpu_flags x = t->cpu_flags;
1772   int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1773
1774   x.bitfield.cpu64 = 0;
1775   x.bitfield.cpuno64 = 0;
1776
1777   if (cpu_flags_all_zero (&x))
1778     {
1779       /* This instruction is available on all archs.  */
1780       match |= CPU_FLAGS_ARCH_MATCH;
1781     }
1782   else
1783     {
1784       /* This instruction is available only on some archs.  */
1785       i386_cpu_flags cpu = cpu_arch_flags;
1786
1787       /* AVX512VL is no standalone feature - match it and then strip it.  */
1788       if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1789         return match;
1790       x.bitfield.cpuavx512vl = 0;
1791
1792       cpu = cpu_flags_and (x, cpu);
1793       if (!cpu_flags_all_zero (&cpu))
1794         {
1795           if (x.bitfield.cpuavx)
1796             {
1797               /* We need to check a few extra flags with AVX.  */
1798               if (cpu.bitfield.cpuavx
1799                   && (!t->opcode_modifier.sse2avx || sse2avx)
1800                   && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1801                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1802                   && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1803                 match |= CPU_FLAGS_ARCH_MATCH;
1804             }
1805           else if (x.bitfield.cpuavx512f)
1806             {
1807               /* We need to check a few extra flags with AVX512F.  */
1808               if (cpu.bitfield.cpuavx512f
1809                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1810                   && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1811                   && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1812                 match |= CPU_FLAGS_ARCH_MATCH;
1813             }
1814           else
1815             match |= CPU_FLAGS_ARCH_MATCH;
1816         }
1817     }
1818   return match;
1819 }
1820
1821 static INLINE i386_operand_type
1822 operand_type_and (i386_operand_type x, i386_operand_type y)
1823 {
1824   switch (ARRAY_SIZE (x.array))
1825     {
1826     case 3:
1827       x.array [2] &= y.array [2];
1828       /* Fall through.  */
1829     case 2:
1830       x.array [1] &= y.array [1];
1831       /* Fall through.  */
1832     case 1:
1833       x.array [0] &= y.array [0];
1834       break;
1835     default:
1836       abort ();
1837     }
1838   return x;
1839 }
1840
1841 static INLINE i386_operand_type
1842 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1843 {
1844   switch (ARRAY_SIZE (x.array))
1845     {
1846     case 3:
1847       x.array [2] &= ~y.array [2];
1848       /* Fall through.  */
1849     case 2:
1850       x.array [1] &= ~y.array [1];
1851       /* Fall through.  */
1852     case 1:
1853       x.array [0] &= ~y.array [0];
1854       break;
1855     default:
1856       abort ();
1857     }
1858   return x;
1859 }
1860
1861 static INLINE i386_operand_type
1862 operand_type_or (i386_operand_type x, i386_operand_type y)
1863 {
1864   switch (ARRAY_SIZE (x.array))
1865     {
1866     case 3:
1867       x.array [2] |= y.array [2];
1868       /* Fall through.  */
1869     case 2:
1870       x.array [1] |= y.array [1];
1871       /* Fall through.  */
1872     case 1:
1873       x.array [0] |= y.array [0];
1874       break;
1875     default:
1876       abort ();
1877     }
1878   return x;
1879 }
1880
1881 static INLINE i386_operand_type
1882 operand_type_xor (i386_operand_type x, i386_operand_type y)
1883 {
1884   switch (ARRAY_SIZE (x.array))
1885     {
1886     case 3:
1887       x.array [2] ^= y.array [2];
1888       /* Fall through.  */
1889     case 2:
1890       x.array [1] ^= y.array [1];
1891       /* Fall through.  */
1892     case 1:
1893       x.array [0] ^= y.array [0];
1894       break;
1895     default:
1896       abort ();
1897     }
1898   return x;
1899 }
1900
1901 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
1902 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
1903 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
1904 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
1905 static const i386_operand_type anydisp
1906   = OPERAND_TYPE_ANYDISP;
1907 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
1908 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
1909 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
1910 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
1911 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
1912 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
1913 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
1914 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
1915 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
1916 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
1917 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
1918
1919 enum operand_type
1920 {
1921   reg,
1922   imm,
1923   disp,
1924   anymem
1925 };
1926
1927 static INLINE int
1928 operand_type_check (i386_operand_type t, enum operand_type c)
1929 {
1930   switch (c)
1931     {
1932     case reg:
1933       return t.bitfield.reg;
1934
1935     case imm:
1936       return (t.bitfield.imm8
1937               || t.bitfield.imm8s
1938               || t.bitfield.imm16
1939               || t.bitfield.imm32
1940               || t.bitfield.imm32s
1941               || t.bitfield.imm64);
1942
1943     case disp:
1944       return (t.bitfield.disp8
1945               || t.bitfield.disp16
1946               || t.bitfield.disp32
1947               || t.bitfield.disp32s
1948               || t.bitfield.disp64);
1949
1950     case anymem:
1951       return (t.bitfield.disp8
1952               || t.bitfield.disp16
1953               || t.bitfield.disp32
1954               || t.bitfield.disp32s
1955               || t.bitfield.disp64
1956               || t.bitfield.baseindex);
1957
1958     default:
1959       abort ();
1960     }
1961
1962   return 0;
1963 }
1964
1965 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
1966    between operand GIVEN and opeand WANTED for instruction template T.  */
1967
1968 static INLINE int
1969 match_operand_size (const insn_template *t, unsigned int wanted,
1970                     unsigned int given)
1971 {
1972   return !((i.types[given].bitfield.byte
1973             && !t->operand_types[wanted].bitfield.byte)
1974            || (i.types[given].bitfield.word
1975                && !t->operand_types[wanted].bitfield.word)
1976            || (i.types[given].bitfield.dword
1977                && !t->operand_types[wanted].bitfield.dword)
1978            || (i.types[given].bitfield.qword
1979                && !t->operand_types[wanted].bitfield.qword)
1980            || (i.types[given].bitfield.tbyte
1981                && !t->operand_types[wanted].bitfield.tbyte));
1982 }
1983
1984 /* Return 1 if there is no conflict in SIMD register between operand
1985    GIVEN and opeand WANTED for instruction template T.  */
1986
1987 static INLINE int
1988 match_simd_size (const insn_template *t, unsigned int wanted,
1989                  unsigned int given)
1990 {
1991   return !((i.types[given].bitfield.xmmword
1992             && !t->operand_types[wanted].bitfield.xmmword)
1993            || (i.types[given].bitfield.ymmword
1994                && !t->operand_types[wanted].bitfield.ymmword)
1995            || (i.types[given].bitfield.zmmword
1996                && !t->operand_types[wanted].bitfield.zmmword));
1997 }
1998
1999 /* Return 1 if there is no conflict in any size between operand GIVEN
2000    and opeand WANTED for instruction template T.  */
2001
2002 static INLINE int
2003 match_mem_size (const insn_template *t, unsigned int wanted,
2004                 unsigned int given)
2005 {
2006   return (match_operand_size (t, wanted, given)
2007           && !((i.types[given].bitfield.unspecified
2008                 && !i.broadcast
2009                 && !t->operand_types[wanted].bitfield.unspecified)
2010                || (i.types[given].bitfield.fword
2011                    && !t->operand_types[wanted].bitfield.fword)
2012                /* For scalar opcode templates to allow register and memory
2013                   operands at the same time, some special casing is needed
2014                   here.  Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2015                   down-conversion vpmov*.  */
2016                || ((t->operand_types[wanted].bitfield.regsimd
2017                     && !t->opcode_modifier.broadcast
2018                     && (t->operand_types[wanted].bitfield.byte
2019                         || t->operand_types[wanted].bitfield.word
2020                         || t->operand_types[wanted].bitfield.dword
2021                         || t->operand_types[wanted].bitfield.qword))
2022                    ? (i.types[given].bitfield.xmmword
2023                       || i.types[given].bitfield.ymmword
2024                       || i.types[given].bitfield.zmmword)
2025                    : !match_simd_size(t, wanted, given))));
2026 }
2027
2028 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2029    operands for instruction template T, and it has MATCH_REVERSE set if there
2030    is no size conflict on any operands for the template with operands reversed
2031    (and the template allows for reversing in the first place).  */
2032
2033 #define MATCH_STRAIGHT 1
2034 #define MATCH_REVERSE  2
2035
2036 static INLINE unsigned int
2037 operand_size_match (const insn_template *t)
2038 {
2039   unsigned int j, match = MATCH_STRAIGHT;
2040
2041   /* Don't check jump instructions.  */
2042   if (t->opcode_modifier.jump
2043       || t->opcode_modifier.jumpbyte
2044       || t->opcode_modifier.jumpdword
2045       || t->opcode_modifier.jumpintersegment)
2046     return match;
2047
2048   /* Check memory and accumulator operand size.  */
2049   for (j = 0; j < i.operands; j++)
2050     {
2051       if (!i.types[j].bitfield.reg && !i.types[j].bitfield.regsimd
2052           && t->operand_types[j].bitfield.anysize)
2053         continue;
2054
2055       if (t->operand_types[j].bitfield.reg
2056           && !match_operand_size (t, j, j))
2057         {
2058           match = 0;
2059           break;
2060         }
2061
2062       if (t->operand_types[j].bitfield.regsimd
2063           && !match_simd_size (t, j, j))
2064         {
2065           match = 0;
2066           break;
2067         }
2068
2069       if (t->operand_types[j].bitfield.acc
2070           && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2071         {
2072           match = 0;
2073           break;
2074         }
2075
2076       if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2077         {
2078           match = 0;
2079           break;
2080         }
2081     }
2082
2083   if (!t->opcode_modifier.d)
2084     {
2085 mismatch:
2086       if (!match)
2087         i.error = operand_size_mismatch;
2088       return match;
2089     }
2090
2091   /* Check reverse.  */
2092   gas_assert (i.operands >= 2 && i.operands <= 3);
2093
2094   for (j = 0; j < i.operands; j++)
2095     {
2096       unsigned int given = i.operands - j - 1;
2097
2098       if (t->operand_types[j].bitfield.reg
2099           && !match_operand_size (t, j, given))
2100         goto mismatch;
2101
2102       if (t->operand_types[j].bitfield.regsimd
2103           && !match_simd_size (t, j, given))
2104         goto mismatch;
2105
2106       if (t->operand_types[j].bitfield.acc
2107           && (!match_operand_size (t, j, given)
2108               || !match_simd_size (t, j, given)))
2109         goto mismatch;
2110
2111       if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2112         goto mismatch;
2113     }
2114
2115   return match | MATCH_REVERSE;
2116 }
2117
2118 static INLINE int
2119 operand_type_match (i386_operand_type overlap,
2120                     i386_operand_type given)
2121 {
2122   i386_operand_type temp = overlap;
2123
2124   temp.bitfield.jumpabsolute = 0;
2125   temp.bitfield.unspecified = 0;
2126   temp.bitfield.byte = 0;
2127   temp.bitfield.word = 0;
2128   temp.bitfield.dword = 0;
2129   temp.bitfield.fword = 0;
2130   temp.bitfield.qword = 0;
2131   temp.bitfield.tbyte = 0;
2132   temp.bitfield.xmmword = 0;
2133   temp.bitfield.ymmword = 0;
2134   temp.bitfield.zmmword = 0;
2135   if (operand_type_all_zero (&temp))
2136     goto mismatch;
2137
2138   if (given.bitfield.baseindex == overlap.bitfield.baseindex
2139       && given.bitfield.jumpabsolute == overlap.bitfield.jumpabsolute)
2140     return 1;
2141
2142 mismatch:
2143   i.error = operand_type_mismatch;
2144   return 0;
2145 }
2146
2147 /* If given types g0 and g1 are registers they must be of the same type
2148    unless the expected operand type register overlap is null.
2149    Memory operand size of certain SIMD instructions is also being checked
2150    here.  */
2151
2152 static INLINE int
2153 operand_type_register_match (i386_operand_type g0,
2154                              i386_operand_type t0,
2155                              i386_operand_type g1,
2156                              i386_operand_type t1)
2157 {
2158   if (!g0.bitfield.reg
2159       && !g0.bitfield.regsimd
2160       && (!operand_type_check (g0, anymem)
2161           || g0.bitfield.unspecified
2162           || !t0.bitfield.regsimd))
2163     return 1;
2164
2165   if (!g1.bitfield.reg
2166       && !g1.bitfield.regsimd
2167       && (!operand_type_check (g1, anymem)
2168           || g1.bitfield.unspecified
2169           || !t1.bitfield.regsimd))
2170     return 1;
2171
2172   if (g0.bitfield.byte == g1.bitfield.byte
2173       && g0.bitfield.word == g1.bitfield.word
2174       && g0.bitfield.dword == g1.bitfield.dword
2175       && g0.bitfield.qword == g1.bitfield.qword
2176       && g0.bitfield.xmmword == g1.bitfield.xmmword
2177       && g0.bitfield.ymmword == g1.bitfield.ymmword
2178       && g0.bitfield.zmmword == g1.bitfield.zmmword)
2179     return 1;
2180
2181   if (!(t0.bitfield.byte & t1.bitfield.byte)
2182       && !(t0.bitfield.word & t1.bitfield.word)
2183       && !(t0.bitfield.dword & t1.bitfield.dword)
2184       && !(t0.bitfield.qword & t1.bitfield.qword)
2185       && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2186       && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2187       && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2188     return 1;
2189
2190   i.error = register_type_mismatch;
2191
2192   return 0;
2193 }
2194
2195 static INLINE unsigned int
2196 register_number (const reg_entry *r)
2197 {
2198   unsigned int nr = r->reg_num;
2199
2200   if (r->reg_flags & RegRex)
2201     nr += 8;
2202
2203   if (r->reg_flags & RegVRex)
2204     nr += 16;
2205
2206   return nr;
2207 }
2208
2209 static INLINE unsigned int
2210 mode_from_disp_size (i386_operand_type t)
2211 {
2212   if (t.bitfield.disp8)
2213     return 1;
2214   else if (t.bitfield.disp16
2215            || t.bitfield.disp32
2216            || t.bitfield.disp32s)
2217     return 2;
2218   else
2219     return 0;
2220 }
2221
2222 static INLINE int
2223 fits_in_signed_byte (addressT num)
2224 {
2225   return num + 0x80 <= 0xff;
2226 }
2227
2228 static INLINE int
2229 fits_in_unsigned_byte (addressT num)
2230 {
2231   return num <= 0xff;
2232 }
2233
2234 static INLINE int
2235 fits_in_unsigned_word (addressT num)
2236 {
2237   return num <= 0xffff;
2238 }
2239
2240 static INLINE int
2241 fits_in_signed_word (addressT num)
2242 {
2243   return num + 0x8000 <= 0xffff;
2244 }
2245
2246 static INLINE int
2247 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2248 {
2249 #ifndef BFD64
2250   return 1;
2251 #else
2252   return num + 0x80000000 <= 0xffffffff;
2253 #endif
2254 }                               /* fits_in_signed_long() */
2255
2256 static INLINE int
2257 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2258 {
2259 #ifndef BFD64
2260   return 1;
2261 #else
2262   return num <= 0xffffffff;
2263 #endif
2264 }                               /* fits_in_unsigned_long() */
2265
2266 static INLINE int
2267 fits_in_disp8 (offsetT num)
2268 {
2269   int shift = i.memshift;
2270   unsigned int mask;
2271
2272   if (shift == -1)
2273     abort ();
2274
2275   mask = (1 << shift) - 1;
2276
2277   /* Return 0 if NUM isn't properly aligned.  */
2278   if ((num & mask))
2279     return 0;
2280
2281   /* Check if NUM will fit in 8bit after shift.  */
2282   return fits_in_signed_byte (num >> shift);
2283 }
2284
2285 static INLINE int
2286 fits_in_imm4 (offsetT num)
2287 {
2288   return (num & 0xf) == num;
2289 }
2290
2291 static i386_operand_type
2292 smallest_imm_type (offsetT num)
2293 {
2294   i386_operand_type t;
2295
2296   operand_type_set (&t, 0);
2297   t.bitfield.imm64 = 1;
2298
2299   if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2300     {
2301       /* This code is disabled on the 486 because all the Imm1 forms
2302          in the opcode table are slower on the i486.  They're the
2303          versions with the implicitly specified single-position
2304          displacement, which has another syntax if you really want to
2305          use that form.  */
2306       t.bitfield.imm1 = 1;
2307       t.bitfield.imm8 = 1;
2308       t.bitfield.imm8s = 1;
2309       t.bitfield.imm16 = 1;
2310       t.bitfield.imm32 = 1;
2311       t.bitfield.imm32s = 1;
2312     }
2313   else if (fits_in_signed_byte (num))
2314     {
2315       t.bitfield.imm8 = 1;
2316       t.bitfield.imm8s = 1;
2317       t.bitfield.imm16 = 1;
2318       t.bitfield.imm32 = 1;
2319       t.bitfield.imm32s = 1;
2320     }
2321   else if (fits_in_unsigned_byte (num))
2322     {
2323       t.bitfield.imm8 = 1;
2324       t.bitfield.imm16 = 1;
2325       t.bitfield.imm32 = 1;
2326       t.bitfield.imm32s = 1;
2327     }
2328   else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2329     {
2330       t.bitfield.imm16 = 1;
2331       t.bitfield.imm32 = 1;
2332       t.bitfield.imm32s = 1;
2333     }
2334   else if (fits_in_signed_long (num))
2335     {
2336       t.bitfield.imm32 = 1;
2337       t.bitfield.imm32s = 1;
2338     }
2339   else if (fits_in_unsigned_long (num))
2340     t.bitfield.imm32 = 1;
2341
2342   return t;
2343 }
2344
2345 static offsetT
2346 offset_in_range (offsetT val, int size)
2347 {
2348   addressT mask;
2349
2350   switch (size)
2351     {
2352     case 1: mask = ((addressT) 1 <<  8) - 1; break;
2353     case 2: mask = ((addressT) 1 << 16) - 1; break;
2354     case 4: mask = ((addressT) 2 << 31) - 1; break;
2355 #ifdef BFD64
2356     case 8: mask = ((addressT) 2 << 63) - 1; break;
2357 #endif
2358     default: abort ();
2359     }
2360
2361 #ifdef BFD64
2362   /* If BFD64, sign extend val for 32bit address mode.  */
2363   if (flag_code != CODE_64BIT
2364       || i.prefix[ADDR_PREFIX])
2365     if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2366       val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2367 #endif
2368
2369   if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2370     {
2371       char buf1[40], buf2[40];
2372
2373       sprint_value (buf1, val);
2374       sprint_value (buf2, val & mask);
2375       as_warn (_("%s shortened to %s"), buf1, buf2);
2376     }
2377   return val & mask;
2378 }
2379
2380 enum PREFIX_GROUP
2381 {
2382   PREFIX_EXIST = 0,
2383   PREFIX_LOCK,
2384   PREFIX_REP,
2385   PREFIX_DS,
2386   PREFIX_OTHER
2387 };
2388
2389 /* Returns
2390    a. PREFIX_EXIST if attempting to add a prefix where one from the
2391    same class already exists.
2392    b. PREFIX_LOCK if lock prefix is added.
2393    c. PREFIX_REP if rep/repne prefix is added.
2394    d. PREFIX_DS if ds prefix is added.
2395    e. PREFIX_OTHER if other prefix is added.
2396  */
2397
2398 static enum PREFIX_GROUP
2399 add_prefix (unsigned int prefix)
2400 {
2401   enum PREFIX_GROUP ret = PREFIX_OTHER;
2402   unsigned int q;
2403
2404   if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2405       && flag_code == CODE_64BIT)
2406     {
2407       if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2408           || (i.prefix[REX_PREFIX] & prefix & REX_R)
2409           || (i.prefix[REX_PREFIX] & prefix & REX_X)
2410           || (i.prefix[REX_PREFIX] & prefix & REX_B))
2411         ret = PREFIX_EXIST;
2412       q = REX_PREFIX;
2413     }
2414   else
2415     {
2416       switch (prefix)
2417         {
2418         default:
2419           abort ();
2420
2421         case DS_PREFIX_OPCODE:
2422           ret = PREFIX_DS;
2423           /* Fall through.  */
2424         case CS_PREFIX_OPCODE:
2425         case ES_PREFIX_OPCODE:
2426         case FS_PREFIX_OPCODE:
2427         case GS_PREFIX_OPCODE:
2428         case SS_PREFIX_OPCODE:
2429           q = SEG_PREFIX;
2430           break;
2431
2432         case REPNE_PREFIX_OPCODE:
2433         case REPE_PREFIX_OPCODE:
2434           q = REP_PREFIX;
2435           ret = PREFIX_REP;
2436           break;
2437
2438         case LOCK_PREFIX_OPCODE:
2439           q = LOCK_PREFIX;
2440           ret = PREFIX_LOCK;
2441           break;
2442
2443         case FWAIT_OPCODE:
2444           q = WAIT_PREFIX;
2445           break;
2446
2447         case ADDR_PREFIX_OPCODE:
2448           q = ADDR_PREFIX;
2449           break;
2450
2451         case DATA_PREFIX_OPCODE:
2452           q = DATA_PREFIX;
2453           break;
2454         }
2455       if (i.prefix[q] != 0)
2456         ret = PREFIX_EXIST;
2457     }
2458
2459   if (ret)
2460     {
2461       if (!i.prefix[q])
2462         ++i.prefixes;
2463       i.prefix[q] |= prefix;
2464     }
2465   else
2466     as_bad (_("same type of prefix used twice"));
2467
2468   return ret;
2469 }
2470
2471 static void
2472 update_code_flag (int value, int check)
2473 {
2474   PRINTF_LIKE ((*as_error));
2475
2476   flag_code = (enum flag_code) value;
2477   if (flag_code == CODE_64BIT)
2478     {
2479       cpu_arch_flags.bitfield.cpu64 = 1;
2480       cpu_arch_flags.bitfield.cpuno64 = 0;
2481     }
2482   else
2483     {
2484       cpu_arch_flags.bitfield.cpu64 = 0;
2485       cpu_arch_flags.bitfield.cpuno64 = 1;
2486     }
2487   if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2488     {
2489       if (check)
2490         as_error = as_fatal;
2491       else
2492         as_error = as_bad;
2493       (*as_error) (_("64bit mode not supported on `%s'."),
2494                    cpu_arch_name ? cpu_arch_name : default_arch);
2495     }
2496   if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2497     {
2498       if (check)
2499         as_error = as_fatal;
2500       else
2501         as_error = as_bad;
2502       (*as_error) (_("32bit mode not supported on `%s'."),
2503                    cpu_arch_name ? cpu_arch_name : default_arch);
2504     }
2505   stackop_size = '\0';
2506 }
2507
2508 static void
2509 set_code_flag (int value)
2510 {
2511   update_code_flag (value, 0);
2512 }
2513
2514 static void
2515 set_16bit_gcc_code_flag (int new_code_flag)
2516 {
2517   flag_code = (enum flag_code) new_code_flag;
2518   if (flag_code != CODE_16BIT)
2519     abort ();
2520   cpu_arch_flags.bitfield.cpu64 = 0;
2521   cpu_arch_flags.bitfield.cpuno64 = 1;
2522   stackop_size = LONG_MNEM_SUFFIX;
2523 }
2524
2525 static void
2526 set_intel_syntax (int syntax_flag)
2527 {
2528   /* Find out if register prefixing is specified.  */
2529   int ask_naked_reg = 0;
2530
2531   SKIP_WHITESPACE ();
2532   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2533     {
2534       char *string;
2535       int e = get_symbol_name (&string);
2536
2537       if (strcmp (string, "prefix") == 0)
2538         ask_naked_reg = 1;
2539       else if (strcmp (string, "noprefix") == 0)
2540         ask_naked_reg = -1;
2541       else
2542         as_bad (_("bad argument to syntax directive."));
2543       (void) restore_line_pointer (e);
2544     }
2545   demand_empty_rest_of_line ();
2546
2547   intel_syntax = syntax_flag;
2548
2549   if (ask_naked_reg == 0)
2550     allow_naked_reg = (intel_syntax
2551                        && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2552   else
2553     allow_naked_reg = (ask_naked_reg < 0);
2554
2555   expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2556
2557   identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2558   identifier_chars['$'] = intel_syntax ? '$' : 0;
2559   register_prefix = allow_naked_reg ? "" : "%";
2560 }
2561
2562 static void
2563 set_intel_mnemonic (int mnemonic_flag)
2564 {
2565   intel_mnemonic = mnemonic_flag;
2566 }
2567
2568 static void
2569 set_allow_index_reg (int flag)
2570 {
2571   allow_index_reg = flag;
2572 }
2573
2574 static void
2575 set_check (int what)
2576 {
2577   enum check_kind *kind;
2578   const char *str;
2579
2580   if (what)
2581     {
2582       kind = &operand_check;
2583       str = "operand";
2584     }
2585   else
2586     {
2587       kind = &sse_check;
2588       str = "sse";
2589     }
2590
2591   SKIP_WHITESPACE ();
2592
2593   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2594     {
2595       char *string;
2596       int e = get_symbol_name (&string);
2597
2598       if (strcmp (string, "none") == 0)
2599         *kind = check_none;
2600       else if (strcmp (string, "warning") == 0)
2601         *kind = check_warning;
2602       else if (strcmp (string, "error") == 0)
2603         *kind = check_error;
2604       else
2605         as_bad (_("bad argument to %s_check directive."), str);
2606       (void) restore_line_pointer (e);
2607     }
2608   else
2609     as_bad (_("missing argument for %s_check directive"), str);
2610
2611   demand_empty_rest_of_line ();
2612 }
2613
2614 static void
2615 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2616                            i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2617 {
2618 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2619   static const char *arch;
2620
2621   /* Intel LIOM is only supported on ELF.  */
2622   if (!IS_ELF)
2623     return;
2624
2625   if (!arch)
2626     {
2627       /* Use cpu_arch_name if it is set in md_parse_option.  Otherwise
2628          use default_arch.  */
2629       arch = cpu_arch_name;
2630       if (!arch)
2631         arch = default_arch;
2632     }
2633
2634   /* If we are targeting Intel MCU, we must enable it.  */
2635   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2636       || new_flag.bitfield.cpuiamcu)
2637     return;
2638
2639   /* If we are targeting Intel L1OM, we must enable it.  */
2640   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2641       || new_flag.bitfield.cpul1om)
2642     return;
2643
2644   /* If we are targeting Intel K1OM, we must enable it.  */
2645   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2646       || new_flag.bitfield.cpuk1om)
2647     return;
2648
2649   as_bad (_("`%s' is not supported on `%s'"), name, arch);
2650 #endif
2651 }
2652
2653 static void
2654 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2655 {
2656   SKIP_WHITESPACE ();
2657
2658   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2659     {
2660       char *string;
2661       int e = get_symbol_name (&string);
2662       unsigned int j;
2663       i386_cpu_flags flags;
2664
2665       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2666         {
2667           if (strcmp (string, cpu_arch[j].name) == 0)
2668             {
2669               check_cpu_arch_compatible (string, cpu_arch[j].flags);
2670
2671               if (*string != '.')
2672                 {
2673                   cpu_arch_name = cpu_arch[j].name;
2674                   cpu_sub_arch_name = NULL;
2675                   cpu_arch_flags = cpu_arch[j].flags;
2676                   if (flag_code == CODE_64BIT)
2677                     {
2678                       cpu_arch_flags.bitfield.cpu64 = 1;
2679                       cpu_arch_flags.bitfield.cpuno64 = 0;
2680                     }
2681                   else
2682                     {
2683                       cpu_arch_flags.bitfield.cpu64 = 0;
2684                       cpu_arch_flags.bitfield.cpuno64 = 1;
2685                     }
2686                   cpu_arch_isa = cpu_arch[j].type;
2687                   cpu_arch_isa_flags = cpu_arch[j].flags;
2688                   if (!cpu_arch_tune_set)
2689                     {
2690                       cpu_arch_tune = cpu_arch_isa;
2691                       cpu_arch_tune_flags = cpu_arch_isa_flags;
2692                     }
2693                   break;
2694                 }
2695
2696               flags = cpu_flags_or (cpu_arch_flags,
2697                                     cpu_arch[j].flags);
2698
2699               if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2700                 {
2701                   if (cpu_sub_arch_name)
2702                     {
2703                       char *name = cpu_sub_arch_name;
2704                       cpu_sub_arch_name = concat (name,
2705                                                   cpu_arch[j].name,
2706                                                   (const char *) NULL);
2707                       free (name);
2708                     }
2709                   else
2710                     cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2711                   cpu_arch_flags = flags;
2712                   cpu_arch_isa_flags = flags;
2713                 }
2714               else
2715                 cpu_arch_isa_flags
2716                   = cpu_flags_or (cpu_arch_isa_flags,
2717                                   cpu_arch[j].flags);
2718               (void) restore_line_pointer (e);
2719               demand_empty_rest_of_line ();
2720               return;
2721             }
2722         }
2723
2724       if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2725         {
2726           /* Disable an ISA extension.  */
2727           for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2728             if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2729               {
2730                 flags = cpu_flags_and_not (cpu_arch_flags,
2731                                            cpu_noarch[j].flags);
2732                 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2733                   {
2734                     if (cpu_sub_arch_name)
2735                       {
2736                         char *name = cpu_sub_arch_name;
2737                         cpu_sub_arch_name = concat (name, string,
2738                                                     (const char *) NULL);
2739                         free (name);
2740                       }
2741                     else
2742                       cpu_sub_arch_name = xstrdup (string);
2743                     cpu_arch_flags = flags;
2744                     cpu_arch_isa_flags = flags;
2745                   }
2746                 (void) restore_line_pointer (e);
2747                 demand_empty_rest_of_line ();
2748                 return;
2749               }
2750
2751           j = ARRAY_SIZE (cpu_arch);
2752         }
2753
2754       if (j >= ARRAY_SIZE (cpu_arch))
2755         as_bad (_("no such architecture: `%s'"), string);
2756
2757       *input_line_pointer = e;
2758     }
2759   else
2760     as_bad (_("missing cpu architecture"));
2761
2762   no_cond_jump_promotion = 0;
2763   if (*input_line_pointer == ','
2764       && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2765     {
2766       char *string;
2767       char e;
2768
2769       ++input_line_pointer;
2770       e = get_symbol_name (&string);
2771
2772       if (strcmp (string, "nojumps") == 0)
2773         no_cond_jump_promotion = 1;
2774       else if (strcmp (string, "jumps") == 0)
2775         ;
2776       else
2777         as_bad (_("no such architecture modifier: `%s'"), string);
2778
2779       (void) restore_line_pointer (e);
2780     }
2781
2782   demand_empty_rest_of_line ();
2783 }
2784
2785 enum bfd_architecture
2786 i386_arch (void)
2787 {
2788   if (cpu_arch_isa == PROCESSOR_L1OM)
2789     {
2790       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2791           || flag_code != CODE_64BIT)
2792         as_fatal (_("Intel L1OM is 64bit ELF only"));
2793       return bfd_arch_l1om;
2794     }
2795   else if (cpu_arch_isa == PROCESSOR_K1OM)
2796     {
2797       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2798           || flag_code != CODE_64BIT)
2799         as_fatal (_("Intel K1OM is 64bit ELF only"));
2800       return bfd_arch_k1om;
2801     }
2802   else if (cpu_arch_isa == PROCESSOR_IAMCU)
2803     {
2804       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2805           || flag_code == CODE_64BIT)
2806         as_fatal (_("Intel MCU is 32bit ELF only"));
2807       return bfd_arch_iamcu;
2808     }
2809   else
2810     return bfd_arch_i386;
2811 }
2812
2813 unsigned long
2814 i386_mach (void)
2815 {
2816   if (!strncmp (default_arch, "x86_64", 6))
2817     {
2818       if (cpu_arch_isa == PROCESSOR_L1OM)
2819         {
2820           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2821               || default_arch[6] != '\0')
2822             as_fatal (_("Intel L1OM is 64bit ELF only"));
2823           return bfd_mach_l1om;
2824         }
2825       else if (cpu_arch_isa == PROCESSOR_K1OM)
2826         {
2827           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2828               || default_arch[6] != '\0')
2829             as_fatal (_("Intel K1OM is 64bit ELF only"));
2830           return bfd_mach_k1om;
2831         }
2832       else if (default_arch[6] == '\0')
2833         return bfd_mach_x86_64;
2834       else
2835         return bfd_mach_x64_32;
2836     }
2837   else if (!strcmp (default_arch, "i386")
2838            || !strcmp (default_arch, "iamcu"))
2839     {
2840       if (cpu_arch_isa == PROCESSOR_IAMCU)
2841         {
2842           if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2843             as_fatal (_("Intel MCU is 32bit ELF only"));
2844           return bfd_mach_i386_iamcu;
2845         }
2846       else
2847         return bfd_mach_i386_i386;
2848     }
2849   else
2850     as_fatal (_("unknown architecture"));
2851 }
2852 \f
2853 void
2854 md_begin (void)
2855 {
2856   const char *hash_err;
2857
2858   /* Support pseudo prefixes like {disp32}.  */
2859   lex_type ['{'] = LEX_BEGIN_NAME;
2860
2861   /* Initialize op_hash hash table.  */
2862   op_hash = hash_new ();
2863
2864   {
2865     const insn_template *optab;
2866     templates *core_optab;
2867
2868     /* Setup for loop.  */
2869     optab = i386_optab;
2870     core_optab = XNEW (templates);
2871     core_optab->start = optab;
2872
2873     while (1)
2874       {
2875         ++optab;
2876         if (optab->name == NULL
2877             || strcmp (optab->name, (optab - 1)->name) != 0)
2878           {
2879             /* different name --> ship out current template list;
2880                add to hash table; & begin anew.  */
2881             core_optab->end = optab;
2882             hash_err = hash_insert (op_hash,
2883                                     (optab - 1)->name,
2884                                     (void *) core_optab);
2885             if (hash_err)
2886               {
2887                 as_fatal (_("can't hash %s: %s"),
2888                           (optab - 1)->name,
2889                           hash_err);
2890               }
2891             if (optab->name == NULL)
2892               break;
2893             core_optab = XNEW (templates);
2894             core_optab->start = optab;
2895           }
2896       }
2897   }
2898
2899   /* Initialize reg_hash hash table.  */
2900   reg_hash = hash_new ();
2901   {
2902     const reg_entry *regtab;
2903     unsigned int regtab_size = i386_regtab_size;
2904
2905     for (regtab = i386_regtab; regtab_size--; regtab++)
2906       {
2907         hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
2908         if (hash_err)
2909           as_fatal (_("can't hash %s: %s"),
2910                     regtab->reg_name,
2911                     hash_err);
2912       }
2913   }
2914
2915   /* Fill in lexical tables:  mnemonic_chars, operand_chars.  */
2916   {
2917     int c;
2918     char *p;
2919
2920     for (c = 0; c < 256; c++)
2921       {
2922         if (ISDIGIT (c))
2923           {
2924             digit_chars[c] = c;
2925             mnemonic_chars[c] = c;
2926             register_chars[c] = c;
2927             operand_chars[c] = c;
2928           }
2929         else if (ISLOWER (c))
2930           {
2931             mnemonic_chars[c] = c;
2932             register_chars[c] = c;
2933             operand_chars[c] = c;
2934           }
2935         else if (ISUPPER (c))
2936           {
2937             mnemonic_chars[c] = TOLOWER (c);
2938             register_chars[c] = mnemonic_chars[c];
2939             operand_chars[c] = c;
2940           }
2941         else if (c == '{' || c == '}')
2942           {
2943             mnemonic_chars[c] = c;
2944             operand_chars[c] = c;
2945           }
2946
2947         if (ISALPHA (c) || ISDIGIT (c))
2948           identifier_chars[c] = c;
2949         else if (c >= 128)
2950           {
2951             identifier_chars[c] = c;
2952             operand_chars[c] = c;
2953           }
2954       }
2955
2956 #ifdef LEX_AT
2957     identifier_chars['@'] = '@';
2958 #endif
2959 #ifdef LEX_QM
2960     identifier_chars['?'] = '?';
2961     operand_chars['?'] = '?';
2962 #endif
2963     digit_chars['-'] = '-';
2964     mnemonic_chars['_'] = '_';
2965     mnemonic_chars['-'] = '-';
2966     mnemonic_chars['.'] = '.';
2967     identifier_chars['_'] = '_';
2968     identifier_chars['.'] = '.';
2969
2970     for (p = operand_special_chars; *p != '\0'; p++)
2971       operand_chars[(unsigned char) *p] = *p;
2972   }
2973
2974   if (flag_code == CODE_64BIT)
2975     {
2976 #if defined (OBJ_COFF) && defined (TE_PE)
2977       x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
2978                                   ? 32 : 16);
2979 #else
2980       x86_dwarf2_return_column = 16;
2981 #endif
2982       x86_cie_data_alignment = -8;
2983     }
2984   else
2985     {
2986       x86_dwarf2_return_column = 8;
2987       x86_cie_data_alignment = -4;
2988     }
2989 }
2990
2991 void
2992 i386_print_statistics (FILE *file)
2993 {
2994   hash_print_statistics (file, "i386 opcode", op_hash);
2995   hash_print_statistics (file, "i386 register", reg_hash);
2996 }
2997 \f
2998 #ifdef DEBUG386
2999
3000 /* Debugging routines for md_assemble.  */
3001 static void pte (insn_template *);
3002 static void pt (i386_operand_type);
3003 static void pe (expressionS *);
3004 static void ps (symbolS *);
3005
3006 static void
3007 pi (const char *line, i386_insn *x)
3008 {
3009   unsigned int j;
3010
3011   fprintf (stdout, "%s: template ", line);
3012   pte (&x->tm);
3013   fprintf (stdout, "  address: base %s  index %s  scale %x\n",
3014            x->base_reg ? x->base_reg->reg_name : "none",
3015            x->index_reg ? x->index_reg->reg_name : "none",
3016            x->log2_scale_factor);
3017   fprintf (stdout, "  modrm:  mode %x  reg %x  reg/mem %x\n",
3018            x->rm.mode, x->rm.reg, x->rm.regmem);
3019   fprintf (stdout, "  sib:  base %x  index %x  scale %x\n",
3020            x->sib.base, x->sib.index, x->sib.scale);
3021   fprintf (stdout, "  rex: 64bit %x  extX %x  extY %x  extZ %x\n",
3022            (x->rex & REX_W) != 0,
3023            (x->rex & REX_R) != 0,
3024            (x->rex & REX_X) != 0,
3025            (x->rex & REX_B) != 0);
3026   for (j = 0; j < x->operands; j++)
3027     {
3028       fprintf (stdout, "    #%d:  ", j + 1);
3029       pt (x->types[j]);
3030       fprintf (stdout, "\n");
3031       if (x->types[j].bitfield.reg
3032           || x->types[j].bitfield.regmmx
3033           || x->types[j].bitfield.regsimd
3034           || x->types[j].bitfield.sreg
3035           || x->types[j].bitfield.control
3036           || x->types[j].bitfield.debug
3037           || x->types[j].bitfield.test)
3038         fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3039       if (operand_type_check (x->types[j], imm))
3040         pe (x->op[j].imms);
3041       if (operand_type_check (x->types[j], disp))
3042         pe (x->op[j].disps);
3043     }
3044 }
3045
3046 static void
3047 pte (insn_template *t)
3048 {
3049   unsigned int j;
3050   fprintf (stdout, " %d operands ", t->operands);
3051   fprintf (stdout, "opcode %x ", t->base_opcode);
3052   if (t->extension_opcode != None)
3053     fprintf (stdout, "ext %x ", t->extension_opcode);
3054   if (t->opcode_modifier.d)
3055     fprintf (stdout, "D");
3056   if (t->opcode_modifier.w)
3057     fprintf (stdout, "W");
3058   fprintf (stdout, "\n");
3059   for (j = 0; j < t->operands; j++)
3060     {
3061       fprintf (stdout, "    #%d type ", j + 1);
3062       pt (t->operand_types[j]);
3063       fprintf (stdout, "\n");
3064     }
3065 }
3066
3067 static void
3068 pe (expressionS *e)
3069 {
3070   fprintf (stdout, "    operation     %d\n", e->X_op);
3071   fprintf (stdout, "    add_number    %ld (%lx)\n",
3072            (long) e->X_add_number, (long) e->X_add_number);
3073   if (e->X_add_symbol)
3074     {
3075       fprintf (stdout, "    add_symbol    ");
3076       ps (e->X_add_symbol);
3077       fprintf (stdout, "\n");
3078     }
3079   if (e->X_op_symbol)
3080     {
3081       fprintf (stdout, "    op_symbol    ");
3082       ps (e->X_op_symbol);
3083       fprintf (stdout, "\n");
3084     }
3085 }
3086
3087 static void
3088 ps (symbolS *s)
3089 {
3090   fprintf (stdout, "%s type %s%s",
3091            S_GET_NAME (s),
3092            S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3093            segment_name (S_GET_SEGMENT (s)));
3094 }
3095
3096 static struct type_name
3097   {
3098     i386_operand_type mask;
3099     const char *name;
3100   }
3101 const type_names[] =
3102 {
3103   { OPERAND_TYPE_REG8, "r8" },
3104   { OPERAND_TYPE_REG16, "r16" },
3105   { OPERAND_TYPE_REG32, "r32" },
3106   { OPERAND_TYPE_REG64, "r64" },
3107   { OPERAND_TYPE_ACC8, "acc8" },
3108   { OPERAND_TYPE_ACC16, "acc16" },
3109   { OPERAND_TYPE_ACC32, "acc32" },
3110   { OPERAND_TYPE_ACC64, "acc64" },
3111   { OPERAND_TYPE_IMM8, "i8" },
3112   { OPERAND_TYPE_IMM8, "i8s" },
3113   { OPERAND_TYPE_IMM16, "i16" },
3114   { OPERAND_TYPE_IMM32, "i32" },
3115   { OPERAND_TYPE_IMM32S, "i32s" },
3116   { OPERAND_TYPE_IMM64, "i64" },
3117   { OPERAND_TYPE_IMM1, "i1" },
3118   { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3119   { OPERAND_TYPE_DISP8, "d8" },
3120   { OPERAND_TYPE_DISP16, "d16" },
3121   { OPERAND_TYPE_DISP32, "d32" },
3122   { OPERAND_TYPE_DISP32S, "d32s" },
3123   { OPERAND_TYPE_DISP64, "d64" },
3124   { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3125   { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3126   { OPERAND_TYPE_CONTROL, "control reg" },
3127   { OPERAND_TYPE_TEST, "test reg" },
3128   { OPERAND_TYPE_DEBUG, "debug reg" },
3129   { OPERAND_TYPE_FLOATREG, "FReg" },
3130   { OPERAND_TYPE_FLOATACC, "FAcc" },
3131   { OPERAND_TYPE_SREG, "SReg" },
3132   { OPERAND_TYPE_JUMPABSOLUTE, "Jump Absolute" },
3133   { OPERAND_TYPE_REGMMX, "rMMX" },
3134   { OPERAND_TYPE_REGXMM, "rXMM" },
3135   { OPERAND_TYPE_REGYMM, "rYMM" },
3136   { OPERAND_TYPE_REGZMM, "rZMM" },
3137   { OPERAND_TYPE_REGMASK, "Mask reg" },
3138   { OPERAND_TYPE_ESSEG, "es" },
3139 };
3140
3141 static void
3142 pt (i386_operand_type t)
3143 {
3144   unsigned int j;
3145   i386_operand_type a;
3146
3147   for (j = 0; j < ARRAY_SIZE (type_names); j++)
3148     {
3149       a = operand_type_and (t, type_names[j].mask);
3150       if (operand_type_equal (&a, &type_names[j].mask))
3151         fprintf (stdout, "%s, ",  type_names[j].name);
3152     }
3153   fflush (stdout);
3154 }
3155
3156 #endif /* DEBUG386 */
3157 \f
3158 static bfd_reloc_code_real_type
3159 reloc (unsigned int size,
3160        int pcrel,
3161        int sign,
3162        bfd_reloc_code_real_type other)
3163 {
3164   if (other != NO_RELOC)
3165     {
3166       reloc_howto_type *rel;
3167
3168       if (size == 8)
3169         switch (other)
3170           {
3171           case BFD_RELOC_X86_64_GOT32:
3172             return BFD_RELOC_X86_64_GOT64;
3173             break;
3174           case BFD_RELOC_X86_64_GOTPLT64:
3175             return BFD_RELOC_X86_64_GOTPLT64;
3176             break;
3177           case BFD_RELOC_X86_64_PLTOFF64:
3178             return BFD_RELOC_X86_64_PLTOFF64;
3179             break;
3180           case BFD_RELOC_X86_64_GOTPC32:
3181             other = BFD_RELOC_X86_64_GOTPC64;
3182             break;
3183           case BFD_RELOC_X86_64_GOTPCREL:
3184             other = BFD_RELOC_X86_64_GOTPCREL64;
3185             break;
3186           case BFD_RELOC_X86_64_TPOFF32:
3187             other = BFD_RELOC_X86_64_TPOFF64;
3188             break;
3189           case BFD_RELOC_X86_64_DTPOFF32:
3190             other = BFD_RELOC_X86_64_DTPOFF64;
3191             break;
3192           default:
3193             break;
3194           }
3195
3196 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3197       if (other == BFD_RELOC_SIZE32)
3198         {
3199           if (size == 8)
3200             other = BFD_RELOC_SIZE64;
3201           if (pcrel)
3202             {
3203               as_bad (_("there are no pc-relative size relocations"));
3204               return NO_RELOC;
3205             }
3206         }
3207 #endif
3208
3209       /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless.  */
3210       if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3211         sign = -1;
3212
3213       rel = bfd_reloc_type_lookup (stdoutput, other);
3214       if (!rel)
3215         as_bad (_("unknown relocation (%u)"), other);
3216       else if (size != bfd_get_reloc_size (rel))
3217         as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3218                 bfd_get_reloc_size (rel),
3219                 size);
3220       else if (pcrel && !rel->pc_relative)
3221         as_bad (_("non-pc-relative relocation for pc-relative field"));
3222       else if ((rel->complain_on_overflow == complain_overflow_signed
3223                 && !sign)
3224                || (rel->complain_on_overflow == complain_overflow_unsigned
3225                    && sign > 0))
3226         as_bad (_("relocated field and relocation type differ in signedness"));
3227       else
3228         return other;
3229       return NO_RELOC;
3230     }
3231
3232   if (pcrel)
3233     {
3234       if (!sign)
3235         as_bad (_("there are no unsigned pc-relative relocations"));
3236       switch (size)
3237         {
3238         case 1: return BFD_RELOC_8_PCREL;
3239         case 2: return BFD_RELOC_16_PCREL;
3240         case 4: return BFD_RELOC_32_PCREL;
3241         case 8: return BFD_RELOC_64_PCREL;
3242         }
3243       as_bad (_("cannot do %u byte pc-relative relocation"), size);
3244     }
3245   else
3246     {
3247       if (sign > 0)
3248         switch (size)
3249           {
3250           case 4: return BFD_RELOC_X86_64_32S;
3251           }
3252       else
3253         switch (size)
3254           {
3255           case 1: return BFD_RELOC_8;
3256           case 2: return BFD_RELOC_16;
3257           case 4: return BFD_RELOC_32;
3258           case 8: return BFD_RELOC_64;
3259           }
3260       as_bad (_("cannot do %s %u byte relocation"),
3261               sign > 0 ? "signed" : "unsigned", size);
3262     }
3263
3264   return NO_RELOC;
3265 }
3266
3267 /* Here we decide which fixups can be adjusted to make them relative to
3268    the beginning of the section instead of the symbol.  Basically we need
3269    to make sure that the dynamic relocations are done correctly, so in
3270    some cases we force the original symbol to be used.  */
3271
3272 int
3273 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3274 {
3275 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3276   if (!IS_ELF)
3277     return 1;
3278
3279   /* Don't adjust pc-relative references to merge sections in 64-bit
3280      mode.  */
3281   if (use_rela_relocations
3282       && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3283       && fixP->fx_pcrel)
3284     return 0;
3285
3286   /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3287      and changed later by validate_fix.  */
3288   if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3289       && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3290     return 0;
3291
3292   /* Adjust_reloc_syms doesn't know about the GOT.  Need to keep symbol
3293      for size relocations.  */
3294   if (fixP->fx_r_type == BFD_RELOC_SIZE32
3295       || fixP->fx_r_type == BFD_RELOC_SIZE64
3296       || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3297       || fixP->fx_r_type == BFD_RELOC_386_PLT32
3298       || fixP->fx_r_type == BFD_RELOC_386_GOT32
3299       || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3300       || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3301       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3302       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3303       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3304       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3305       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3306       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3307       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3308       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3309       || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3310       || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
3311       || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3312       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3313       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3314       || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3315       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3316       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3317       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3318       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3319       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3320       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3321       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3322       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3323       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3324       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3325       || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3326       || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3327     return 0;
3328 #endif
3329   return 1;
3330 }
3331
3332 static int
3333 intel_float_operand (const char *mnemonic)
3334 {
3335   /* Note that the value returned is meaningful only for opcodes with (memory)
3336      operands, hence the code here is free to improperly handle opcodes that
3337      have no operands (for better performance and smaller code). */
3338
3339   if (mnemonic[0] != 'f')
3340     return 0; /* non-math */
3341
3342   switch (mnemonic[1])
3343     {
3344     /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3345        the fs segment override prefix not currently handled because no
3346        call path can make opcodes without operands get here */
3347     case 'i':
3348       return 2 /* integer op */;
3349     case 'l':
3350       if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3351         return 3; /* fldcw/fldenv */
3352       break;
3353     case 'n':
3354       if (mnemonic[2] != 'o' /* fnop */)
3355         return 3; /* non-waiting control op */
3356       break;
3357     case 'r':
3358       if (mnemonic[2] == 's')
3359         return 3; /* frstor/frstpm */
3360       break;
3361     case 's':
3362       if (mnemonic[2] == 'a')
3363         return 3; /* fsave */
3364       if (mnemonic[2] == 't')
3365         {
3366           switch (mnemonic[3])
3367             {
3368             case 'c': /* fstcw */
3369             case 'd': /* fstdw */
3370             case 'e': /* fstenv */
3371             case 's': /* fsts[gw] */
3372               return 3;
3373             }
3374         }
3375       break;
3376     case 'x':
3377       if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3378         return 0; /* fxsave/fxrstor are not really math ops */
3379       break;
3380     }
3381
3382   return 1;
3383 }
3384
3385 /* Build the VEX prefix.  */
3386
3387 static void
3388 build_vex_prefix (const insn_template *t)
3389 {
3390   unsigned int register_specifier;
3391   unsigned int implied_prefix;
3392   unsigned int vector_length;
3393   unsigned int w;
3394
3395   /* Check register specifier.  */
3396   if (i.vex.register_specifier)
3397     {
3398       register_specifier =
3399         ~register_number (i.vex.register_specifier) & 0xf;
3400       gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3401     }
3402   else
3403     register_specifier = 0xf;
3404
3405   /* Use 2-byte VEX prefix by swapping destination and source operand
3406      if there are more than 1 register operand.  */
3407   if (i.reg_operands > 1
3408       && i.vec_encoding != vex_encoding_vex3
3409       && i.dir_encoding == dir_encoding_default
3410       && i.operands == i.reg_operands
3411       && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3412       && i.tm.opcode_modifier.vexopcode == VEX0F
3413       && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3414       && i.rex == REX_B)
3415     {
3416       unsigned int xchg = i.operands - 1;
3417       union i386_op temp_op;
3418       i386_operand_type temp_type;
3419
3420       temp_type = i.types[xchg];
3421       i.types[xchg] = i.types[0];
3422       i.types[0] = temp_type;
3423       temp_op = i.op[xchg];
3424       i.op[xchg] = i.op[0];
3425       i.op[0] = temp_op;
3426
3427       gas_assert (i.rm.mode == 3);
3428
3429       i.rex = REX_R;
3430       xchg = i.rm.regmem;
3431       i.rm.regmem = i.rm.reg;
3432       i.rm.reg = xchg;
3433
3434       if (i.tm.opcode_modifier.d)
3435         i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3436                             ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3437       else /* Use the next insn.  */
3438         i.tm = t[1];
3439     }
3440
3441   /* Use 2-byte VEX prefix by swapping commutative source operands if there
3442      are no memory operands and at least 3 register ones.  */
3443   if (i.reg_operands >= 3
3444       && i.vec_encoding != vex_encoding_vex3
3445       && i.reg_operands == i.operands - i.imm_operands
3446       && i.tm.opcode_modifier.vex
3447       && i.tm.opcode_modifier.commutative
3448       && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3449       && i.rex == REX_B
3450       && i.vex.register_specifier
3451       && !(i.vex.register_specifier->reg_flags & RegRex))
3452     {
3453       unsigned int xchg = i.operands - i.reg_operands;
3454       union i386_op temp_op;
3455       i386_operand_type temp_type;
3456
3457       gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3458       gas_assert (!i.tm.opcode_modifier.sae);
3459       gas_assert (operand_type_equal (&i.types[i.operands - 2],
3460                                       &i.types[i.operands - 3]));
3461       gas_assert (i.rm.mode == 3);
3462
3463       temp_type = i.types[xchg];
3464       i.types[xchg] = i.types[xchg + 1];
3465       i.types[xchg + 1] = temp_type;
3466       temp_op = i.op[xchg];
3467       i.op[xchg] = i.op[xchg + 1];
3468       i.op[xchg + 1] = temp_op;
3469
3470       i.rex = 0;
3471       xchg = i.rm.regmem | 8;
3472       i.rm.regmem = ~register_specifier & 0xf;
3473       gas_assert (!(i.rm.regmem & 8));
3474       i.vex.register_specifier += xchg - i.rm.regmem;
3475       register_specifier = ~xchg & 0xf;
3476     }
3477
3478   if (i.tm.opcode_modifier.vex == VEXScalar)
3479     vector_length = avxscalar;
3480   else if (i.tm.opcode_modifier.vex == VEX256)
3481     vector_length = 1;
3482   else
3483     {
3484       unsigned int op;
3485
3486       /* Determine vector length from the last multi-length vector
3487          operand.  */
3488       vector_length = 0;
3489       for (op = t->operands; op--;)
3490         if (t->operand_types[op].bitfield.xmmword
3491             && t->operand_types[op].bitfield.ymmword
3492             && i.types[op].bitfield.ymmword)
3493           {
3494             vector_length = 1;
3495             break;
3496           }
3497     }
3498
3499   switch ((i.tm.base_opcode >> 8) & 0xff)
3500     {
3501     case 0:
3502       implied_prefix = 0;
3503       break;
3504     case DATA_PREFIX_OPCODE:
3505       implied_prefix = 1;
3506       break;
3507     case REPE_PREFIX_OPCODE:
3508       implied_prefix = 2;
3509       break;
3510     case REPNE_PREFIX_OPCODE:
3511       implied_prefix = 3;
3512       break;
3513     default:
3514       abort ();
3515     }
3516
3517   /* Check the REX.W bit and VEXW.  */
3518   if (i.tm.opcode_modifier.vexw == VEXWIG)
3519     w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3520   else if (i.tm.opcode_modifier.vexw)
3521     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3522   else
3523     w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3524
3525   /* Use 2-byte VEX prefix if possible.  */
3526   if (w == 0
3527       && i.vec_encoding != vex_encoding_vex3
3528       && i.tm.opcode_modifier.vexopcode == VEX0F
3529       && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3530     {
3531       /* 2-byte VEX prefix.  */
3532       unsigned int r;
3533
3534       i.vex.length = 2;
3535       i.vex.bytes[0] = 0xc5;
3536
3537       /* Check the REX.R bit.  */
3538       r = (i.rex & REX_R) ? 0 : 1;
3539       i.vex.bytes[1] = (r << 7
3540                         | register_specifier << 3
3541                         | vector_length << 2
3542                         | implied_prefix);
3543     }
3544   else
3545     {
3546       /* 3-byte VEX prefix.  */
3547       unsigned int m;
3548
3549       i.vex.length = 3;
3550
3551       switch (i.tm.opcode_modifier.vexopcode)
3552         {
3553         case VEX0F:
3554           m = 0x1;
3555           i.vex.bytes[0] = 0xc4;
3556           break;
3557         case VEX0F38:
3558           m = 0x2;
3559           i.vex.bytes[0] = 0xc4;
3560           break;
3561         case VEX0F3A:
3562           m = 0x3;
3563           i.vex.bytes[0] = 0xc4;
3564           break;
3565         case XOP08:
3566           m = 0x8;
3567           i.vex.bytes[0] = 0x8f;
3568           break;
3569         case XOP09:
3570           m = 0x9;
3571           i.vex.bytes[0] = 0x8f;
3572           break;
3573         case XOP0A:
3574           m = 0xa;
3575           i.vex.bytes[0] = 0x8f;
3576           break;
3577         default:
3578           abort ();
3579         }
3580
3581       /* The high 3 bits of the second VEX byte are 1's compliment
3582          of RXB bits from REX.  */
3583       i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3584
3585       i.vex.bytes[2] = (w << 7
3586                         | register_specifier << 3
3587                         | vector_length << 2
3588                         | implied_prefix);
3589     }
3590 }
3591
3592 static INLINE bfd_boolean
3593 is_evex_encoding (const insn_template *t)
3594 {
3595   return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3596          || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3597          || t->opcode_modifier.sae;
3598 }
3599
3600 static INLINE bfd_boolean
3601 is_any_vex_encoding (const insn_template *t)
3602 {
3603   return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3604          || is_evex_encoding (t);
3605 }
3606
3607 /* Build the EVEX prefix.  */
3608
3609 static void
3610 build_evex_prefix (void)
3611 {
3612   unsigned int register_specifier;
3613   unsigned int implied_prefix;
3614   unsigned int m, w;
3615   rex_byte vrex_used = 0;
3616
3617   /* Check register specifier.  */
3618   if (i.vex.register_specifier)
3619     {
3620       gas_assert ((i.vrex & REX_X) == 0);
3621
3622       register_specifier = i.vex.register_specifier->reg_num;
3623       if ((i.vex.register_specifier->reg_flags & RegRex))
3624         register_specifier += 8;
3625       /* The upper 16 registers are encoded in the fourth byte of the
3626          EVEX prefix.  */
3627       if (!(i.vex.register_specifier->reg_flags & RegVRex))
3628         i.vex.bytes[3] = 0x8;
3629       register_specifier = ~register_specifier & 0xf;
3630     }
3631   else
3632     {
3633       register_specifier = 0xf;
3634
3635       /* Encode upper 16 vector index register in the fourth byte of
3636          the EVEX prefix.  */
3637       if (!(i.vrex & REX_X))
3638         i.vex.bytes[3] = 0x8;
3639       else
3640         vrex_used |= REX_X;
3641     }
3642
3643   switch ((i.tm.base_opcode >> 8) & 0xff)
3644     {
3645     case 0:
3646       implied_prefix = 0;
3647       break;
3648     case DATA_PREFIX_OPCODE:
3649       implied_prefix = 1;
3650       break;
3651     case REPE_PREFIX_OPCODE:
3652       implied_prefix = 2;
3653       break;
3654     case REPNE_PREFIX_OPCODE:
3655       implied_prefix = 3;
3656       break;
3657     default:
3658       abort ();
3659     }
3660
3661   /* 4 byte EVEX prefix.  */
3662   i.vex.length = 4;
3663   i.vex.bytes[0] = 0x62;
3664
3665   /* mmmm bits.  */
3666   switch (i.tm.opcode_modifier.vexopcode)
3667     {
3668     case VEX0F:
3669       m = 1;
3670       break;
3671     case VEX0F38:
3672       m = 2;
3673       break;
3674     case VEX0F3A:
3675       m = 3;
3676       break;
3677     default:
3678       abort ();
3679       break;
3680     }
3681
3682   /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3683      bits from REX.  */
3684   i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3685
3686   /* The fifth bit of the second EVEX byte is 1's compliment of the
3687      REX_R bit in VREX.  */
3688   if (!(i.vrex & REX_R))
3689     i.vex.bytes[1] |= 0x10;
3690   else
3691     vrex_used |= REX_R;
3692
3693   if ((i.reg_operands + i.imm_operands) == i.operands)
3694     {
3695       /* When all operands are registers, the REX_X bit in REX is not
3696          used.  We reuse it to encode the upper 16 registers, which is
3697          indicated by the REX_B bit in VREX.  The REX_X bit is encoded
3698          as 1's compliment.  */
3699       if ((i.vrex & REX_B))
3700         {
3701           vrex_used |= REX_B;
3702           i.vex.bytes[1] &= ~0x40;
3703         }
3704     }
3705
3706   /* EVEX instructions shouldn't need the REX prefix.  */
3707   i.vrex &= ~vrex_used;
3708   gas_assert (i.vrex == 0);
3709
3710   /* Check the REX.W bit and VEXW.  */
3711   if (i.tm.opcode_modifier.vexw == VEXWIG)
3712     w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3713   else if (i.tm.opcode_modifier.vexw)
3714     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3715   else
3716     w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3717
3718   /* Encode the U bit.  */
3719   implied_prefix |= 0x4;
3720
3721   /* The third byte of the EVEX prefix.  */
3722   i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3723
3724   /* The fourth byte of the EVEX prefix.  */
3725   /* The zeroing-masking bit.  */
3726   if (i.mask && i.mask->zeroing)
3727     i.vex.bytes[3] |= 0x80;
3728
3729   /* Don't always set the broadcast bit if there is no RC.  */
3730   if (!i.rounding)
3731     {
3732       /* Encode the vector length.  */
3733       unsigned int vec_length;
3734
3735       if (!i.tm.opcode_modifier.evex
3736           || i.tm.opcode_modifier.evex == EVEXDYN)
3737         {
3738           unsigned int op;
3739
3740           /* Determine vector length from the last multi-length vector
3741              operand.  */
3742           vec_length = 0;
3743           for (op = i.operands; op--;)
3744             if (i.tm.operand_types[op].bitfield.xmmword
3745                 + i.tm.operand_types[op].bitfield.ymmword
3746                 + i.tm.operand_types[op].bitfield.zmmword > 1)
3747               {
3748                 if (i.types[op].bitfield.zmmword)
3749                   {
3750                     i.tm.opcode_modifier.evex = EVEX512;
3751                     break;
3752                   }
3753                 else if (i.types[op].bitfield.ymmword)
3754                   {
3755                     i.tm.opcode_modifier.evex = EVEX256;
3756                     break;
3757                   }
3758                 else if (i.types[op].bitfield.xmmword)
3759                   {
3760                     i.tm.opcode_modifier.evex = EVEX128;
3761                     break;
3762                   }
3763                 else if (i.broadcast && (int) op == i.broadcast->operand)
3764                   {
3765                     switch (i.broadcast->bytes)
3766                       {
3767                         case 64:
3768                           i.tm.opcode_modifier.evex = EVEX512;
3769                           break;
3770                         case 32:
3771                           i.tm.opcode_modifier.evex = EVEX256;
3772                           break;
3773                         case 16:
3774                           i.tm.opcode_modifier.evex = EVEX128;
3775                           break;
3776                         default:
3777                           abort ();
3778                       }
3779                     break;
3780                   }
3781               }
3782
3783           if (op >= MAX_OPERANDS)
3784             abort ();
3785         }
3786
3787       switch (i.tm.opcode_modifier.evex)
3788         {
3789         case EVEXLIG: /* LL' is ignored */
3790           vec_length = evexlig << 5;
3791           break;
3792         case EVEX128:
3793           vec_length = 0 << 5;
3794           break;
3795         case EVEX256:
3796           vec_length = 1 << 5;
3797           break;
3798         case EVEX512:
3799           vec_length = 2 << 5;
3800           break;
3801         default:
3802           abort ();
3803           break;
3804         }
3805       i.vex.bytes[3] |= vec_length;
3806       /* Encode the broadcast bit.  */
3807       if (i.broadcast)
3808         i.vex.bytes[3] |= 0x10;
3809     }
3810   else
3811     {
3812       if (i.rounding->type != saeonly)
3813         i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3814       else
3815         i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3816     }
3817
3818   if (i.mask && i.mask->mask)
3819     i.vex.bytes[3] |= i.mask->mask->reg_num;
3820 }
3821
3822 static void
3823 process_immext (void)
3824 {
3825   expressionS *exp;
3826
3827   if ((i.tm.cpu_flags.bitfield.cpusse3 || i.tm.cpu_flags.bitfield.cpusvme)
3828       && i.operands > 0)
3829     {
3830       /* MONITOR/MWAIT as well as SVME instructions have fixed operands
3831          with an opcode suffix which is coded in the same place as an
3832          8-bit immediate field would be.
3833          Here we check those operands and remove them afterwards.  */
3834       unsigned int x;
3835
3836       for (x = 0; x < i.operands; x++)
3837         if (register_number (i.op[x].regs) != x)
3838           as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3839                   register_prefix, i.op[x].regs->reg_name, x + 1,
3840                   i.tm.name);
3841
3842       i.operands = 0;
3843     }
3844
3845   if (i.tm.cpu_flags.bitfield.cpumwaitx && i.operands > 0)
3846     {
3847       /* MONITORX/MWAITX instructions have fixed operands with an opcode
3848          suffix which is coded in the same place as an 8-bit immediate
3849          field would be.
3850          Here we check those operands and remove them afterwards.  */
3851       unsigned int x;
3852
3853       if (i.operands != 3)
3854         abort();
3855
3856       for (x = 0; x < 2; x++)
3857         if (register_number (i.op[x].regs) != x)
3858           goto bad_register_operand;
3859
3860       /* Check for third operand for mwaitx/monitorx insn.  */
3861       if (register_number (i.op[x].regs)
3862           != (x + (i.tm.extension_opcode == 0xfb)))
3863         {
3864 bad_register_operand:
3865           as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3866                   register_prefix, i.op[x].regs->reg_name, x+1,
3867                   i.tm.name);
3868         }
3869
3870       i.operands = 0;
3871     }
3872
3873   /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3874      which is coded in the same place as an 8-bit immediate field
3875      would be.  Here we fake an 8-bit immediate operand from the
3876      opcode suffix stored in tm.extension_opcode.
3877
3878      AVX instructions also use this encoding, for some of
3879      3 argument instructions.  */
3880
3881   gas_assert (i.imm_operands <= 1
3882               && (i.operands <= 2
3883                   || (is_any_vex_encoding (&i.tm)
3884                       && i.operands <= 4)));
3885
3886   exp = &im_expressions[i.imm_operands++];
3887   i.op[i.operands].imms = exp;
3888   i.types[i.operands] = imm8;
3889   i.operands++;
3890   exp->X_op = O_constant;
3891   exp->X_add_number = i.tm.extension_opcode;
3892   i.tm.extension_opcode = None;
3893 }
3894
3895
3896 static int
3897 check_hle (void)
3898 {
3899   switch (i.tm.opcode_modifier.hleprefixok)
3900     {
3901     default:
3902       abort ();
3903     case HLEPrefixNone:
3904       as_bad (_("invalid instruction `%s' after `%s'"),
3905               i.tm.name, i.hle_prefix);
3906       return 0;
3907     case HLEPrefixLock:
3908       if (i.prefix[LOCK_PREFIX])
3909         return 1;
3910       as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3911       return 0;
3912     case HLEPrefixAny:
3913       return 1;
3914     case HLEPrefixRelease:
3915       if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3916         {
3917           as_bad (_("instruction `%s' after `xacquire' not allowed"),
3918                   i.tm.name);
3919           return 0;
3920         }
3921       if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
3922         {
3923           as_bad (_("memory destination needed for instruction `%s'"
3924                     " after `xrelease'"), i.tm.name);
3925           return 0;
3926         }
3927       return 1;
3928     }
3929 }
3930
3931 /* Try the shortest encoding by shortening operand size.  */
3932
3933 static void
3934 optimize_encoding (void)
3935 {
3936   unsigned int j;
3937
3938   if (optimize_for_space
3939       && i.reg_operands == 1
3940       && i.imm_operands == 1
3941       && !i.types[1].bitfield.byte
3942       && i.op[0].imms->X_op == O_constant
3943       && fits_in_imm7 (i.op[0].imms->X_add_number)
3944       && ((i.tm.base_opcode == 0xa8
3945            && i.tm.extension_opcode == None)
3946           || (i.tm.base_opcode == 0xf6
3947               && i.tm.extension_opcode == 0x0)))
3948     {
3949       /* Optimize: -Os:
3950            test $imm7, %r64/%r32/%r16  -> test $imm7, %r8
3951        */
3952       unsigned int base_regnum = i.op[1].regs->reg_num;
3953       if (flag_code == CODE_64BIT || base_regnum < 4)
3954         {
3955           i.types[1].bitfield.byte = 1;
3956           /* Ignore the suffix.  */
3957           i.suffix = 0;
3958           if (base_regnum >= 4
3959               && !(i.op[1].regs->reg_flags & RegRex))
3960             {
3961               /* Handle SP, BP, SI and DI registers.  */
3962               if (i.types[1].bitfield.word)
3963                 j = 16;
3964               else if (i.types[1].bitfield.dword)
3965                 j = 32;
3966               else
3967                 j = 48;
3968               i.op[1].regs -= j;
3969             }
3970         }
3971     }
3972   else if (flag_code == CODE_64BIT
3973            && ((i.types[1].bitfield.qword
3974                 && i.reg_operands == 1
3975                 && i.imm_operands == 1
3976                 && i.op[0].imms->X_op == O_constant
3977                 && ((i.tm.base_opcode == 0xb8
3978                      && i.tm.extension_opcode == None
3979                      && fits_in_unsigned_long (i.op[0].imms->X_add_number))
3980                     || (fits_in_imm31 (i.op[0].imms->X_add_number)
3981                         && (((i.tm.base_opcode == 0x24
3982                               || i.tm.base_opcode == 0xa8)
3983                              && i.tm.extension_opcode == None)
3984                             || (i.tm.base_opcode == 0x80
3985                                 && i.tm.extension_opcode == 0x4)
3986                             || ((i.tm.base_opcode == 0xf6
3987                                  || (i.tm.base_opcode | 1) == 0xc7)
3988                                 && i.tm.extension_opcode == 0x0)))
3989                     || (fits_in_imm7 (i.op[0].imms->X_add_number)
3990                         && i.tm.base_opcode == 0x83
3991                         && i.tm.extension_opcode == 0x4)))
3992                || (i.types[0].bitfield.qword
3993                    && ((i.reg_operands == 2
3994                         && i.op[0].regs == i.op[1].regs
3995                         && ((i.tm.base_opcode == 0x30
3996                              || i.tm.base_opcode == 0x28)
3997                             && i.tm.extension_opcode == None))
3998                        || (i.reg_operands == 1
3999                            && i.operands == 1
4000                            && i.tm.base_opcode == 0x30
4001                            && i.tm.extension_opcode == None)))))
4002     {
4003       /* Optimize: -O:
4004            andq $imm31, %r64   -> andl $imm31, %r32
4005            andq $imm7, %r64    -> andl $imm7, %r32
4006            testq $imm31, %r64  -> testl $imm31, %r32
4007            xorq %r64, %r64     -> xorl %r32, %r32
4008            subq %r64, %r64     -> subl %r32, %r32
4009            movq $imm31, %r64   -> movl $imm31, %r32
4010            movq $imm32, %r64   -> movl $imm32, %r32
4011         */
4012       i.tm.opcode_modifier.norex64 = 1;
4013       if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4014         {
4015           /* Handle
4016                movq $imm31, %r64   -> movl $imm31, %r32
4017                movq $imm32, %r64   -> movl $imm32, %r32
4018            */
4019           i.tm.operand_types[0].bitfield.imm32 = 1;
4020           i.tm.operand_types[0].bitfield.imm32s = 0;
4021           i.tm.operand_types[0].bitfield.imm64 = 0;
4022           i.types[0].bitfield.imm32 = 1;
4023           i.types[0].bitfield.imm32s = 0;
4024           i.types[0].bitfield.imm64 = 0;
4025           i.types[1].bitfield.dword = 1;
4026           i.types[1].bitfield.qword = 0;
4027           if ((i.tm.base_opcode | 1) == 0xc7)
4028             {
4029               /* Handle
4030                    movq $imm31, %r64   -> movl $imm31, %r32
4031                */
4032               i.tm.base_opcode = 0xb8;
4033               i.tm.extension_opcode = None;
4034               i.tm.opcode_modifier.w = 0;
4035               i.tm.opcode_modifier.shortform = 1;
4036               i.tm.opcode_modifier.modrm = 0;
4037             }
4038         }
4039     }
4040   else if (optimize > 1
4041            && !optimize_for_space
4042            && i.reg_operands == 2
4043            && i.op[0].regs == i.op[1].regs
4044            && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4045                || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4046            && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4047     {
4048       /* Optimize: -O2:
4049            andb %rN, %rN  -> testb %rN, %rN
4050            andw %rN, %rN  -> testw %rN, %rN
4051            andq %rN, %rN  -> testq %rN, %rN
4052            orb %rN, %rN   -> testb %rN, %rN
4053            orw %rN, %rN   -> testw %rN, %rN
4054            orq %rN, %rN   -> testq %rN, %rN
4055
4056            and outside of 64-bit mode
4057
4058            andl %rN, %rN  -> testl %rN, %rN
4059            orl %rN, %rN   -> testl %rN, %rN
4060        */
4061       i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4062     }
4063   else if (i.reg_operands == 3
4064            && i.op[0].regs == i.op[1].regs
4065            && !i.types[2].bitfield.xmmword
4066            && (i.tm.opcode_modifier.vex
4067                || ((!i.mask || i.mask->zeroing)
4068                    && !i.rounding
4069                    && is_evex_encoding (&i.tm)
4070                    && (i.vec_encoding != vex_encoding_evex
4071                        || cpu_arch_isa_flags.bitfield.cpuavx512vl
4072                        || i.tm.cpu_flags.bitfield.cpuavx512vl
4073                        || (i.tm.operand_types[2].bitfield.zmmword
4074                            && i.types[2].bitfield.ymmword))))
4075            && ((i.tm.base_opcode == 0x55
4076                 || i.tm.base_opcode == 0x6655
4077                 || i.tm.base_opcode == 0x66df
4078                 || i.tm.base_opcode == 0x57
4079                 || i.tm.base_opcode == 0x6657
4080                 || i.tm.base_opcode == 0x66ef
4081                 || i.tm.base_opcode == 0x66f8
4082                 || i.tm.base_opcode == 0x66f9
4083                 || i.tm.base_opcode == 0x66fa
4084                 || i.tm.base_opcode == 0x66fb
4085                 || i.tm.base_opcode == 0x42
4086                 || i.tm.base_opcode == 0x6642
4087                 || i.tm.base_opcode == 0x47
4088                 || i.tm.base_opcode == 0x6647)
4089                && i.tm.extension_opcode == None))
4090     {
4091       /* Optimize: -O1:
4092            VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4093            vpsubq and vpsubw:
4094              EVEX VOP %zmmM, %zmmM, %zmmN
4095                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4096                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4097              EVEX VOP %ymmM, %ymmM, %ymmN
4098                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4099                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4100              VEX VOP %ymmM, %ymmM, %ymmN
4101                -> VEX VOP %xmmM, %xmmM, %xmmN
4102            VOP, one of vpandn and vpxor:
4103              VEX VOP %ymmM, %ymmM, %ymmN
4104                -> VEX VOP %xmmM, %xmmM, %xmmN
4105            VOP, one of vpandnd and vpandnq:
4106              EVEX VOP %zmmM, %zmmM, %zmmN
4107                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4108                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4109              EVEX VOP %ymmM, %ymmM, %ymmN
4110                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4111                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4112            VOP, one of vpxord and vpxorq:
4113              EVEX VOP %zmmM, %zmmM, %zmmN
4114                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4115                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4116              EVEX VOP %ymmM, %ymmM, %ymmN
4117                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4118                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4119            VOP, one of kxord and kxorq:
4120              VEX VOP %kM, %kM, %kN
4121                -> VEX kxorw %kM, %kM, %kN
4122            VOP, one of kandnd and kandnq:
4123              VEX VOP %kM, %kM, %kN
4124                -> VEX kandnw %kM, %kM, %kN
4125        */
4126       if (is_evex_encoding (&i.tm))
4127         {
4128           if (i.vec_encoding != vex_encoding_evex)
4129             {
4130               i.tm.opcode_modifier.vex = VEX128;
4131               i.tm.opcode_modifier.vexw = VEXW0;
4132               i.tm.opcode_modifier.evex = 0;
4133             }
4134           else if (optimize > 1)
4135             i.tm.opcode_modifier.evex = EVEX128;
4136           else
4137             return;
4138         }
4139       else if (i.tm.operand_types[0].bitfield.regmask)
4140         {
4141           i.tm.base_opcode &= 0xff;
4142           i.tm.opcode_modifier.vexw = VEXW0;
4143         }
4144       else
4145         i.tm.opcode_modifier.vex = VEX128;
4146
4147       if (i.tm.opcode_modifier.vex)
4148         for (j = 0; j < 3; j++)
4149           {
4150             i.types[j].bitfield.xmmword = 1;
4151             i.types[j].bitfield.ymmword = 0;
4152           }
4153     }
4154   else if (i.vec_encoding != vex_encoding_evex
4155            && !i.types[0].bitfield.zmmword
4156            && !i.types[1].bitfield.zmmword
4157            && !i.mask
4158            && !i.broadcast
4159            && is_evex_encoding (&i.tm)
4160            && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4161                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4162                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4163                || (i.tm.base_opcode & ~4) == 0x66db
4164                || (i.tm.base_opcode & ~4) == 0x66eb)
4165            && i.tm.extension_opcode == None)
4166     {
4167       /* Optimize: -O1:
4168            VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4169            vmovdqu32 and vmovdqu64:
4170              EVEX VOP %xmmM, %xmmN
4171                -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4172              EVEX VOP %ymmM, %ymmN
4173                -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4174              EVEX VOP %xmmM, mem
4175                -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4176              EVEX VOP %ymmM, mem
4177                -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4178              EVEX VOP mem, %xmmN
4179                -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4180              EVEX VOP mem, %ymmN
4181                -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4182            VOP, one of vpand, vpandn, vpor, vpxor:
4183              EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4184                -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4185              EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4186                -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4187              EVEX VOP{d,q} mem, %xmmM, %xmmN
4188                -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4189              EVEX VOP{d,q} mem, %ymmM, %ymmN
4190                -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4191        */
4192       for (j = 0; j < i.operands; j++)
4193         if (operand_type_check (i.types[j], disp)
4194             && i.op[j].disps->X_op == O_constant)
4195           {
4196             /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4197                has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4198                bytes, we choose EVEX Disp8 over VEX Disp32.  */
4199             int evex_disp8, vex_disp8;
4200             unsigned int memshift = i.memshift;
4201             offsetT n = i.op[j].disps->X_add_number;
4202
4203             evex_disp8 = fits_in_disp8 (n);
4204             i.memshift = 0;
4205             vex_disp8 = fits_in_disp8 (n);
4206             if (evex_disp8 != vex_disp8)
4207               {
4208                 i.memshift = memshift;
4209                 return;
4210               }
4211
4212             i.types[j].bitfield.disp8 = vex_disp8;
4213             break;
4214           }
4215       if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4216         i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4217       i.tm.opcode_modifier.vex
4218         = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4219       i.tm.opcode_modifier.vexw = VEXW0;
4220       /* VPAND, VPOR, and VPXOR are commutative.  */
4221       if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4222         i.tm.opcode_modifier.commutative = 1;
4223       i.tm.opcode_modifier.evex = 0;
4224       i.tm.opcode_modifier.masking = 0;
4225       i.tm.opcode_modifier.broadcast = 0;
4226       i.tm.opcode_modifier.disp8memshift = 0;
4227       i.memshift = 0;
4228       if (j < i.operands)
4229         i.types[j].bitfield.disp8
4230           = fits_in_disp8 (i.op[j].disps->X_add_number);
4231     }
4232 }
4233
4234 /* This is the guts of the machine-dependent assembler.  LINE points to a
4235    machine dependent instruction.  This function is supposed to emit
4236    the frags/bytes it assembles to.  */
4237
4238 void
4239 md_assemble (char *line)
4240 {
4241   unsigned int j;
4242   char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4243   const insn_template *t;
4244
4245   /* Initialize globals.  */
4246   memset (&i, '\0', sizeof (i));
4247   for (j = 0; j < MAX_OPERANDS; j++)
4248     i.reloc[j] = NO_RELOC;
4249   memset (disp_expressions, '\0', sizeof (disp_expressions));
4250   memset (im_expressions, '\0', sizeof (im_expressions));
4251   save_stack_p = save_stack;
4252
4253   /* First parse an instruction mnemonic & call i386_operand for the operands.
4254      We assume that the scrubber has arranged it so that line[0] is the valid
4255      start of a (possibly prefixed) mnemonic.  */
4256
4257   line = parse_insn (line, mnemonic);
4258   if (line == NULL)
4259     return;
4260   mnem_suffix = i.suffix;
4261
4262   line = parse_operands (line, mnemonic);
4263   this_operand = -1;
4264   xfree (i.memop1_string);
4265   i.memop1_string = NULL;
4266   if (line == NULL)
4267     return;
4268
4269   /* Now we've parsed the mnemonic into a set of templates, and have the
4270      operands at hand.  */
4271
4272   /* All intel opcodes have reversed operands except for "bound" and
4273      "enter".  We also don't reverse intersegment "jmp" and "call"
4274      instructions with 2 immediate operands so that the immediate segment
4275      precedes the offset, as it does when in AT&T mode. */
4276   if (intel_syntax
4277       && i.operands > 1
4278       && (strcmp (mnemonic, "bound") != 0)
4279       && (strcmp (mnemonic, "invlpga") != 0)
4280       && !(operand_type_check (i.types[0], imm)
4281            && operand_type_check (i.types[1], imm)))
4282     swap_operands ();
4283
4284   /* The order of the immediates should be reversed
4285      for 2 immediates extrq and insertq instructions */
4286   if (i.imm_operands == 2
4287       && (strcmp (mnemonic, "extrq") == 0
4288           || strcmp (mnemonic, "insertq") == 0))
4289       swap_2_operands (0, 1);
4290
4291   if (i.imm_operands)
4292     optimize_imm ();
4293
4294   /* Don't optimize displacement for movabs since it only takes 64bit
4295      displacement.  */
4296   if (i.disp_operands
4297       && i.disp_encoding != disp_encoding_32bit
4298       && (flag_code != CODE_64BIT
4299           || strcmp (mnemonic, "movabs") != 0))
4300     optimize_disp ();
4301
4302   /* Next, we find a template that matches the given insn,
4303      making sure the overlap of the given operands types is consistent
4304      with the template operand types.  */
4305
4306   if (!(t = match_template (mnem_suffix)))
4307     return;
4308
4309   if (sse_check != check_none
4310       && !i.tm.opcode_modifier.noavx
4311       && !i.tm.cpu_flags.bitfield.cpuavx
4312       && (i.tm.cpu_flags.bitfield.cpusse
4313           || i.tm.cpu_flags.bitfield.cpusse2
4314           || i.tm.cpu_flags.bitfield.cpusse3
4315           || i.tm.cpu_flags.bitfield.cpussse3
4316           || i.tm.cpu_flags.bitfield.cpusse4_1
4317           || i.tm.cpu_flags.bitfield.cpusse4_2
4318           || i.tm.cpu_flags.bitfield.cpupclmul
4319           || i.tm.cpu_flags.bitfield.cpuaes
4320           || i.tm.cpu_flags.bitfield.cpugfni))
4321     {
4322       (sse_check == check_warning
4323        ? as_warn
4324        : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4325     }
4326
4327   /* Zap movzx and movsx suffix.  The suffix has been set from
4328      "word ptr" or "byte ptr" on the source operand in Intel syntax
4329      or extracted from mnemonic in AT&T syntax.  But we'll use
4330      the destination register to choose the suffix for encoding.  */
4331   if ((i.tm.base_opcode & ~9) == 0x0fb6)
4332     {
4333       /* In Intel syntax, there must be a suffix.  In AT&T syntax, if
4334          there is no suffix, the default will be byte extension.  */
4335       if (i.reg_operands != 2
4336           && !i.suffix
4337           && intel_syntax)
4338         as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
4339
4340       i.suffix = 0;
4341     }
4342
4343   if (i.tm.opcode_modifier.fwait)
4344     if (!add_prefix (FWAIT_OPCODE))
4345       return;
4346
4347   /* Check if REP prefix is OK.  */
4348   if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4349     {
4350       as_bad (_("invalid instruction `%s' after `%s'"),
4351                 i.tm.name, i.rep_prefix);
4352       return;
4353     }
4354
4355   /* Check for lock without a lockable instruction.  Destination operand
4356      must be memory unless it is xchg (0x86).  */
4357   if (i.prefix[LOCK_PREFIX]
4358       && (!i.tm.opcode_modifier.islockable
4359           || i.mem_operands == 0
4360           || (i.tm.base_opcode != 0x86
4361               && !(i.flags[i.operands - 1] & Operand_Mem))))
4362     {
4363       as_bad (_("expecting lockable instruction after `lock'"));
4364       return;
4365     }
4366
4367   /* Check for data size prefix on VEX/XOP/EVEX encoded insns.  */
4368   if (i.prefix[DATA_PREFIX] && is_any_vex_encoding (&i.tm))
4369     {
4370       as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4371       return;
4372     }
4373
4374   /* Check if HLE prefix is OK.  */
4375   if (i.hle_prefix && !check_hle ())
4376     return;
4377
4378   /* Check BND prefix.  */
4379   if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4380     as_bad (_("expecting valid branch instruction after `bnd'"));
4381
4382   /* Check NOTRACK prefix.  */
4383   if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4384     as_bad (_("expecting indirect branch instruction after `notrack'"));
4385
4386   if (i.tm.cpu_flags.bitfield.cpumpx)
4387     {
4388       if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4389         as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4390       else if (flag_code != CODE_16BIT
4391                ? i.prefix[ADDR_PREFIX]
4392                : i.mem_operands && !i.prefix[ADDR_PREFIX])
4393         as_bad (_("16-bit address isn't allowed in MPX instructions"));
4394     }
4395
4396   /* Insert BND prefix.  */
4397   if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4398     {
4399       if (!i.prefix[BND_PREFIX])
4400         add_prefix (BND_PREFIX_OPCODE);
4401       else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4402         {
4403           as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4404           i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4405         }
4406     }
4407
4408   /* Check string instruction segment overrides.  */
4409   if (i.tm.opcode_modifier.isstring && i.mem_operands != 0)
4410     {
4411       if (!check_string ())
4412         return;
4413       i.disp_operands = 0;
4414     }
4415
4416   if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4417     optimize_encoding ();
4418
4419   if (!process_suffix ())
4420     return;
4421
4422   /* Update operand types.  */
4423   for (j = 0; j < i.operands; j++)
4424     i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4425
4426   /* Make still unresolved immediate matches conform to size of immediate
4427      given in i.suffix.  */
4428   if (!finalize_imm ())
4429     return;
4430
4431   if (i.types[0].bitfield.imm1)
4432     i.imm_operands = 0; /* kludge for shift insns.  */
4433
4434   /* We only need to check those implicit registers for instructions
4435      with 3 operands or less.  */
4436   if (i.operands <= 3)
4437     for (j = 0; j < i.operands; j++)
4438       if (i.types[j].bitfield.inoutportreg
4439           || i.types[j].bitfield.shiftcount
4440           || (i.types[j].bitfield.acc && !i.types[j].bitfield.xmmword))
4441         i.reg_operands--;
4442
4443   /* ImmExt should be processed after SSE2AVX.  */
4444   if (!i.tm.opcode_modifier.sse2avx
4445       && i.tm.opcode_modifier.immext)
4446     process_immext ();
4447
4448   /* For insns with operands there are more diddles to do to the opcode.  */
4449   if (i.operands)
4450     {
4451       if (!process_operands ())
4452         return;
4453     }
4454   else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4455     {
4456       /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc.  */
4457       as_warn (_("translating to `%sp'"), i.tm.name);
4458     }
4459
4460   if (is_any_vex_encoding (&i.tm))
4461     {
4462       if (!cpu_arch_flags.bitfield.cpui286)
4463         {
4464           as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4465                   i.tm.name);
4466           return;
4467         }
4468
4469       if (i.tm.opcode_modifier.vex)
4470         build_vex_prefix (t);
4471       else
4472         build_evex_prefix ();
4473     }
4474
4475   /* Handle conversion of 'int $3' --> special int3 insn.  XOP or FMA4
4476      instructions may define INT_OPCODE as well, so avoid this corner
4477      case for those instructions that use MODRM.  */
4478   if (i.tm.base_opcode == INT_OPCODE
4479       && !i.tm.opcode_modifier.modrm
4480       && i.op[0].imms->X_add_number == 3)
4481     {
4482       i.tm.base_opcode = INT3_OPCODE;
4483       i.imm_operands = 0;
4484     }
4485
4486   if ((i.tm.opcode_modifier.jump
4487        || i.tm.opcode_modifier.jumpbyte
4488        || i.tm.opcode_modifier.jumpdword)
4489       && i.op[0].disps->X_op == O_constant)
4490     {
4491       /* Convert "jmp constant" (and "call constant") to a jump (call) to
4492          the absolute address given by the constant.  Since ix86 jumps and
4493          calls are pc relative, we need to generate a reloc.  */
4494       i.op[0].disps->X_add_symbol = &abs_symbol;
4495       i.op[0].disps->X_op = O_symbol;
4496     }
4497
4498   if (i.tm.opcode_modifier.rex64)
4499     i.rex |= REX_W;
4500
4501   /* For 8 bit registers we need an empty rex prefix.  Also if the
4502      instruction already has a prefix, we need to convert old
4503      registers to new ones.  */
4504
4505   if ((i.types[0].bitfield.reg && i.types[0].bitfield.byte
4506        && (i.op[0].regs->reg_flags & RegRex64) != 0)
4507       || (i.types[1].bitfield.reg && i.types[1].bitfield.byte
4508           && (i.op[1].regs->reg_flags & RegRex64) != 0)
4509       || (((i.types[0].bitfield.reg && i.types[0].bitfield.byte)
4510            || (i.types[1].bitfield.reg && i.types[1].bitfield.byte))
4511           && i.rex != 0))
4512     {
4513       int x;
4514
4515       i.rex |= REX_OPCODE;
4516       for (x = 0; x < 2; x++)
4517         {
4518           /* Look for 8 bit operand that uses old registers.  */
4519           if (i.types[x].bitfield.reg && i.types[x].bitfield.byte
4520               && (i.op[x].regs->reg_flags & RegRex64) == 0)
4521             {
4522               /* In case it is "hi" register, give up.  */
4523               if (i.op[x].regs->reg_num > 3)
4524                 as_bad (_("can't encode register '%s%s' in an "
4525                           "instruction requiring REX prefix."),
4526                         register_prefix, i.op[x].regs->reg_name);
4527
4528               /* Otherwise it is equivalent to the extended register.
4529                  Since the encoding doesn't change this is merely
4530                  cosmetic cleanup for debug output.  */
4531
4532               i.op[x].regs = i.op[x].regs + 8;
4533             }
4534         }
4535     }
4536
4537   if (i.rex == 0 && i.rex_encoding)
4538     {
4539       /* Check if we can add a REX_OPCODE byte.  Look for 8 bit operand
4540          that uses legacy register.  If it is "hi" register, don't add
4541          the REX_OPCODE byte.  */
4542       int x;
4543       for (x = 0; x < 2; x++)
4544         if (i.types[x].bitfield.reg
4545             && i.types[x].bitfield.byte
4546             && (i.op[x].regs->reg_flags & RegRex64) == 0
4547             && i.op[x].regs->reg_num > 3)
4548           {
4549             i.rex_encoding = FALSE;
4550             break;
4551           }
4552
4553       if (i.rex_encoding)
4554         i.rex = REX_OPCODE;
4555     }
4556
4557   if (i.rex != 0)
4558     add_prefix (REX_OPCODE | i.rex);
4559
4560   /* We are ready to output the insn.  */
4561   output_insn ();
4562 }
4563
4564 static char *
4565 parse_insn (char *line, char *mnemonic)
4566 {
4567   char *l = line;
4568   char *token_start = l;
4569   char *mnem_p;
4570   int supported;
4571   const insn_template *t;
4572   char *dot_p = NULL;
4573
4574   while (1)
4575     {
4576       mnem_p = mnemonic;
4577       while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
4578         {
4579           if (*mnem_p == '.')
4580             dot_p = mnem_p;
4581           mnem_p++;
4582           if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
4583             {
4584               as_bad (_("no such instruction: `%s'"), token_start);
4585               return NULL;
4586             }
4587           l++;
4588         }
4589       if (!is_space_char (*l)
4590           && *l != END_OF_INSN
4591           && (intel_syntax
4592               || (*l != PREFIX_SEPARATOR
4593                   && *l != ',')))
4594         {
4595           as_bad (_("invalid character %s in mnemonic"),
4596                   output_invalid (*l));
4597           return NULL;
4598         }
4599       if (token_start == l)
4600         {
4601           if (!intel_syntax && *l == PREFIX_SEPARATOR)
4602             as_bad (_("expecting prefix; got nothing"));
4603           else
4604             as_bad (_("expecting mnemonic; got nothing"));
4605           return NULL;
4606         }
4607
4608       /* Look up instruction (or prefix) via hash table.  */
4609       current_templates = (const templates *) hash_find (op_hash, mnemonic);
4610
4611       if (*l != END_OF_INSN
4612           && (!is_space_char (*l) || l[1] != END_OF_INSN)
4613           && current_templates
4614           && current_templates->start->opcode_modifier.isprefix)
4615         {
4616           if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
4617             {
4618               as_bad ((flag_code != CODE_64BIT
4619                        ? _("`%s' is only supported in 64-bit mode")
4620                        : _("`%s' is not supported in 64-bit mode")),
4621                       current_templates->start->name);
4622               return NULL;
4623             }
4624           /* If we are in 16-bit mode, do not allow addr16 or data16.
4625              Similarly, in 32-bit mode, do not allow addr32 or data32.  */
4626           if ((current_templates->start->opcode_modifier.size == SIZE16
4627                || current_templates->start->opcode_modifier.size == SIZE32)
4628               && flag_code != CODE_64BIT
4629               && ((current_templates->start->opcode_modifier.size == SIZE32)
4630                   ^ (flag_code == CODE_16BIT)))
4631             {
4632               as_bad (_("redundant %s prefix"),
4633                       current_templates->start->name);
4634               return NULL;
4635             }
4636           if (current_templates->start->opcode_length == 0)
4637             {
4638               /* Handle pseudo prefixes.  */
4639               switch (current_templates->start->base_opcode)
4640                 {
4641                 case 0x0:
4642                   /* {disp8} */
4643                   i.disp_encoding = disp_encoding_8bit;
4644                   break;
4645                 case 0x1:
4646                   /* {disp32} */
4647                   i.disp_encoding = disp_encoding_32bit;
4648                   break;
4649                 case 0x2:
4650                   /* {load} */
4651                   i.dir_encoding = dir_encoding_load;
4652                   break;
4653                 case 0x3:
4654                   /* {store} */
4655                   i.dir_encoding = dir_encoding_store;
4656                   break;
4657                 case 0x4:
4658                   /* {vex2} */
4659                   i.vec_encoding = vex_encoding_vex2;
4660                   break;
4661                 case 0x5:
4662                   /* {vex3} */
4663                   i.vec_encoding = vex_encoding_vex3;
4664                   break;
4665                 case 0x6:
4666                   /* {evex} */
4667                   i.vec_encoding = vex_encoding_evex;
4668                   break;
4669                 case 0x7:
4670                   /* {rex} */
4671                   i.rex_encoding = TRUE;
4672                   break;
4673                 case 0x8:
4674                   /* {nooptimize} */
4675                   i.no_optimize = TRUE;
4676                   break;
4677                 default:
4678                   abort ();
4679                 }
4680             }
4681           else
4682             {
4683               /* Add prefix, checking for repeated prefixes.  */
4684               switch (add_prefix (current_templates->start->base_opcode))
4685                 {
4686                 case PREFIX_EXIST:
4687                   return NULL;
4688                 case PREFIX_DS:
4689                   if (current_templates->start->cpu_flags.bitfield.cpuibt)
4690                     i.notrack_prefix = current_templates->start->name;
4691                   break;
4692                 case PREFIX_REP:
4693                   if (current_templates->start->cpu_flags.bitfield.cpuhle)
4694                     i.hle_prefix = current_templates->start->name;
4695                   else if (current_templates->start->cpu_flags.bitfield.cpumpx)
4696                     i.bnd_prefix = current_templates->start->name;
4697                   else
4698                     i.rep_prefix = current_templates->start->name;
4699                   break;
4700                 default:
4701                   break;
4702                 }
4703             }
4704           /* Skip past PREFIX_SEPARATOR and reset token_start.  */
4705           token_start = ++l;
4706         }
4707       else
4708         break;
4709     }
4710
4711   if (!current_templates)
4712     {
4713       /* Deprecated functionality (new code should use pseudo-prefixes instead):
4714          Check if we should swap operand or force 32bit displacement in
4715          encoding.  */
4716       if (mnem_p - 2 == dot_p && dot_p[1] == 's')
4717         i.dir_encoding = dir_encoding_swap;
4718       else if (mnem_p - 3 == dot_p
4719                && dot_p[1] == 'd'
4720                && dot_p[2] == '8')
4721         i.disp_encoding = disp_encoding_8bit;
4722       else if (mnem_p - 4 == dot_p
4723                && dot_p[1] == 'd'
4724                && dot_p[2] == '3'
4725                && dot_p[3] == '2')
4726         i.disp_encoding = disp_encoding_32bit;
4727       else
4728         goto check_suffix;
4729       mnem_p = dot_p;
4730       *dot_p = '\0';
4731       current_templates = (const templates *) hash_find (op_hash, mnemonic);
4732     }
4733
4734   if (!current_templates)
4735     {
4736 check_suffix:
4737       if (mnem_p > mnemonic)
4738         {
4739           /* See if we can get a match by trimming off a suffix.  */
4740           switch (mnem_p[-1])
4741             {
4742             case WORD_MNEM_SUFFIX:
4743               if (intel_syntax && (intel_float_operand (mnemonic) & 2))
4744                 i.suffix = SHORT_MNEM_SUFFIX;
4745               else
4746                 /* Fall through.  */
4747               case BYTE_MNEM_SUFFIX:
4748               case QWORD_MNEM_SUFFIX:
4749                 i.suffix = mnem_p[-1];
4750               mnem_p[-1] = '\0';
4751               current_templates = (const templates *) hash_find (op_hash,
4752                                                                  mnemonic);
4753               break;
4754             case SHORT_MNEM_SUFFIX:
4755             case LONG_MNEM_SUFFIX:
4756               if (!intel_syntax)
4757                 {
4758                   i.suffix = mnem_p[-1];
4759                   mnem_p[-1] = '\0';
4760                   current_templates = (const templates *) hash_find (op_hash,
4761                                                                      mnemonic);
4762                 }
4763               break;
4764
4765               /* Intel Syntax.  */
4766             case 'd':
4767               if (intel_syntax)
4768                 {
4769                   if (intel_float_operand (mnemonic) == 1)
4770                     i.suffix = SHORT_MNEM_SUFFIX;
4771                   else
4772                     i.suffix = LONG_MNEM_SUFFIX;
4773                   mnem_p[-1] = '\0';
4774                   current_templates = (const templates *) hash_find (op_hash,
4775                                                                      mnemonic);
4776                 }
4777               break;
4778             }
4779         }
4780
4781       if (!current_templates)
4782         {
4783           as_bad (_("no such instruction: `%s'"), token_start);
4784           return NULL;
4785         }
4786     }
4787
4788   if (current_templates->start->opcode_modifier.jump
4789       || current_templates->start->opcode_modifier.jumpbyte)
4790     {
4791       /* Check for a branch hint.  We allow ",pt" and ",pn" for
4792          predict taken and predict not taken respectively.
4793          I'm not sure that branch hints actually do anything on loop
4794          and jcxz insns (JumpByte) for current Pentium4 chips.  They
4795          may work in the future and it doesn't hurt to accept them
4796          now.  */
4797       if (l[0] == ',' && l[1] == 'p')
4798         {
4799           if (l[2] == 't')
4800             {
4801               if (!add_prefix (DS_PREFIX_OPCODE))
4802                 return NULL;
4803               l += 3;
4804             }
4805           else if (l[2] == 'n')
4806             {
4807               if (!add_prefix (CS_PREFIX_OPCODE))
4808                 return NULL;
4809               l += 3;
4810             }
4811         }
4812     }
4813   /* Any other comma loses.  */
4814   if (*l == ',')
4815     {
4816       as_bad (_("invalid character %s in mnemonic"),
4817               output_invalid (*l));
4818       return NULL;
4819     }
4820
4821   /* Check if instruction is supported on specified architecture.  */
4822   supported = 0;
4823   for (t = current_templates->start; t < current_templates->end; ++t)
4824     {
4825       supported |= cpu_flags_match (t);
4826       if (supported == CPU_FLAGS_PERFECT_MATCH)
4827         {
4828           if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
4829             as_warn (_("use .code16 to ensure correct addressing mode"));
4830
4831           return l;
4832         }
4833     }
4834
4835   if (!(supported & CPU_FLAGS_64BIT_MATCH))
4836     as_bad (flag_code == CODE_64BIT
4837             ? _("`%s' is not supported in 64-bit mode")
4838             : _("`%s' is only supported in 64-bit mode"),
4839             current_templates->start->name);
4840   else
4841     as_bad (_("`%s' is not supported on `%s%s'"),
4842             current_templates->start->name,
4843             cpu_arch_name ? cpu_arch_name : default_arch,
4844             cpu_sub_arch_name ? cpu_sub_arch_name : "");
4845
4846   return NULL;
4847 }
4848
4849 static char *
4850 parse_operands (char *l, const char *mnemonic)
4851 {
4852   char *token_start;
4853
4854   /* 1 if operand is pending after ','.  */
4855   unsigned int expecting_operand = 0;
4856
4857   /* Non-zero if operand parens not balanced.  */
4858   unsigned int paren_not_balanced;
4859
4860   while (*l != END_OF_INSN)
4861     {
4862       /* Skip optional white space before operand.  */
4863       if (is_space_char (*l))
4864         ++l;
4865       if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
4866         {
4867           as_bad (_("invalid character %s before operand %d"),
4868                   output_invalid (*l),
4869                   i.operands + 1);
4870           return NULL;
4871         }
4872       token_start = l;  /* After white space.  */
4873       paren_not_balanced = 0;
4874       while (paren_not_balanced || *l != ',')
4875         {
4876           if (*l == END_OF_INSN)
4877             {
4878               if (paren_not_balanced)
4879                 {
4880                   if (!intel_syntax)
4881                     as_bad (_("unbalanced parenthesis in operand %d."),
4882                             i.operands + 1);
4883                   else
4884                     as_bad (_("unbalanced brackets in operand %d."),
4885                             i.operands + 1);
4886                   return NULL;
4887                 }
4888               else
4889                 break;  /* we are done */
4890             }
4891           else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4892             {
4893               as_bad (_("invalid character %s in operand %d"),
4894                       output_invalid (*l),
4895                       i.operands + 1);
4896               return NULL;
4897             }
4898           if (!intel_syntax)
4899             {
4900               if (*l == '(')
4901                 ++paren_not_balanced;
4902               if (*l == ')')
4903                 --paren_not_balanced;
4904             }
4905           else
4906             {
4907               if (*l == '[')
4908                 ++paren_not_balanced;
4909               if (*l == ']')
4910                 --paren_not_balanced;
4911             }
4912           l++;
4913         }
4914       if (l != token_start)
4915         {                       /* Yes, we've read in another operand.  */
4916           unsigned int operand_ok;
4917           this_operand = i.operands++;
4918           if (i.operands > MAX_OPERANDS)
4919             {
4920               as_bad (_("spurious operands; (%d operands/instruction max)"),
4921                       MAX_OPERANDS);
4922               return NULL;
4923             }
4924           i.types[this_operand].bitfield.unspecified = 1;
4925           /* Now parse operand adding info to 'i' as we go along.  */
4926           END_STRING_AND_SAVE (l);
4927
4928           if (i.mem_operands > 1)
4929             {
4930               as_bad (_("too many memory references for `%s'"),
4931                       mnemonic);
4932               return 0;
4933             }
4934
4935           if (intel_syntax)
4936             operand_ok =
4937               i386_intel_operand (token_start,
4938                                   intel_float_operand (mnemonic));
4939           else
4940             operand_ok = i386_att_operand (token_start);
4941
4942           RESTORE_END_STRING (l);
4943           if (!operand_ok)
4944             return NULL;
4945         }
4946       else
4947         {
4948           if (expecting_operand)
4949             {
4950             expecting_operand_after_comma:
4951               as_bad (_("expecting operand after ','; got nothing"));
4952               return NULL;
4953             }
4954           if (*l == ',')
4955             {
4956               as_bad (_("expecting operand before ','; got nothing"));
4957               return NULL;
4958             }
4959         }
4960
4961       /* Now *l must be either ',' or END_OF_INSN.  */
4962       if (*l == ',')
4963         {
4964           if (*++l == END_OF_INSN)
4965             {
4966               /* Just skip it, if it's \n complain.  */
4967               goto expecting_operand_after_comma;
4968             }
4969           expecting_operand = 1;
4970         }
4971     }
4972   return l;
4973 }
4974
4975 static void
4976 swap_2_operands (int xchg1, int xchg2)
4977 {
4978   union i386_op temp_op;
4979   i386_operand_type temp_type;
4980   unsigned int temp_flags;
4981   enum bfd_reloc_code_real temp_reloc;
4982
4983   temp_type = i.types[xchg2];
4984   i.types[xchg2] = i.types[xchg1];
4985   i.types[xchg1] = temp_type;
4986
4987   temp_flags = i.flags[xchg2];
4988   i.flags[xchg2] = i.flags[xchg1];
4989   i.flags[xchg1] = temp_flags;
4990
4991   temp_op = i.op[xchg2];
4992   i.op[xchg2] = i.op[xchg1];
4993   i.op[xchg1] = temp_op;
4994
4995   temp_reloc = i.reloc[xchg2];
4996   i.reloc[xchg2] = i.reloc[xchg1];
4997   i.reloc[xchg1] = temp_reloc;
4998
4999   if (i.mask)
5000     {
5001       if (i.mask->operand == xchg1)
5002         i.mask->operand = xchg2;
5003       else if (i.mask->operand == xchg2)
5004         i.mask->operand = xchg1;
5005     }
5006   if (i.broadcast)
5007     {
5008       if (i.broadcast->operand == xchg1)
5009         i.broadcast->operand = xchg2;
5010       else if (i.broadcast->operand == xchg2)
5011         i.broadcast->operand = xchg1;
5012     }
5013   if (i.rounding)
5014     {
5015       if (i.rounding->operand == xchg1)
5016         i.rounding->operand = xchg2;
5017       else if (i.rounding->operand == xchg2)
5018         i.rounding->operand = xchg1;
5019     }
5020 }
5021
5022 static void
5023 swap_operands (void)
5024 {
5025   switch (i.operands)
5026     {
5027     case 5:
5028     case 4:
5029       swap_2_operands (1, i.operands - 2);
5030       /* Fall through.  */
5031     case 3:
5032     case 2:
5033       swap_2_operands (0, i.operands - 1);
5034       break;
5035     default:
5036       abort ();
5037     }
5038
5039   if (i.mem_operands == 2)
5040     {
5041       const seg_entry *temp_seg;
5042       temp_seg = i.seg[0];
5043       i.seg[0] = i.seg[1];
5044       i.seg[1] = temp_seg;
5045     }
5046 }
5047
5048 /* Try to ensure constant immediates are represented in the smallest
5049    opcode possible.  */
5050 static void
5051 optimize_imm (void)
5052 {
5053   char guess_suffix = 0;
5054   int op;
5055
5056   if (i.suffix)
5057     guess_suffix = i.suffix;
5058   else if (i.reg_operands)
5059     {
5060       /* Figure out a suffix from the last register operand specified.
5061          We can't do this properly yet, ie. excluding InOutPortReg,
5062          but the following works for instructions with immediates.
5063          In any case, we can't set i.suffix yet.  */
5064       for (op = i.operands; --op >= 0;)
5065         if (i.types[op].bitfield.reg && i.types[op].bitfield.byte)
5066           {
5067             guess_suffix = BYTE_MNEM_SUFFIX;
5068             break;
5069           }
5070         else if (i.types[op].bitfield.reg && i.types[op].bitfield.word)
5071           {
5072             guess_suffix = WORD_MNEM_SUFFIX;
5073             break;
5074           }
5075         else if (i.types[op].bitfield.reg && i.types[op].bitfield.dword)
5076           {
5077             guess_suffix = LONG_MNEM_SUFFIX;
5078             break;
5079           }
5080         else if (i.types[op].bitfield.reg && i.types[op].bitfield.qword)
5081           {
5082             guess_suffix = QWORD_MNEM_SUFFIX;
5083             break;
5084           }
5085     }
5086   else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5087     guess_suffix = WORD_MNEM_SUFFIX;
5088
5089   for (op = i.operands; --op >= 0;)
5090     if (operand_type_check (i.types[op], imm))
5091       {
5092         switch (i.op[op].imms->X_op)
5093           {
5094           case O_constant:
5095             /* If a suffix is given, this operand may be shortened.  */
5096             switch (guess_suffix)
5097               {
5098               case LONG_MNEM_SUFFIX:
5099                 i.types[op].bitfield.imm32 = 1;
5100                 i.types[op].bitfield.imm64 = 1;
5101                 break;
5102               case WORD_MNEM_SUFFIX:
5103                 i.types[op].bitfield.imm16 = 1;
5104                 i.types[op].bitfield.imm32 = 1;
5105                 i.types[op].bitfield.imm32s = 1;
5106                 i.types[op].bitfield.imm64 = 1;
5107                 break;
5108               case BYTE_MNEM_SUFFIX:
5109                 i.types[op].bitfield.imm8 = 1;
5110                 i.types[op].bitfield.imm8s = 1;
5111                 i.types[op].bitfield.imm16 = 1;
5112                 i.types[op].bitfield.imm32 = 1;
5113                 i.types[op].bitfield.imm32s = 1;
5114                 i.types[op].bitfield.imm64 = 1;
5115                 break;
5116               }
5117
5118             /* If this operand is at most 16 bits, convert it
5119                to a signed 16 bit number before trying to see
5120                whether it will fit in an even smaller size.
5121                This allows a 16-bit operand such as $0xffe0 to
5122                be recognised as within Imm8S range.  */
5123             if ((i.types[op].bitfield.imm16)
5124                 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5125               {
5126                 i.op[op].imms->X_add_number =
5127                   (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5128               }
5129 #ifdef BFD64
5130             /* Store 32-bit immediate in 64-bit for 64-bit BFD.  */
5131             if ((i.types[op].bitfield.imm32)
5132                 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5133                     == 0))
5134               {
5135                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5136                                                 ^ ((offsetT) 1 << 31))
5137                                                - ((offsetT) 1 << 31));
5138               }
5139 #endif
5140             i.types[op]
5141               = operand_type_or (i.types[op],
5142                                  smallest_imm_type (i.op[op].imms->X_add_number));
5143
5144             /* We must avoid matching of Imm32 templates when 64bit
5145                only immediate is available.  */
5146             if (guess_suffix == QWORD_MNEM_SUFFIX)
5147               i.types[op].bitfield.imm32 = 0;
5148             break;
5149
5150           case O_absent:
5151           case O_register:
5152             abort ();
5153
5154             /* Symbols and expressions.  */
5155           default:
5156             /* Convert symbolic operand to proper sizes for matching, but don't
5157                prevent matching a set of insns that only supports sizes other
5158                than those matching the insn suffix.  */
5159             {
5160               i386_operand_type mask, allowed;
5161               const insn_template *t;
5162
5163               operand_type_set (&mask, 0);
5164               operand_type_set (&allowed, 0);
5165
5166               for (t = current_templates->start;
5167                    t < current_templates->end;
5168                    ++t)
5169                 allowed = operand_type_or (allowed,
5170                                            t->operand_types[op]);
5171               switch (guess_suffix)
5172                 {
5173                 case QWORD_MNEM_SUFFIX:
5174                   mask.bitfield.imm64 = 1;
5175                   mask.bitfield.imm32s = 1;
5176                   break;
5177                 case LONG_MNEM_SUFFIX:
5178                   mask.bitfield.imm32 = 1;
5179                   break;
5180                 case WORD_MNEM_SUFFIX:
5181                   mask.bitfield.imm16 = 1;
5182                   break;
5183                 case BYTE_MNEM_SUFFIX:
5184                   mask.bitfield.imm8 = 1;
5185                   break;
5186                 default:
5187                   break;
5188                 }
5189               allowed = operand_type_and (mask, allowed);
5190               if (!operand_type_all_zero (&allowed))
5191                 i.types[op] = operand_type_and (i.types[op], mask);
5192             }
5193             break;
5194           }
5195       }
5196 }
5197
5198 /* Try to use the smallest displacement type too.  */
5199 static void
5200 optimize_disp (void)
5201 {
5202   int op;
5203
5204   for (op = i.operands; --op >= 0;)
5205     if (operand_type_check (i.types[op], disp))
5206       {
5207         if (i.op[op].disps->X_op == O_constant)
5208           {
5209             offsetT op_disp = i.op[op].disps->X_add_number;
5210
5211             if (i.types[op].bitfield.disp16
5212                 && (op_disp & ~(offsetT) 0xffff) == 0)
5213               {
5214                 /* If this operand is at most 16 bits, convert
5215                    to a signed 16 bit number and don't use 64bit
5216                    displacement.  */
5217                 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5218                 i.types[op].bitfield.disp64 = 0;
5219               }
5220 #ifdef BFD64
5221             /* Optimize 64-bit displacement to 32-bit for 64-bit BFD.  */
5222             if (i.types[op].bitfield.disp32
5223                 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5224               {
5225                 /* If this operand is at most 32 bits, convert
5226                    to a signed 32 bit number and don't use 64bit
5227                    displacement.  */
5228                 op_disp &= (((offsetT) 2 << 31) - 1);
5229                 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5230                 i.types[op].bitfield.disp64 = 0;
5231               }
5232 #endif
5233             if (!op_disp && i.types[op].bitfield.baseindex)
5234               {
5235                 i.types[op].bitfield.disp8 = 0;
5236                 i.types[op].bitfield.disp16 = 0;
5237                 i.types[op].bitfield.disp32 = 0;
5238                 i.types[op].bitfield.disp32s = 0;
5239                 i.types[op].bitfield.disp64 = 0;
5240                 i.op[op].disps = 0;
5241                 i.disp_operands--;
5242               }
5243             else if (flag_code == CODE_64BIT)
5244               {
5245                 if (fits_in_signed_long (op_disp))
5246                   {
5247                     i.types[op].bitfield.disp64 = 0;
5248                     i.types[op].bitfield.disp32s = 1;
5249                   }
5250                 if (i.prefix[ADDR_PREFIX]
5251                     && fits_in_unsigned_long (op_disp))
5252                   i.types[op].bitfield.disp32 = 1;
5253               }
5254             if ((i.types[op].bitfield.disp32
5255                  || i.types[op].bitfield.disp32s
5256                  || i.types[op].bitfield.disp16)
5257                 && fits_in_disp8 (op_disp))
5258               i.types[op].bitfield.disp8 = 1;
5259           }
5260         else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5261                  || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5262           {
5263             fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5264                          i.op[op].disps, 0, i.reloc[op]);
5265             i.types[op].bitfield.disp8 = 0;
5266             i.types[op].bitfield.disp16 = 0;
5267             i.types[op].bitfield.disp32 = 0;
5268             i.types[op].bitfield.disp32s = 0;
5269             i.types[op].bitfield.disp64 = 0;
5270           }
5271         else
5272           /* We only support 64bit displacement on constants.  */
5273           i.types[op].bitfield.disp64 = 0;
5274       }
5275 }
5276
5277 /* Return 1 if there is a match in broadcast bytes between operand
5278    GIVEN and instruction template T.   */
5279
5280 static INLINE int
5281 match_broadcast_size (const insn_template *t, unsigned int given)
5282 {
5283   return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5284            && i.types[given].bitfield.byte)
5285           || (t->opcode_modifier.broadcast == WORD_BROADCAST
5286               && i.types[given].bitfield.word)
5287           || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5288               && i.types[given].bitfield.dword)
5289           || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5290               && i.types[given].bitfield.qword));
5291 }
5292
5293 /* Check if operands are valid for the instruction.  */
5294
5295 static int
5296 check_VecOperands (const insn_template *t)
5297 {
5298   unsigned int op;
5299   i386_cpu_flags cpu;
5300   static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
5301
5302   /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5303      any one operand are implicity requiring AVX512VL support if the actual
5304      operand size is YMMword or XMMword.  Since this function runs after
5305      template matching, there's no need to check for YMMword/XMMword in
5306      the template.  */
5307   cpu = cpu_flags_and (t->cpu_flags, avx512);
5308   if (!cpu_flags_all_zero (&cpu)
5309       && !t->cpu_flags.bitfield.cpuavx512vl
5310       && !cpu_arch_flags.bitfield.cpuavx512vl)
5311     {
5312       for (op = 0; op < t->operands; ++op)
5313         {
5314           if (t->operand_types[op].bitfield.zmmword
5315               && (i.types[op].bitfield.ymmword
5316                   || i.types[op].bitfield.xmmword))
5317             {
5318               i.error = unsupported;
5319               return 1;
5320             }
5321         }
5322     }
5323
5324   /* Without VSIB byte, we can't have a vector register for index.  */
5325   if (!t->opcode_modifier.vecsib
5326       && i.index_reg
5327       && (i.index_reg->reg_type.bitfield.xmmword
5328           || i.index_reg->reg_type.bitfield.ymmword
5329           || i.index_reg->reg_type.bitfield.zmmword))
5330     {
5331       i.error = unsupported_vector_index_register;
5332       return 1;
5333     }
5334
5335   /* Check if default mask is allowed.  */
5336   if (t->opcode_modifier.nodefmask
5337       && (!i.mask || i.mask->mask->reg_num == 0))
5338     {
5339       i.error = no_default_mask;
5340       return 1;
5341     }
5342
5343   /* For VSIB byte, we need a vector register for index, and all vector
5344      registers must be distinct.  */
5345   if (t->opcode_modifier.vecsib)
5346     {
5347       if (!i.index_reg
5348           || !((t->opcode_modifier.vecsib == VecSIB128
5349                 && i.index_reg->reg_type.bitfield.xmmword)
5350                || (t->opcode_modifier.vecsib == VecSIB256
5351                    && i.index_reg->reg_type.bitfield.ymmword)
5352                || (t->opcode_modifier.vecsib == VecSIB512
5353                    && i.index_reg->reg_type.bitfield.zmmword)))
5354       {
5355         i.error = invalid_vsib_address;
5356         return 1;
5357       }
5358
5359       gas_assert (i.reg_operands == 2 || i.mask);
5360       if (i.reg_operands == 2 && !i.mask)
5361         {
5362           gas_assert (i.types[0].bitfield.regsimd);
5363           gas_assert (i.types[0].bitfield.xmmword
5364                       || i.types[0].bitfield.ymmword);
5365           gas_assert (i.types[2].bitfield.regsimd);
5366           gas_assert (i.types[2].bitfield.xmmword
5367                       || i.types[2].bitfield.ymmword);
5368           if (operand_check == check_none)
5369             return 0;
5370           if (register_number (i.op[0].regs)
5371               != register_number (i.index_reg)
5372               && register_number (i.op[2].regs)
5373                  != register_number (i.index_reg)
5374               && register_number (i.op[0].regs)
5375                  != register_number (i.op[2].regs))
5376             return 0;
5377           if (operand_check == check_error)
5378             {
5379               i.error = invalid_vector_register_set;
5380               return 1;
5381             }
5382           as_warn (_("mask, index, and destination registers should be distinct"));
5383         }
5384       else if (i.reg_operands == 1 && i.mask)
5385         {
5386           if (i.types[1].bitfield.regsimd
5387               && (i.types[1].bitfield.xmmword
5388                   || i.types[1].bitfield.ymmword
5389                   || i.types[1].bitfield.zmmword)
5390               && (register_number (i.op[1].regs)
5391                   == register_number (i.index_reg)))
5392             {
5393               if (operand_check == check_error)
5394                 {
5395                   i.error = invalid_vector_register_set;
5396                   return 1;
5397                 }
5398               if (operand_check != check_none)
5399                 as_warn (_("index and destination registers should be distinct"));
5400             }
5401         }
5402     }
5403
5404   /* Check if broadcast is supported by the instruction and is applied
5405      to the memory operand.  */
5406   if (i.broadcast)
5407     {
5408       i386_operand_type type, overlap;
5409
5410       /* Check if specified broadcast is supported in this instruction,
5411          and its broadcast bytes match the memory operand.  */
5412       op = i.broadcast->operand;
5413       if (!t->opcode_modifier.broadcast
5414           || !(i.flags[op] & Operand_Mem)
5415           || (!i.types[op].bitfield.unspecified
5416               && !match_broadcast_size (t, op)))
5417         {
5418         bad_broadcast:
5419           i.error = unsupported_broadcast;
5420           return 1;
5421         }
5422
5423       i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5424                             * i.broadcast->type);
5425       operand_type_set (&type, 0);
5426       switch (i.broadcast->bytes)
5427         {
5428         case 2:
5429           type.bitfield.word = 1;
5430           break;
5431         case 4:
5432           type.bitfield.dword = 1;
5433           break;
5434         case 8:
5435           type.bitfield.qword = 1;
5436           break;
5437         case 16:
5438           type.bitfield.xmmword = 1;
5439           break;
5440         case 32:
5441           type.bitfield.ymmword = 1;
5442           break;
5443         case 64:
5444           type.bitfield.zmmword = 1;
5445           break;
5446         default:
5447           goto bad_broadcast;
5448         }
5449
5450       overlap = operand_type_and (type, t->operand_types[op]);
5451       if (operand_type_all_zero (&overlap))
5452           goto bad_broadcast;
5453
5454       if (t->opcode_modifier.checkregsize)
5455         {
5456           unsigned int j;
5457
5458           type.bitfield.baseindex = 1;
5459           for (j = 0; j < i.operands; ++j)
5460             {
5461               if (j != op
5462                   && !operand_type_register_match(i.types[j],
5463                                                   t->operand_types[j],
5464                                                   type,
5465                                                   t->operand_types[op]))
5466                 goto bad_broadcast;
5467             }
5468         }
5469     }
5470   /* If broadcast is supported in this instruction, we need to check if
5471      operand of one-element size isn't specified without broadcast.  */
5472   else if (t->opcode_modifier.broadcast && i.mem_operands)
5473     {
5474       /* Find memory operand.  */
5475       for (op = 0; op < i.operands; op++)
5476         if (i.flags[op] & Operand_Mem)
5477           break;
5478       gas_assert (op < i.operands);
5479       /* Check size of the memory operand.  */
5480       if (match_broadcast_size (t, op))
5481         {
5482           i.error = broadcast_needed;
5483           return 1;
5484         }
5485     }
5486   else
5487     op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning.  */
5488
5489   /* Check if requested masking is supported.  */
5490   if (i.mask)
5491     {
5492       switch (t->opcode_modifier.masking)
5493         {
5494         case BOTH_MASKING:
5495           break;
5496         case MERGING_MASKING:
5497           if (i.mask->zeroing)
5498             {
5499         case 0:
5500               i.error = unsupported_masking;
5501               return 1;
5502             }
5503           break;
5504         case DYNAMIC_MASKING:
5505           /* Memory destinations allow only merging masking.  */
5506           if (i.mask->zeroing && i.mem_operands)
5507             {
5508               /* Find memory operand.  */
5509               for (op = 0; op < i.operands; op++)
5510                 if (i.flags[op] & Operand_Mem)
5511                   break;
5512               gas_assert (op < i.operands);
5513               if (op == i.operands - 1)
5514                 {
5515                   i.error = unsupported_masking;
5516                   return 1;
5517                 }
5518             }
5519           break;
5520         default:
5521           abort ();
5522         }
5523     }
5524
5525   /* Check if masking is applied to dest operand.  */
5526   if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5527     {
5528       i.error = mask_not_on_destination;
5529       return 1;
5530     }
5531
5532   /* Check RC/SAE.  */
5533   if (i.rounding)
5534     {
5535       if (!t->opcode_modifier.sae
5536           || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
5537         {
5538           i.error = unsupported_rc_sae;
5539           return 1;
5540         }
5541       /* If the instruction has several immediate operands and one of
5542          them is rounding, the rounding operand should be the last
5543          immediate operand.  */
5544       if (i.imm_operands > 1
5545           && i.rounding->operand != (int) (i.imm_operands - 1))
5546         {
5547           i.error = rc_sae_operand_not_last_imm;
5548           return 1;
5549         }
5550     }
5551
5552   /* Check vector Disp8 operand.  */
5553   if (t->opcode_modifier.disp8memshift
5554       && i.disp_encoding != disp_encoding_32bit)
5555     {
5556       if (i.broadcast)
5557         i.memshift = t->opcode_modifier.broadcast - 1;
5558       else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
5559         i.memshift = t->opcode_modifier.disp8memshift;
5560       else
5561         {
5562           const i386_operand_type *type = NULL;
5563
5564           i.memshift = 0;
5565           for (op = 0; op < i.operands; op++)
5566             if (i.flags[op] & Operand_Mem)
5567               {
5568                 if (t->opcode_modifier.evex == EVEXLIG)
5569                   i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
5570                 else if (t->operand_types[op].bitfield.xmmword
5571                          + t->operand_types[op].bitfield.ymmword
5572                          + t->operand_types[op].bitfield.zmmword <= 1)
5573                   type = &t->operand_types[op];
5574                 else if (!i.types[op].bitfield.unspecified)
5575                   type = &i.types[op];
5576               }
5577             else if (i.types[op].bitfield.regsimd
5578                      && t->opcode_modifier.evex != EVEXLIG)
5579               {
5580                 if (i.types[op].bitfield.zmmword)
5581                   i.memshift = 6;
5582                 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
5583                   i.memshift = 5;
5584                 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
5585                   i.memshift = 4;
5586               }
5587
5588           if (type)
5589             {
5590               if (type->bitfield.zmmword)
5591                 i.memshift = 6;
5592               else if (type->bitfield.ymmword)
5593                 i.memshift = 5;
5594               else if (type->bitfield.xmmword)
5595                 i.memshift = 4;
5596             }
5597
5598           /* For the check in fits_in_disp8().  */
5599           if (i.memshift == 0)
5600             i.memshift = -1;
5601         }
5602
5603       for (op = 0; op < i.operands; op++)
5604         if (operand_type_check (i.types[op], disp)
5605             && i.op[op].disps->X_op == O_constant)
5606           {
5607             if (fits_in_disp8 (i.op[op].disps->X_add_number))
5608               {
5609                 i.types[op].bitfield.disp8 = 1;
5610                 return 0;
5611               }
5612             i.types[op].bitfield.disp8 = 0;
5613           }
5614     }
5615
5616   i.memshift = 0;
5617
5618   return 0;
5619 }
5620
5621 /* Check if operands are valid for the instruction.  Update VEX
5622    operand types.  */
5623
5624 static int
5625 VEX_check_operands (const insn_template *t)
5626 {
5627   if (i.vec_encoding == vex_encoding_evex)
5628     {
5629       /* This instruction must be encoded with EVEX prefix.  */
5630       if (!is_evex_encoding (t))
5631         {
5632           i.error = unsupported;
5633           return 1;
5634         }
5635       return 0;
5636     }
5637
5638   if (!t->opcode_modifier.vex)
5639     {
5640       /* This instruction template doesn't have VEX prefix.  */
5641       if (i.vec_encoding != vex_encoding_default)
5642         {
5643           i.error = unsupported;
5644           return 1;
5645         }
5646       return 0;
5647     }
5648
5649   /* Check the special Imm4 cases; must be the first operand.  */
5650   if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
5651     {
5652       if (i.op[0].imms->X_op != O_constant
5653           || !fits_in_imm4 (i.op[0].imms->X_add_number))
5654         {
5655           i.error = bad_imm4;
5656           return 1;
5657         }
5658
5659       /* Turn off Imm<N> so that update_imm won't complain.  */
5660       operand_type_set (&i.types[0], 0);
5661     }
5662
5663   return 0;
5664 }
5665
5666 static const insn_template *
5667 match_template (char mnem_suffix)
5668 {
5669   /* Points to template once we've found it.  */
5670   const insn_template *t;
5671   i386_operand_type overlap0, overlap1, overlap2, overlap3;
5672   i386_operand_type overlap4;
5673   unsigned int found_reverse_match;
5674   i386_opcode_modifier suffix_check, mnemsuf_check;
5675   i386_operand_type operand_types [MAX_OPERANDS];
5676   int addr_prefix_disp;
5677   unsigned int j;
5678   unsigned int found_cpu_match, size_match;
5679   unsigned int check_register;
5680   enum i386_error specific_error = 0;
5681
5682 #if MAX_OPERANDS != 5
5683 # error "MAX_OPERANDS must be 5."
5684 #endif
5685
5686   found_reverse_match = 0;
5687   addr_prefix_disp = -1;
5688
5689   memset (&suffix_check, 0, sizeof (suffix_check));
5690   if (intel_syntax && i.broadcast)
5691     /* nothing */;
5692   else if (i.suffix == BYTE_MNEM_SUFFIX)
5693     suffix_check.no_bsuf = 1;
5694   else if (i.suffix == WORD_MNEM_SUFFIX)
5695     suffix_check.no_wsuf = 1;
5696   else if (i.suffix == SHORT_MNEM_SUFFIX)
5697     suffix_check.no_ssuf = 1;
5698   else if (i.suffix == LONG_MNEM_SUFFIX)
5699     suffix_check.no_lsuf = 1;
5700   else if (i.suffix == QWORD_MNEM_SUFFIX)
5701     suffix_check.no_qsuf = 1;
5702   else if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
5703     suffix_check.no_ldsuf = 1;
5704
5705   memset (&mnemsuf_check, 0, sizeof (mnemsuf_check));
5706   if (intel_syntax)
5707     {
5708       switch (mnem_suffix)
5709         {
5710         case BYTE_MNEM_SUFFIX:  mnemsuf_check.no_bsuf = 1; break;
5711         case WORD_MNEM_SUFFIX:  mnemsuf_check.no_wsuf = 1; break;
5712         case SHORT_MNEM_SUFFIX: mnemsuf_check.no_ssuf = 1; break;
5713         case LONG_MNEM_SUFFIX:  mnemsuf_check.no_lsuf = 1; break;
5714         case QWORD_MNEM_SUFFIX: mnemsuf_check.no_qsuf = 1; break;
5715         }
5716     }
5717
5718   /* Must have right number of operands.  */
5719   i.error = number_of_operands_mismatch;
5720
5721   for (t = current_templates->start; t < current_templates->end; t++)
5722     {
5723       addr_prefix_disp = -1;
5724       found_reverse_match = 0;
5725
5726       if (i.operands != t->operands)
5727         continue;
5728
5729       /* Check processor support.  */
5730       i.error = unsupported;
5731       found_cpu_match = (cpu_flags_match (t)
5732                          == CPU_FLAGS_PERFECT_MATCH);
5733       if (!found_cpu_match)
5734         continue;
5735
5736       /* Check AT&T mnemonic.   */
5737       i.error = unsupported_with_intel_mnemonic;
5738       if (intel_mnemonic && t->opcode_modifier.attmnemonic)
5739         continue;
5740
5741       /* Check AT&T/Intel syntax and Intel64/AMD64 ISA.   */
5742       i.error = unsupported_syntax;
5743       if ((intel_syntax && t->opcode_modifier.attsyntax)
5744           || (!intel_syntax && t->opcode_modifier.intelsyntax)
5745           || (intel64 && t->opcode_modifier.amd64)
5746           || (!intel64 && t->opcode_modifier.intel64))
5747         continue;
5748
5749       /* Check the suffix, except for some instructions in intel mode.  */
5750       i.error = invalid_instruction_suffix;
5751       if ((!intel_syntax || !t->opcode_modifier.ignoresize)
5752           && ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
5753               || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
5754               || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
5755               || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
5756               || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
5757               || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf)))
5758         continue;
5759       /* In Intel mode all mnemonic suffixes must be explicitly allowed.  */
5760       if ((t->opcode_modifier.no_bsuf && mnemsuf_check.no_bsuf)
5761           || (t->opcode_modifier.no_wsuf && mnemsuf_check.no_wsuf)
5762           || (t->opcode_modifier.no_lsuf && mnemsuf_check.no_lsuf)
5763           || (t->opcode_modifier.no_ssuf && mnemsuf_check.no_ssuf)
5764           || (t->opcode_modifier.no_qsuf && mnemsuf_check.no_qsuf)
5765           || (t->opcode_modifier.no_ldsuf && mnemsuf_check.no_ldsuf))
5766         continue;
5767
5768       size_match = operand_size_match (t);
5769       if (!size_match)
5770         continue;
5771
5772       for (j = 0; j < MAX_OPERANDS; j++)
5773         operand_types[j] = t->operand_types[j];
5774
5775       /* In general, don't allow 64-bit operands in 32-bit mode.  */
5776       if (i.suffix == QWORD_MNEM_SUFFIX
5777           && flag_code != CODE_64BIT
5778           && (intel_syntax
5779               ? (!t->opcode_modifier.ignoresize
5780                  && !t->opcode_modifier.broadcast
5781                  && !intel_float_operand (t->name))
5782               : intel_float_operand (t->name) != 2)
5783           && ((!operand_types[0].bitfield.regmmx
5784                && !operand_types[0].bitfield.regsimd)
5785               || (!operand_types[t->operands > 1].bitfield.regmmx
5786                   && !operand_types[t->operands > 1].bitfield.regsimd))
5787           && (t->base_opcode != 0x0fc7
5788               || t->extension_opcode != 1 /* cmpxchg8b */))
5789         continue;
5790
5791       /* In general, don't allow 32-bit operands on pre-386.  */
5792       else if (i.suffix == LONG_MNEM_SUFFIX
5793                && !cpu_arch_flags.bitfield.cpui386
5794                && (intel_syntax
5795                    ? (!t->opcode_modifier.ignoresize
5796                       && !intel_float_operand (t->name))
5797                    : intel_float_operand (t->name) != 2)
5798                && ((!operand_types[0].bitfield.regmmx
5799                     && !operand_types[0].bitfield.regsimd)
5800                    || (!operand_types[t->operands > 1].bitfield.regmmx
5801                        && !operand_types[t->operands > 1].bitfield.regsimd)))
5802         continue;
5803
5804       /* Do not verify operands when there are none.  */
5805       else
5806         {
5807           if (!t->operands)
5808             /* We've found a match; break out of loop.  */
5809             break;
5810         }
5811
5812       /* Address size prefix will turn Disp64/Disp32/Disp16 operand
5813          into Disp32/Disp16/Disp32 operand.  */
5814       if (i.prefix[ADDR_PREFIX] != 0)
5815           {
5816             /* There should be only one Disp operand.  */
5817             switch (flag_code)
5818             {
5819             case CODE_16BIT:
5820               for (j = 0; j < MAX_OPERANDS; j++)
5821                 {
5822                   if (operand_types[j].bitfield.disp16)
5823                     {
5824                       addr_prefix_disp = j;
5825                       operand_types[j].bitfield.disp32 = 1;
5826                       operand_types[j].bitfield.disp16 = 0;
5827                       break;
5828                     }
5829                 }
5830               break;
5831             case CODE_32BIT:
5832               for (j = 0; j < MAX_OPERANDS; j++)
5833                 {
5834                   if (operand_types[j].bitfield.disp32)
5835                     {
5836                       addr_prefix_disp = j;
5837                       operand_types[j].bitfield.disp32 = 0;
5838                       operand_types[j].bitfield.disp16 = 1;
5839                       break;
5840                     }
5841                 }
5842               break;
5843             case CODE_64BIT:
5844               for (j = 0; j < MAX_OPERANDS; j++)
5845                 {
5846                   if (operand_types[j].bitfield.disp64)
5847                     {
5848                       addr_prefix_disp = j;
5849                       operand_types[j].bitfield.disp64 = 0;
5850                       operand_types[j].bitfield.disp32 = 1;
5851                       break;
5852                     }
5853                 }
5854               break;
5855             }
5856           }
5857
5858       /* Force 0x8b encoding for "mov foo@GOT, %eax".  */
5859       if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
5860         continue;
5861
5862       /* We check register size if needed.  */
5863       if (t->opcode_modifier.checkregsize)
5864         {
5865           check_register = (1 << t->operands) - 1;
5866           if (i.broadcast)
5867             check_register &= ~(1 << i.broadcast->operand);
5868         }
5869       else
5870         check_register = 0;
5871
5872       overlap0 = operand_type_and (i.types[0], operand_types[0]);
5873       switch (t->operands)
5874         {
5875         case 1:
5876           if (!operand_type_match (overlap0, i.types[0]))
5877             continue;
5878           break;
5879         case 2:
5880           /* xchg %eax, %eax is a special case. It is an alias for nop
5881              only in 32bit mode and we can use opcode 0x90.  In 64bit
5882              mode, we can't use 0x90 for xchg %eax, %eax since it should
5883              zero-extend %eax to %rax.  */
5884           if (flag_code == CODE_64BIT
5885               && t->base_opcode == 0x90
5886               && i.types[0].bitfield.acc && i.types[0].bitfield.dword
5887               && i.types[1].bitfield.acc && i.types[1].bitfield.dword)
5888             continue;
5889           /* xrelease mov %eax, <disp> is another special case. It must not
5890              match the accumulator-only encoding of mov.  */
5891           if (flag_code != CODE_64BIT
5892               && i.hle_prefix
5893               && t->base_opcode == 0xa0
5894               && i.types[0].bitfield.acc
5895               && (i.flags[1] & Operand_Mem))
5896             continue;
5897           /* Fall through.  */
5898
5899         case 3:
5900           if (!(size_match & MATCH_STRAIGHT))
5901             goto check_reverse;
5902           /* Reverse direction of operands if swapping is possible in the first
5903              place (operands need to be symmetric) and
5904              - the load form is requested, and the template is a store form,
5905              - the store form is requested, and the template is a load form,
5906              - the non-default (swapped) form is requested.  */
5907           overlap1 = operand_type_and (operand_types[0], operand_types[1]);
5908           if (t->opcode_modifier.d && i.reg_operands == i.operands
5909               && !operand_type_all_zero (&overlap1))
5910             switch (i.dir_encoding)
5911               {
5912               case dir_encoding_load:
5913                 if (operand_type_check (operand_types[i.operands - 1], anymem)
5914                     || t->opcode_modifier.regmem)
5915                   goto check_reverse;
5916                 break;
5917
5918               case dir_encoding_store:
5919                 if (!operand_type_check (operand_types[i.operands - 1], anymem)
5920                     && !t->opcode_modifier.regmem)
5921                   goto check_reverse;
5922                 break;
5923
5924               case dir_encoding_swap:
5925                 goto check_reverse;
5926
5927               case dir_encoding_default:
5928                 break;
5929               }
5930           /* If we want store form, we skip the current load.  */
5931           if ((i.dir_encoding == dir_encoding_store
5932                || i.dir_encoding == dir_encoding_swap)
5933               && i.mem_operands == 0
5934               && t->opcode_modifier.load)
5935             continue;
5936           /* Fall through.  */
5937         case 4:
5938         case 5:
5939           overlap1 = operand_type_and (i.types[1], operand_types[1]);
5940           if (!operand_type_match (overlap0, i.types[0])
5941               || !operand_type_match (overlap1, i.types[1])
5942               || ((check_register & 3) == 3
5943                   && !operand_type_register_match (i.types[0],
5944                                                    operand_types[0],
5945                                                    i.types[1],
5946                                                    operand_types[1])))
5947             {
5948               /* Check if other direction is valid ...  */
5949               if (!t->opcode_modifier.d)
5950                 continue;
5951
5952 check_reverse:
5953               if (!(size_match & MATCH_REVERSE))
5954                 continue;
5955               /* Try reversing direction of operands.  */
5956               overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
5957               overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
5958               if (!operand_type_match (overlap0, i.types[0])
5959                   || !operand_type_match (overlap1, i.types[i.operands - 1])
5960                   || (check_register
5961                       && !operand_type_register_match (i.types[0],
5962                                                        operand_types[i.operands - 1],
5963                                                        i.types[i.operands - 1],
5964                                                        operand_types[0])))
5965                 {
5966                   /* Does not match either direction.  */
5967                   continue;
5968                 }
5969               /* found_reverse_match holds which of D or FloatR
5970                  we've found.  */
5971               if (!t->opcode_modifier.d)
5972                 found_reverse_match = 0;
5973               else if (operand_types[0].bitfield.tbyte)
5974                 found_reverse_match = Opcode_FloatD;
5975               else if (operand_types[0].bitfield.xmmword
5976                        || operand_types[i.operands - 1].bitfield.xmmword
5977                        || operand_types[0].bitfield.regmmx
5978                        || operand_types[i.operands - 1].bitfield.regmmx
5979                        || is_any_vex_encoding(t))
5980                 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
5981                                       ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
5982               else
5983                 found_reverse_match = Opcode_D;
5984               if (t->opcode_modifier.floatr)
5985                 found_reverse_match |= Opcode_FloatR;
5986             }
5987           else
5988             {
5989               /* Found a forward 2 operand match here.  */
5990               switch (t->operands)
5991                 {
5992                 case 5:
5993                   overlap4 = operand_type_and (i.types[4],
5994                                                operand_types[4]);
5995                   /* Fall through.  */
5996                 case 4:
5997                   overlap3 = operand_type_and (i.types[3],
5998                                                operand_types[3]);
5999                   /* Fall through.  */
6000                 case 3:
6001                   overlap2 = operand_type_and (i.types[2],
6002                                                operand_types[2]);
6003                   break;
6004                 }
6005
6006               switch (t->operands)
6007                 {
6008                 case 5:
6009                   if (!operand_type_match (overlap4, i.types[4])
6010                       || !operand_type_register_match (i.types[3],
6011                                                        operand_types[3],
6012                                                        i.types[4],
6013                                                        operand_types[4]))
6014                     continue;
6015                   /* Fall through.  */
6016                 case 4:
6017                   if (!operand_type_match (overlap3, i.types[3])
6018                       || ((check_register & 0xa) == 0xa
6019                           && !operand_type_register_match (i.types[1],
6020                                                             operand_types[1],
6021                                                             i.types[3],
6022                                                             operand_types[3]))
6023                       || ((check_register & 0xc) == 0xc
6024                           && !operand_type_register_match (i.types[2],
6025                                                             operand_types[2],
6026                                                             i.types[3],
6027                                                             operand_types[3])))
6028                     continue;
6029                   /* Fall through.  */
6030                 case 3:
6031                   /* Here we make use of the fact that there are no
6032                      reverse match 3 operand instructions.  */
6033                   if (!operand_type_match (overlap2, i.types[2])
6034                       || ((check_register & 5) == 5
6035                           && !operand_type_register_match (i.types[0],
6036                                                             operand_types[0],
6037                                                             i.types[2],
6038                                                             operand_types[2]))
6039                       || ((check_register & 6) == 6
6040                           && !operand_type_register_match (i.types[1],
6041                                                             operand_types[1],
6042                                                             i.types[2],
6043                                                             operand_types[2])))
6044                     continue;
6045                   break;
6046                 }
6047             }
6048           /* Found either forward/reverse 2, 3 or 4 operand match here:
6049              slip through to break.  */
6050         }
6051       if (!found_cpu_match)
6052         continue;
6053
6054       /* Check if vector and VEX operands are valid.  */
6055       if (check_VecOperands (t) || VEX_check_operands (t))
6056         {
6057           specific_error = i.error;
6058           continue;
6059         }
6060
6061       /* We've found a match; break out of loop.  */
6062       break;
6063     }
6064
6065   if (t == current_templates->end)
6066     {
6067       /* We found no match.  */
6068       const char *err_msg;
6069       switch (specific_error ? specific_error : i.error)
6070         {
6071         default:
6072           abort ();
6073         case operand_size_mismatch:
6074           err_msg = _("operand size mismatch");
6075           break;
6076         case operand_type_mismatch:
6077           err_msg = _("operand type mismatch");
6078           break;
6079         case register_type_mismatch:
6080           err_msg = _("register type mismatch");
6081           break;
6082         case number_of_operands_mismatch:
6083           err_msg = _("number of operands mismatch");
6084           break;
6085         case invalid_instruction_suffix:
6086           err_msg = _("invalid instruction suffix");
6087           break;
6088         case bad_imm4:
6089           err_msg = _("constant doesn't fit in 4 bits");
6090           break;
6091         case unsupported_with_intel_mnemonic:
6092           err_msg = _("unsupported with Intel mnemonic");
6093           break;
6094         case unsupported_syntax:
6095           err_msg = _("unsupported syntax");
6096           break;
6097         case unsupported:
6098           as_bad (_("unsupported instruction `%s'"),
6099                   current_templates->start->name);
6100           return NULL;
6101         case invalid_vsib_address:
6102           err_msg = _("invalid VSIB address");
6103           break;
6104         case invalid_vector_register_set:
6105           err_msg = _("mask, index, and destination registers must be distinct");
6106           break;
6107         case unsupported_vector_index_register:
6108           err_msg = _("unsupported vector index register");
6109           break;
6110         case unsupported_broadcast:
6111           err_msg = _("unsupported broadcast");
6112           break;
6113         case broadcast_needed:
6114           err_msg = _("broadcast is needed for operand of such type");
6115           break;
6116         case unsupported_masking:
6117           err_msg = _("unsupported masking");
6118           break;
6119         case mask_not_on_destination:
6120           err_msg = _("mask not on destination operand");
6121           break;
6122         case no_default_mask:
6123           err_msg = _("default mask isn't allowed");
6124           break;
6125         case unsupported_rc_sae:
6126           err_msg = _("unsupported static rounding/sae");
6127           break;
6128         case rc_sae_operand_not_last_imm:
6129           if (intel_syntax)
6130             err_msg = _("RC/SAE operand must precede immediate operands");
6131           else
6132             err_msg = _("RC/SAE operand must follow immediate operands");
6133           break;
6134         case invalid_register_operand:
6135           err_msg = _("invalid register operand");
6136           break;
6137         }
6138       as_bad (_("%s for `%s'"), err_msg,
6139               current_templates->start->name);
6140       return NULL;
6141     }
6142
6143   if (!quiet_warnings)
6144     {
6145       if (!intel_syntax
6146           && (i.types[0].bitfield.jumpabsolute
6147               != operand_types[0].bitfield.jumpabsolute))
6148         {
6149           as_warn (_("indirect %s without `*'"), t->name);
6150         }
6151
6152       if (t->opcode_modifier.isprefix
6153           && t->opcode_modifier.ignoresize)
6154         {
6155           /* Warn them that a data or address size prefix doesn't
6156              affect assembly of the next line of code.  */
6157           as_warn (_("stand-alone `%s' prefix"), t->name);
6158         }
6159     }
6160
6161   /* Copy the template we found.  */
6162   i.tm = *t;
6163
6164   if (addr_prefix_disp != -1)
6165     i.tm.operand_types[addr_prefix_disp]
6166       = operand_types[addr_prefix_disp];
6167
6168   if (found_reverse_match)
6169     {
6170       /* If we found a reverse match we must alter the opcode direction
6171          bit and clear/flip the regmem modifier one.  found_reverse_match
6172          holds bits to change (different for int & float insns).  */
6173
6174       i.tm.base_opcode ^= found_reverse_match;
6175
6176       i.tm.operand_types[0] = operand_types[i.operands - 1];
6177       i.tm.operand_types[i.operands - 1] = operand_types[0];
6178
6179       /* Certain SIMD insns have their load forms specified in the opcode
6180          table, and hence we need to _set_ RegMem instead of clearing it.
6181          We need to avoid setting the bit though on insns like KMOVW.  */
6182       i.tm.opcode_modifier.regmem
6183         = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6184           && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6185           && !i.tm.opcode_modifier.regmem;
6186     }
6187
6188   return t;
6189 }
6190
6191 static int
6192 check_string (void)
6193 {
6194   unsigned int mem_op = i.flags[0] & Operand_Mem ? 0 : 1;
6195
6196   if (i.tm.operand_types[mem_op].bitfield.esseg)
6197     {
6198       if (i.seg[0] != NULL && i.seg[0] != &es)
6199         {
6200           as_bad (_("`%s' operand %d must use `%ses' segment"),
6201                   i.tm.name,
6202                   intel_syntax ? i.tm.operands - mem_op : mem_op + 1,
6203                   register_prefix);
6204           return 0;
6205         }
6206       /* There's only ever one segment override allowed per instruction.
6207          This instruction possibly has a legal segment override on the
6208          second operand, so copy the segment to where non-string
6209          instructions store it, allowing common code.  */
6210       i.seg[0] = i.seg[1];
6211     }
6212   else if (i.tm.operand_types[mem_op + 1].bitfield.esseg)
6213     {
6214       if (i.seg[1] != NULL && i.seg[1] != &es)
6215         {
6216           as_bad (_("`%s' operand %d must use `%ses' segment"),
6217                   i.tm.name,
6218                   intel_syntax ? i.tm.operands - mem_op - 1 : mem_op + 2,
6219                   register_prefix);
6220           return 0;
6221         }
6222     }
6223   return 1;
6224 }
6225
6226 static int
6227 process_suffix (void)
6228 {
6229   /* If matched instruction specifies an explicit instruction mnemonic
6230      suffix, use it.  */
6231   if (i.tm.opcode_modifier.size == SIZE16)
6232     i.suffix = WORD_MNEM_SUFFIX;
6233   else if (i.tm.opcode_modifier.size == SIZE32)
6234     i.suffix = LONG_MNEM_SUFFIX;
6235   else if (i.tm.opcode_modifier.size == SIZE64)
6236     i.suffix = QWORD_MNEM_SUFFIX;
6237   else if (i.reg_operands)
6238     {
6239       /* If there's no instruction mnemonic suffix we try to invent one
6240          based on register operands.  */
6241       if (!i.suffix)
6242         {
6243           /* We take i.suffix from the last register operand specified,
6244              Destination register type is more significant than source
6245              register type.  crc32 in SSE4.2 prefers source register
6246              type. */
6247           if (i.tm.base_opcode == 0xf20f38f0 && i.types[0].bitfield.reg)
6248             {
6249               if (i.types[0].bitfield.byte)
6250                 i.suffix = BYTE_MNEM_SUFFIX;
6251               else if (i.types[0].bitfield.word)
6252                 i.suffix = WORD_MNEM_SUFFIX;
6253               else if (i.types[0].bitfield.dword)
6254                 i.suffix = LONG_MNEM_SUFFIX;
6255               else if (i.types[0].bitfield.qword)
6256                 i.suffix = QWORD_MNEM_SUFFIX;
6257             }
6258
6259           if (!i.suffix)
6260             {
6261               int op;
6262
6263               if (i.tm.base_opcode == 0xf20f38f0)
6264                 {
6265                   /* We have to know the operand size for crc32.  */
6266                   as_bad (_("ambiguous memory operand size for `%s`"),
6267                           i.tm.name);
6268                   return 0;
6269                 }
6270
6271               for (op = i.operands; --op >= 0;)
6272                 if (!i.tm.operand_types[op].bitfield.inoutportreg
6273                     && !i.tm.operand_types[op].bitfield.shiftcount)
6274                   {
6275                     if (!i.types[op].bitfield.reg)
6276                       continue;
6277                     if (i.types[op].bitfield.byte)
6278                       i.suffix = BYTE_MNEM_SUFFIX;
6279                     else if (i.types[op].bitfield.word)
6280                       i.suffix = WORD_MNEM_SUFFIX;
6281                     else if (i.types[op].bitfield.dword)
6282                       i.suffix = LONG_MNEM_SUFFIX;
6283                     else if (i.types[op].bitfield.qword)
6284                       i.suffix = QWORD_MNEM_SUFFIX;
6285                     else
6286                       continue;
6287                     break;
6288                   }
6289             }
6290         }
6291       else if (i.suffix == BYTE_MNEM_SUFFIX)
6292         {
6293           if (intel_syntax
6294               && i.tm.opcode_modifier.ignoresize
6295               && i.tm.opcode_modifier.no_bsuf)
6296             i.suffix = 0;
6297           else if (!check_byte_reg ())
6298             return 0;
6299         }
6300       else if (i.suffix == LONG_MNEM_SUFFIX)
6301         {
6302           if (intel_syntax
6303               && i.tm.opcode_modifier.ignoresize
6304               && i.tm.opcode_modifier.no_lsuf
6305               && !i.tm.opcode_modifier.todword
6306               && !i.tm.opcode_modifier.toqword)
6307             i.suffix = 0;
6308           else if (!check_long_reg ())
6309             return 0;
6310         }
6311       else if (i.suffix == QWORD_MNEM_SUFFIX)
6312         {
6313           if (intel_syntax
6314               && i.tm.opcode_modifier.ignoresize
6315               && i.tm.opcode_modifier.no_qsuf
6316               && !i.tm.opcode_modifier.todword
6317               && !i.tm.opcode_modifier.toqword)
6318             i.suffix = 0;
6319           else if (!check_qword_reg ())
6320             return 0;
6321         }
6322       else if (i.suffix == WORD_MNEM_SUFFIX)
6323         {
6324           if (intel_syntax
6325               && i.tm.opcode_modifier.ignoresize
6326               && i.tm.opcode_modifier.no_wsuf)
6327             i.suffix = 0;
6328           else if (!check_word_reg ())
6329             return 0;
6330         }
6331       else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
6332         /* Do nothing if the instruction is going to ignore the prefix.  */
6333         ;
6334       else
6335         abort ();
6336     }
6337   else if (i.tm.opcode_modifier.defaultsize
6338            && !i.suffix
6339            /* exclude fldenv/frstor/fsave/fstenv */
6340            && i.tm.opcode_modifier.no_ssuf)
6341     {
6342       if (stackop_size == LONG_MNEM_SUFFIX
6343           && i.tm.base_opcode == 0xcf)
6344         {
6345           /* stackop_size is set to LONG_MNEM_SUFFIX for the
6346              .code16gcc directive to support 16-bit mode with
6347              32-bit address.  For IRET without a suffix, generate
6348              16-bit IRET (opcode 0xcf) to return from an interrupt
6349              handler.  */
6350           i.suffix = WORD_MNEM_SUFFIX;
6351           as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6352         }
6353       else
6354         i.suffix = stackop_size;
6355     }
6356   else if (intel_syntax
6357            && !i.suffix
6358            && (i.tm.operand_types[0].bitfield.jumpabsolute
6359                || i.tm.opcode_modifier.jumpbyte
6360                || i.tm.opcode_modifier.jumpintersegment
6361                || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6362                    && i.tm.extension_opcode <= 3)))
6363     {
6364       switch (flag_code)
6365         {
6366         case CODE_64BIT:
6367           if (!i.tm.opcode_modifier.no_qsuf)
6368             {
6369               i.suffix = QWORD_MNEM_SUFFIX;
6370               break;
6371             }
6372           /* Fall through.  */
6373         case CODE_32BIT:
6374           if (!i.tm.opcode_modifier.no_lsuf)
6375             i.suffix = LONG_MNEM_SUFFIX;
6376           break;
6377         case CODE_16BIT:
6378           if (!i.tm.opcode_modifier.no_wsuf)
6379             i.suffix = WORD_MNEM_SUFFIX;
6380           break;
6381         }
6382     }
6383
6384   if (!i.suffix)
6385     {
6386       if (!intel_syntax)
6387         {
6388           if (i.tm.opcode_modifier.w)
6389             {
6390               as_bad (_("no instruction mnemonic suffix given and "
6391                         "no register operands; can't size instruction"));
6392               return 0;
6393             }
6394         }
6395       else
6396         {
6397           unsigned int suffixes;
6398
6399           suffixes = !i.tm.opcode_modifier.no_bsuf;
6400           if (!i.tm.opcode_modifier.no_wsuf)
6401             suffixes |= 1 << 1;
6402           if (!i.tm.opcode_modifier.no_lsuf)
6403             suffixes |= 1 << 2;
6404           if (!i.tm.opcode_modifier.no_ldsuf)
6405             suffixes |= 1 << 3;
6406           if (!i.tm.opcode_modifier.no_ssuf)
6407             suffixes |= 1 << 4;
6408           if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6409             suffixes |= 1 << 5;
6410
6411           /* There are more than suffix matches.  */
6412           if (i.tm.opcode_modifier.w
6413               || ((suffixes & (suffixes - 1))
6414                   && !i.tm.opcode_modifier.defaultsize
6415                   && !i.tm.opcode_modifier.ignoresize))
6416             {
6417               as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6418               return 0;
6419             }
6420         }
6421     }
6422
6423   /* Change the opcode based on the operand size given by i.suffix.  */
6424   switch (i.suffix)
6425     {
6426     /* Size floating point instruction.  */
6427     case LONG_MNEM_SUFFIX:
6428       if (i.tm.opcode_modifier.floatmf)
6429         {
6430           i.tm.base_opcode ^= 4;
6431           break;
6432         }
6433     /* fall through */
6434     case WORD_MNEM_SUFFIX:
6435     case QWORD_MNEM_SUFFIX:
6436       /* It's not a byte, select word/dword operation.  */
6437       if (i.tm.opcode_modifier.w)
6438         {
6439           if (i.tm.opcode_modifier.shortform)
6440             i.tm.base_opcode |= 8;
6441           else
6442             i.tm.base_opcode |= 1;
6443         }
6444     /* fall through */
6445     case SHORT_MNEM_SUFFIX:
6446       /* Now select between word & dword operations via the operand
6447          size prefix, except for instructions that will ignore this
6448          prefix anyway.  */
6449       if (i.reg_operands > 0
6450           && i.types[0].bitfield.reg
6451           && i.tm.opcode_modifier.addrprefixopreg
6452           && (i.tm.opcode_modifier.immext
6453               || i.operands == 1))
6454         {
6455           /* The address size override prefix changes the size of the
6456              first operand.  */
6457           if ((flag_code == CODE_32BIT
6458                && i.op[0].regs->reg_type.bitfield.word)
6459               || (flag_code != CODE_32BIT
6460                   && i.op[0].regs->reg_type.bitfield.dword))
6461             if (!add_prefix (ADDR_PREFIX_OPCODE))
6462               return 0;
6463         }
6464       else if (i.suffix != QWORD_MNEM_SUFFIX
6465                && !i.tm.opcode_modifier.ignoresize
6466                && !i.tm.opcode_modifier.floatmf
6467                && !is_any_vex_encoding (&i.tm)
6468                && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
6469                    || (flag_code == CODE_64BIT
6470                        && i.tm.opcode_modifier.jumpbyte)))
6471         {
6472           unsigned int prefix = DATA_PREFIX_OPCODE;
6473
6474           if (i.tm.opcode_modifier.jumpbyte) /* jcxz, loop */
6475             prefix = ADDR_PREFIX_OPCODE;
6476
6477           if (!add_prefix (prefix))
6478             return 0;
6479         }
6480
6481       /* Set mode64 for an operand.  */
6482       if (i.suffix == QWORD_MNEM_SUFFIX
6483           && flag_code == CODE_64BIT
6484           && !i.tm.opcode_modifier.norex64
6485           /* Special case for xchg %rax,%rax.  It is NOP and doesn't
6486              need rex64. */
6487           && ! (i.operands == 2
6488                 && i.tm.base_opcode == 0x90
6489                 && i.tm.extension_opcode == None
6490                 && i.types[0].bitfield.acc && i.types[0].bitfield.qword
6491                 && i.types[1].bitfield.acc && i.types[1].bitfield.qword))
6492         i.rex |= REX_W;
6493
6494       break;
6495     }
6496
6497   if (i.reg_operands != 0
6498       && i.operands > 1
6499       && i.tm.opcode_modifier.addrprefixopreg
6500       && !i.tm.opcode_modifier.immext)
6501     {
6502       /* Check invalid register operand when the address size override
6503          prefix changes the size of register operands.  */
6504       unsigned int op;
6505       enum { need_word, need_dword, need_qword } need;
6506
6507       if (flag_code == CODE_32BIT)
6508         need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
6509       else
6510         {
6511           if (i.prefix[ADDR_PREFIX])
6512             need = need_dword;
6513           else
6514             need = flag_code == CODE_64BIT ? need_qword : need_word;
6515         }
6516
6517       for (op = 0; op < i.operands; op++)
6518         if (i.types[op].bitfield.reg
6519             && ((need == need_word
6520                  && !i.op[op].regs->reg_type.bitfield.word)
6521                 || (need == need_dword
6522                     && !i.op[op].regs->reg_type.bitfield.dword)
6523                 || (need == need_qword
6524                     && !i.op[op].regs->reg_type.bitfield.qword)))
6525           {
6526             as_bad (_("invalid register operand size for `%s'"),
6527                     i.tm.name);
6528             return 0;
6529           }
6530     }
6531
6532   return 1;
6533 }
6534
6535 static int
6536 check_byte_reg (void)
6537 {
6538   int op;
6539
6540   for (op = i.operands; --op >= 0;)
6541     {
6542       /* Skip non-register operands. */
6543       if (!i.types[op].bitfield.reg)
6544         continue;
6545
6546       /* If this is an eight bit register, it's OK.  If it's the 16 or
6547          32 bit version of an eight bit register, we will just use the
6548          low portion, and that's OK too.  */
6549       if (i.types[op].bitfield.byte)
6550         continue;
6551
6552       /* I/O port address operands are OK too.  */
6553       if (i.tm.operand_types[op].bitfield.inoutportreg)
6554         continue;
6555
6556       /* crc32 doesn't generate this warning.  */
6557       if (i.tm.base_opcode == 0xf20f38f0)
6558         continue;
6559
6560       if ((i.types[op].bitfield.word
6561            || i.types[op].bitfield.dword
6562            || i.types[op].bitfield.qword)
6563           && i.op[op].regs->reg_num < 4
6564           /* Prohibit these changes in 64bit mode, since the lowering
6565              would be more complicated.  */
6566           && flag_code != CODE_64BIT)
6567         {
6568 #if REGISTER_WARNINGS
6569           if (!quiet_warnings)
6570             as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6571                      register_prefix,
6572                      (i.op[op].regs + (i.types[op].bitfield.word
6573                                        ? REGNAM_AL - REGNAM_AX
6574                                        : REGNAM_AL - REGNAM_EAX))->reg_name,
6575                      register_prefix,
6576                      i.op[op].regs->reg_name,
6577                      i.suffix);
6578 #endif
6579           continue;
6580         }
6581       /* Any other register is bad.  */
6582       if (i.types[op].bitfield.reg
6583           || i.types[op].bitfield.regmmx
6584           || i.types[op].bitfield.regsimd
6585           || i.types[op].bitfield.sreg
6586           || i.types[op].bitfield.control
6587           || i.types[op].bitfield.debug
6588           || i.types[op].bitfield.test)
6589         {
6590           as_bad (_("`%s%s' not allowed with `%s%c'"),
6591                   register_prefix,
6592                   i.op[op].regs->reg_name,
6593                   i.tm.name,
6594                   i.suffix);
6595           return 0;
6596         }
6597     }
6598   return 1;
6599 }
6600
6601 static int
6602 check_long_reg (void)
6603 {
6604   int op;
6605
6606   for (op = i.operands; --op >= 0;)
6607     /* Skip non-register operands. */
6608     if (!i.types[op].bitfield.reg)
6609       continue;
6610     /* Reject eight bit registers, except where the template requires
6611        them. (eg. movzb)  */
6612     else if (i.types[op].bitfield.byte
6613              && (i.tm.operand_types[op].bitfield.reg
6614                  || i.tm.operand_types[op].bitfield.acc)
6615              && (i.tm.operand_types[op].bitfield.word
6616                  || i.tm.operand_types[op].bitfield.dword))
6617       {
6618         as_bad (_("`%s%s' not allowed with `%s%c'"),
6619                 register_prefix,
6620                 i.op[op].regs->reg_name,
6621                 i.tm.name,
6622                 i.suffix);
6623         return 0;
6624       }
6625     /* Warn if the e prefix on a general reg is missing.  */
6626     else if ((!quiet_warnings || flag_code == CODE_64BIT)
6627              && i.types[op].bitfield.word
6628              && (i.tm.operand_types[op].bitfield.reg
6629                  || i.tm.operand_types[op].bitfield.acc)
6630              && i.tm.operand_types[op].bitfield.dword)
6631       {
6632         /* Prohibit these changes in the 64bit mode, since the
6633            lowering is more complicated.  */
6634         if (flag_code == CODE_64BIT)
6635           {
6636             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6637                     register_prefix, i.op[op].regs->reg_name,
6638                     i.suffix);
6639             return 0;
6640           }
6641 #if REGISTER_WARNINGS
6642         as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6643                  register_prefix,
6644                  (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
6645                  register_prefix, i.op[op].regs->reg_name, i.suffix);
6646 #endif
6647       }
6648     /* Warn if the r prefix on a general reg is present.  */
6649     else if (i.types[op].bitfield.qword
6650              && (i.tm.operand_types[op].bitfield.reg
6651                  || i.tm.operand_types[op].bitfield.acc)
6652              && i.tm.operand_types[op].bitfield.dword)
6653       {
6654         if (intel_syntax
6655             && i.tm.opcode_modifier.toqword
6656             && !i.types[0].bitfield.regsimd)
6657           {
6658             /* Convert to QWORD.  We want REX byte. */
6659             i.suffix = QWORD_MNEM_SUFFIX;
6660           }
6661         else
6662           {
6663             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6664                     register_prefix, i.op[op].regs->reg_name,
6665                     i.suffix);
6666             return 0;
6667           }
6668       }
6669   return 1;
6670 }
6671
6672 static int
6673 check_qword_reg (void)
6674 {
6675   int op;
6676
6677   for (op = i.operands; --op >= 0; )
6678     /* Skip non-register operands. */
6679     if (!i.types[op].bitfield.reg)
6680       continue;
6681     /* Reject eight bit registers, except where the template requires
6682        them. (eg. movzb)  */
6683     else if (i.types[op].bitfield.byte
6684              && (i.tm.operand_types[op].bitfield.reg
6685                  || i.tm.operand_types[op].bitfield.acc)
6686              && (i.tm.operand_types[op].bitfield.word
6687                  || i.tm.operand_types[op].bitfield.dword))
6688       {
6689         as_bad (_("`%s%s' not allowed with `%s%c'"),
6690                 register_prefix,
6691                 i.op[op].regs->reg_name,
6692                 i.tm.name,
6693                 i.suffix);
6694         return 0;
6695       }
6696     /* Warn if the r prefix on a general reg is missing.  */
6697     else if ((i.types[op].bitfield.word
6698               || i.types[op].bitfield.dword)
6699              && (i.tm.operand_types[op].bitfield.reg
6700                  || i.tm.operand_types[op].bitfield.acc)
6701              && i.tm.operand_types[op].bitfield.qword)
6702       {
6703         /* Prohibit these changes in the 64bit mode, since the
6704            lowering is more complicated.  */
6705         if (intel_syntax
6706             && i.tm.opcode_modifier.todword
6707             && !i.types[0].bitfield.regsimd)
6708           {
6709             /* Convert to DWORD.  We don't want REX byte. */
6710             i.suffix = LONG_MNEM_SUFFIX;
6711           }
6712         else
6713           {
6714             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6715                     register_prefix, i.op[op].regs->reg_name,
6716                     i.suffix);
6717             return 0;
6718           }
6719       }
6720   return 1;
6721 }
6722
6723 static int
6724 check_word_reg (void)
6725 {
6726   int op;
6727   for (op = i.operands; --op >= 0;)
6728     /* Skip non-register operands. */
6729     if (!i.types[op].bitfield.reg)
6730       continue;
6731     /* Reject eight bit registers, except where the template requires
6732        them. (eg. movzb)  */
6733     else if (i.types[op].bitfield.byte
6734              && (i.tm.operand_types[op].bitfield.reg
6735                  || i.tm.operand_types[op].bitfield.acc)
6736              && (i.tm.operand_types[op].bitfield.word
6737                  || i.tm.operand_types[op].bitfield.dword))
6738       {
6739         as_bad (_("`%s%s' not allowed with `%s%c'"),
6740                 register_prefix,
6741                 i.op[op].regs->reg_name,
6742                 i.tm.name,
6743                 i.suffix);
6744         return 0;
6745       }
6746     /* Warn if the e or r prefix on a general reg is present.  */
6747     else if ((!quiet_warnings || flag_code == CODE_64BIT)
6748              && (i.types[op].bitfield.dword
6749                  || i.types[op].bitfield.qword)
6750              && (i.tm.operand_types[op].bitfield.reg
6751                  || i.tm.operand_types[op].bitfield.acc)
6752              && i.tm.operand_types[op].bitfield.word)
6753       {
6754         /* Prohibit these changes in the 64bit mode, since the
6755            lowering is more complicated.  */
6756         if (flag_code == CODE_64BIT)
6757           {
6758             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6759                     register_prefix, i.op[op].regs->reg_name,
6760                     i.suffix);
6761             return 0;
6762           }
6763 #if REGISTER_WARNINGS
6764         as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6765                  register_prefix,
6766                  (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
6767                  register_prefix, i.op[op].regs->reg_name, i.suffix);
6768 #endif
6769       }
6770   return 1;
6771 }
6772
6773 static int
6774 update_imm (unsigned int j)
6775 {
6776   i386_operand_type overlap = i.types[j];
6777   if ((overlap.bitfield.imm8
6778        || overlap.bitfield.imm8s
6779        || overlap.bitfield.imm16
6780        || overlap.bitfield.imm32
6781        || overlap.bitfield.imm32s
6782        || overlap.bitfield.imm64)
6783       && !operand_type_equal (&overlap, &imm8)
6784       && !operand_type_equal (&overlap, &imm8s)
6785       && !operand_type_equal (&overlap, &imm16)
6786       && !operand_type_equal (&overlap, &imm32)
6787       && !operand_type_equal (&overlap, &imm32s)
6788       && !operand_type_equal (&overlap, &imm64))
6789     {
6790       if (i.suffix)
6791         {
6792           i386_operand_type temp;
6793
6794           operand_type_set (&temp, 0);
6795           if (i.suffix == BYTE_MNEM_SUFFIX)
6796             {
6797               temp.bitfield.imm8 = overlap.bitfield.imm8;
6798               temp.bitfield.imm8s = overlap.bitfield.imm8s;
6799             }
6800           else if (i.suffix == WORD_MNEM_SUFFIX)
6801             temp.bitfield.imm16 = overlap.bitfield.imm16;
6802           else if (i.suffix == QWORD_MNEM_SUFFIX)
6803             {
6804               temp.bitfield.imm64 = overlap.bitfield.imm64;
6805               temp.bitfield.imm32s = overlap.bitfield.imm32s;
6806             }
6807           else
6808             temp.bitfield.imm32 = overlap.bitfield.imm32;
6809           overlap = temp;
6810         }
6811       else if (operand_type_equal (&overlap, &imm16_32_32s)
6812                || operand_type_equal (&overlap, &imm16_32)
6813                || operand_type_equal (&overlap, &imm16_32s))
6814         {
6815           if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
6816             overlap = imm16;
6817           else
6818             overlap = imm32s;
6819         }
6820       if (!operand_type_equal (&overlap, &imm8)
6821           && !operand_type_equal (&overlap, &imm8s)
6822           && !operand_type_equal (&overlap, &imm16)
6823           && !operand_type_equal (&overlap, &imm32)
6824           && !operand_type_equal (&overlap, &imm32s)
6825           && !operand_type_equal (&overlap, &imm64))
6826         {
6827           as_bad (_("no instruction mnemonic suffix given; "
6828                     "can't determine immediate size"));
6829           return 0;
6830         }
6831     }
6832   i.types[j] = overlap;
6833
6834   return 1;
6835 }
6836
6837 static int
6838 finalize_imm (void)
6839 {
6840   unsigned int j, n;
6841
6842   /* Update the first 2 immediate operands.  */
6843   n = i.operands > 2 ? 2 : i.operands;
6844   if (n)
6845     {
6846       for (j = 0; j < n; j++)
6847         if (update_imm (j) == 0)
6848           return 0;
6849
6850       /* The 3rd operand can't be immediate operand.  */
6851       gas_assert (operand_type_check (i.types[2], imm) == 0);
6852     }
6853
6854   return 1;
6855 }
6856
6857 static int
6858 process_operands (void)
6859 {
6860   /* Default segment register this instruction will use for memory
6861      accesses.  0 means unknown.  This is only for optimizing out
6862      unnecessary segment overrides.  */
6863   const seg_entry *default_seg = 0;
6864
6865   if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
6866     {
6867       unsigned int dupl = i.operands;
6868       unsigned int dest = dupl - 1;
6869       unsigned int j;
6870
6871       /* The destination must be an xmm register.  */
6872       gas_assert (i.reg_operands
6873                   && MAX_OPERANDS > dupl
6874                   && operand_type_equal (&i.types[dest], &regxmm));
6875
6876       if (i.tm.operand_types[0].bitfield.acc
6877           && i.tm.operand_types[0].bitfield.xmmword)
6878         {
6879           if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
6880             {
6881               /* Keep xmm0 for instructions with VEX prefix and 3
6882                  sources.  */
6883               i.tm.operand_types[0].bitfield.acc = 0;
6884               i.tm.operand_types[0].bitfield.regsimd = 1;
6885               goto duplicate;
6886             }
6887           else
6888             {
6889               /* We remove the first xmm0 and keep the number of
6890                  operands unchanged, which in fact duplicates the
6891                  destination.  */
6892               for (j = 1; j < i.operands; j++)
6893                 {
6894                   i.op[j - 1] = i.op[j];
6895                   i.types[j - 1] = i.types[j];
6896                   i.tm.operand_types[j - 1] = i.tm.operand_types[j];
6897                   i.flags[j - 1] = i.flags[j];
6898                 }
6899             }
6900         }
6901       else if (i.tm.opcode_modifier.implicit1stxmm0)
6902         {
6903           gas_assert ((MAX_OPERANDS - 1) > dupl
6904                       && (i.tm.opcode_modifier.vexsources
6905                           == VEX3SOURCES));
6906
6907           /* Add the implicit xmm0 for instructions with VEX prefix
6908              and 3 sources.  */
6909           for (j = i.operands; j > 0; j--)
6910             {
6911               i.op[j] = i.op[j - 1];
6912               i.types[j] = i.types[j - 1];
6913               i.tm.operand_types[j] = i.tm.operand_types[j - 1];
6914               i.flags[j] = i.flags[j - 1];
6915             }
6916           i.op[0].regs
6917             = (const reg_entry *) hash_find (reg_hash, "xmm0");
6918           i.types[0] = regxmm;
6919           i.tm.operand_types[0] = regxmm;
6920
6921           i.operands += 2;
6922           i.reg_operands += 2;
6923           i.tm.operands += 2;
6924
6925           dupl++;
6926           dest++;
6927           i.op[dupl] = i.op[dest];
6928           i.types[dupl] = i.types[dest];
6929           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
6930           i.flags[dupl] = i.flags[dest];
6931         }
6932       else
6933         {
6934 duplicate:
6935           i.operands++;
6936           i.reg_operands++;
6937           i.tm.operands++;
6938
6939           i.op[dupl] = i.op[dest];
6940           i.types[dupl] = i.types[dest];
6941           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
6942           i.flags[dupl] = i.flags[dest];
6943         }
6944
6945        if (i.tm.opcode_modifier.immext)
6946          process_immext ();
6947     }
6948   else if (i.tm.operand_types[0].bitfield.acc
6949            && i.tm.operand_types[0].bitfield.xmmword)
6950     {
6951       unsigned int j;
6952
6953       for (j = 1; j < i.operands; j++)
6954         {
6955           i.op[j - 1] = i.op[j];
6956           i.types[j - 1] = i.types[j];
6957
6958           /* We need to adjust fields in i.tm since they are used by
6959              build_modrm_byte.  */
6960           i.tm.operand_types [j - 1] = i.tm.operand_types [j];
6961
6962           i.flags[j - 1] = i.flags[j];
6963         }
6964
6965       i.operands--;
6966       i.reg_operands--;
6967       i.tm.operands--;
6968     }
6969   else if (i.tm.opcode_modifier.implicitquadgroup)
6970     {
6971       unsigned int regnum, first_reg_in_group, last_reg_in_group;
6972
6973       /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
6974       gas_assert (i.operands >= 2 && i.types[1].bitfield.regsimd);
6975       regnum = register_number (i.op[1].regs);
6976       first_reg_in_group = regnum & ~3;
6977       last_reg_in_group = first_reg_in_group + 3;
6978       if (regnum != first_reg_in_group)
6979         as_warn (_("source register `%s%s' implicitly denotes"
6980                    " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
6981                  register_prefix, i.op[1].regs->reg_name,
6982                  register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
6983                  register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
6984                  i.tm.name);
6985     }
6986   else if (i.tm.opcode_modifier.regkludge)
6987     {
6988       /* The imul $imm, %reg instruction is converted into
6989          imul $imm, %reg, %reg, and the clr %reg instruction
6990          is converted into xor %reg, %reg.  */
6991
6992       unsigned int first_reg_op;
6993
6994       if (operand_type_check (i.types[0], reg))
6995         first_reg_op = 0;
6996       else
6997         first_reg_op = 1;
6998       /* Pretend we saw the extra register operand.  */
6999       gas_assert (i.reg_operands == 1
7000                   && i.op[first_reg_op + 1].regs == 0);
7001       i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7002       i.types[first_reg_op + 1] = i.types[first_reg_op];
7003       i.operands++;
7004       i.reg_operands++;
7005     }
7006
7007   if (i.tm.opcode_modifier.shortform)
7008     {
7009       if (i.types[0].bitfield.sreg)
7010         {
7011           if (flag_code != CODE_64BIT
7012               ? i.tm.base_opcode == POP_SEG_SHORT
7013                 && i.op[0].regs->reg_num == 1
7014               : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7015                 && i.op[0].regs->reg_num < 4)
7016             {
7017               as_bad (_("you can't `%s %s%s'"),
7018                       i.tm.name, register_prefix, i.op[0].regs->reg_name);
7019               return 0;
7020             }
7021           if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7022             {
7023               i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7024               i.tm.opcode_length = 2;
7025             }
7026           i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7027         }
7028       else
7029         {
7030           /* The register or float register operand is in operand
7031              0 or 1.  */
7032           unsigned int op;
7033
7034           if ((i.types[0].bitfield.reg && i.types[0].bitfield.tbyte)
7035               || operand_type_check (i.types[0], reg))
7036             op = 0;
7037           else
7038             op = 1;
7039           /* Register goes in low 3 bits of opcode.  */
7040           i.tm.base_opcode |= i.op[op].regs->reg_num;
7041           if ((i.op[op].regs->reg_flags & RegRex) != 0)
7042             i.rex |= REX_B;
7043           if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7044             {
7045               /* Warn about some common errors, but press on regardless.
7046                  The first case can be generated by gcc (<= 2.8.1).  */
7047               if (i.operands == 2)
7048                 {
7049                   /* Reversed arguments on faddp, fsubp, etc.  */
7050                   as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7051                            register_prefix, i.op[!intel_syntax].regs->reg_name,
7052                            register_prefix, i.op[intel_syntax].regs->reg_name);
7053                 }
7054               else
7055                 {
7056                   /* Extraneous `l' suffix on fp insn.  */
7057                   as_warn (_("translating to `%s %s%s'"), i.tm.name,
7058                            register_prefix, i.op[0].regs->reg_name);
7059                 }
7060             }
7061         }
7062     }
7063   else if (i.tm.opcode_modifier.modrm)
7064     {
7065       /* The opcode is completed (modulo i.tm.extension_opcode which
7066          must be put into the modrm byte).  Now, we make the modrm and
7067          index base bytes based on all the info we've collected.  */
7068
7069       default_seg = build_modrm_byte ();
7070     }
7071   else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7072     {
7073       default_seg = &ds;
7074     }
7075   else if (i.tm.opcode_modifier.isstring)
7076     {
7077       /* For the string instructions that allow a segment override
7078          on one of their operands, the default segment is ds.  */
7079       default_seg = &ds;
7080     }
7081
7082   if (i.tm.base_opcode == 0x8d /* lea */
7083       && i.seg[0]
7084       && !quiet_warnings)
7085     as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7086
7087   /* If a segment was explicitly specified, and the specified segment
7088      is not the default, use an opcode prefix to select it.  If we
7089      never figured out what the default segment is, then default_seg
7090      will be zero at this point, and the specified segment prefix will
7091      always be used.  */
7092   if ((i.seg[0]) && (i.seg[0] != default_seg))
7093     {
7094       if (!add_prefix (i.seg[0]->seg_prefix))
7095         return 0;
7096     }
7097   return 1;
7098 }
7099
7100 static const seg_entry *
7101 build_modrm_byte (void)
7102 {
7103   const seg_entry *default_seg = 0;
7104   unsigned int source, dest;
7105   int vex_3_sources;
7106
7107   vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7108   if (vex_3_sources)
7109     {
7110       unsigned int nds, reg_slot;
7111       expressionS *exp;
7112
7113       dest = i.operands - 1;
7114       nds = dest - 1;
7115
7116       /* There are 2 kinds of instructions:
7117          1. 5 operands: 4 register operands or 3 register operands
7118          plus 1 memory operand plus one Imm4 operand, VexXDS, and
7119          VexW0 or VexW1.  The destination must be either XMM, YMM or
7120          ZMM register.
7121          2. 4 operands: 4 register operands or 3 register operands
7122          plus 1 memory operand, with VexXDS.  */
7123       gas_assert ((i.reg_operands == 4
7124                    || (i.reg_operands == 3 && i.mem_operands == 1))
7125                   && i.tm.opcode_modifier.vexvvvv == VEXXDS
7126                   && i.tm.opcode_modifier.vexw
7127                   && i.tm.operand_types[dest].bitfield.regsimd);
7128
7129       /* If VexW1 is set, the first non-immediate operand is the source and
7130          the second non-immediate one is encoded in the immediate operand.  */
7131       if (i.tm.opcode_modifier.vexw == VEXW1)
7132         {
7133           source = i.imm_operands;
7134           reg_slot = i.imm_operands + 1;
7135         }
7136       else
7137         {
7138           source = i.imm_operands + 1;
7139           reg_slot = i.imm_operands;
7140         }
7141
7142       if (i.imm_operands == 0)
7143         {
7144           /* When there is no immediate operand, generate an 8bit
7145              immediate operand to encode the first operand.  */
7146           exp = &im_expressions[i.imm_operands++];
7147           i.op[i.operands].imms = exp;
7148           i.types[i.operands] = imm8;
7149           i.operands++;
7150
7151           gas_assert (i.tm.operand_types[reg_slot].bitfield.regsimd);
7152           exp->X_op = O_constant;
7153           exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7154           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7155         }
7156       else
7157         {
7158           gas_assert (i.imm_operands == 1);
7159           gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7160           gas_assert (!i.tm.opcode_modifier.immext);
7161
7162           /* Turn on Imm8 again so that output_imm will generate it.  */
7163           i.types[0].bitfield.imm8 = 1;
7164
7165           gas_assert (i.tm.operand_types[reg_slot].bitfield.regsimd);
7166           i.op[0].imms->X_add_number
7167               |= register_number (i.op[reg_slot].regs) << 4;
7168           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7169         }
7170
7171       gas_assert (i.tm.operand_types[nds].bitfield.regsimd);
7172       i.vex.register_specifier = i.op[nds].regs;
7173     }
7174   else
7175     source = dest = 0;
7176
7177   /* i.reg_operands MUST be the number of real register operands;
7178      implicit registers do not count.  If there are 3 register
7179      operands, it must be a instruction with VexNDS.  For a
7180      instruction with VexNDD, the destination register is encoded
7181      in VEX prefix.  If there are 4 register operands, it must be
7182      a instruction with VEX prefix and 3 sources.  */
7183   if (i.mem_operands == 0
7184       && ((i.reg_operands == 2
7185            && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7186           || (i.reg_operands == 3
7187               && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7188           || (i.reg_operands == 4 && vex_3_sources)))
7189     {
7190       switch (i.operands)
7191         {
7192         case 2:
7193           source = 0;
7194           break;
7195         case 3:
7196           /* When there are 3 operands, one of them may be immediate,
7197              which may be the first or the last operand.  Otherwise,
7198              the first operand must be shift count register (cl) or it
7199              is an instruction with VexNDS. */
7200           gas_assert (i.imm_operands == 1
7201                       || (i.imm_operands == 0
7202                           && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7203                               || i.types[0].bitfield.shiftcount)));
7204           if (operand_type_check (i.types[0], imm)
7205               || i.types[0].bitfield.shiftcount)
7206             source = 1;
7207           else
7208             source = 0;
7209           break;
7210         case 4:
7211           /* When there are 4 operands, the first two must be 8bit
7212              immediate operands. The source operand will be the 3rd
7213              one.
7214
7215              For instructions with VexNDS, if the first operand
7216              an imm8, the source operand is the 2nd one.  If the last
7217              operand is imm8, the source operand is the first one.  */
7218           gas_assert ((i.imm_operands == 2
7219                        && i.types[0].bitfield.imm8
7220                        && i.types[1].bitfield.imm8)
7221                       || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7222                           && i.imm_operands == 1
7223                           && (i.types[0].bitfield.imm8
7224                               || i.types[i.operands - 1].bitfield.imm8
7225                               || i.rounding)));
7226           if (i.imm_operands == 2)
7227             source = 2;
7228           else
7229             {
7230               if (i.types[0].bitfield.imm8)
7231                 source = 1;
7232               else
7233                 source = 0;
7234             }
7235           break;
7236         case 5:
7237           if (is_evex_encoding (&i.tm))
7238             {
7239               /* For EVEX instructions, when there are 5 operands, the
7240                  first one must be immediate operand.  If the second one
7241                  is immediate operand, the source operand is the 3th
7242                  one.  If the last one is immediate operand, the source
7243                  operand is the 2nd one.  */
7244               gas_assert (i.imm_operands == 2
7245                           && i.tm.opcode_modifier.sae
7246                           && operand_type_check (i.types[0], imm));
7247               if (operand_type_check (i.types[1], imm))
7248                 source = 2;
7249               else if (operand_type_check (i.types[4], imm))
7250                 source = 1;
7251               else
7252                 abort ();
7253             }
7254           break;
7255         default:
7256           abort ();
7257         }
7258
7259       if (!vex_3_sources)
7260         {
7261           dest = source + 1;
7262
7263           /* RC/SAE operand could be between DEST and SRC.  That happens
7264              when one operand is GPR and the other one is XMM/YMM/ZMM
7265              register.  */
7266           if (i.rounding && i.rounding->operand == (int) dest)
7267             dest++;
7268
7269           if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7270             {
7271               /* For instructions with VexNDS, the register-only source
7272                  operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7273                  register.  It is encoded in VEX prefix.  */
7274
7275               i386_operand_type op;
7276               unsigned int vvvv;
7277
7278               /* Check register-only source operand when two source
7279                  operands are swapped.  */
7280               if (!i.tm.operand_types[source].bitfield.baseindex
7281                   && i.tm.operand_types[dest].bitfield.baseindex)
7282                 {
7283                   vvvv = source;
7284                   source = dest;
7285                 }
7286               else
7287                 vvvv = dest;
7288
7289               op = i.tm.operand_types[vvvv];
7290               if ((dest + 1) >= i.operands
7291                   || ((!op.bitfield.reg
7292                        || (!op.bitfield.dword && !op.bitfield.qword))
7293                       && !op.bitfield.regsimd
7294                       && !operand_type_equal (&op, &regmask)))
7295                 abort ();
7296               i.vex.register_specifier = i.op[vvvv].regs;
7297               dest++;
7298             }
7299         }
7300
7301       i.rm.mode = 3;
7302       /* One of the register operands will be encoded in the i.rm.reg
7303          field, the other in the combined i.rm.mode and i.rm.regmem
7304          fields.  If no form of this instruction supports a memory
7305          destination operand, then we assume the source operand may
7306          sometimes be a memory operand and so we need to store the
7307          destination in the i.rm.reg field.  */
7308       if (!i.tm.opcode_modifier.regmem
7309           && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7310         {
7311           i.rm.reg = i.op[dest].regs->reg_num;
7312           i.rm.regmem = i.op[source].regs->reg_num;
7313           if (i.op[dest].regs->reg_type.bitfield.regmmx
7314                || i.op[source].regs->reg_type.bitfield.regmmx)
7315             i.has_regmmx = TRUE;
7316           else if (i.op[dest].regs->reg_type.bitfield.regsimd
7317                    || i.op[source].regs->reg_type.bitfield.regsimd)
7318             {
7319               if (i.types[dest].bitfield.zmmword
7320                   || i.types[source].bitfield.zmmword)
7321                 i.has_regzmm = TRUE;
7322               else if (i.types[dest].bitfield.ymmword
7323                        || i.types[source].bitfield.ymmword)
7324                 i.has_regymm = TRUE;
7325               else
7326                 i.has_regxmm = TRUE;
7327             }
7328           if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7329             i.rex |= REX_R;
7330           if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7331             i.vrex |= REX_R;
7332           if ((i.op[source].regs->reg_flags & RegRex) != 0)
7333             i.rex |= REX_B;
7334           if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7335             i.vrex |= REX_B;
7336         }
7337       else
7338         {
7339           i.rm.reg = i.op[source].regs->reg_num;
7340           i.rm.regmem = i.op[dest].regs->reg_num;
7341           if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7342             i.rex |= REX_B;
7343           if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7344             i.vrex |= REX_B;
7345           if ((i.op[source].regs->reg_flags & RegRex) != 0)
7346             i.rex |= REX_R;
7347           if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7348             i.vrex |= REX_R;
7349         }
7350       if (flag_code != CODE_64BIT && (i.rex & REX_R))
7351         {
7352           if (!i.types[!i.tm.opcode_modifier.regmem].bitfield.control)
7353             abort ();
7354           i.rex &= ~REX_R;
7355           add_prefix (LOCK_PREFIX_OPCODE);
7356         }
7357     }
7358   else
7359     {                   /* If it's not 2 reg operands...  */
7360       unsigned int mem;
7361
7362       if (i.mem_operands)
7363         {
7364           unsigned int fake_zero_displacement = 0;
7365           unsigned int op;
7366
7367           for (op = 0; op < i.operands; op++)
7368             if (i.flags[op] & Operand_Mem)
7369               break;
7370           gas_assert (op < i.operands);
7371
7372           if (i.tm.opcode_modifier.vecsib)
7373             {
7374               if (i.index_reg->reg_num == RegIZ)
7375                 abort ();
7376
7377               i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7378               if (!i.base_reg)
7379                 {
7380                   i.sib.base = NO_BASE_REGISTER;
7381                   i.sib.scale = i.log2_scale_factor;
7382                   i.types[op].bitfield.disp8 = 0;
7383                   i.types[op].bitfield.disp16 = 0;
7384                   i.types[op].bitfield.disp64 = 0;
7385                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7386                     {
7387                       /* Must be 32 bit */
7388                       i.types[op].bitfield.disp32 = 1;
7389                       i.types[op].bitfield.disp32s = 0;
7390                     }
7391                   else
7392                     {
7393                       i.types[op].bitfield.disp32 = 0;
7394                       i.types[op].bitfield.disp32s = 1;
7395                     }
7396                 }
7397               i.sib.index = i.index_reg->reg_num;
7398               if ((i.index_reg->reg_flags & RegRex) != 0)
7399                 i.rex |= REX_X;
7400               if ((i.index_reg->reg_flags & RegVRex) != 0)
7401                 i.vrex |= REX_X;
7402             }
7403
7404           default_seg = &ds;
7405
7406           if (i.base_reg == 0)
7407             {
7408               i.rm.mode = 0;
7409               if (!i.disp_operands)
7410                 fake_zero_displacement = 1;
7411               if (i.index_reg == 0)
7412                 {
7413                   i386_operand_type newdisp;
7414
7415                   gas_assert (!i.tm.opcode_modifier.vecsib);
7416                   /* Operand is just <disp>  */
7417                   if (flag_code == CODE_64BIT)
7418                     {
7419                       /* 64bit mode overwrites the 32bit absolute
7420                          addressing by RIP relative addressing and
7421                          absolute addressing is encoded by one of the
7422                          redundant SIB forms.  */
7423                       i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7424                       i.sib.base = NO_BASE_REGISTER;
7425                       i.sib.index = NO_INDEX_REGISTER;
7426                       newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7427                     }
7428                   else if ((flag_code == CODE_16BIT)
7429                            ^ (i.prefix[ADDR_PREFIX] != 0))
7430                     {
7431                       i.rm.regmem = NO_BASE_REGISTER_16;
7432                       newdisp = disp16;
7433                     }
7434                   else
7435                     {
7436                       i.rm.regmem = NO_BASE_REGISTER;
7437                       newdisp = disp32;
7438                     }
7439                   i.types[op] = operand_type_and_not (i.types[op], anydisp);
7440                   i.types[op] = operand_type_or (i.types[op], newdisp);
7441                 }
7442               else if (!i.tm.opcode_modifier.vecsib)
7443                 {
7444                   /* !i.base_reg && i.index_reg  */
7445                   if (i.index_reg->reg_num == RegIZ)
7446                     i.sib.index = NO_INDEX_REGISTER;
7447                   else
7448                     i.sib.index = i.index_reg->reg_num;
7449                   i.sib.base = NO_BASE_REGISTER;
7450                   i.sib.scale = i.log2_scale_factor;
7451                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7452                   i.types[op].bitfield.disp8 = 0;
7453                   i.types[op].bitfield.disp16 = 0;
7454                   i.types[op].bitfield.disp64 = 0;
7455                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7456                     {
7457                       /* Must be 32 bit */
7458                       i.types[op].bitfield.disp32 = 1;
7459                       i.types[op].bitfield.disp32s = 0;
7460                     }
7461                   else
7462                     {
7463                       i.types[op].bitfield.disp32 = 0;
7464                       i.types[op].bitfield.disp32s = 1;
7465                     }
7466                   if ((i.index_reg->reg_flags & RegRex) != 0)
7467                     i.rex |= REX_X;
7468                 }
7469             }
7470           /* RIP addressing for 64bit mode.  */
7471           else if (i.base_reg->reg_num == RegIP)
7472             {
7473               gas_assert (!i.tm.opcode_modifier.vecsib);
7474               i.rm.regmem = NO_BASE_REGISTER;
7475               i.types[op].bitfield.disp8 = 0;
7476               i.types[op].bitfield.disp16 = 0;
7477               i.types[op].bitfield.disp32 = 0;
7478               i.types[op].bitfield.disp32s = 1;
7479               i.types[op].bitfield.disp64 = 0;
7480               i.flags[op] |= Operand_PCrel;
7481               if (! i.disp_operands)
7482                 fake_zero_displacement = 1;
7483             }
7484           else if (i.base_reg->reg_type.bitfield.word)
7485             {
7486               gas_assert (!i.tm.opcode_modifier.vecsib);
7487               switch (i.base_reg->reg_num)
7488                 {
7489                 case 3: /* (%bx)  */
7490                   if (i.index_reg == 0)
7491                     i.rm.regmem = 7;
7492                   else /* (%bx,%si) -> 0, or (%bx,%di) -> 1  */
7493                     i.rm.regmem = i.index_reg->reg_num - 6;
7494                   break;
7495                 case 5: /* (%bp)  */
7496                   default_seg = &ss;
7497                   if (i.index_reg == 0)
7498                     {
7499                       i.rm.regmem = 6;
7500                       if (operand_type_check (i.types[op], disp) == 0)
7501                         {
7502                           /* fake (%bp) into 0(%bp)  */
7503                           i.types[op].bitfield.disp8 = 1;
7504                           fake_zero_displacement = 1;
7505                         }
7506                     }
7507                   else /* (%bp,%si) -> 2, or (%bp,%di) -> 3  */
7508                     i.rm.regmem = i.index_reg->reg_num - 6 + 2;
7509                   break;
7510                 default: /* (%si) -> 4 or (%di) -> 5  */
7511                   i.rm.regmem = i.base_reg->reg_num - 6 + 4;
7512                 }
7513               i.rm.mode = mode_from_disp_size (i.types[op]);
7514             }
7515           else /* i.base_reg and 32/64 bit mode  */
7516             {
7517               if (flag_code == CODE_64BIT
7518                   && operand_type_check (i.types[op], disp))
7519                 {
7520                   i.types[op].bitfield.disp16 = 0;
7521                   i.types[op].bitfield.disp64 = 0;
7522                   if (i.prefix[ADDR_PREFIX] == 0)
7523                     {
7524                       i.types[op].bitfield.disp32 = 0;
7525                       i.types[op].bitfield.disp32s = 1;
7526                     }
7527                   else
7528                     {
7529                       i.types[op].bitfield.disp32 = 1;
7530                       i.types[op].bitfield.disp32s = 0;
7531                     }
7532                 }
7533
7534               if (!i.tm.opcode_modifier.vecsib)
7535                 i.rm.regmem = i.base_reg->reg_num;
7536               if ((i.base_reg->reg_flags & RegRex) != 0)
7537                 i.rex |= REX_B;
7538               i.sib.base = i.base_reg->reg_num;
7539               /* x86-64 ignores REX prefix bit here to avoid decoder
7540                  complications.  */
7541               if (!(i.base_reg->reg_flags & RegRex)
7542                   && (i.base_reg->reg_num == EBP_REG_NUM
7543                    || i.base_reg->reg_num == ESP_REG_NUM))
7544                   default_seg = &ss;
7545               if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
7546                 {
7547                   fake_zero_displacement = 1;
7548                   i.types[op].bitfield.disp8 = 1;
7549                 }
7550               i.sib.scale = i.log2_scale_factor;
7551               if (i.index_reg == 0)
7552                 {
7553                   gas_assert (!i.tm.opcode_modifier.vecsib);
7554                   /* <disp>(%esp) becomes two byte modrm with no index
7555                      register.  We've already stored the code for esp
7556                      in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
7557                      Any base register besides %esp will not use the
7558                      extra modrm byte.  */
7559                   i.sib.index = NO_INDEX_REGISTER;
7560                 }
7561               else if (!i.tm.opcode_modifier.vecsib)
7562                 {
7563                   if (i.index_reg->reg_num == RegIZ)
7564                     i.sib.index = NO_INDEX_REGISTER;
7565                   else
7566                     i.sib.index = i.index_reg->reg_num;
7567                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7568                   if ((i.index_reg->reg_flags & RegRex) != 0)
7569                     i.rex |= REX_X;
7570                 }
7571
7572               if (i.disp_operands
7573                   && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
7574                       || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
7575                 i.rm.mode = 0;
7576               else
7577                 {
7578                   if (!fake_zero_displacement
7579                       && !i.disp_operands
7580                       && i.disp_encoding)
7581                     {
7582                       fake_zero_displacement = 1;
7583                       if (i.disp_encoding == disp_encoding_8bit)
7584                         i.types[op].bitfield.disp8 = 1;
7585                       else
7586                         i.types[op].bitfield.disp32 = 1;
7587                     }
7588                   i.rm.mode = mode_from_disp_size (i.types[op]);
7589                 }
7590             }
7591
7592           if (fake_zero_displacement)
7593             {
7594               /* Fakes a zero displacement assuming that i.types[op]
7595                  holds the correct displacement size.  */
7596               expressionS *exp;
7597
7598               gas_assert (i.op[op].disps == 0);
7599               exp = &disp_expressions[i.disp_operands++];
7600               i.op[op].disps = exp;
7601               exp->X_op = O_constant;
7602               exp->X_add_number = 0;
7603               exp->X_add_symbol = (symbolS *) 0;
7604               exp->X_op_symbol = (symbolS *) 0;
7605             }
7606
7607           mem = op;
7608         }
7609       else
7610         mem = ~0;
7611
7612       if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
7613         {
7614           if (operand_type_check (i.types[0], imm))
7615             i.vex.register_specifier = NULL;
7616           else
7617             {
7618               /* VEX.vvvv encodes one of the sources when the first
7619                  operand is not an immediate.  */
7620               if (i.tm.opcode_modifier.vexw == VEXW0)
7621                 i.vex.register_specifier = i.op[0].regs;
7622               else
7623                 i.vex.register_specifier = i.op[1].regs;
7624             }
7625
7626           /* Destination is a XMM register encoded in the ModRM.reg
7627              and VEX.R bit.  */
7628           i.rm.reg = i.op[2].regs->reg_num;
7629           if ((i.op[2].regs->reg_flags & RegRex) != 0)
7630             i.rex |= REX_R;
7631
7632           /* ModRM.rm and VEX.B encodes the other source.  */
7633           if (!i.mem_operands)
7634             {
7635               i.rm.mode = 3;
7636
7637               if (i.tm.opcode_modifier.vexw == VEXW0)
7638                 i.rm.regmem = i.op[1].regs->reg_num;
7639               else
7640                 i.rm.regmem = i.op[0].regs->reg_num;
7641
7642               if ((i.op[1].regs->reg_flags & RegRex) != 0)
7643                 i.rex |= REX_B;
7644             }
7645         }
7646       else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
7647         {
7648           i.vex.register_specifier = i.op[2].regs;
7649           if (!i.mem_operands)
7650             {
7651               i.rm.mode = 3;
7652               i.rm.regmem = i.op[1].regs->reg_num;
7653               if ((i.op[1].regs->reg_flags & RegRex) != 0)
7654                 i.rex |= REX_B;
7655             }
7656         }
7657       /* Fill in i.rm.reg or i.rm.regmem field with register operand
7658          (if any) based on i.tm.extension_opcode.  Again, we must be
7659          careful to make sure that segment/control/debug/test/MMX
7660          registers are coded into the i.rm.reg field.  */
7661       else if (i.reg_operands)
7662         {
7663           unsigned int op;
7664           unsigned int vex_reg = ~0;
7665
7666           for (op = 0; op < i.operands; op++)
7667             {
7668               if (i.types[op].bitfield.reg
7669                   || i.types[op].bitfield.regbnd
7670                   || i.types[op].bitfield.regmask
7671                   || i.types[op].bitfield.sreg
7672                   || i.types[op].bitfield.control
7673                   || i.types[op].bitfield.debug
7674                   || i.types[op].bitfield.test)
7675                 break;
7676               if (i.types[op].bitfield.regsimd)
7677                 {
7678                   if (i.types[op].bitfield.zmmword)
7679                     i.has_regzmm = TRUE;
7680                   else if (i.types[op].bitfield.ymmword)
7681                     i.has_regymm = TRUE;
7682                   else
7683                     i.has_regxmm = TRUE;
7684                   break;
7685                 }
7686               if (i.types[op].bitfield.regmmx)
7687                 {
7688                   i.has_regmmx = TRUE;
7689                   break;
7690                 }
7691             }
7692
7693           if (vex_3_sources)
7694             op = dest;
7695           else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7696             {
7697               /* For instructions with VexNDS, the register-only
7698                  source operand is encoded in VEX prefix. */
7699               gas_assert (mem != (unsigned int) ~0);
7700
7701               if (op > mem)
7702                 {
7703                   vex_reg = op++;
7704                   gas_assert (op < i.operands);
7705                 }
7706               else
7707                 {
7708                   /* Check register-only source operand when two source
7709                      operands are swapped.  */
7710                   if (!i.tm.operand_types[op].bitfield.baseindex
7711                       && i.tm.operand_types[op + 1].bitfield.baseindex)
7712                     {
7713                       vex_reg = op;
7714                       op += 2;
7715                       gas_assert (mem == (vex_reg + 1)
7716                                   && op < i.operands);
7717                     }
7718                   else
7719                     {
7720                       vex_reg = op + 1;
7721                       gas_assert (vex_reg < i.operands);
7722                     }
7723                 }
7724             }
7725           else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7726             {
7727               /* For instructions with VexNDD, the register destination
7728                  is encoded in VEX prefix.  */
7729               if (i.mem_operands == 0)
7730                 {
7731                   /* There is no memory operand.  */
7732                   gas_assert ((op + 2) == i.operands);
7733                   vex_reg = op + 1;
7734                 }
7735               else
7736                 {
7737                   /* There are only 2 non-immediate operands.  */
7738                   gas_assert (op < i.imm_operands + 2
7739                               && i.operands == i.imm_operands + 2);
7740                   vex_reg = i.imm_operands + 1;
7741                 }
7742             }
7743           else
7744             gas_assert (op < i.operands);
7745
7746           if (vex_reg != (unsigned int) ~0)
7747             {
7748               i386_operand_type *type = &i.tm.operand_types[vex_reg];
7749
7750               if ((!type->bitfield.reg
7751                    || (!type->bitfield.dword && !type->bitfield.qword))
7752                   && !type->bitfield.regsimd
7753                   && !operand_type_equal (type, &regmask))
7754                 abort ();
7755
7756               i.vex.register_specifier = i.op[vex_reg].regs;
7757             }
7758
7759           /* Don't set OP operand twice.  */
7760           if (vex_reg != op)
7761             {
7762               /* If there is an extension opcode to put here, the
7763                  register number must be put into the regmem field.  */
7764               if (i.tm.extension_opcode != None)
7765                 {
7766                   i.rm.regmem = i.op[op].regs->reg_num;
7767                   if ((i.op[op].regs->reg_flags & RegRex) != 0)
7768                     i.rex |= REX_B;
7769                   if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7770                     i.vrex |= REX_B;
7771                 }
7772               else
7773                 {
7774                   i.rm.reg = i.op[op].regs->reg_num;
7775                   if ((i.op[op].regs->reg_flags & RegRex) != 0)
7776                     i.rex |= REX_R;
7777                   if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7778                     i.vrex |= REX_R;
7779                 }
7780             }
7781
7782           /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
7783              must set it to 3 to indicate this is a register operand
7784              in the regmem field.  */
7785           if (!i.mem_operands)
7786             i.rm.mode = 3;
7787         }
7788
7789       /* Fill in i.rm.reg field with extension opcode (if any).  */
7790       if (i.tm.extension_opcode != None)
7791         i.rm.reg = i.tm.extension_opcode;
7792     }
7793   return default_seg;
7794 }
7795
7796 static void
7797 output_branch (void)
7798 {
7799   char *p;
7800   int size;
7801   int code16;
7802   int prefix;
7803   relax_substateT subtype;
7804   symbolS *sym;
7805   offsetT off;
7806
7807   code16 = flag_code == CODE_16BIT ? CODE16 : 0;
7808   size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
7809
7810   prefix = 0;
7811   if (i.prefix[DATA_PREFIX] != 0)
7812     {
7813       prefix = 1;
7814       i.prefixes -= 1;
7815       code16 ^= CODE16;
7816     }
7817   /* Pentium4 branch hints.  */
7818   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7819       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7820     {
7821       prefix++;
7822       i.prefixes--;
7823     }
7824   if (i.prefix[REX_PREFIX] != 0)
7825     {
7826       prefix++;
7827       i.prefixes--;
7828     }
7829
7830   /* BND prefixed jump.  */
7831   if (i.prefix[BND_PREFIX] != 0)
7832     {
7833       FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
7834       i.prefixes -= 1;
7835     }
7836
7837   if (i.prefixes != 0 && !intel_syntax)
7838     as_warn (_("skipping prefixes on this instruction"));
7839
7840   /* It's always a symbol;  End frag & setup for relax.
7841      Make sure there is enough room in this frag for the largest
7842      instruction we may generate in md_convert_frag.  This is 2
7843      bytes for the opcode and room for the prefix and largest
7844      displacement.  */
7845   frag_grow (prefix + 2 + 4);
7846   /* Prefix and 1 opcode byte go in fr_fix.  */
7847   p = frag_more (prefix + 1);
7848   if (i.prefix[DATA_PREFIX] != 0)
7849     *p++ = DATA_PREFIX_OPCODE;
7850   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
7851       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
7852     *p++ = i.prefix[SEG_PREFIX];
7853   if (i.prefix[REX_PREFIX] != 0)
7854     *p++ = i.prefix[REX_PREFIX];
7855   *p = i.tm.base_opcode;
7856
7857   if ((unsigned char) *p == JUMP_PC_RELATIVE)
7858     subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
7859   else if (cpu_arch_flags.bitfield.cpui386)
7860     subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
7861   else
7862     subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
7863   subtype |= code16;
7864
7865   sym = i.op[0].disps->X_add_symbol;
7866   off = i.op[0].disps->X_add_number;
7867
7868   if (i.op[0].disps->X_op != O_constant
7869       && i.op[0].disps->X_op != O_symbol)
7870     {
7871       /* Handle complex expressions.  */
7872       sym = make_expr_symbol (i.op[0].disps);
7873       off = 0;
7874     }
7875
7876   /* 1 possible extra opcode + 4 byte displacement go in var part.
7877      Pass reloc in fr_var.  */
7878   frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
7879 }
7880
7881 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7882 /* Return TRUE iff PLT32 relocation should be used for branching to
7883    symbol S.  */
7884
7885 static bfd_boolean
7886 need_plt32_p (symbolS *s)
7887 {
7888   /* PLT32 relocation is ELF only.  */
7889   if (!IS_ELF)
7890     return FALSE;
7891
7892 #ifdef TE_SOLARIS
7893   /* Don't emit PLT32 relocation on Solaris: neither native linker nor
7894      krtld support it.  */
7895   return FALSE;
7896 #endif
7897
7898   /* Since there is no need to prepare for PLT branch on x86-64, we
7899      can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
7900      be used as a marker for 32-bit PC-relative branches.  */
7901   if (!object_64bit)
7902     return FALSE;
7903
7904   /* Weak or undefined symbol need PLT32 relocation.  */
7905   if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
7906     return TRUE;
7907
7908   /* Non-global symbol doesn't need PLT32 relocation.  */
7909   if (! S_IS_EXTERNAL (s))
7910     return FALSE;
7911
7912   /* Other global symbols need PLT32 relocation.  NB: Symbol with
7913      non-default visibilities are treated as normal global symbol
7914      so that PLT32 relocation can be used as a marker for 32-bit
7915      PC-relative branches.  It is useful for linker relaxation.  */
7916   return TRUE;
7917 }
7918 #endif
7919
7920 static void
7921 output_jump (void)
7922 {
7923   char *p;
7924   int size;
7925   fixS *fixP;
7926   bfd_reloc_code_real_type jump_reloc = i.reloc[0];
7927
7928   if (i.tm.opcode_modifier.jumpbyte)
7929     {
7930       /* This is a loop or jecxz type instruction.  */
7931       size = 1;
7932       if (i.prefix[ADDR_PREFIX] != 0)
7933         {
7934           FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
7935           i.prefixes -= 1;
7936         }
7937       /* Pentium4 branch hints.  */
7938       if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7939           || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7940         {
7941           FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
7942           i.prefixes--;
7943         }
7944     }
7945   else
7946     {
7947       int code16;
7948
7949       code16 = 0;
7950       if (flag_code == CODE_16BIT)
7951         code16 = CODE16;
7952
7953       if (i.prefix[DATA_PREFIX] != 0)
7954         {
7955           FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
7956           i.prefixes -= 1;
7957           code16 ^= CODE16;
7958         }
7959
7960       size = 4;
7961       if (code16)
7962         size = 2;
7963     }
7964
7965   if (i.prefix[REX_PREFIX] != 0)
7966     {
7967       FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
7968       i.prefixes -= 1;
7969     }
7970
7971   /* BND prefixed jump.  */
7972   if (i.prefix[BND_PREFIX] != 0)
7973     {
7974       FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
7975       i.prefixes -= 1;
7976     }
7977
7978   if (i.prefixes != 0 && !intel_syntax)
7979     as_warn (_("skipping prefixes on this instruction"));
7980
7981   p = frag_more (i.tm.opcode_length + size);
7982   switch (i.tm.opcode_length)
7983     {
7984     case 2:
7985       *p++ = i.tm.base_opcode >> 8;
7986       /* Fall through.  */
7987     case 1:
7988       *p++ = i.tm.base_opcode;
7989       break;
7990     default:
7991       abort ();
7992     }
7993
7994 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7995   if (size == 4
7996       && jump_reloc == NO_RELOC
7997       && need_plt32_p (i.op[0].disps->X_add_symbol))
7998     jump_reloc = BFD_RELOC_X86_64_PLT32;
7999 #endif
8000
8001   jump_reloc = reloc (size, 1, 1, jump_reloc);
8002
8003   fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8004                       i.op[0].disps, 1, jump_reloc);
8005
8006   /* All jumps handled here are signed, but don't use a signed limit
8007      check for 32 and 16 bit jumps as we want to allow wrap around at
8008      4G and 64k respectively.  */
8009   if (size == 1)
8010     fixP->fx_signed = 1;
8011 }
8012
8013 static void
8014 output_interseg_jump (void)
8015 {
8016   char *p;
8017   int size;
8018   int prefix;
8019   int code16;
8020
8021   code16 = 0;
8022   if (flag_code == CODE_16BIT)
8023     code16 = CODE16;
8024
8025   prefix = 0;
8026   if (i.prefix[DATA_PREFIX] != 0)
8027     {
8028       prefix = 1;
8029       i.prefixes -= 1;
8030       code16 ^= CODE16;
8031     }
8032   if (i.prefix[REX_PREFIX] != 0)
8033     {
8034       prefix++;
8035       i.prefixes -= 1;
8036     }
8037
8038   size = 4;
8039   if (code16)
8040     size = 2;
8041
8042   if (i.prefixes != 0 && !intel_syntax)
8043     as_warn (_("skipping prefixes on this instruction"));
8044
8045   /* 1 opcode; 2 segment; offset  */
8046   p = frag_more (prefix + 1 + 2 + size);
8047
8048   if (i.prefix[DATA_PREFIX] != 0)
8049     *p++ = DATA_PREFIX_OPCODE;
8050
8051   if (i.prefix[REX_PREFIX] != 0)
8052     *p++ = i.prefix[REX_PREFIX];
8053
8054   *p++ = i.tm.base_opcode;
8055   if (i.op[1].imms->X_op == O_constant)
8056     {
8057       offsetT n = i.op[1].imms->X_add_number;
8058
8059       if (size == 2
8060           && !fits_in_unsigned_word (n)
8061           && !fits_in_signed_word (n))
8062         {
8063           as_bad (_("16-bit jump out of range"));
8064           return;
8065         }
8066       md_number_to_chars (p, n, size);
8067     }
8068   else
8069     fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8070                  i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8071   if (i.op[0].imms->X_op != O_constant)
8072     as_bad (_("can't handle non absolute segment in `%s'"),
8073             i.tm.name);
8074   md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8075 }
8076
8077 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8078 void
8079 x86_cleanup (void)
8080 {
8081   char *p;
8082   asection *seg = now_seg;
8083   subsegT subseg = now_subseg;
8084   asection *sec;
8085   unsigned int alignment, align_size_1;
8086   unsigned int isa_1_descsz, feature_2_descsz, descsz;
8087   unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8088   unsigned int padding;
8089
8090   if (!IS_ELF || !x86_used_note)
8091     return;
8092
8093   x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8094
8095   /* The .note.gnu.property section layout:
8096
8097      Field      Length          Contents
8098      ----       ----            ----
8099      n_namsz    4               4
8100      n_descsz   4               The note descriptor size
8101      n_type     4               NT_GNU_PROPERTY_TYPE_0
8102      n_name     4               "GNU"
8103      n_desc     n_descsz        The program property array
8104      ....       ....            ....
8105    */
8106
8107   /* Create the .note.gnu.property section.  */
8108   sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8109   bfd_set_section_flags (sec,
8110                          (SEC_ALLOC
8111                           | SEC_LOAD
8112                           | SEC_DATA
8113                           | SEC_HAS_CONTENTS
8114                           | SEC_READONLY));
8115
8116   if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8117     {
8118       align_size_1 = 7;
8119       alignment = 3;
8120     }
8121   else
8122     {
8123       align_size_1 = 3;
8124       alignment = 2;
8125     }
8126
8127   bfd_set_section_alignment (sec, alignment);
8128   elf_section_type (sec) = SHT_NOTE;
8129
8130   /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8131                                   + 4-byte data  */
8132   isa_1_descsz_raw = 4 + 4 + 4;
8133   /* Align GNU_PROPERTY_X86_ISA_1_USED.  */
8134   isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8135
8136   feature_2_descsz_raw = isa_1_descsz;
8137   /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8138                                       + 4-byte data  */
8139   feature_2_descsz_raw += 4 + 4 + 4;
8140   /* Align GNU_PROPERTY_X86_FEATURE_2_USED.  */
8141   feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8142                       & ~align_size_1);
8143
8144   descsz = feature_2_descsz;
8145   /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz.  */
8146   p = frag_more (4 + 4 + 4 + 4 + descsz);
8147
8148   /* Write n_namsz.  */
8149   md_number_to_chars (p, (valueT) 4, 4);
8150
8151   /* Write n_descsz.  */
8152   md_number_to_chars (p + 4, (valueT) descsz, 4);
8153
8154   /* Write n_type.  */
8155   md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8156
8157   /* Write n_name.  */
8158   memcpy (p + 4 * 3, "GNU", 4);
8159
8160   /* Write 4-byte type.  */
8161   md_number_to_chars (p + 4 * 4,
8162                       (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8163
8164   /* Write 4-byte data size.  */
8165   md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8166
8167   /* Write 4-byte data.  */
8168   md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8169
8170   /* Zero out paddings.  */
8171   padding = isa_1_descsz - isa_1_descsz_raw;
8172   if (padding)
8173     memset (p + 4 * 7, 0, padding);
8174
8175   /* Write 4-byte type.  */
8176   md_number_to_chars (p + isa_1_descsz + 4 * 4,
8177                       (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8178
8179   /* Write 4-byte data size.  */
8180   md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8181
8182   /* Write 4-byte data.  */
8183   md_number_to_chars (p + isa_1_descsz + 4 * 6,
8184                       (valueT) x86_feature_2_used, 4);
8185
8186   /* Zero out paddings.  */
8187   padding = feature_2_descsz - feature_2_descsz_raw;
8188   if (padding)
8189     memset (p + isa_1_descsz + 4 * 7, 0, padding);
8190
8191   /* We probably can't restore the current segment, for there likely
8192      isn't one yet...  */
8193   if (seg && subseg)
8194     subseg_set (seg, subseg);
8195 }
8196 #endif
8197
8198 static unsigned int
8199 encoding_length (const fragS *start_frag, offsetT start_off,
8200                  const char *frag_now_ptr)
8201 {
8202   unsigned int len = 0;
8203
8204   if (start_frag != frag_now)
8205     {
8206       const fragS *fr = start_frag;
8207
8208       do {
8209         len += fr->fr_fix;
8210         fr = fr->fr_next;
8211       } while (fr && fr != frag_now);
8212     }
8213
8214   return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8215 }
8216
8217 static void
8218 output_insn (void)
8219 {
8220   fragS *insn_start_frag;
8221   offsetT insn_start_off;
8222
8223 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8224   if (IS_ELF && x86_used_note)
8225     {
8226       if (i.tm.cpu_flags.bitfield.cpucmov)
8227         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
8228       if (i.tm.cpu_flags.bitfield.cpusse)
8229         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
8230       if (i.tm.cpu_flags.bitfield.cpusse2)
8231         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
8232       if (i.tm.cpu_flags.bitfield.cpusse3)
8233         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
8234       if (i.tm.cpu_flags.bitfield.cpussse3)
8235         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
8236       if (i.tm.cpu_flags.bitfield.cpusse4_1)
8237         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
8238       if (i.tm.cpu_flags.bitfield.cpusse4_2)
8239         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
8240       if (i.tm.cpu_flags.bitfield.cpuavx)
8241         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
8242       if (i.tm.cpu_flags.bitfield.cpuavx2)
8243         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
8244       if (i.tm.cpu_flags.bitfield.cpufma)
8245         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
8246       if (i.tm.cpu_flags.bitfield.cpuavx512f)
8247         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
8248       if (i.tm.cpu_flags.bitfield.cpuavx512cd)
8249         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
8250       if (i.tm.cpu_flags.bitfield.cpuavx512er)
8251         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
8252       if (i.tm.cpu_flags.bitfield.cpuavx512pf)
8253         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
8254       if (i.tm.cpu_flags.bitfield.cpuavx512vl)
8255         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
8256       if (i.tm.cpu_flags.bitfield.cpuavx512dq)
8257         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
8258       if (i.tm.cpu_flags.bitfield.cpuavx512bw)
8259         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
8260       if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
8261         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
8262       if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
8263         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
8264       if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
8265         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
8266       if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
8267         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
8268       if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
8269         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
8270       if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
8271         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
8272       if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
8273         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
8274       if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
8275         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
8276
8277       if (i.tm.cpu_flags.bitfield.cpu8087
8278           || i.tm.cpu_flags.bitfield.cpu287
8279           || i.tm.cpu_flags.bitfield.cpu387
8280           || i.tm.cpu_flags.bitfield.cpu687
8281           || i.tm.cpu_flags.bitfield.cpufisttp)
8282         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
8283       /* Don't set GNU_PROPERTY_X86_FEATURE_2_MMX for prefetchtXXX nor
8284          Xfence instructions.  */
8285       if (i.tm.base_opcode != 0xf18
8286           && i.tm.base_opcode != 0xf0d
8287           && i.tm.base_opcode != 0xfaef8
8288           && (i.has_regmmx
8289               || i.tm.cpu_flags.bitfield.cpummx
8290               || i.tm.cpu_flags.bitfield.cpua3dnow
8291               || i.tm.cpu_flags.bitfield.cpua3dnowa))
8292         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
8293       if (i.has_regxmm)
8294         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
8295       if (i.has_regymm)
8296         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
8297       if (i.has_regzmm)
8298         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
8299       if (i.tm.cpu_flags.bitfield.cpufxsr)
8300         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
8301       if (i.tm.cpu_flags.bitfield.cpuxsave)
8302         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
8303       if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
8304         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
8305       if (i.tm.cpu_flags.bitfield.cpuxsavec)
8306         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
8307     }
8308 #endif
8309
8310   /* Tie dwarf2 debug info to the address at the start of the insn.
8311      We can't do this after the insn has been output as the current
8312      frag may have been closed off.  eg. by frag_var.  */
8313   dwarf2_emit_insn (0);
8314
8315   insn_start_frag = frag_now;
8316   insn_start_off = frag_now_fix ();
8317
8318   /* Output jumps.  */
8319   if (i.tm.opcode_modifier.jump)
8320     output_branch ();
8321   else if (i.tm.opcode_modifier.jumpbyte
8322            || i.tm.opcode_modifier.jumpdword)
8323     output_jump ();
8324   else if (i.tm.opcode_modifier.jumpintersegment)
8325     output_interseg_jump ();
8326   else
8327     {
8328       /* Output normal instructions here.  */
8329       char *p;
8330       unsigned char *q;
8331       unsigned int j;
8332       unsigned int prefix;
8333
8334       if (avoid_fence
8335           && (i.tm.base_opcode == 0xfaee8
8336               || i.tm.base_opcode == 0xfaef0
8337               || i.tm.base_opcode == 0xfaef8))
8338         {
8339           /* Encode lfence, mfence, and sfence as
8340              f0 83 04 24 00   lock addl $0x0, (%{re}sp).  */
8341           offsetT val = 0x240483f0ULL;
8342           p = frag_more (5);
8343           md_number_to_chars (p, val, 5);
8344           return;
8345         }
8346
8347       /* Some processors fail on LOCK prefix. This options makes
8348          assembler ignore LOCK prefix and serves as a workaround.  */
8349       if (omit_lock_prefix)
8350         {
8351           if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
8352             return;
8353           i.prefix[LOCK_PREFIX] = 0;
8354         }
8355
8356       /* Since the VEX/EVEX prefix contains the implicit prefix, we
8357          don't need the explicit prefix.  */
8358       if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
8359         {
8360           switch (i.tm.opcode_length)
8361             {
8362             case 3:
8363               if (i.tm.base_opcode & 0xff000000)
8364                 {
8365                   prefix = (i.tm.base_opcode >> 24) & 0xff;
8366                   if (!i.tm.cpu_flags.bitfield.cpupadlock
8367                       || prefix != REPE_PREFIX_OPCODE
8368                       || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
8369                     add_prefix (prefix);
8370                 }
8371               break;
8372             case 2:
8373               if ((i.tm.base_opcode & 0xff0000) != 0)
8374                 {
8375                   prefix = (i.tm.base_opcode >> 16) & 0xff;
8376                   add_prefix (prefix);
8377                 }
8378               break;
8379             case 1:
8380               break;
8381             case 0:
8382               /* Check for pseudo prefixes.  */
8383               as_bad_where (insn_start_frag->fr_file,
8384                             insn_start_frag->fr_line,
8385                              _("pseudo prefix without instruction"));
8386               return;
8387             default:
8388               abort ();
8389             }
8390
8391 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
8392           /* For x32, add a dummy REX_OPCODE prefix for mov/add with
8393              R_X86_64_GOTTPOFF relocation so that linker can safely
8394              perform IE->LE optimization.  */
8395           if (x86_elf_abi == X86_64_X32_ABI
8396               && i.operands == 2
8397               && i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
8398               && i.prefix[REX_PREFIX] == 0)
8399             add_prefix (REX_OPCODE);
8400 #endif
8401
8402           /* The prefix bytes.  */
8403           for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
8404             if (*q)
8405               FRAG_APPEND_1_CHAR (*q);
8406         }
8407       else
8408         {
8409           for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
8410             if (*q)
8411               switch (j)
8412                 {
8413                 case REX_PREFIX:
8414                   /* REX byte is encoded in VEX prefix.  */
8415                   break;
8416                 case SEG_PREFIX:
8417                 case ADDR_PREFIX:
8418                   FRAG_APPEND_1_CHAR (*q);
8419                   break;
8420                 default:
8421                   /* There should be no other prefixes for instructions
8422                      with VEX prefix.  */
8423                   abort ();
8424                 }
8425
8426           /* For EVEX instructions i.vrex should become 0 after
8427              build_evex_prefix.  For VEX instructions upper 16 registers
8428              aren't available, so VREX should be 0.  */
8429           if (i.vrex)
8430             abort ();
8431           /* Now the VEX prefix.  */
8432           p = frag_more (i.vex.length);
8433           for (j = 0; j < i.vex.length; j++)
8434             p[j] = i.vex.bytes[j];
8435         }
8436
8437       /* Now the opcode; be careful about word order here!  */
8438       if (i.tm.opcode_length == 1)
8439         {
8440           FRAG_APPEND_1_CHAR (i.tm.base_opcode);
8441         }
8442       else
8443         {
8444           switch (i.tm.opcode_length)
8445             {
8446             case 4:
8447               p = frag_more (4);
8448               *p++ = (i.tm.base_opcode >> 24) & 0xff;
8449               *p++ = (i.tm.base_opcode >> 16) & 0xff;
8450               break;
8451             case 3:
8452               p = frag_more (3);
8453               *p++ = (i.tm.base_opcode >> 16) & 0xff;
8454               break;
8455             case 2:
8456               p = frag_more (2);
8457               break;
8458             default:
8459               abort ();
8460               break;
8461             }
8462
8463           /* Put out high byte first: can't use md_number_to_chars!  */
8464           *p++ = (i.tm.base_opcode >> 8) & 0xff;
8465           *p = i.tm.base_opcode & 0xff;
8466         }
8467
8468       /* Now the modrm byte and sib byte (if present).  */
8469       if (i.tm.opcode_modifier.modrm)
8470         {
8471           FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
8472                                | i.rm.reg << 3
8473                                | i.rm.mode << 6));
8474           /* If i.rm.regmem == ESP (4)
8475              && i.rm.mode != (Register mode)
8476              && not 16 bit
8477              ==> need second modrm byte.  */
8478           if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
8479               && i.rm.mode != 3
8480               && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
8481             FRAG_APPEND_1_CHAR ((i.sib.base << 0
8482                                  | i.sib.index << 3
8483                                  | i.sib.scale << 6));
8484         }
8485
8486       if (i.disp_operands)
8487         output_disp (insn_start_frag, insn_start_off);
8488
8489       if (i.imm_operands)
8490         output_imm (insn_start_frag, insn_start_off);
8491
8492       /*
8493        * frag_now_fix () returning plain abs_section_offset when we're in the
8494        * absolute section, and abs_section_offset not getting updated as data
8495        * gets added to the frag breaks the logic below.
8496        */
8497       if (now_seg != absolute_section)
8498         {
8499           j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
8500           if (j > 15)
8501             as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
8502                      j);
8503         }
8504     }
8505
8506 #ifdef DEBUG386
8507   if (flag_debug)
8508     {
8509       pi ("" /*line*/, &i);
8510     }
8511 #endif /* DEBUG386  */
8512 }
8513
8514 /* Return the size of the displacement operand N.  */
8515
8516 static int
8517 disp_size (unsigned int n)
8518 {
8519   int size = 4;
8520
8521   if (i.types[n].bitfield.disp64)
8522     size = 8;
8523   else if (i.types[n].bitfield.disp8)
8524     size = 1;
8525   else if (i.types[n].bitfield.disp16)
8526     size = 2;
8527   return size;
8528 }
8529
8530 /* Return the size of the immediate operand N.  */
8531
8532 static int
8533 imm_size (unsigned int n)
8534 {
8535   int size = 4;
8536   if (i.types[n].bitfield.imm64)
8537     size = 8;
8538   else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
8539     size = 1;
8540   else if (i.types[n].bitfield.imm16)
8541     size = 2;
8542   return size;
8543 }
8544
8545 static void
8546 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
8547 {
8548   char *p;
8549   unsigned int n;
8550
8551   for (n = 0; n < i.operands; n++)
8552     {
8553       if (operand_type_check (i.types[n], disp))
8554         {
8555           if (i.op[n].disps->X_op == O_constant)
8556             {
8557               int size = disp_size (n);
8558               offsetT val = i.op[n].disps->X_add_number;
8559
8560               val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
8561                                      size);
8562               p = frag_more (size);
8563               md_number_to_chars (p, val, size);
8564             }
8565           else
8566             {
8567               enum bfd_reloc_code_real reloc_type;
8568               int size = disp_size (n);
8569               int sign = i.types[n].bitfield.disp32s;
8570               int pcrel = (i.flags[n] & Operand_PCrel) != 0;
8571               fixS *fixP;
8572
8573               /* We can't have 8 bit displacement here.  */
8574               gas_assert (!i.types[n].bitfield.disp8);
8575
8576               /* The PC relative address is computed relative
8577                  to the instruction boundary, so in case immediate
8578                  fields follows, we need to adjust the value.  */
8579               if (pcrel && i.imm_operands)
8580                 {
8581                   unsigned int n1;
8582                   int sz = 0;
8583
8584                   for (n1 = 0; n1 < i.operands; n1++)
8585                     if (operand_type_check (i.types[n1], imm))
8586                       {
8587                         /* Only one immediate is allowed for PC
8588                            relative address.  */
8589                         gas_assert (sz == 0);
8590                         sz = imm_size (n1);
8591                         i.op[n].disps->X_add_number -= sz;
8592                       }
8593                   /* We should find the immediate.  */
8594                   gas_assert (sz != 0);
8595                 }
8596
8597               p = frag_more (size);
8598               reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
8599               if (GOT_symbol
8600                   && GOT_symbol == i.op[n].disps->X_add_symbol
8601                   && (((reloc_type == BFD_RELOC_32
8602                         || reloc_type == BFD_RELOC_X86_64_32S
8603                         || (reloc_type == BFD_RELOC_64
8604                             && object_64bit))
8605                        && (i.op[n].disps->X_op == O_symbol
8606                            || (i.op[n].disps->X_op == O_add
8607                                && ((symbol_get_value_expression
8608                                     (i.op[n].disps->X_op_symbol)->X_op)
8609                                    == O_subtract))))
8610                       || reloc_type == BFD_RELOC_32_PCREL))
8611                 {
8612                   if (!object_64bit)
8613                     {
8614                       reloc_type = BFD_RELOC_386_GOTPC;
8615                       i.op[n].imms->X_add_number +=
8616                         encoding_length (insn_start_frag, insn_start_off, p);
8617                     }
8618                   else if (reloc_type == BFD_RELOC_64)
8619                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
8620                   else
8621                     /* Don't do the adjustment for x86-64, as there
8622                        the pcrel addressing is relative to the _next_
8623                        insn, and that is taken care of in other code.  */
8624                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
8625                 }
8626               fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
8627                                   size, i.op[n].disps, pcrel,
8628                                   reloc_type);
8629               /* Check for "call/jmp *mem", "mov mem, %reg",
8630                  "test %reg, mem" and "binop mem, %reg" where binop
8631                  is one of adc, add, and, cmp, or, sbb, sub, xor
8632                  instructions without data prefix.  Always generate
8633                  R_386_GOT32X for "sym*GOT" operand in 32-bit mode.  */
8634               if (i.prefix[DATA_PREFIX] == 0
8635                   && (generate_relax_relocations
8636                       || (!object_64bit
8637                           && i.rm.mode == 0
8638                           && i.rm.regmem == 5))
8639                   && (i.rm.mode == 2
8640                       || (i.rm.mode == 0 && i.rm.regmem == 5))
8641                   && ((i.operands == 1
8642                        && i.tm.base_opcode == 0xff
8643                        && (i.rm.reg == 2 || i.rm.reg == 4))
8644                       || (i.operands == 2
8645                           && (i.tm.base_opcode == 0x8b
8646                               || i.tm.base_opcode == 0x85
8647                               || (i.tm.base_opcode & 0xc7) == 0x03))))
8648                 {
8649                   if (object_64bit)
8650                     {
8651                       fixP->fx_tcbit = i.rex != 0;
8652                       if (i.base_reg
8653                           && (i.base_reg->reg_num == RegIP))
8654                       fixP->fx_tcbit2 = 1;
8655                     }
8656                   else
8657                     fixP->fx_tcbit2 = 1;
8658                 }
8659             }
8660         }
8661     }
8662 }
8663
8664 static void
8665 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
8666 {
8667   char *p;
8668   unsigned int n;
8669
8670   for (n = 0; n < i.operands; n++)
8671     {
8672       /* Skip SAE/RC Imm operand in EVEX.  They are already handled.  */
8673       if (i.rounding && (int) n == i.rounding->operand)
8674         continue;
8675
8676       if (operand_type_check (i.types[n], imm))
8677         {
8678           if (i.op[n].imms->X_op == O_constant)
8679             {
8680               int size = imm_size (n);
8681               offsetT val;
8682
8683               val = offset_in_range (i.op[n].imms->X_add_number,
8684                                      size);
8685               p = frag_more (size);
8686               md_number_to_chars (p, val, size);
8687             }
8688           else
8689             {
8690               /* Not absolute_section.
8691                  Need a 32-bit fixup (don't support 8bit
8692                  non-absolute imms).  Try to support other
8693                  sizes ...  */
8694               enum bfd_reloc_code_real reloc_type;
8695               int size = imm_size (n);
8696               int sign;
8697
8698               if (i.types[n].bitfield.imm32s
8699                   && (i.suffix == QWORD_MNEM_SUFFIX
8700                       || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
8701                 sign = 1;
8702               else
8703                 sign = 0;
8704
8705               p = frag_more (size);
8706               reloc_type = reloc (size, 0, sign, i.reloc[n]);
8707
8708               /*   This is tough to explain.  We end up with this one if we
8709                * have operands that look like
8710                * "_GLOBAL_OFFSET_TABLE_+[.-.L284]".  The goal here is to
8711                * obtain the absolute address of the GOT, and it is strongly
8712                * preferable from a performance point of view to avoid using
8713                * a runtime relocation for this.  The actual sequence of
8714                * instructions often look something like:
8715                *
8716                *        call    .L66
8717                * .L66:
8718                *        popl    %ebx
8719                *        addl    $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
8720                *
8721                *   The call and pop essentially return the absolute address
8722                * of the label .L66 and store it in %ebx.  The linker itself
8723                * will ultimately change the first operand of the addl so
8724                * that %ebx points to the GOT, but to keep things simple, the
8725                * .o file must have this operand set so that it generates not
8726                * the absolute address of .L66, but the absolute address of
8727                * itself.  This allows the linker itself simply treat a GOTPC
8728                * relocation as asking for a pcrel offset to the GOT to be
8729                * added in, and the addend of the relocation is stored in the
8730                * operand field for the instruction itself.
8731                *
8732                *   Our job here is to fix the operand so that it would add
8733                * the correct offset so that %ebx would point to itself.  The
8734                * thing that is tricky is that .-.L66 will point to the
8735                * beginning of the instruction, so we need to further modify
8736                * the operand so that it will point to itself.  There are
8737                * other cases where you have something like:
8738                *
8739                *        .long   $_GLOBAL_OFFSET_TABLE_+[.-.L66]
8740                *
8741                * and here no correction would be required.  Internally in
8742                * the assembler we treat operands of this form as not being
8743                * pcrel since the '.' is explicitly mentioned, and I wonder
8744                * whether it would simplify matters to do it this way.  Who
8745                * knows.  In earlier versions of the PIC patches, the
8746                * pcrel_adjust field was used to store the correction, but
8747                * since the expression is not pcrel, I felt it would be
8748                * confusing to do it this way.  */
8749
8750               if ((reloc_type == BFD_RELOC_32
8751                    || reloc_type == BFD_RELOC_X86_64_32S
8752                    || reloc_type == BFD_RELOC_64)
8753                   && GOT_symbol
8754                   && GOT_symbol == i.op[n].imms->X_add_symbol
8755                   && (i.op[n].imms->X_op == O_symbol
8756                       || (i.op[n].imms->X_op == O_add
8757                           && ((symbol_get_value_expression
8758                                (i.op[n].imms->X_op_symbol)->X_op)
8759                               == O_subtract))))
8760                 {
8761                   if (!object_64bit)
8762                     reloc_type = BFD_RELOC_386_GOTPC;
8763                   else if (size == 4)
8764                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
8765                   else if (size == 8)
8766                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
8767                   i.op[n].imms->X_add_number +=
8768                     encoding_length (insn_start_frag, insn_start_off, p);
8769                 }
8770               fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8771                            i.op[n].imms, 0, reloc_type);
8772             }
8773         }
8774     }
8775 }
8776 \f
8777 /* x86_cons_fix_new is called via the expression parsing code when a
8778    reloc is needed.  We use this hook to get the correct .got reloc.  */
8779 static int cons_sign = -1;
8780
8781 void
8782 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
8783                   expressionS *exp, bfd_reloc_code_real_type r)
8784 {
8785   r = reloc (len, 0, cons_sign, r);
8786
8787 #ifdef TE_PE
8788   if (exp->X_op == O_secrel)
8789     {
8790       exp->X_op = O_symbol;
8791       r = BFD_RELOC_32_SECREL;
8792     }
8793 #endif
8794
8795   fix_new_exp (frag, off, len, exp, 0, r);
8796 }
8797
8798 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
8799    purpose of the `.dc.a' internal pseudo-op.  */
8800
8801 int
8802 x86_address_bytes (void)
8803 {
8804   if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
8805     return 4;
8806   return stdoutput->arch_info->bits_per_address / 8;
8807 }
8808
8809 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
8810     || defined (LEX_AT)
8811 # define lex_got(reloc, adjust, types) NULL
8812 #else
8813 /* Parse operands of the form
8814    <symbol>@GOTOFF+<nnn>
8815    and similar .plt or .got references.
8816
8817    If we find one, set up the correct relocation in RELOC and copy the
8818    input string, minus the `@GOTOFF' into a malloc'd buffer for
8819    parsing by the calling routine.  Return this buffer, and if ADJUST
8820    is non-null set it to the length of the string we removed from the
8821    input line.  Otherwise return NULL.  */
8822 static char *
8823 lex_got (enum bfd_reloc_code_real *rel,
8824          int *adjust,
8825          i386_operand_type *types)
8826 {
8827   /* Some of the relocations depend on the size of what field is to
8828      be relocated.  But in our callers i386_immediate and i386_displacement
8829      we don't yet know the operand size (this will be set by insn
8830      matching).  Hence we record the word32 relocation here,
8831      and adjust the reloc according to the real size in reloc().  */
8832   static const struct {
8833     const char *str;
8834     int len;
8835     const enum bfd_reloc_code_real rel[2];
8836     const i386_operand_type types64;
8837   } gotrel[] = {
8838 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8839     { STRING_COMMA_LEN ("SIZE"),      { BFD_RELOC_SIZE32,
8840                                         BFD_RELOC_SIZE32 },
8841       OPERAND_TYPE_IMM32_64 },
8842 #endif
8843     { STRING_COMMA_LEN ("PLTOFF"),   { _dummy_first_bfd_reloc_code_real,
8844                                        BFD_RELOC_X86_64_PLTOFF64 },
8845       OPERAND_TYPE_IMM64 },
8846     { STRING_COMMA_LEN ("PLT"),      { BFD_RELOC_386_PLT32,
8847                                        BFD_RELOC_X86_64_PLT32    },
8848       OPERAND_TYPE_IMM32_32S_DISP32 },
8849     { STRING_COMMA_LEN ("GOTPLT"),   { _dummy_first_bfd_reloc_code_real,
8850                                        BFD_RELOC_X86_64_GOTPLT64 },
8851       OPERAND_TYPE_IMM64_DISP64 },
8852     { STRING_COMMA_LEN ("GOTOFF"),   { BFD_RELOC_386_GOTOFF,
8853                                        BFD_RELOC_X86_64_GOTOFF64 },
8854       OPERAND_TYPE_IMM64_DISP64 },
8855     { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
8856                                        BFD_RELOC_X86_64_GOTPCREL },
8857       OPERAND_TYPE_IMM32_32S_DISP32 },
8858     { STRING_COMMA_LEN ("TLSGD"),    { BFD_RELOC_386_TLS_GD,
8859                                        BFD_RELOC_X86_64_TLSGD    },
8860       OPERAND_TYPE_IMM32_32S_DISP32 },
8861     { STRING_COMMA_LEN ("TLSLDM"),   { BFD_RELOC_386_TLS_LDM,
8862                                        _dummy_first_bfd_reloc_code_real },
8863       OPERAND_TYPE_NONE },
8864     { STRING_COMMA_LEN ("TLSLD"),    { _dummy_first_bfd_reloc_code_real,
8865                                        BFD_RELOC_X86_64_TLSLD    },
8866       OPERAND_TYPE_IMM32_32S_DISP32 },
8867     { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
8868                                        BFD_RELOC_X86_64_GOTTPOFF },
8869       OPERAND_TYPE_IMM32_32S_DISP32 },
8870     { STRING_COMMA_LEN ("TPOFF"),    { BFD_RELOC_386_TLS_LE_32,
8871                                        BFD_RELOC_X86_64_TPOFF32  },
8872       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8873     { STRING_COMMA_LEN ("NTPOFF"),   { BFD_RELOC_386_TLS_LE,
8874                                        _dummy_first_bfd_reloc_code_real },
8875       OPERAND_TYPE_NONE },
8876     { STRING_COMMA_LEN ("DTPOFF"),   { BFD_RELOC_386_TLS_LDO_32,
8877                                        BFD_RELOC_X86_64_DTPOFF32 },
8878       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8879     { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
8880                                        _dummy_first_bfd_reloc_code_real },
8881       OPERAND_TYPE_NONE },
8882     { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
8883                                        _dummy_first_bfd_reloc_code_real },
8884       OPERAND_TYPE_NONE },
8885     { STRING_COMMA_LEN ("GOT"),      { BFD_RELOC_386_GOT32,
8886                                        BFD_RELOC_X86_64_GOT32    },
8887       OPERAND_TYPE_IMM32_32S_64_DISP32 },
8888     { STRING_COMMA_LEN ("TLSDESC"),  { BFD_RELOC_386_TLS_GOTDESC,
8889                                        BFD_RELOC_X86_64_GOTPC32_TLSDESC },
8890       OPERAND_TYPE_IMM32_32S_DISP32 },
8891     { STRING_COMMA_LEN ("TLSCALL"),  { BFD_RELOC_386_TLS_DESC_CALL,
8892                                        BFD_RELOC_X86_64_TLSDESC_CALL },
8893       OPERAND_TYPE_IMM32_32S_DISP32 },
8894   };
8895   char *cp;
8896   unsigned int j;
8897
8898 #if defined (OBJ_MAYBE_ELF)
8899   if (!IS_ELF)
8900     return NULL;
8901 #endif
8902
8903   for (cp = input_line_pointer; *cp != '@'; cp++)
8904     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
8905       return NULL;
8906
8907   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
8908     {
8909       int len = gotrel[j].len;
8910       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
8911         {
8912           if (gotrel[j].rel[object_64bit] != 0)
8913             {
8914               int first, second;
8915               char *tmpbuf, *past_reloc;
8916
8917               *rel = gotrel[j].rel[object_64bit];
8918
8919               if (types)
8920                 {
8921                   if (flag_code != CODE_64BIT)
8922                     {
8923                       types->bitfield.imm32 = 1;
8924                       types->bitfield.disp32 = 1;
8925                     }
8926                   else
8927                     *types = gotrel[j].types64;
8928                 }
8929
8930               if (j != 0 && GOT_symbol == NULL)
8931                 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
8932
8933               /* The length of the first part of our input line.  */
8934               first = cp - input_line_pointer;
8935
8936               /* The second part goes from after the reloc token until
8937                  (and including) an end_of_line char or comma.  */
8938               past_reloc = cp + 1 + len;
8939               cp = past_reloc;
8940               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
8941                 ++cp;
8942               second = cp + 1 - past_reloc;
8943
8944               /* Allocate and copy string.  The trailing NUL shouldn't
8945                  be necessary, but be safe.  */
8946               tmpbuf = XNEWVEC (char, first + second + 2);
8947               memcpy (tmpbuf, input_line_pointer, first);
8948               if (second != 0 && *past_reloc != ' ')
8949                 /* Replace the relocation token with ' ', so that
8950                    errors like foo@GOTOFF1 will be detected.  */
8951                 tmpbuf[first++] = ' ';
8952               else
8953                 /* Increment length by 1 if the relocation token is
8954                    removed.  */
8955                 len++;
8956               if (adjust)
8957                 *adjust = len;
8958               memcpy (tmpbuf + first, past_reloc, second);
8959               tmpbuf[first + second] = '\0';
8960               return tmpbuf;
8961             }
8962
8963           as_bad (_("@%s reloc is not supported with %d-bit output format"),
8964                   gotrel[j].str, 1 << (5 + object_64bit));
8965           return NULL;
8966         }
8967     }
8968
8969   /* Might be a symbol version string.  Don't as_bad here.  */
8970   return NULL;
8971 }
8972 #endif
8973
8974 #ifdef TE_PE
8975 #ifdef lex_got
8976 #undef lex_got
8977 #endif
8978 /* Parse operands of the form
8979    <symbol>@SECREL32+<nnn>
8980
8981    If we find one, set up the correct relocation in RELOC and copy the
8982    input string, minus the `@SECREL32' into a malloc'd buffer for
8983    parsing by the calling routine.  Return this buffer, and if ADJUST
8984    is non-null set it to the length of the string we removed from the
8985    input line.  Otherwise return NULL.
8986
8987    This function is copied from the ELF version above adjusted for PE targets.  */
8988
8989 static char *
8990 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
8991          int *adjust ATTRIBUTE_UNUSED,
8992          i386_operand_type *types)
8993 {
8994   static const struct
8995   {
8996     const char *str;
8997     int len;
8998     const enum bfd_reloc_code_real rel[2];
8999     const i386_operand_type types64;
9000   }
9001   gotrel[] =
9002   {
9003     { STRING_COMMA_LEN ("SECREL32"),    { BFD_RELOC_32_SECREL,
9004                                           BFD_RELOC_32_SECREL },
9005       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9006   };
9007
9008   char *cp;
9009   unsigned j;
9010
9011   for (cp = input_line_pointer; *cp != '@'; cp++)
9012     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9013       return NULL;
9014
9015   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9016     {
9017       int len = gotrel[j].len;
9018
9019       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9020         {
9021           if (gotrel[j].rel[object_64bit] != 0)
9022             {
9023               int first, second;
9024               char *tmpbuf, *past_reloc;
9025
9026               *rel = gotrel[j].rel[object_64bit];
9027               if (adjust)
9028                 *adjust = len;
9029
9030               if (types)
9031                 {
9032                   if (flag_code != CODE_64BIT)
9033                     {
9034                       types->bitfield.imm32 = 1;
9035                       types->bitfield.disp32 = 1;
9036                     }
9037                   else
9038                     *types = gotrel[j].types64;
9039                 }
9040
9041               /* The length of the first part of our input line.  */
9042               first = cp - input_line_pointer;
9043
9044               /* The second part goes from after the reloc token until
9045                  (and including) an end_of_line char or comma.  */
9046               past_reloc = cp + 1 + len;
9047               cp = past_reloc;
9048               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9049                 ++cp;
9050               second = cp + 1 - past_reloc;
9051
9052               /* Allocate and copy string.  The trailing NUL shouldn't
9053                  be necessary, but be safe.  */
9054               tmpbuf = XNEWVEC (char, first + second + 2);
9055               memcpy (tmpbuf, input_line_pointer, first);
9056               if (second != 0 && *past_reloc != ' ')
9057                 /* Replace the relocation token with ' ', so that
9058                    errors like foo@SECLREL321 will be detected.  */
9059                 tmpbuf[first++] = ' ';
9060               memcpy (tmpbuf + first, past_reloc, second);
9061               tmpbuf[first + second] = '\0';
9062               return tmpbuf;
9063             }
9064
9065           as_bad (_("@%s reloc is not supported with %d-bit output format"),
9066                   gotrel[j].str, 1 << (5 + object_64bit));
9067           return NULL;
9068         }
9069     }
9070
9071   /* Might be a symbol version string.  Don't as_bad here.  */
9072   return NULL;
9073 }
9074
9075 #endif /* TE_PE */
9076
9077 bfd_reloc_code_real_type
9078 x86_cons (expressionS *exp, int size)
9079 {
9080   bfd_reloc_code_real_type got_reloc = NO_RELOC;
9081
9082   intel_syntax = -intel_syntax;
9083
9084   exp->X_md = 0;
9085   if (size == 4 || (object_64bit && size == 8))
9086     {
9087       /* Handle @GOTOFF and the like in an expression.  */
9088       char *save;
9089       char *gotfree_input_line;
9090       int adjust = 0;
9091
9092       save = input_line_pointer;
9093       gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
9094       if (gotfree_input_line)
9095         input_line_pointer = gotfree_input_line;
9096
9097       expression (exp);
9098
9099       if (gotfree_input_line)
9100         {
9101           /* expression () has merrily parsed up to the end of line,
9102              or a comma - in the wrong buffer.  Transfer how far
9103              input_line_pointer has moved to the right buffer.  */
9104           input_line_pointer = (save
9105                                 + (input_line_pointer - gotfree_input_line)
9106                                 + adjust);
9107           free (gotfree_input_line);
9108           if (exp->X_op == O_constant
9109               || exp->X_op == O_absent
9110               || exp->X_op == O_illegal
9111               || exp->X_op == O_register
9112               || exp->X_op == O_big)
9113             {
9114               char c = *input_line_pointer;
9115               *input_line_pointer = 0;
9116               as_bad (_("missing or invalid expression `%s'"), save);
9117               *input_line_pointer = c;
9118             }
9119           else if ((got_reloc == BFD_RELOC_386_PLT32
9120                     || got_reloc == BFD_RELOC_X86_64_PLT32)
9121                    && exp->X_op != O_symbol)
9122             {
9123               char c = *input_line_pointer;
9124               *input_line_pointer = 0;
9125               as_bad (_("invalid PLT expression `%s'"), save);
9126               *input_line_pointer = c;
9127             }
9128         }
9129     }
9130   else
9131     expression (exp);
9132
9133   intel_syntax = -intel_syntax;
9134
9135   if (intel_syntax)
9136     i386_intel_simplify (exp);
9137
9138   return got_reloc;
9139 }
9140
9141 static void
9142 signed_cons (int size)
9143 {
9144   if (flag_code == CODE_64BIT)
9145     cons_sign = 1;
9146   cons (size);
9147   cons_sign = -1;
9148 }
9149
9150 #ifdef TE_PE
9151 static void
9152 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
9153 {
9154   expressionS exp;
9155
9156   do
9157     {
9158       expression (&exp);
9159       if (exp.X_op == O_symbol)
9160         exp.X_op = O_secrel;
9161
9162       emit_expr (&exp, 4);
9163     }
9164   while (*input_line_pointer++ == ',');
9165
9166   input_line_pointer--;
9167   demand_empty_rest_of_line ();
9168 }
9169 #endif
9170
9171 /* Handle Vector operations.  */
9172
9173 static char *
9174 check_VecOperations (char *op_string, char *op_end)
9175 {
9176   const reg_entry *mask;
9177   const char *saved;
9178   char *end_op;
9179
9180   while (*op_string
9181          && (op_end == NULL || op_string < op_end))
9182     {
9183       saved = op_string;
9184       if (*op_string == '{')
9185         {
9186           op_string++;
9187
9188           /* Check broadcasts.  */
9189           if (strncmp (op_string, "1to", 3) == 0)
9190             {
9191               int bcst_type;
9192
9193               if (i.broadcast)
9194                 goto duplicated_vec_op;
9195
9196               op_string += 3;
9197               if (*op_string == '8')
9198                 bcst_type = 8;
9199               else if (*op_string == '4')
9200                 bcst_type = 4;
9201               else if (*op_string == '2')
9202                 bcst_type = 2;
9203               else if (*op_string == '1'
9204                        && *(op_string+1) == '6')
9205                 {
9206                   bcst_type = 16;
9207                   op_string++;
9208                 }
9209               else
9210                 {
9211                   as_bad (_("Unsupported broadcast: `%s'"), saved);
9212                   return NULL;
9213                 }
9214               op_string++;
9215
9216               broadcast_op.type = bcst_type;
9217               broadcast_op.operand = this_operand;
9218               broadcast_op.bytes = 0;
9219               i.broadcast = &broadcast_op;
9220             }
9221           /* Check masking operation.  */
9222           else if ((mask = parse_register (op_string, &end_op)) != NULL)
9223             {
9224               /* k0 can't be used for write mask.  */
9225               if (!mask->reg_type.bitfield.regmask || mask->reg_num == 0)
9226                 {
9227                   as_bad (_("`%s%s' can't be used for write mask"),
9228                           register_prefix, mask->reg_name);
9229                   return NULL;
9230                 }
9231
9232               if (!i.mask)
9233                 {
9234                   mask_op.mask = mask;
9235                   mask_op.zeroing = 0;
9236                   mask_op.operand = this_operand;
9237                   i.mask = &mask_op;
9238                 }
9239               else
9240                 {
9241                   if (i.mask->mask)
9242                     goto duplicated_vec_op;
9243
9244                   i.mask->mask = mask;
9245
9246                   /* Only "{z}" is allowed here.  No need to check
9247                      zeroing mask explicitly.  */
9248                   if (i.mask->operand != this_operand)
9249                     {
9250                       as_bad (_("invalid write mask `%s'"), saved);
9251                       return NULL;
9252                     }
9253                 }
9254
9255               op_string = end_op;
9256             }
9257           /* Check zeroing-flag for masking operation.  */
9258           else if (*op_string == 'z')
9259             {
9260               if (!i.mask)
9261                 {
9262                   mask_op.mask = NULL;
9263                   mask_op.zeroing = 1;
9264                   mask_op.operand = this_operand;
9265                   i.mask = &mask_op;
9266                 }
9267               else
9268                 {
9269                   if (i.mask->zeroing)
9270                     {
9271                     duplicated_vec_op:
9272                       as_bad (_("duplicated `%s'"), saved);
9273                       return NULL;
9274                     }
9275
9276                   i.mask->zeroing = 1;
9277
9278                   /* Only "{%k}" is allowed here.  No need to check mask
9279                      register explicitly.  */
9280                   if (i.mask->operand != this_operand)
9281                     {
9282                       as_bad (_("invalid zeroing-masking `%s'"),
9283                               saved);
9284                       return NULL;
9285                     }
9286                 }
9287
9288               op_string++;
9289             }
9290           else
9291             goto unknown_vec_op;
9292
9293           if (*op_string != '}')
9294             {
9295               as_bad (_("missing `}' in `%s'"), saved);
9296               return NULL;
9297             }
9298           op_string++;
9299
9300           /* Strip whitespace since the addition of pseudo prefixes
9301              changed how the scrubber treats '{'.  */
9302           if (is_space_char (*op_string))
9303             ++op_string;
9304
9305           continue;
9306         }
9307     unknown_vec_op:
9308       /* We don't know this one.  */
9309       as_bad (_("unknown vector operation: `%s'"), saved);
9310       return NULL;
9311     }
9312
9313   if (i.mask && i.mask->zeroing && !i.mask->mask)
9314     {
9315       as_bad (_("zeroing-masking only allowed with write mask"));
9316       return NULL;
9317     }
9318
9319   return op_string;
9320 }
9321
9322 static int
9323 i386_immediate (char *imm_start)
9324 {
9325   char *save_input_line_pointer;
9326   char *gotfree_input_line;
9327   segT exp_seg = 0;
9328   expressionS *exp;
9329   i386_operand_type types;
9330
9331   operand_type_set (&types, ~0);
9332
9333   if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
9334     {
9335       as_bad (_("at most %d immediate operands are allowed"),
9336               MAX_IMMEDIATE_OPERANDS);
9337       return 0;
9338     }
9339
9340   exp = &im_expressions[i.imm_operands++];
9341   i.op[this_operand].imms = exp;
9342
9343   if (is_space_char (*imm_start))
9344     ++imm_start;
9345
9346   save_input_line_pointer = input_line_pointer;
9347   input_line_pointer = imm_start;
9348
9349   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9350   if (gotfree_input_line)
9351     input_line_pointer = gotfree_input_line;
9352
9353   exp_seg = expression (exp);
9354
9355   SKIP_WHITESPACE ();
9356
9357   /* Handle vector operations.  */
9358   if (*input_line_pointer == '{')
9359     {
9360       input_line_pointer = check_VecOperations (input_line_pointer,
9361                                                 NULL);
9362       if (input_line_pointer == NULL)
9363         return 0;
9364     }
9365
9366   if (*input_line_pointer)
9367     as_bad (_("junk `%s' after expression"), input_line_pointer);
9368
9369   input_line_pointer = save_input_line_pointer;
9370   if (gotfree_input_line)
9371     {
9372       free (gotfree_input_line);
9373
9374       if (exp->X_op == O_constant || exp->X_op == O_register)
9375         exp->X_op = O_illegal;
9376     }
9377
9378   return i386_finalize_immediate (exp_seg, exp, types, imm_start);
9379 }
9380
9381 static int
9382 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9383                          i386_operand_type types, const char *imm_start)
9384 {
9385   if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
9386     {
9387       if (imm_start)
9388         as_bad (_("missing or invalid immediate expression `%s'"),
9389                 imm_start);
9390       return 0;
9391     }
9392   else if (exp->X_op == O_constant)
9393     {
9394       /* Size it properly later.  */
9395       i.types[this_operand].bitfield.imm64 = 1;
9396       /* If not 64bit, sign extend val.  */
9397       if (flag_code != CODE_64BIT
9398           && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
9399         exp->X_add_number
9400           = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
9401     }
9402 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9403   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
9404            && exp_seg != absolute_section
9405            && exp_seg != text_section
9406            && exp_seg != data_section
9407            && exp_seg != bss_section
9408            && exp_seg != undefined_section
9409            && !bfd_is_com_section (exp_seg))
9410     {
9411       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9412       return 0;
9413     }
9414 #endif
9415   else if (!intel_syntax && exp_seg == reg_section)
9416     {
9417       if (imm_start)
9418         as_bad (_("illegal immediate register operand %s"), imm_start);
9419       return 0;
9420     }
9421   else
9422     {
9423       /* This is an address.  The size of the address will be
9424          determined later, depending on destination register,
9425          suffix, or the default for the section.  */
9426       i.types[this_operand].bitfield.imm8 = 1;
9427       i.types[this_operand].bitfield.imm16 = 1;
9428       i.types[this_operand].bitfield.imm32 = 1;
9429       i.types[this_operand].bitfield.imm32s = 1;
9430       i.types[this_operand].bitfield.imm64 = 1;
9431       i.types[this_operand] = operand_type_and (i.types[this_operand],
9432                                                 types);
9433     }
9434
9435   return 1;
9436 }
9437
9438 static char *
9439 i386_scale (char *scale)
9440 {
9441   offsetT val;
9442   char *save = input_line_pointer;
9443
9444   input_line_pointer = scale;
9445   val = get_absolute_expression ();
9446
9447   switch (val)
9448     {
9449     case 1:
9450       i.log2_scale_factor = 0;
9451       break;
9452     case 2:
9453       i.log2_scale_factor = 1;
9454       break;
9455     case 4:
9456       i.log2_scale_factor = 2;
9457       break;
9458     case 8:
9459       i.log2_scale_factor = 3;
9460       break;
9461     default:
9462       {
9463         char sep = *input_line_pointer;
9464
9465         *input_line_pointer = '\0';
9466         as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
9467                 scale);
9468         *input_line_pointer = sep;
9469         input_line_pointer = save;
9470         return NULL;
9471       }
9472     }
9473   if (i.log2_scale_factor != 0 && i.index_reg == 0)
9474     {
9475       as_warn (_("scale factor of %d without an index register"),
9476                1 << i.log2_scale_factor);
9477       i.log2_scale_factor = 0;
9478     }
9479   scale = input_line_pointer;
9480   input_line_pointer = save;
9481   return scale;
9482 }
9483
9484 static int
9485 i386_displacement (char *disp_start, char *disp_end)
9486 {
9487   expressionS *exp;
9488   segT exp_seg = 0;
9489   char *save_input_line_pointer;
9490   char *gotfree_input_line;
9491   int override;
9492   i386_operand_type bigdisp, types = anydisp;
9493   int ret;
9494
9495   if (i.disp_operands == MAX_MEMORY_OPERANDS)
9496     {
9497       as_bad (_("at most %d displacement operands are allowed"),
9498               MAX_MEMORY_OPERANDS);
9499       return 0;
9500     }
9501
9502   operand_type_set (&bigdisp, 0);
9503   if ((i.types[this_operand].bitfield.jumpabsolute)
9504       || (!current_templates->start->opcode_modifier.jump
9505           && !current_templates->start->opcode_modifier.jumpdword))
9506     {
9507       bigdisp.bitfield.disp32 = 1;
9508       override = (i.prefix[ADDR_PREFIX] != 0);
9509       if (flag_code == CODE_64BIT)
9510         {
9511           if (!override)
9512             {
9513               bigdisp.bitfield.disp32s = 1;
9514               bigdisp.bitfield.disp64 = 1;
9515             }
9516         }
9517       else if ((flag_code == CODE_16BIT) ^ override)
9518         {
9519           bigdisp.bitfield.disp32 = 0;
9520           bigdisp.bitfield.disp16 = 1;
9521         }
9522     }
9523   else
9524     {
9525       /* For PC-relative branches, the width of the displacement
9526          is dependent upon data size, not address size.  */
9527       override = (i.prefix[DATA_PREFIX] != 0);
9528       if (flag_code == CODE_64BIT)
9529         {
9530           if (override || i.suffix == WORD_MNEM_SUFFIX)
9531             bigdisp.bitfield.disp16 = 1;
9532           else
9533             {
9534               bigdisp.bitfield.disp32 = 1;
9535               bigdisp.bitfield.disp32s = 1;
9536             }
9537         }
9538       else
9539         {
9540           if (!override)
9541             override = (i.suffix == (flag_code != CODE_16BIT
9542                                      ? WORD_MNEM_SUFFIX
9543                                      : LONG_MNEM_SUFFIX));
9544           bigdisp.bitfield.disp32 = 1;
9545           if ((flag_code == CODE_16BIT) ^ override)
9546             {
9547               bigdisp.bitfield.disp32 = 0;
9548               bigdisp.bitfield.disp16 = 1;
9549             }
9550         }
9551     }
9552   i.types[this_operand] = operand_type_or (i.types[this_operand],
9553                                            bigdisp);
9554
9555   exp = &disp_expressions[i.disp_operands];
9556   i.op[this_operand].disps = exp;
9557   i.disp_operands++;
9558   save_input_line_pointer = input_line_pointer;
9559   input_line_pointer = disp_start;
9560   END_STRING_AND_SAVE (disp_end);
9561
9562 #ifndef GCC_ASM_O_HACK
9563 #define GCC_ASM_O_HACK 0
9564 #endif
9565 #if GCC_ASM_O_HACK
9566   END_STRING_AND_SAVE (disp_end + 1);
9567   if (i.types[this_operand].bitfield.baseIndex
9568       && displacement_string_end[-1] == '+')
9569     {
9570       /* This hack is to avoid a warning when using the "o"
9571          constraint within gcc asm statements.
9572          For instance:
9573
9574          #define _set_tssldt_desc(n,addr,limit,type) \
9575          __asm__ __volatile__ ( \
9576          "movw %w2,%0\n\t" \
9577          "movw %w1,2+%0\n\t" \
9578          "rorl $16,%1\n\t" \
9579          "movb %b1,4+%0\n\t" \
9580          "movb %4,5+%0\n\t" \
9581          "movb $0,6+%0\n\t" \
9582          "movb %h1,7+%0\n\t" \
9583          "rorl $16,%1" \
9584          : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
9585
9586          This works great except that the output assembler ends
9587          up looking a bit weird if it turns out that there is
9588          no offset.  You end up producing code that looks like:
9589
9590          #APP
9591          movw $235,(%eax)
9592          movw %dx,2+(%eax)
9593          rorl $16,%edx
9594          movb %dl,4+(%eax)
9595          movb $137,5+(%eax)
9596          movb $0,6+(%eax)
9597          movb %dh,7+(%eax)
9598          rorl $16,%edx
9599          #NO_APP
9600
9601          So here we provide the missing zero.  */
9602
9603       *displacement_string_end = '0';
9604     }
9605 #endif
9606   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9607   if (gotfree_input_line)
9608     input_line_pointer = gotfree_input_line;
9609
9610   exp_seg = expression (exp);
9611
9612   SKIP_WHITESPACE ();
9613   if (*input_line_pointer)
9614     as_bad (_("junk `%s' after expression"), input_line_pointer);
9615 #if GCC_ASM_O_HACK
9616   RESTORE_END_STRING (disp_end + 1);
9617 #endif
9618   input_line_pointer = save_input_line_pointer;
9619   if (gotfree_input_line)
9620     {
9621       free (gotfree_input_line);
9622
9623       if (exp->X_op == O_constant || exp->X_op == O_register)
9624         exp->X_op = O_illegal;
9625     }
9626
9627   ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
9628
9629   RESTORE_END_STRING (disp_end);
9630
9631   return ret;
9632 }
9633
9634 static int
9635 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9636                             i386_operand_type types, const char *disp_start)
9637 {
9638   i386_operand_type bigdisp;
9639   int ret = 1;
9640
9641   /* We do this to make sure that the section symbol is in
9642      the symbol table.  We will ultimately change the relocation
9643      to be relative to the beginning of the section.  */
9644   if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
9645       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
9646       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
9647     {
9648       if (exp->X_op != O_symbol)
9649         goto inv_disp;
9650
9651       if (S_IS_LOCAL (exp->X_add_symbol)
9652           && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
9653           && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
9654         section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
9655       exp->X_op = O_subtract;
9656       exp->X_op_symbol = GOT_symbol;
9657       if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
9658         i.reloc[this_operand] = BFD_RELOC_32_PCREL;
9659       else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
9660         i.reloc[this_operand] = BFD_RELOC_64;
9661       else
9662         i.reloc[this_operand] = BFD_RELOC_32;
9663     }
9664
9665   else if (exp->X_op == O_absent
9666            || exp->X_op == O_illegal
9667            || exp->X_op == O_big)
9668     {
9669     inv_disp:
9670       as_bad (_("missing or invalid displacement expression `%s'"),
9671               disp_start);
9672       ret = 0;
9673     }
9674
9675   else if (flag_code == CODE_64BIT
9676            && !i.prefix[ADDR_PREFIX]
9677            && exp->X_op == O_constant)
9678     {
9679       /* Since displacement is signed extended to 64bit, don't allow
9680          disp32 and turn off disp32s if they are out of range.  */
9681       i.types[this_operand].bitfield.disp32 = 0;
9682       if (!fits_in_signed_long (exp->X_add_number))
9683         {
9684           i.types[this_operand].bitfield.disp32s = 0;
9685           if (i.types[this_operand].bitfield.baseindex)
9686             {
9687               as_bad (_("0x%lx out range of signed 32bit displacement"),
9688                       (long) exp->X_add_number);
9689               ret = 0;
9690             }
9691         }
9692     }
9693
9694 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9695   else if (exp->X_op != O_constant
9696            && OUTPUT_FLAVOR == bfd_target_aout_flavour
9697            && exp_seg != absolute_section
9698            && exp_seg != text_section
9699            && exp_seg != data_section
9700            && exp_seg != bss_section
9701            && exp_seg != undefined_section
9702            && !bfd_is_com_section (exp_seg))
9703     {
9704       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9705       ret = 0;
9706     }
9707 #endif
9708
9709   /* Check if this is a displacement only operand.  */
9710   bigdisp = i.types[this_operand];
9711   bigdisp.bitfield.disp8 = 0;
9712   bigdisp.bitfield.disp16 = 0;
9713   bigdisp.bitfield.disp32 = 0;
9714   bigdisp.bitfield.disp32s = 0;
9715   bigdisp.bitfield.disp64 = 0;
9716   if (operand_type_all_zero (&bigdisp))
9717     i.types[this_operand] = operand_type_and (i.types[this_operand],
9718                                               types);
9719
9720   return ret;
9721 }
9722
9723 /* Return the active addressing mode, taking address override and
9724    registers forming the address into consideration.  Update the
9725    address override prefix if necessary.  */
9726
9727 static enum flag_code
9728 i386_addressing_mode (void)
9729 {
9730   enum flag_code addr_mode;
9731
9732   if (i.prefix[ADDR_PREFIX])
9733     addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
9734   else
9735     {
9736       addr_mode = flag_code;
9737
9738 #if INFER_ADDR_PREFIX
9739       if (i.mem_operands == 0)
9740         {
9741           /* Infer address prefix from the first memory operand.  */
9742           const reg_entry *addr_reg = i.base_reg;
9743
9744           if (addr_reg == NULL)
9745             addr_reg = i.index_reg;
9746
9747           if (addr_reg)
9748             {
9749               if (addr_reg->reg_type.bitfield.dword)
9750                 addr_mode = CODE_32BIT;
9751               else if (flag_code != CODE_64BIT
9752                        && addr_reg->reg_type.bitfield.word)
9753                 addr_mode = CODE_16BIT;
9754
9755               if (addr_mode != flag_code)
9756                 {
9757                   i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
9758                   i.prefixes += 1;
9759                   /* Change the size of any displacement too.  At most one
9760                      of Disp16 or Disp32 is set.
9761                      FIXME.  There doesn't seem to be any real need for
9762                      separate Disp16 and Disp32 flags.  The same goes for
9763                      Imm16 and Imm32.  Removing them would probably clean
9764                      up the code quite a lot.  */
9765                   if (flag_code != CODE_64BIT
9766                       && (i.types[this_operand].bitfield.disp16
9767                           || i.types[this_operand].bitfield.disp32))
9768                     i.types[this_operand]
9769                       = operand_type_xor (i.types[this_operand], disp16_32);
9770                 }
9771             }
9772         }
9773 #endif
9774     }
9775
9776   return addr_mode;
9777 }
9778
9779 /* Make sure the memory operand we've been dealt is valid.
9780    Return 1 on success, 0 on a failure.  */
9781
9782 static int
9783 i386_index_check (const char *operand_string)
9784 {
9785   const char *kind = "base/index";
9786   enum flag_code addr_mode = i386_addressing_mode ();
9787
9788   if (current_templates->start->opcode_modifier.isstring
9789       && !current_templates->start->cpu_flags.bitfield.cpupadlock
9790       && (current_templates->end[-1].opcode_modifier.isstring
9791           || i.mem_operands))
9792     {
9793       /* Memory operands of string insns are special in that they only allow
9794          a single register (rDI, rSI, or rBX) as their memory address.  */
9795       const reg_entry *expected_reg;
9796       static const char *di_si[][2] =
9797         {
9798           { "esi", "edi" },
9799           { "si", "di" },
9800           { "rsi", "rdi" }
9801         };
9802       static const char *bx[] = { "ebx", "bx", "rbx" };
9803
9804       kind = "string address";
9805
9806       if (current_templates->start->opcode_modifier.repprefixok)
9807         {
9808           i386_operand_type type = current_templates->end[-1].operand_types[0];
9809
9810           if (!type.bitfield.baseindex
9811               || ((!i.mem_operands != !intel_syntax)
9812                   && current_templates->end[-1].operand_types[1]
9813                      .bitfield.baseindex))
9814             type = current_templates->end[-1].operand_types[1];
9815           expected_reg = hash_find (reg_hash,
9816                                     di_si[addr_mode][type.bitfield.esseg]);
9817
9818         }
9819       else
9820         expected_reg = hash_find (reg_hash, bx[addr_mode]);
9821
9822       if (i.base_reg != expected_reg
9823           || i.index_reg
9824           || operand_type_check (i.types[this_operand], disp))
9825         {
9826           /* The second memory operand must have the same size as
9827              the first one.  */
9828           if (i.mem_operands
9829               && i.base_reg
9830               && !((addr_mode == CODE_64BIT
9831                     && i.base_reg->reg_type.bitfield.qword)
9832                    || (addr_mode == CODE_32BIT
9833                        ? i.base_reg->reg_type.bitfield.dword
9834                        : i.base_reg->reg_type.bitfield.word)))
9835             goto bad_address;
9836
9837           as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
9838                    operand_string,
9839                    intel_syntax ? '[' : '(',
9840                    register_prefix,
9841                    expected_reg->reg_name,
9842                    intel_syntax ? ']' : ')');
9843           return 1;
9844         }
9845       else
9846         return 1;
9847
9848 bad_address:
9849       as_bad (_("`%s' is not a valid %s expression"),
9850               operand_string, kind);
9851       return 0;
9852     }
9853   else
9854     {
9855       if (addr_mode != CODE_16BIT)
9856         {
9857           /* 32-bit/64-bit checks.  */
9858           if ((i.base_reg
9859                && ((addr_mode == CODE_64BIT
9860                     ? !i.base_reg->reg_type.bitfield.qword
9861                     : !i.base_reg->reg_type.bitfield.dword)
9862                    || (i.index_reg && i.base_reg->reg_num == RegIP)
9863                    || i.base_reg->reg_num == RegIZ))
9864               || (i.index_reg
9865                   && !i.index_reg->reg_type.bitfield.xmmword
9866                   && !i.index_reg->reg_type.bitfield.ymmword
9867                   && !i.index_reg->reg_type.bitfield.zmmword
9868                   && ((addr_mode == CODE_64BIT
9869                        ? !i.index_reg->reg_type.bitfield.qword
9870                        : !i.index_reg->reg_type.bitfield.dword)
9871                       || !i.index_reg->reg_type.bitfield.baseindex)))
9872             goto bad_address;
9873
9874           /* bndmk, bndldx, and bndstx have special restrictions. */
9875           if (current_templates->start->base_opcode == 0xf30f1b
9876               || (current_templates->start->base_opcode & ~1) == 0x0f1a)
9877             {
9878               /* They cannot use RIP-relative addressing. */
9879               if (i.base_reg && i.base_reg->reg_num == RegIP)
9880                 {
9881                   as_bad (_("`%s' cannot be used here"), operand_string);
9882                   return 0;
9883                 }
9884
9885               /* bndldx and bndstx ignore their scale factor. */
9886               if (current_templates->start->base_opcode != 0xf30f1b
9887                   && i.log2_scale_factor)
9888                 as_warn (_("register scaling is being ignored here"));
9889             }
9890         }
9891       else
9892         {
9893           /* 16-bit checks.  */
9894           if ((i.base_reg
9895                && (!i.base_reg->reg_type.bitfield.word
9896                    || !i.base_reg->reg_type.bitfield.baseindex))
9897               || (i.index_reg
9898                   && (!i.index_reg->reg_type.bitfield.word
9899                       || !i.index_reg->reg_type.bitfield.baseindex
9900                       || !(i.base_reg
9901                            && i.base_reg->reg_num < 6
9902                            && i.index_reg->reg_num >= 6
9903                            && i.log2_scale_factor == 0))))
9904             goto bad_address;
9905         }
9906     }
9907   return 1;
9908 }
9909
9910 /* Handle vector immediates.  */
9911
9912 static int
9913 RC_SAE_immediate (const char *imm_start)
9914 {
9915   unsigned int match_found, j;
9916   const char *pstr = imm_start;
9917   expressionS *exp;
9918
9919   if (*pstr != '{')
9920     return 0;
9921
9922   pstr++;
9923   match_found = 0;
9924   for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
9925     {
9926       if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
9927         {
9928           if (!i.rounding)
9929             {
9930               rc_op.type = RC_NamesTable[j].type;
9931               rc_op.operand = this_operand;
9932               i.rounding = &rc_op;
9933             }
9934           else
9935             {
9936               as_bad (_("duplicated `%s'"), imm_start);
9937               return 0;
9938             }
9939           pstr += RC_NamesTable[j].len;
9940           match_found = 1;
9941           break;
9942         }
9943     }
9944   if (!match_found)
9945     return 0;
9946
9947   if (*pstr++ != '}')
9948     {
9949       as_bad (_("Missing '}': '%s'"), imm_start);
9950       return 0;
9951     }
9952   /* RC/SAE immediate string should contain nothing more.  */;
9953   if (*pstr != 0)
9954     {
9955       as_bad (_("Junk after '}': '%s'"), imm_start);
9956       return 0;
9957     }
9958
9959   exp = &im_expressions[i.imm_operands++];
9960   i.op[this_operand].imms = exp;
9961
9962   exp->X_op = O_constant;
9963   exp->X_add_number = 0;
9964   exp->X_add_symbol = (symbolS *) 0;
9965   exp->X_op_symbol = (symbolS *) 0;
9966
9967   i.types[this_operand].bitfield.imm8 = 1;
9968   return 1;
9969 }
9970
9971 /* Only string instructions can have a second memory operand, so
9972    reduce current_templates to just those if it contains any.  */
9973 static int
9974 maybe_adjust_templates (void)
9975 {
9976   const insn_template *t;
9977
9978   gas_assert (i.mem_operands == 1);
9979
9980   for (t = current_templates->start; t < current_templates->end; ++t)
9981     if (t->opcode_modifier.isstring)
9982       break;
9983
9984   if (t < current_templates->end)
9985     {
9986       static templates aux_templates;
9987       bfd_boolean recheck;
9988
9989       aux_templates.start = t;
9990       for (; t < current_templates->end; ++t)
9991         if (!t->opcode_modifier.isstring)
9992           break;
9993       aux_templates.end = t;
9994
9995       /* Determine whether to re-check the first memory operand.  */
9996       recheck = (aux_templates.start != current_templates->start
9997                  || t != current_templates->end);
9998
9999       current_templates = &aux_templates;
10000
10001       if (recheck)
10002         {
10003           i.mem_operands = 0;
10004           if (i.memop1_string != NULL
10005               && i386_index_check (i.memop1_string) == 0)
10006             return 0;
10007           i.mem_operands = 1;
10008         }
10009     }
10010
10011   return 1;
10012 }
10013
10014 /* Parse OPERAND_STRING into the i386_insn structure I.  Returns zero
10015    on error.  */
10016
10017 static int
10018 i386_att_operand (char *operand_string)
10019 {
10020   const reg_entry *r;
10021   char *end_op;
10022   char *op_string = operand_string;
10023
10024   if (is_space_char (*op_string))
10025     ++op_string;
10026
10027   /* We check for an absolute prefix (differentiating,
10028      for example, 'jmp pc_relative_label' from 'jmp *absolute_label'.  */
10029   if (*op_string == ABSOLUTE_PREFIX)
10030     {
10031       ++op_string;
10032       if (is_space_char (*op_string))
10033         ++op_string;
10034       i.types[this_operand].bitfield.jumpabsolute = 1;
10035     }
10036
10037   /* Check if operand is a register.  */
10038   if ((r = parse_register (op_string, &end_op)) != NULL)
10039     {
10040       i386_operand_type temp;
10041
10042       /* Check for a segment override by searching for ':' after a
10043          segment register.  */
10044       op_string = end_op;
10045       if (is_space_char (*op_string))
10046         ++op_string;
10047       if (*op_string == ':' && r->reg_type.bitfield.sreg)
10048         {
10049           switch (r->reg_num)
10050             {
10051             case 0:
10052               i.seg[i.mem_operands] = &es;
10053               break;
10054             case 1:
10055               i.seg[i.mem_operands] = &cs;
10056               break;
10057             case 2:
10058               i.seg[i.mem_operands] = &ss;
10059               break;
10060             case 3:
10061               i.seg[i.mem_operands] = &ds;
10062               break;
10063             case 4:
10064               i.seg[i.mem_operands] = &fs;
10065               break;
10066             case 5:
10067               i.seg[i.mem_operands] = &gs;
10068               break;
10069             }
10070
10071           /* Skip the ':' and whitespace.  */
10072           ++op_string;
10073           if (is_space_char (*op_string))
10074             ++op_string;
10075
10076           if (!is_digit_char (*op_string)
10077               && !is_identifier_char (*op_string)
10078               && *op_string != '('
10079               && *op_string != ABSOLUTE_PREFIX)
10080             {
10081               as_bad (_("bad memory operand `%s'"), op_string);
10082               return 0;
10083             }
10084           /* Handle case of %es:*foo.  */
10085           if (*op_string == ABSOLUTE_PREFIX)
10086             {
10087               ++op_string;
10088               if (is_space_char (*op_string))
10089                 ++op_string;
10090               i.types[this_operand].bitfield.jumpabsolute = 1;
10091             }
10092           goto do_memory_reference;
10093         }
10094
10095       /* Handle vector operations.  */
10096       if (*op_string == '{')
10097         {
10098           op_string = check_VecOperations (op_string, NULL);
10099           if (op_string == NULL)
10100             return 0;
10101         }
10102
10103       if (*op_string)
10104         {
10105           as_bad (_("junk `%s' after register"), op_string);
10106           return 0;
10107         }
10108       temp = r->reg_type;
10109       temp.bitfield.baseindex = 0;
10110       i.types[this_operand] = operand_type_or (i.types[this_operand],
10111                                                temp);
10112       i.types[this_operand].bitfield.unspecified = 0;
10113       i.op[this_operand].regs = r;
10114       i.reg_operands++;
10115     }
10116   else if (*op_string == REGISTER_PREFIX)
10117     {
10118       as_bad (_("bad register name `%s'"), op_string);
10119       return 0;
10120     }
10121   else if (*op_string == IMMEDIATE_PREFIX)
10122     {
10123       ++op_string;
10124       if (i.types[this_operand].bitfield.jumpabsolute)
10125         {
10126           as_bad (_("immediate operand illegal with absolute jump"));
10127           return 0;
10128         }
10129       if (!i386_immediate (op_string))
10130         return 0;
10131     }
10132   else if (RC_SAE_immediate (operand_string))
10133     {
10134       /* If it is a RC or SAE immediate, do nothing.  */
10135       ;
10136     }
10137   else if (is_digit_char (*op_string)
10138            || is_identifier_char (*op_string)
10139            || *op_string == '"'
10140            || *op_string == '(')
10141     {
10142       /* This is a memory reference of some sort.  */
10143       char *base_string;
10144
10145       /* Start and end of displacement string expression (if found).  */
10146       char *displacement_string_start;
10147       char *displacement_string_end;
10148       char *vop_start;
10149
10150     do_memory_reference:
10151       if (i.mem_operands == 1 && !maybe_adjust_templates ())
10152         return 0;
10153       if ((i.mem_operands == 1
10154            && !current_templates->start->opcode_modifier.isstring)
10155           || i.mem_operands == 2)
10156         {
10157           as_bad (_("too many memory references for `%s'"),
10158                   current_templates->start->name);
10159           return 0;
10160         }
10161
10162       /* Check for base index form.  We detect the base index form by
10163          looking for an ')' at the end of the operand, searching
10164          for the '(' matching it, and finding a REGISTER_PREFIX or ','
10165          after the '('.  */
10166       base_string = op_string + strlen (op_string);
10167
10168       /* Handle vector operations.  */
10169       vop_start = strchr (op_string, '{');
10170       if (vop_start && vop_start < base_string)
10171         {
10172           if (check_VecOperations (vop_start, base_string) == NULL)
10173             return 0;
10174           base_string = vop_start;
10175         }
10176
10177       --base_string;
10178       if (is_space_char (*base_string))
10179         --base_string;
10180
10181       /* If we only have a displacement, set-up for it to be parsed later.  */
10182       displacement_string_start = op_string;
10183       displacement_string_end = base_string + 1;
10184
10185       if (*base_string == ')')
10186         {
10187           char *temp_string;
10188           unsigned int parens_balanced = 1;
10189           /* We've already checked that the number of left & right ()'s are
10190              equal, so this loop will not be infinite.  */
10191           do
10192             {
10193               base_string--;
10194               if (*base_string == ')')
10195                 parens_balanced++;
10196               if (*base_string == '(')
10197                 parens_balanced--;
10198             }
10199           while (parens_balanced);
10200
10201           temp_string = base_string;
10202
10203           /* Skip past '(' and whitespace.  */
10204           ++base_string;
10205           if (is_space_char (*base_string))
10206             ++base_string;
10207
10208           if (*base_string == ','
10209               || ((i.base_reg = parse_register (base_string, &end_op))
10210                   != NULL))
10211             {
10212               displacement_string_end = temp_string;
10213
10214               i.types[this_operand].bitfield.baseindex = 1;
10215
10216               if (i.base_reg)
10217                 {
10218                   base_string = end_op;
10219                   if (is_space_char (*base_string))
10220                     ++base_string;
10221                 }
10222
10223               /* There may be an index reg or scale factor here.  */
10224               if (*base_string == ',')
10225                 {
10226                   ++base_string;
10227                   if (is_space_char (*base_string))
10228                     ++base_string;
10229
10230                   if ((i.index_reg = parse_register (base_string, &end_op))
10231                       != NULL)
10232                     {
10233                       base_string = end_op;
10234                       if (is_space_char (*base_string))
10235                         ++base_string;
10236                       if (*base_string == ',')
10237                         {
10238                           ++base_string;
10239                           if (is_space_char (*base_string))
10240                             ++base_string;
10241                         }
10242                       else if (*base_string != ')')
10243                         {
10244                           as_bad (_("expecting `,' or `)' "
10245                                     "after index register in `%s'"),
10246                                   operand_string);
10247                           return 0;
10248                         }
10249                     }
10250                   else if (*base_string == REGISTER_PREFIX)
10251                     {
10252                       end_op = strchr (base_string, ',');
10253                       if (end_op)
10254                         *end_op = '\0';
10255                       as_bad (_("bad register name `%s'"), base_string);
10256                       return 0;
10257                     }
10258
10259                   /* Check for scale factor.  */
10260                   if (*base_string != ')')
10261                     {
10262                       char *end_scale = i386_scale (base_string);
10263
10264                       if (!end_scale)
10265                         return 0;
10266
10267                       base_string = end_scale;
10268                       if (is_space_char (*base_string))
10269                         ++base_string;
10270                       if (*base_string != ')')
10271                         {
10272                           as_bad (_("expecting `)' "
10273                                     "after scale factor in `%s'"),
10274                                   operand_string);
10275                           return 0;
10276                         }
10277                     }
10278                   else if (!i.index_reg)
10279                     {
10280                       as_bad (_("expecting index register or scale factor "
10281                                 "after `,'; got '%c'"),
10282                               *base_string);
10283                       return 0;
10284                     }
10285                 }
10286               else if (*base_string != ')')
10287                 {
10288                   as_bad (_("expecting `,' or `)' "
10289                             "after base register in `%s'"),
10290                           operand_string);
10291                   return 0;
10292                 }
10293             }
10294           else if (*base_string == REGISTER_PREFIX)
10295             {
10296               end_op = strchr (base_string, ',');
10297               if (end_op)
10298                 *end_op = '\0';
10299               as_bad (_("bad register name `%s'"), base_string);
10300               return 0;
10301             }
10302         }
10303
10304       /* If there's an expression beginning the operand, parse it,
10305          assuming displacement_string_start and
10306          displacement_string_end are meaningful.  */
10307       if (displacement_string_start != displacement_string_end)
10308         {
10309           if (!i386_displacement (displacement_string_start,
10310                                   displacement_string_end))
10311             return 0;
10312         }
10313
10314       /* Special case for (%dx) while doing input/output op.  */
10315       if (i.base_reg
10316           && i.base_reg->reg_type.bitfield.inoutportreg
10317           && i.index_reg == 0
10318           && i.log2_scale_factor == 0
10319           && i.seg[i.mem_operands] == 0
10320           && !operand_type_check (i.types[this_operand], disp))
10321         {
10322           i.types[this_operand] = i.base_reg->reg_type;
10323           return 1;
10324         }
10325
10326       if (i386_index_check (operand_string) == 0)
10327         return 0;
10328       i.flags[this_operand] |= Operand_Mem;
10329       if (i.mem_operands == 0)
10330         i.memop1_string = xstrdup (operand_string);
10331       i.mem_operands++;
10332     }
10333   else
10334     {
10335       /* It's not a memory operand; argh!  */
10336       as_bad (_("invalid char %s beginning operand %d `%s'"),
10337               output_invalid (*op_string),
10338               this_operand + 1,
10339               op_string);
10340       return 0;
10341     }
10342   return 1;                     /* Normal return.  */
10343 }
10344 \f
10345 /* Calculate the maximum variable size (i.e., excluding fr_fix)
10346    that an rs_machine_dependent frag may reach.  */
10347
10348 unsigned int
10349 i386_frag_max_var (fragS *frag)
10350 {
10351   /* The only relaxable frags are for jumps.
10352      Unconditional jumps can grow by 4 bytes and others by 5 bytes.  */
10353   gas_assert (frag->fr_type == rs_machine_dependent);
10354   return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
10355 }
10356
10357 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10358 static int
10359 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
10360 {
10361   /* STT_GNU_IFUNC symbol must go through PLT.  */
10362   if ((symbol_get_bfdsym (fr_symbol)->flags
10363        & BSF_GNU_INDIRECT_FUNCTION) != 0)
10364     return 0;
10365
10366   if (!S_IS_EXTERNAL (fr_symbol))
10367     /* Symbol may be weak or local.  */
10368     return !S_IS_WEAK (fr_symbol);
10369
10370   /* Global symbols with non-default visibility can't be preempted. */
10371   if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
10372     return 1;
10373
10374   if (fr_var != NO_RELOC)
10375     switch ((enum bfd_reloc_code_real) fr_var)
10376       {
10377       case BFD_RELOC_386_PLT32:
10378       case BFD_RELOC_X86_64_PLT32:
10379         /* Symbol with PLT relocation may be preempted. */
10380         return 0;
10381       default:
10382         abort ();
10383       }
10384
10385   /* Global symbols with default visibility in a shared library may be
10386      preempted by another definition.  */
10387   return !shared;
10388 }
10389 #endif
10390
10391 /* md_estimate_size_before_relax()
10392
10393    Called just before relax() for rs_machine_dependent frags.  The x86
10394    assembler uses these frags to handle variable size jump
10395    instructions.
10396
10397    Any symbol that is now undefined will not become defined.
10398    Return the correct fr_subtype in the frag.
10399    Return the initial "guess for variable size of frag" to caller.
10400    The guess is actually the growth beyond the fixed part.  Whatever
10401    we do to grow the fixed or variable part contributes to our
10402    returned value.  */
10403
10404 int
10405 md_estimate_size_before_relax (fragS *fragP, segT segment)
10406 {
10407   /* We've already got fragP->fr_subtype right;  all we have to do is
10408      check for un-relaxable symbols.  On an ELF system, we can't relax
10409      an externally visible symbol, because it may be overridden by a
10410      shared library.  */
10411   if (S_GET_SEGMENT (fragP->fr_symbol) != segment
10412 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10413       || (IS_ELF
10414           && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
10415                                                 fragP->fr_var))
10416 #endif
10417 #if defined (OBJ_COFF) && defined (TE_PE)
10418       || (OUTPUT_FLAVOR == bfd_target_coff_flavour
10419           && S_IS_WEAK (fragP->fr_symbol))
10420 #endif
10421       )
10422     {
10423       /* Symbol is undefined in this segment, or we need to keep a
10424          reloc so that weak symbols can be overridden.  */
10425       int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
10426       enum bfd_reloc_code_real reloc_type;
10427       unsigned char *opcode;
10428       int old_fr_fix;
10429
10430       if (fragP->fr_var != NO_RELOC)
10431         reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
10432       else if (size == 2)
10433         reloc_type = BFD_RELOC_16_PCREL;
10434 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10435       else if (need_plt32_p (fragP->fr_symbol))
10436         reloc_type = BFD_RELOC_X86_64_PLT32;
10437 #endif
10438       else
10439         reloc_type = BFD_RELOC_32_PCREL;
10440
10441       old_fr_fix = fragP->fr_fix;
10442       opcode = (unsigned char *) fragP->fr_opcode;
10443
10444       switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
10445         {
10446         case UNCOND_JUMP:
10447           /* Make jmp (0xeb) a (d)word displacement jump.  */
10448           opcode[0] = 0xe9;
10449           fragP->fr_fix += size;
10450           fix_new (fragP, old_fr_fix, size,
10451                    fragP->fr_symbol,
10452                    fragP->fr_offset, 1,
10453                    reloc_type);
10454           break;
10455
10456         case COND_JUMP86:
10457           if (size == 2
10458               && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
10459             {
10460               /* Negate the condition, and branch past an
10461                  unconditional jump.  */
10462               opcode[0] ^= 1;
10463               opcode[1] = 3;
10464               /* Insert an unconditional jump.  */
10465               opcode[2] = 0xe9;
10466               /* We added two extra opcode bytes, and have a two byte
10467                  offset.  */
10468               fragP->fr_fix += 2 + 2;
10469               fix_new (fragP, old_fr_fix + 2, 2,
10470                        fragP->fr_symbol,
10471                        fragP->fr_offset, 1,
10472                        reloc_type);
10473               break;
10474             }
10475           /* Fall through.  */
10476
10477         case COND_JUMP:
10478           if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
10479             {
10480               fixS *fixP;
10481
10482               fragP->fr_fix += 1;
10483               fixP = fix_new (fragP, old_fr_fix, 1,
10484                               fragP->fr_symbol,
10485                               fragP->fr_offset, 1,
10486                               BFD_RELOC_8_PCREL);
10487               fixP->fx_signed = 1;
10488               break;
10489             }
10490
10491           /* This changes the byte-displacement jump 0x7N
10492              to the (d)word-displacement jump 0x0f,0x8N.  */
10493           opcode[1] = opcode[0] + 0x10;
10494           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
10495           /* We've added an opcode byte.  */
10496           fragP->fr_fix += 1 + size;
10497           fix_new (fragP, old_fr_fix + 1, size,
10498                    fragP->fr_symbol,
10499                    fragP->fr_offset, 1,
10500                    reloc_type);
10501           break;
10502
10503         default:
10504           BAD_CASE (fragP->fr_subtype);
10505           break;
10506         }
10507       frag_wane (fragP);
10508       return fragP->fr_fix - old_fr_fix;
10509     }
10510
10511   /* Guess size depending on current relax state.  Initially the relax
10512      state will correspond to a short jump and we return 1, because
10513      the variable part of the frag (the branch offset) is one byte
10514      long.  However, we can relax a section more than once and in that
10515      case we must either set fr_subtype back to the unrelaxed state,
10516      or return the value for the appropriate branch.  */
10517   return md_relax_table[fragP->fr_subtype].rlx_length;
10518 }
10519
10520 /* Called after relax() is finished.
10521
10522    In:  Address of frag.
10523         fr_type == rs_machine_dependent.
10524         fr_subtype is what the address relaxed to.
10525
10526    Out: Any fixSs and constants are set up.
10527         Caller will turn frag into a ".space 0".  */
10528
10529 void
10530 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
10531                  fragS *fragP)
10532 {
10533   unsigned char *opcode;
10534   unsigned char *where_to_put_displacement = NULL;
10535   offsetT target_address;
10536   offsetT opcode_address;
10537   unsigned int extension = 0;
10538   offsetT displacement_from_opcode_start;
10539
10540   opcode = (unsigned char *) fragP->fr_opcode;
10541
10542   /* Address we want to reach in file space.  */
10543   target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
10544
10545   /* Address opcode resides at in file space.  */
10546   opcode_address = fragP->fr_address + fragP->fr_fix;
10547
10548   /* Displacement from opcode start to fill into instruction.  */
10549   displacement_from_opcode_start = target_address - opcode_address;
10550
10551   if ((fragP->fr_subtype & BIG) == 0)
10552     {
10553       /* Don't have to change opcode.  */
10554       extension = 1;            /* 1 opcode + 1 displacement  */
10555       where_to_put_displacement = &opcode[1];
10556     }
10557   else
10558     {
10559       if (no_cond_jump_promotion
10560           && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
10561         as_warn_where (fragP->fr_file, fragP->fr_line,
10562                        _("long jump required"));
10563
10564       switch (fragP->fr_subtype)
10565         {
10566         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
10567           extension = 4;                /* 1 opcode + 4 displacement  */
10568           opcode[0] = 0xe9;
10569           where_to_put_displacement = &opcode[1];
10570           break;
10571
10572         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
10573           extension = 2;                /* 1 opcode + 2 displacement  */
10574           opcode[0] = 0xe9;
10575           where_to_put_displacement = &opcode[1];
10576           break;
10577
10578         case ENCODE_RELAX_STATE (COND_JUMP, BIG):
10579         case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
10580           extension = 5;                /* 2 opcode + 4 displacement  */
10581           opcode[1] = opcode[0] + 0x10;
10582           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
10583           where_to_put_displacement = &opcode[2];
10584           break;
10585
10586         case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
10587           extension = 3;                /* 2 opcode + 2 displacement  */
10588           opcode[1] = opcode[0] + 0x10;
10589           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
10590           where_to_put_displacement = &opcode[2];
10591           break;
10592
10593         case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
10594           extension = 4;
10595           opcode[0] ^= 1;
10596           opcode[1] = 3;
10597           opcode[2] = 0xe9;
10598           where_to_put_displacement = &opcode[3];
10599           break;
10600
10601         default:
10602           BAD_CASE (fragP->fr_subtype);
10603           break;
10604         }
10605     }
10606
10607   /* If size if less then four we are sure that the operand fits,
10608      but if it's 4, then it could be that the displacement is larger
10609      then -/+ 2GB.  */
10610   if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
10611       && object_64bit
10612       && ((addressT) (displacement_from_opcode_start - extension
10613                       + ((addressT) 1 << 31))
10614           > (((addressT) 2 << 31) - 1)))
10615     {
10616       as_bad_where (fragP->fr_file, fragP->fr_line,
10617                     _("jump target out of range"));
10618       /* Make us emit 0.  */
10619       displacement_from_opcode_start = extension;
10620     }
10621   /* Now put displacement after opcode.  */
10622   md_number_to_chars ((char *) where_to_put_displacement,
10623                       (valueT) (displacement_from_opcode_start - extension),
10624                       DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
10625   fragP->fr_fix += extension;
10626 }
10627 \f
10628 /* Apply a fixup (fixP) to segment data, once it has been determined
10629    by our caller that we have all the info we need to fix it up.
10630
10631    Parameter valP is the pointer to the value of the bits.
10632
10633    On the 386, immediates, displacements, and data pointers are all in
10634    the same (little-endian) format, so we don't need to care about which
10635    we are handling.  */
10636
10637 void
10638 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
10639 {
10640   char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
10641   valueT value = *valP;
10642
10643 #if !defined (TE_Mach)
10644   if (fixP->fx_pcrel)
10645     {
10646       switch (fixP->fx_r_type)
10647         {
10648         default:
10649           break;
10650
10651         case BFD_RELOC_64:
10652           fixP->fx_r_type = BFD_RELOC_64_PCREL;
10653           break;
10654         case BFD_RELOC_32:
10655         case BFD_RELOC_X86_64_32S:
10656           fixP->fx_r_type = BFD_RELOC_32_PCREL;
10657           break;
10658         case BFD_RELOC_16:
10659           fixP->fx_r_type = BFD_RELOC_16_PCREL;
10660           break;
10661         case BFD_RELOC_8:
10662           fixP->fx_r_type = BFD_RELOC_8_PCREL;
10663           break;
10664         }
10665     }
10666
10667   if (fixP->fx_addsy != NULL
10668       && (fixP->fx_r_type == BFD_RELOC_32_PCREL
10669           || fixP->fx_r_type == BFD_RELOC_64_PCREL
10670           || fixP->fx_r_type == BFD_RELOC_16_PCREL
10671           || fixP->fx_r_type == BFD_RELOC_8_PCREL)
10672       && !use_rela_relocations)
10673     {
10674       /* This is a hack.  There should be a better way to handle this.
10675          This covers for the fact that bfd_install_relocation will
10676          subtract the current location (for partial_inplace, PC relative
10677          relocations); see more below.  */
10678 #ifndef OBJ_AOUT
10679       if (IS_ELF
10680 #ifdef TE_PE
10681           || OUTPUT_FLAVOR == bfd_target_coff_flavour
10682 #endif
10683           )
10684         value += fixP->fx_where + fixP->fx_frag->fr_address;
10685 #endif
10686 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10687       if (IS_ELF)
10688         {
10689           segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
10690
10691           if ((sym_seg == seg
10692                || (symbol_section_p (fixP->fx_addsy)
10693                    && sym_seg != absolute_section))
10694               && !generic_force_reloc (fixP))
10695             {
10696               /* Yes, we add the values in twice.  This is because
10697                  bfd_install_relocation subtracts them out again.  I think
10698                  bfd_install_relocation is broken, but I don't dare change
10699                  it.  FIXME.  */
10700               value += fixP->fx_where + fixP->fx_frag->fr_address;
10701             }
10702         }
10703 #endif
10704 #if defined (OBJ_COFF) && defined (TE_PE)
10705       /* For some reason, the PE format does not store a
10706          section address offset for a PC relative symbol.  */
10707       if (S_GET_SEGMENT (fixP->fx_addsy) != seg
10708           || S_IS_WEAK (fixP->fx_addsy))
10709         value += md_pcrel_from (fixP);
10710 #endif
10711     }
10712 #if defined (OBJ_COFF) && defined (TE_PE)
10713   if (fixP->fx_addsy != NULL
10714       && S_IS_WEAK (fixP->fx_addsy)
10715       /* PR 16858: Do not modify weak function references.  */
10716       && ! fixP->fx_pcrel)
10717     {
10718 #if !defined (TE_PEP)
10719       /* For x86 PE weak function symbols are neither PC-relative
10720          nor do they set S_IS_FUNCTION.  So the only reliable way
10721          to detect them is to check the flags of their containing
10722          section.  */
10723       if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
10724           && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
10725         ;
10726       else
10727 #endif
10728       value -= S_GET_VALUE (fixP->fx_addsy);
10729     }
10730 #endif
10731
10732   /* Fix a few things - the dynamic linker expects certain values here,
10733      and we must not disappoint it.  */
10734 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10735   if (IS_ELF && fixP->fx_addsy)
10736     switch (fixP->fx_r_type)
10737       {
10738       case BFD_RELOC_386_PLT32:
10739       case BFD_RELOC_X86_64_PLT32:
10740         /* Make the jump instruction point to the address of the operand.
10741            At runtime we merely add the offset to the actual PLT entry.
10742            NB: Subtract the offset size only for jump instructions.  */
10743         if (fixP->fx_pcrel)
10744           value = -4;
10745         break;
10746
10747       case BFD_RELOC_386_TLS_GD:
10748       case BFD_RELOC_386_TLS_LDM:
10749       case BFD_RELOC_386_TLS_IE_32:
10750       case BFD_RELOC_386_TLS_IE:
10751       case BFD_RELOC_386_TLS_GOTIE:
10752       case BFD_RELOC_386_TLS_GOTDESC:
10753       case BFD_RELOC_X86_64_TLSGD:
10754       case BFD_RELOC_X86_64_TLSLD:
10755       case BFD_RELOC_X86_64_GOTTPOFF:
10756       case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10757         value = 0; /* Fully resolved at runtime.  No addend.  */
10758         /* Fallthrough */
10759       case BFD_RELOC_386_TLS_LE:
10760       case BFD_RELOC_386_TLS_LDO_32:
10761       case BFD_RELOC_386_TLS_LE_32:
10762       case BFD_RELOC_X86_64_DTPOFF32:
10763       case BFD_RELOC_X86_64_DTPOFF64:
10764       case BFD_RELOC_X86_64_TPOFF32:
10765       case BFD_RELOC_X86_64_TPOFF64:
10766         S_SET_THREAD_LOCAL (fixP->fx_addsy);
10767         break;
10768
10769       case BFD_RELOC_386_TLS_DESC_CALL:
10770       case BFD_RELOC_X86_64_TLSDESC_CALL:
10771         value = 0; /* Fully resolved at runtime.  No addend.  */
10772         S_SET_THREAD_LOCAL (fixP->fx_addsy);
10773         fixP->fx_done = 0;
10774         return;
10775
10776       case BFD_RELOC_VTABLE_INHERIT:
10777       case BFD_RELOC_VTABLE_ENTRY:
10778         fixP->fx_done = 0;
10779         return;
10780
10781       default:
10782         break;
10783       }
10784 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)  */
10785   *valP = value;
10786 #endif /* !defined (TE_Mach)  */
10787
10788   /* Are we finished with this relocation now?  */
10789   if (fixP->fx_addsy == NULL)
10790     fixP->fx_done = 1;
10791 #if defined (OBJ_COFF) && defined (TE_PE)
10792   else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
10793     {
10794       fixP->fx_done = 0;
10795       /* Remember value for tc_gen_reloc.  */
10796       fixP->fx_addnumber = value;
10797       /* Clear out the frag for now.  */
10798       value = 0;
10799     }
10800 #endif
10801   else if (use_rela_relocations)
10802     {
10803       fixP->fx_no_overflow = 1;
10804       /* Remember value for tc_gen_reloc.  */
10805       fixP->fx_addnumber = value;
10806       value = 0;
10807     }
10808
10809   md_number_to_chars (p, value, fixP->fx_size);
10810 }
10811 \f
10812 const char *
10813 md_atof (int type, char *litP, int *sizeP)
10814 {
10815   /* This outputs the LITTLENUMs in REVERSE order;
10816      in accord with the bigendian 386.  */
10817   return ieee_md_atof (type, litP, sizeP, FALSE);
10818 }
10819 \f
10820 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
10821
10822 static char *
10823 output_invalid (int c)
10824 {
10825   if (ISPRINT (c))
10826     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
10827               "'%c'", c);
10828   else
10829     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
10830               "(0x%x)", (unsigned char) c);
10831   return output_invalid_buf;
10832 }
10833
10834 /* REG_STRING starts *before* REGISTER_PREFIX.  */
10835
10836 static const reg_entry *
10837 parse_real_register (char *reg_string, char **end_op)
10838 {
10839   char *s = reg_string;
10840   char *p;
10841   char reg_name_given[MAX_REG_NAME_SIZE + 1];
10842   const reg_entry *r;
10843
10844   /* Skip possible REGISTER_PREFIX and possible whitespace.  */
10845   if (*s == REGISTER_PREFIX)
10846     ++s;
10847
10848   if (is_space_char (*s))
10849     ++s;
10850
10851   p = reg_name_given;
10852   while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
10853     {
10854       if (p >= reg_name_given + MAX_REG_NAME_SIZE)
10855         return (const reg_entry *) NULL;
10856       s++;
10857     }
10858
10859   /* For naked regs, make sure that we are not dealing with an identifier.
10860      This prevents confusing an identifier like `eax_var' with register
10861      `eax'.  */
10862   if (allow_naked_reg && identifier_chars[(unsigned char) *s])
10863     return (const reg_entry *) NULL;
10864
10865   *end_op = s;
10866
10867   r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
10868
10869   /* Handle floating point regs, allowing spaces in the (i) part.  */
10870   if (r == i386_regtab /* %st is first entry of table  */)
10871     {
10872       if (!cpu_arch_flags.bitfield.cpu8087
10873           && !cpu_arch_flags.bitfield.cpu287
10874           && !cpu_arch_flags.bitfield.cpu387)
10875         return (const reg_entry *) NULL;
10876
10877       if (is_space_char (*s))
10878         ++s;
10879       if (*s == '(')
10880         {
10881           ++s;
10882           if (is_space_char (*s))
10883             ++s;
10884           if (*s >= '0' && *s <= '7')
10885             {
10886               int fpr = *s - '0';
10887               ++s;
10888               if (is_space_char (*s))
10889                 ++s;
10890               if (*s == ')')
10891                 {
10892                   *end_op = s + 1;
10893                   r = (const reg_entry *) hash_find (reg_hash, "st(0)");
10894                   know (r);
10895                   return r + fpr;
10896                 }
10897             }
10898           /* We have "%st(" then garbage.  */
10899           return (const reg_entry *) NULL;
10900         }
10901     }
10902
10903   if (r == NULL || allow_pseudo_reg)
10904     return r;
10905
10906   if (operand_type_all_zero (&r->reg_type))
10907     return (const reg_entry *) NULL;
10908
10909   if ((r->reg_type.bitfield.dword
10910        || (r->reg_type.bitfield.sreg && r->reg_num > 3)
10911        || r->reg_type.bitfield.control
10912        || r->reg_type.bitfield.debug
10913        || r->reg_type.bitfield.test)
10914       && !cpu_arch_flags.bitfield.cpui386)
10915     return (const reg_entry *) NULL;
10916
10917   if (r->reg_type.bitfield.regmmx && !cpu_arch_flags.bitfield.cpummx)
10918     return (const reg_entry *) NULL;
10919
10920   if (!cpu_arch_flags.bitfield.cpuavx512f)
10921     {
10922       if (r->reg_type.bitfield.zmmword || r->reg_type.bitfield.regmask)
10923         return (const reg_entry *) NULL;
10924
10925       if (!cpu_arch_flags.bitfield.cpuavx)
10926         {
10927           if (r->reg_type.bitfield.ymmword)
10928             return (const reg_entry *) NULL;
10929
10930           if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
10931             return (const reg_entry *) NULL;
10932         }
10933     }
10934
10935   if (r->reg_type.bitfield.regbnd && !cpu_arch_flags.bitfield.cpumpx)
10936     return (const reg_entry *) NULL;
10937
10938   /* Don't allow fake index register unless allow_index_reg isn't 0. */
10939   if (!allow_index_reg && r->reg_num == RegIZ)
10940     return (const reg_entry *) NULL;
10941
10942   /* Upper 16 vector registers are only available with VREX in 64bit
10943      mode, and require EVEX encoding.  */
10944   if (r->reg_flags & RegVRex)
10945     {
10946       if (!cpu_arch_flags.bitfield.cpuavx512f
10947           || flag_code != CODE_64BIT)
10948         return (const reg_entry *) NULL;
10949
10950       i.vec_encoding = vex_encoding_evex;
10951     }
10952
10953   if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
10954       && (!cpu_arch_flags.bitfield.cpulm || !r->reg_type.bitfield.control)
10955       && flag_code != CODE_64BIT)
10956     return (const reg_entry *) NULL;
10957
10958   if (r->reg_type.bitfield.sreg && r->reg_num == RegFlat && !intel_syntax)
10959     return (const reg_entry *) NULL;
10960
10961   return r;
10962 }
10963
10964 /* REG_STRING starts *before* REGISTER_PREFIX.  */
10965
10966 static const reg_entry *
10967 parse_register (char *reg_string, char **end_op)
10968 {
10969   const reg_entry *r;
10970
10971   if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
10972     r = parse_real_register (reg_string, end_op);
10973   else
10974     r = NULL;
10975   if (!r)
10976     {
10977       char *save = input_line_pointer;
10978       char c;
10979       symbolS *symbolP;
10980
10981       input_line_pointer = reg_string;
10982       c = get_symbol_name (&reg_string);
10983       symbolP = symbol_find (reg_string);
10984       if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
10985         {
10986           const expressionS *e = symbol_get_value_expression (symbolP);
10987
10988           know (e->X_op == O_register);
10989           know (e->X_add_number >= 0
10990                 && (valueT) e->X_add_number < i386_regtab_size);
10991           r = i386_regtab + e->X_add_number;
10992           if ((r->reg_flags & RegVRex))
10993             i.vec_encoding = vex_encoding_evex;
10994           *end_op = input_line_pointer;
10995         }
10996       *input_line_pointer = c;
10997       input_line_pointer = save;
10998     }
10999   return r;
11000 }
11001
11002 int
11003 i386_parse_name (char *name, expressionS *e, char *nextcharP)
11004 {
11005   const reg_entry *r;
11006   char *end = input_line_pointer;
11007
11008   *end = *nextcharP;
11009   r = parse_register (name, &input_line_pointer);
11010   if (r && end <= input_line_pointer)
11011     {
11012       *nextcharP = *input_line_pointer;
11013       *input_line_pointer = 0;
11014       e->X_op = O_register;
11015       e->X_add_number = r - i386_regtab;
11016       return 1;
11017     }
11018   input_line_pointer = end;
11019   *end = 0;
11020   return intel_syntax ? i386_intel_parse_name (name, e) : 0;
11021 }
11022
11023 void
11024 md_operand (expressionS *e)
11025 {
11026   char *end;
11027   const reg_entry *r;
11028
11029   switch (*input_line_pointer)
11030     {
11031     case REGISTER_PREFIX:
11032       r = parse_real_register (input_line_pointer, &end);
11033       if (r)
11034         {
11035           e->X_op = O_register;
11036           e->X_add_number = r - i386_regtab;
11037           input_line_pointer = end;
11038         }
11039       break;
11040
11041     case '[':
11042       gas_assert (intel_syntax);
11043       end = input_line_pointer++;
11044       expression (e);
11045       if (*input_line_pointer == ']')
11046         {
11047           ++input_line_pointer;
11048           e->X_op_symbol = make_expr_symbol (e);
11049           e->X_add_symbol = NULL;
11050           e->X_add_number = 0;
11051           e->X_op = O_index;
11052         }
11053       else
11054         {
11055           e->X_op = O_absent;
11056           input_line_pointer = end;
11057         }
11058       break;
11059     }
11060 }
11061
11062 \f
11063 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11064 const char *md_shortopts = "kVQ:sqnO::";
11065 #else
11066 const char *md_shortopts = "qnO::";
11067 #endif
11068
11069 #define OPTION_32 (OPTION_MD_BASE + 0)
11070 #define OPTION_64 (OPTION_MD_BASE + 1)
11071 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
11072 #define OPTION_MARCH (OPTION_MD_BASE + 3)
11073 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
11074 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
11075 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
11076 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
11077 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
11078 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
11079 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
11080 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
11081 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
11082 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
11083 #define OPTION_X32 (OPTION_MD_BASE + 14)
11084 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
11085 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
11086 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
11087 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
11088 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
11089 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
11090 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
11091 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
11092 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
11093 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
11094 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
11095 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
11096
11097 struct option md_longopts[] =
11098 {
11099   {"32", no_argument, NULL, OPTION_32},
11100 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11101      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
11102   {"64", no_argument, NULL, OPTION_64},
11103 #endif
11104 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11105   {"x32", no_argument, NULL, OPTION_X32},
11106   {"mshared", no_argument, NULL, OPTION_MSHARED},
11107   {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
11108 #endif
11109   {"divide", no_argument, NULL, OPTION_DIVIDE},
11110   {"march", required_argument, NULL, OPTION_MARCH},
11111   {"mtune", required_argument, NULL, OPTION_MTUNE},
11112   {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
11113   {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
11114   {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
11115   {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
11116   {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
11117   {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
11118   {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
11119   {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
11120   {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
11121   {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
11122   {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
11123   {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
11124 # if defined (TE_PE) || defined (TE_PEP)
11125   {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
11126 #endif
11127   {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
11128   {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
11129   {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
11130   {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
11131   {"mamd64", no_argument, NULL, OPTION_MAMD64},
11132   {"mintel64", no_argument, NULL, OPTION_MINTEL64},
11133   {NULL, no_argument, NULL, 0}
11134 };
11135 size_t md_longopts_size = sizeof (md_longopts);
11136
11137 int
11138 md_parse_option (int c, const char *arg)
11139 {
11140   unsigned int j;
11141   char *arch, *next, *saved;
11142
11143   switch (c)
11144     {
11145     case 'n':
11146       optimize_align_code = 0;
11147       break;
11148
11149     case 'q':
11150       quiet_warnings = 1;
11151       break;
11152
11153 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11154       /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
11155          should be emitted or not.  FIXME: Not implemented.  */
11156     case 'Q':
11157       if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
11158         return 0;
11159       break;
11160
11161       /* -V: SVR4 argument to print version ID.  */
11162     case 'V':
11163       print_version_id ();
11164       break;
11165
11166       /* -k: Ignore for FreeBSD compatibility.  */
11167     case 'k':
11168       break;
11169
11170     case 's':
11171       /* -s: On i386 Solaris, this tells the native assembler to use
11172          .stab instead of .stab.excl.  We always use .stab anyhow.  */
11173       break;
11174
11175     case OPTION_MSHARED:
11176       shared = 1;
11177       break;
11178
11179     case OPTION_X86_USED_NOTE:
11180       if (strcasecmp (arg, "yes") == 0)
11181         x86_used_note = 1;
11182       else if (strcasecmp (arg, "no") == 0)
11183         x86_used_note = 0;
11184       else
11185         as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
11186       break;
11187
11188
11189 #endif
11190 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11191      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
11192     case OPTION_64:
11193       {
11194         const char **list, **l;
11195
11196         list = bfd_target_list ();
11197         for (l = list; *l != NULL; l++)
11198           if (CONST_STRNEQ (*l, "elf64-x86-64")
11199               || strcmp (*l, "coff-x86-64") == 0
11200               || strcmp (*l, "pe-x86-64") == 0
11201               || strcmp (*l, "pei-x86-64") == 0
11202               || strcmp (*l, "mach-o-x86-64") == 0)
11203             {
11204               default_arch = "x86_64";
11205               break;
11206             }
11207         if (*l == NULL)
11208           as_fatal (_("no compiled in support for x86_64"));
11209         free (list);
11210       }
11211       break;
11212 #endif
11213
11214 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11215     case OPTION_X32:
11216       if (IS_ELF)
11217         {
11218           const char **list, **l;
11219
11220           list = bfd_target_list ();
11221           for (l = list; *l != NULL; l++)
11222             if (CONST_STRNEQ (*l, "elf32-x86-64"))
11223               {
11224                 default_arch = "x86_64:32";
11225                 break;
11226               }
11227           if (*l == NULL)
11228             as_fatal (_("no compiled in support for 32bit x86_64"));
11229           free (list);
11230         }
11231       else
11232         as_fatal (_("32bit x86_64 is only supported for ELF"));
11233       break;
11234 #endif
11235
11236     case OPTION_32:
11237       default_arch = "i386";
11238       break;
11239
11240     case OPTION_DIVIDE:
11241 #ifdef SVR4_COMMENT_CHARS
11242       {
11243         char *n, *t;
11244         const char *s;
11245
11246         n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
11247         t = n;
11248         for (s = i386_comment_chars; *s != '\0'; s++)
11249           if (*s != '/')
11250             *t++ = *s;
11251         *t = '\0';
11252         i386_comment_chars = n;
11253       }
11254 #endif
11255       break;
11256
11257     case OPTION_MARCH:
11258       saved = xstrdup (arg);
11259       arch = saved;
11260       /* Allow -march=+nosse.  */
11261       if (*arch == '+')
11262         arch++;
11263       do
11264         {
11265           if (*arch == '.')
11266             as_fatal (_("invalid -march= option: `%s'"), arg);
11267           next = strchr (arch, '+');
11268           if (next)
11269             *next++ = '\0';
11270           for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
11271             {
11272               if (strcmp (arch, cpu_arch [j].name) == 0)
11273                 {
11274                   /* Processor.  */
11275                   if (! cpu_arch[j].flags.bitfield.cpui386)
11276                     continue;
11277
11278                   cpu_arch_name = cpu_arch[j].name;
11279                   cpu_sub_arch_name = NULL;
11280                   cpu_arch_flags = cpu_arch[j].flags;
11281                   cpu_arch_isa = cpu_arch[j].type;
11282                   cpu_arch_isa_flags = cpu_arch[j].flags;
11283                   if (!cpu_arch_tune_set)
11284                     {
11285                       cpu_arch_tune = cpu_arch_isa;
11286                       cpu_arch_tune_flags = cpu_arch_isa_flags;
11287                     }
11288                   break;
11289                 }
11290               else if (*cpu_arch [j].name == '.'
11291                        && strcmp (arch, cpu_arch [j].name + 1) == 0)
11292                 {
11293                   /* ISA extension.  */
11294                   i386_cpu_flags flags;
11295
11296                   flags = cpu_flags_or (cpu_arch_flags,
11297                                         cpu_arch[j].flags);
11298
11299                   if (!cpu_flags_equal (&flags, &cpu_arch_flags))
11300                     {
11301                       if (cpu_sub_arch_name)
11302                         {
11303                           char *name = cpu_sub_arch_name;
11304                           cpu_sub_arch_name = concat (name,
11305                                                       cpu_arch[j].name,
11306                                                       (const char *) NULL);
11307                           free (name);
11308                         }
11309                       else
11310                         cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
11311                       cpu_arch_flags = flags;
11312                       cpu_arch_isa_flags = flags;
11313                     }
11314                   else
11315                     cpu_arch_isa_flags
11316                       = cpu_flags_or (cpu_arch_isa_flags,
11317                                       cpu_arch[j].flags);
11318                   break;
11319                 }
11320             }
11321
11322           if (j >= ARRAY_SIZE (cpu_arch))
11323             {
11324               /* Disable an ISA extension.  */
11325               for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
11326                 if (strcmp (arch, cpu_noarch [j].name) == 0)
11327                   {
11328                     i386_cpu_flags flags;
11329
11330                     flags = cpu_flags_and_not (cpu_arch_flags,
11331                                                cpu_noarch[j].flags);
11332                     if (!cpu_flags_equal (&flags, &cpu_arch_flags))
11333                       {
11334                         if (cpu_sub_arch_name)
11335                           {
11336                             char *name = cpu_sub_arch_name;
11337                             cpu_sub_arch_name = concat (arch,
11338                                                         (const char *) NULL);
11339                             free (name);
11340                           }
11341                         else
11342                           cpu_sub_arch_name = xstrdup (arch);
11343                         cpu_arch_flags = flags;
11344                         cpu_arch_isa_flags = flags;
11345                       }
11346                     break;
11347                   }
11348
11349               if (j >= ARRAY_SIZE (cpu_noarch))
11350                 j = ARRAY_SIZE (cpu_arch);
11351             }
11352
11353           if (j >= ARRAY_SIZE (cpu_arch))
11354             as_fatal (_("invalid -march= option: `%s'"), arg);
11355
11356           arch = next;
11357         }
11358       while (next != NULL);
11359       free (saved);
11360       break;
11361
11362     case OPTION_MTUNE:
11363       if (*arg == '.')
11364         as_fatal (_("invalid -mtune= option: `%s'"), arg);
11365       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
11366         {
11367           if (strcmp (arg, cpu_arch [j].name) == 0)
11368             {
11369               cpu_arch_tune_set = 1;
11370               cpu_arch_tune = cpu_arch [j].type;
11371               cpu_arch_tune_flags = cpu_arch[j].flags;
11372               break;
11373             }
11374         }
11375       if (j >= ARRAY_SIZE (cpu_arch))
11376         as_fatal (_("invalid -mtune= option: `%s'"), arg);
11377       break;
11378
11379     case OPTION_MMNEMONIC:
11380       if (strcasecmp (arg, "att") == 0)
11381         intel_mnemonic = 0;
11382       else if (strcasecmp (arg, "intel") == 0)
11383         intel_mnemonic = 1;
11384       else
11385         as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
11386       break;
11387
11388     case OPTION_MSYNTAX:
11389       if (strcasecmp (arg, "att") == 0)
11390         intel_syntax = 0;
11391       else if (strcasecmp (arg, "intel") == 0)
11392         intel_syntax = 1;
11393       else
11394         as_fatal (_("invalid -msyntax= option: `%s'"), arg);
11395       break;
11396
11397     case OPTION_MINDEX_REG:
11398       allow_index_reg = 1;
11399       break;
11400
11401     case OPTION_MNAKED_REG:
11402       allow_naked_reg = 1;
11403       break;
11404
11405     case OPTION_MSSE2AVX:
11406       sse2avx = 1;
11407       break;
11408
11409     case OPTION_MSSE_CHECK:
11410       if (strcasecmp (arg, "error") == 0)
11411         sse_check = check_error;
11412       else if (strcasecmp (arg, "warning") == 0)
11413         sse_check = check_warning;
11414       else if (strcasecmp (arg, "none") == 0)
11415         sse_check = check_none;
11416       else
11417         as_fatal (_("invalid -msse-check= option: `%s'"), arg);
11418       break;
11419
11420     case OPTION_MOPERAND_CHECK:
11421       if (strcasecmp (arg, "error") == 0)
11422         operand_check = check_error;
11423       else if (strcasecmp (arg, "warning") == 0)
11424         operand_check = check_warning;
11425       else if (strcasecmp (arg, "none") == 0)
11426         operand_check = check_none;
11427       else
11428         as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
11429       break;
11430
11431     case OPTION_MAVXSCALAR:
11432       if (strcasecmp (arg, "128") == 0)
11433         avxscalar = vex128;
11434       else if (strcasecmp (arg, "256") == 0)
11435         avxscalar = vex256;
11436       else
11437         as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
11438       break;
11439
11440     case OPTION_MVEXWIG:
11441       if (strcmp (arg, "0") == 0)
11442         vexwig = vexw0;
11443       else if (strcmp (arg, "1") == 0)
11444         vexwig = vexw1;
11445       else
11446         as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
11447       break;
11448
11449     case OPTION_MADD_BND_PREFIX:
11450       add_bnd_prefix = 1;
11451       break;
11452
11453     case OPTION_MEVEXLIG:
11454       if (strcmp (arg, "128") == 0)
11455         evexlig = evexl128;
11456       else if (strcmp (arg, "256") == 0)
11457         evexlig = evexl256;
11458       else  if (strcmp (arg, "512") == 0)
11459         evexlig = evexl512;
11460       else
11461         as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
11462       break;
11463
11464     case OPTION_MEVEXRCIG:
11465       if (strcmp (arg, "rne") == 0)
11466         evexrcig = rne;
11467       else if (strcmp (arg, "rd") == 0)
11468         evexrcig = rd;
11469       else if (strcmp (arg, "ru") == 0)
11470         evexrcig = ru;
11471       else if (strcmp (arg, "rz") == 0)
11472         evexrcig = rz;
11473       else
11474         as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
11475       break;
11476
11477     case OPTION_MEVEXWIG:
11478       if (strcmp (arg, "0") == 0)
11479         evexwig = evexw0;
11480       else if (strcmp (arg, "1") == 0)
11481         evexwig = evexw1;
11482       else
11483         as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
11484       break;
11485
11486 # if defined (TE_PE) || defined (TE_PEP)
11487     case OPTION_MBIG_OBJ:
11488       use_big_obj = 1;
11489       break;
11490 #endif
11491
11492     case OPTION_MOMIT_LOCK_PREFIX:
11493       if (strcasecmp (arg, "yes") == 0)
11494         omit_lock_prefix = 1;
11495       else if (strcasecmp (arg, "no") == 0)
11496         omit_lock_prefix = 0;
11497       else
11498         as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
11499       break;
11500
11501     case OPTION_MFENCE_AS_LOCK_ADD:
11502       if (strcasecmp (arg, "yes") == 0)
11503         avoid_fence = 1;
11504       else if (strcasecmp (arg, "no") == 0)
11505         avoid_fence = 0;
11506       else
11507         as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
11508       break;
11509
11510     case OPTION_MRELAX_RELOCATIONS:
11511       if (strcasecmp (arg, "yes") == 0)
11512         generate_relax_relocations = 1;
11513       else if (strcasecmp (arg, "no") == 0)
11514         generate_relax_relocations = 0;
11515       else
11516         as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
11517       break;
11518
11519     case OPTION_MAMD64:
11520       intel64 = 0;
11521       break;
11522
11523     case OPTION_MINTEL64:
11524       intel64 = 1;
11525       break;
11526
11527     case 'O':
11528       if (arg == NULL)
11529         {
11530           optimize = 1;
11531           /* Turn off -Os.  */
11532           optimize_for_space = 0;
11533         }
11534       else if (*arg == 's')
11535         {
11536           optimize_for_space = 1;
11537           /* Turn on all encoding optimizations.  */
11538           optimize = INT_MAX;
11539         }
11540       else
11541         {
11542           optimize = atoi (arg);
11543           /* Turn off -Os.  */
11544           optimize_for_space = 0;
11545         }
11546       break;
11547
11548     default:
11549       return 0;
11550     }
11551   return 1;
11552 }
11553
11554 #define MESSAGE_TEMPLATE \
11555 "                                                                                "
11556
11557 static char *
11558 output_message (FILE *stream, char *p, char *message, char *start,
11559                 int *left_p, const char *name, int len)
11560 {
11561   int size = sizeof (MESSAGE_TEMPLATE);
11562   int left = *left_p;
11563
11564   /* Reserve 2 spaces for ", " or ",\0" */
11565   left -= len + 2;
11566
11567   /* Check if there is any room.  */
11568   if (left >= 0)
11569     {
11570       if (p != start)
11571         {
11572           *p++ = ',';
11573           *p++ = ' ';
11574         }
11575       p = mempcpy (p, name, len);
11576     }
11577   else
11578     {
11579       /* Output the current message now and start a new one.  */
11580       *p++ = ',';
11581       *p = '\0';
11582       fprintf (stream, "%s\n", message);
11583       p = start;
11584       left = size - (start - message) - len - 2;
11585
11586       gas_assert (left >= 0);
11587
11588       p = mempcpy (p, name, len);
11589     }
11590
11591   *left_p = left;
11592   return p;
11593 }
11594
11595 static void
11596 show_arch (FILE *stream, int ext, int check)
11597 {
11598   static char message[] = MESSAGE_TEMPLATE;
11599   char *start = message + 27;
11600   char *p;
11601   int size = sizeof (MESSAGE_TEMPLATE);
11602   int left;
11603   const char *name;
11604   int len;
11605   unsigned int j;
11606
11607   p = start;
11608   left = size - (start - message);
11609   for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
11610     {
11611       /* Should it be skipped?  */
11612       if (cpu_arch [j].skip)
11613         continue;
11614
11615       name = cpu_arch [j].name;
11616       len = cpu_arch [j].len;
11617       if (*name == '.')
11618         {
11619           /* It is an extension.  Skip if we aren't asked to show it.  */
11620           if (ext)
11621             {
11622               name++;
11623               len--;
11624             }
11625           else
11626             continue;
11627         }
11628       else if (ext)
11629         {
11630           /* It is an processor.  Skip if we show only extension.  */
11631           continue;
11632         }
11633       else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
11634         {
11635           /* It is an impossible processor - skip.  */
11636           continue;
11637         }
11638
11639       p = output_message (stream, p, message, start, &left, name, len);
11640     }
11641
11642   /* Display disabled extensions.  */
11643   if (ext)
11644     for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
11645       {
11646         name = cpu_noarch [j].name;
11647         len = cpu_noarch [j].len;
11648         p = output_message (stream, p, message, start, &left, name,
11649                             len);
11650       }
11651
11652   *p = '\0';
11653   fprintf (stream, "%s\n", message);
11654 }
11655
11656 void
11657 md_show_usage (FILE *stream)
11658 {
11659 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11660   fprintf (stream, _("\
11661   -Qy, -Qn                ignored\n\
11662   -V                      print assembler version number\n\
11663   -k                      ignored\n"));
11664 #endif
11665   fprintf (stream, _("\
11666   -n                      Do not optimize code alignment\n\
11667   -q                      quieten some warnings\n"));
11668 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11669   fprintf (stream, _("\
11670   -s                      ignored\n"));
11671 #endif
11672 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11673                       || defined (TE_PE) || defined (TE_PEP))
11674   fprintf (stream, _("\
11675   --32/--64/--x32         generate 32bit/64bit/x32 code\n"));
11676 #endif
11677 #ifdef SVR4_COMMENT_CHARS
11678   fprintf (stream, _("\
11679   --divide                do not treat `/' as a comment character\n"));
11680 #else
11681   fprintf (stream, _("\
11682   --divide                ignored\n"));
11683 #endif
11684   fprintf (stream, _("\
11685   -march=CPU[,+EXTENSION...]\n\
11686                           generate code for CPU and EXTENSION, CPU is one of:\n"));
11687   show_arch (stream, 0, 1);
11688   fprintf (stream, _("\
11689                           EXTENSION is combination of:\n"));
11690   show_arch (stream, 1, 0);
11691   fprintf (stream, _("\
11692   -mtune=CPU              optimize for CPU, CPU is one of:\n"));
11693   show_arch (stream, 0, 0);
11694   fprintf (stream, _("\
11695   -msse2avx               encode SSE instructions with VEX prefix\n"));
11696   fprintf (stream, _("\
11697   -msse-check=[none|error|warning] (default: warning)\n\
11698                           check SSE instructions\n"));
11699   fprintf (stream, _("\
11700   -moperand-check=[none|error|warning] (default: warning)\n\
11701                           check operand combinations for validity\n"));
11702   fprintf (stream, _("\
11703   -mavxscalar=[128|256] (default: 128)\n\
11704                           encode scalar AVX instructions with specific vector\n\
11705                            length\n"));
11706   fprintf (stream, _("\
11707   -mvexwig=[0|1] (default: 0)\n\
11708                           encode VEX instructions with specific VEX.W value\n\
11709                            for VEX.W bit ignored instructions\n"));
11710   fprintf (stream, _("\
11711   -mevexlig=[128|256|512] (default: 128)\n\
11712                           encode scalar EVEX instructions with specific vector\n\
11713                            length\n"));
11714   fprintf (stream, _("\
11715   -mevexwig=[0|1] (default: 0)\n\
11716                           encode EVEX instructions with specific EVEX.W value\n\
11717                            for EVEX.W bit ignored instructions\n"));
11718   fprintf (stream, _("\
11719   -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
11720                           encode EVEX instructions with specific EVEX.RC value\n\
11721                            for SAE-only ignored instructions\n"));
11722   fprintf (stream, _("\
11723   -mmnemonic=[att|intel] "));
11724   if (SYSV386_COMPAT)
11725     fprintf (stream, _("(default: att)\n"));
11726   else
11727     fprintf (stream, _("(default: intel)\n"));
11728   fprintf (stream, _("\
11729                           use AT&T/Intel mnemonic\n"));
11730   fprintf (stream, _("\
11731   -msyntax=[att|intel] (default: att)\n\
11732                           use AT&T/Intel syntax\n"));
11733   fprintf (stream, _("\
11734   -mindex-reg             support pseudo index registers\n"));
11735   fprintf (stream, _("\
11736   -mnaked-reg             don't require `%%' prefix for registers\n"));
11737   fprintf (stream, _("\
11738   -madd-bnd-prefix        add BND prefix for all valid branches\n"));
11739 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11740   fprintf (stream, _("\
11741   -mshared                disable branch optimization for shared code\n"));
11742   fprintf (stream, _("\
11743   -mx86-used-note=[no|yes] "));
11744   if (DEFAULT_X86_USED_NOTE)
11745     fprintf (stream, _("(default: yes)\n"));
11746   else
11747     fprintf (stream, _("(default: no)\n"));
11748   fprintf (stream, _("\
11749                           generate x86 used ISA and feature properties\n"));
11750 #endif
11751 #if defined (TE_PE) || defined (TE_PEP)
11752   fprintf (stream, _("\
11753   -mbig-obj               generate big object files\n"));
11754 #endif
11755   fprintf (stream, _("\
11756   -momit-lock-prefix=[no|yes] (default: no)\n\
11757                           strip all lock prefixes\n"));
11758   fprintf (stream, _("\
11759   -mfence-as-lock-add=[no|yes] (default: no)\n\
11760                           encode lfence, mfence and sfence as\n\
11761                            lock addl $0x0, (%%{re}sp)\n"));
11762   fprintf (stream, _("\
11763   -mrelax-relocations=[no|yes] "));
11764   if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
11765     fprintf (stream, _("(default: yes)\n"));
11766   else
11767     fprintf (stream, _("(default: no)\n"));
11768   fprintf (stream, _("\
11769                           generate relax relocations\n"));
11770   fprintf (stream, _("\
11771   -mamd64                 accept only AMD64 ISA [default]\n"));
11772   fprintf (stream, _("\
11773   -mintel64               accept only Intel64 ISA\n"));
11774 }
11775
11776 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
11777      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11778      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
11779
11780 /* Pick the target format to use.  */
11781
11782 const char *
11783 i386_target_format (void)
11784 {
11785   if (!strncmp (default_arch, "x86_64", 6))
11786     {
11787       update_code_flag (CODE_64BIT, 1);
11788       if (default_arch[6] == '\0')
11789         x86_elf_abi = X86_64_ABI;
11790       else
11791         x86_elf_abi = X86_64_X32_ABI;
11792     }
11793   else if (!strcmp (default_arch, "i386"))
11794     update_code_flag (CODE_32BIT, 1);
11795   else if (!strcmp (default_arch, "iamcu"))
11796     {
11797       update_code_flag (CODE_32BIT, 1);
11798       if (cpu_arch_isa == PROCESSOR_UNKNOWN)
11799         {
11800           static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
11801           cpu_arch_name = "iamcu";
11802           cpu_sub_arch_name = NULL;
11803           cpu_arch_flags = iamcu_flags;
11804           cpu_arch_isa = PROCESSOR_IAMCU;
11805           cpu_arch_isa_flags = iamcu_flags;
11806           if (!cpu_arch_tune_set)
11807             {
11808               cpu_arch_tune = cpu_arch_isa;
11809               cpu_arch_tune_flags = cpu_arch_isa_flags;
11810             }
11811         }
11812       else if (cpu_arch_isa != PROCESSOR_IAMCU)
11813         as_fatal (_("Intel MCU doesn't support `%s' architecture"),
11814                   cpu_arch_name);
11815     }
11816   else
11817     as_fatal (_("unknown architecture"));
11818
11819   if (cpu_flags_all_zero (&cpu_arch_isa_flags))
11820     cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
11821   if (cpu_flags_all_zero (&cpu_arch_tune_flags))
11822     cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
11823
11824   switch (OUTPUT_FLAVOR)
11825     {
11826 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
11827     case bfd_target_aout_flavour:
11828       return AOUT_TARGET_FORMAT;
11829 #endif
11830 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
11831 # if defined (TE_PE) || defined (TE_PEP)
11832     case bfd_target_coff_flavour:
11833       if (flag_code == CODE_64BIT)
11834         return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
11835       else
11836         return "pe-i386";
11837 # elif defined (TE_GO32)
11838     case bfd_target_coff_flavour:
11839       return "coff-go32";
11840 # else
11841     case bfd_target_coff_flavour:
11842       return "coff-i386";
11843 # endif
11844 #endif
11845 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
11846     case bfd_target_elf_flavour:
11847       {
11848         const char *format;
11849
11850         switch (x86_elf_abi)
11851           {
11852           default:
11853             format = ELF_TARGET_FORMAT;
11854             break;
11855           case X86_64_ABI:
11856             use_rela_relocations = 1;
11857             object_64bit = 1;
11858             format = ELF_TARGET_FORMAT64;
11859             break;
11860           case X86_64_X32_ABI:
11861             use_rela_relocations = 1;
11862             object_64bit = 1;
11863             disallow_64bit_reloc = 1;
11864             format = ELF_TARGET_FORMAT32;
11865             break;
11866           }
11867         if (cpu_arch_isa == PROCESSOR_L1OM)
11868           {
11869             if (x86_elf_abi != X86_64_ABI)
11870               as_fatal (_("Intel L1OM is 64bit only"));
11871             return ELF_TARGET_L1OM_FORMAT;
11872           }
11873         else if (cpu_arch_isa == PROCESSOR_K1OM)
11874           {
11875             if (x86_elf_abi != X86_64_ABI)
11876               as_fatal (_("Intel K1OM is 64bit only"));
11877             return ELF_TARGET_K1OM_FORMAT;
11878           }
11879         else if (cpu_arch_isa == PROCESSOR_IAMCU)
11880           {
11881             if (x86_elf_abi != I386_ABI)
11882               as_fatal (_("Intel MCU is 32bit only"));
11883             return ELF_TARGET_IAMCU_FORMAT;
11884           }
11885         else
11886           return format;
11887       }
11888 #endif
11889 #if defined (OBJ_MACH_O)
11890     case bfd_target_mach_o_flavour:
11891       if (flag_code == CODE_64BIT)
11892         {
11893           use_rela_relocations = 1;
11894           object_64bit = 1;
11895           return "mach-o-x86-64";
11896         }
11897       else
11898         return "mach-o-i386";
11899 #endif
11900     default:
11901       abort ();
11902       return NULL;
11903     }
11904 }
11905
11906 #endif /* OBJ_MAYBE_ more than one  */
11907 \f
11908 symbolS *
11909 md_undefined_symbol (char *name)
11910 {
11911   if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
11912       && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
11913       && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
11914       && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
11915     {
11916       if (!GOT_symbol)
11917         {
11918           if (symbol_find (name))
11919             as_bad (_("GOT already in symbol table"));
11920           GOT_symbol = symbol_new (name, undefined_section,
11921                                    (valueT) 0, &zero_address_frag);
11922         };
11923       return GOT_symbol;
11924     }
11925   return 0;
11926 }
11927
11928 /* Round up a section size to the appropriate boundary.  */
11929
11930 valueT
11931 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
11932 {
11933 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
11934   if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
11935     {
11936       /* For a.out, force the section size to be aligned.  If we don't do
11937          this, BFD will align it for us, but it will not write out the
11938          final bytes of the section.  This may be a bug in BFD, but it is
11939          easier to fix it here since that is how the other a.out targets
11940          work.  */
11941       int align;
11942
11943       align = bfd_section_alignment (segment);
11944       size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
11945     }
11946 #endif
11947
11948   return size;
11949 }
11950
11951 /* On the i386, PC-relative offsets are relative to the start of the
11952    next instruction.  That is, the address of the offset, plus its
11953    size, since the offset is always the last part of the insn.  */
11954
11955 long
11956 md_pcrel_from (fixS *fixP)
11957 {
11958   return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
11959 }
11960
11961 #ifndef I386COFF
11962
11963 static void
11964 s_bss (int ignore ATTRIBUTE_UNUSED)
11965 {
11966   int temp;
11967
11968 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11969   if (IS_ELF)
11970     obj_elf_section_change_hook ();
11971 #endif
11972   temp = get_absolute_expression ();
11973   subseg_set (bss_section, (subsegT) temp);
11974   demand_empty_rest_of_line ();
11975 }
11976
11977 #endif
11978
11979 void
11980 i386_validate_fix (fixS *fixp)
11981 {
11982   if (fixp->fx_subsy)
11983     {
11984       if (fixp->fx_subsy == GOT_symbol)
11985         {
11986           if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
11987             {
11988               if (!object_64bit)
11989                 abort ();
11990 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11991               if (fixp->fx_tcbit2)
11992                 fixp->fx_r_type = (fixp->fx_tcbit
11993                                    ? BFD_RELOC_X86_64_REX_GOTPCRELX
11994                                    : BFD_RELOC_X86_64_GOTPCRELX);
11995               else
11996 #endif
11997                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
11998             }
11999           else
12000             {
12001               if (!object_64bit)
12002                 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
12003               else
12004                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
12005             }
12006           fixp->fx_subsy = 0;
12007         }
12008     }
12009 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12010   else if (!object_64bit)
12011     {
12012       if (fixp->fx_r_type == BFD_RELOC_386_GOT32
12013           && fixp->fx_tcbit2)
12014         fixp->fx_r_type = BFD_RELOC_386_GOT32X;
12015     }
12016 #endif
12017 }
12018
12019 arelent *
12020 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
12021 {
12022   arelent *rel;
12023   bfd_reloc_code_real_type code;
12024
12025   switch (fixp->fx_r_type)
12026     {
12027 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12028     case BFD_RELOC_SIZE32:
12029     case BFD_RELOC_SIZE64:
12030       if (S_IS_DEFINED (fixp->fx_addsy)
12031           && !S_IS_EXTERNAL (fixp->fx_addsy))
12032         {
12033           /* Resolve size relocation against local symbol to size of
12034              the symbol plus addend.  */
12035           valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
12036           if (fixp->fx_r_type == BFD_RELOC_SIZE32
12037               && !fits_in_unsigned_long (value))
12038             as_bad_where (fixp->fx_file, fixp->fx_line,
12039                           _("symbol size computation overflow"));
12040           fixp->fx_addsy = NULL;
12041           fixp->fx_subsy = NULL;
12042           md_apply_fix (fixp, (valueT *) &value, NULL);
12043           return NULL;
12044         }
12045 #endif
12046       /* Fall through.  */
12047
12048     case BFD_RELOC_X86_64_PLT32:
12049     case BFD_RELOC_X86_64_GOT32:
12050     case BFD_RELOC_X86_64_GOTPCREL:
12051     case BFD_RELOC_X86_64_GOTPCRELX:
12052     case BFD_RELOC_X86_64_REX_GOTPCRELX:
12053     case BFD_RELOC_386_PLT32:
12054     case BFD_RELOC_386_GOT32:
12055     case BFD_RELOC_386_GOT32X:
12056     case BFD_RELOC_386_GOTOFF:
12057     case BFD_RELOC_386_GOTPC:
12058     case BFD_RELOC_386_TLS_GD:
12059     case BFD_RELOC_386_TLS_LDM:
12060     case BFD_RELOC_386_TLS_LDO_32:
12061     case BFD_RELOC_386_TLS_IE_32:
12062     case BFD_RELOC_386_TLS_IE:
12063     case BFD_RELOC_386_TLS_GOTIE:
12064     case BFD_RELOC_386_TLS_LE_32:
12065     case BFD_RELOC_386_TLS_LE:
12066     case BFD_RELOC_386_TLS_GOTDESC:
12067     case BFD_RELOC_386_TLS_DESC_CALL:
12068     case BFD_RELOC_X86_64_TLSGD:
12069     case BFD_RELOC_X86_64_TLSLD:
12070     case BFD_RELOC_X86_64_DTPOFF32:
12071     case BFD_RELOC_X86_64_DTPOFF64:
12072     case BFD_RELOC_X86_64_GOTTPOFF:
12073     case BFD_RELOC_X86_64_TPOFF32:
12074     case BFD_RELOC_X86_64_TPOFF64:
12075     case BFD_RELOC_X86_64_GOTOFF64:
12076     case BFD_RELOC_X86_64_GOTPC32:
12077     case BFD_RELOC_X86_64_GOT64:
12078     case BFD_RELOC_X86_64_GOTPCREL64:
12079     case BFD_RELOC_X86_64_GOTPC64:
12080     case BFD_RELOC_X86_64_GOTPLT64:
12081     case BFD_RELOC_X86_64_PLTOFF64:
12082     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12083     case BFD_RELOC_X86_64_TLSDESC_CALL:
12084     case BFD_RELOC_RVA:
12085     case BFD_RELOC_VTABLE_ENTRY:
12086     case BFD_RELOC_VTABLE_INHERIT:
12087 #ifdef TE_PE
12088     case BFD_RELOC_32_SECREL:
12089 #endif
12090       code = fixp->fx_r_type;
12091       break;
12092     case BFD_RELOC_X86_64_32S:
12093       if (!fixp->fx_pcrel)
12094         {
12095           /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32.  */
12096           code = fixp->fx_r_type;
12097           break;
12098         }
12099       /* Fall through.  */
12100     default:
12101       if (fixp->fx_pcrel)
12102         {
12103           switch (fixp->fx_size)
12104             {
12105             default:
12106               as_bad_where (fixp->fx_file, fixp->fx_line,
12107                             _("can not do %d byte pc-relative relocation"),
12108                             fixp->fx_size);
12109               code = BFD_RELOC_32_PCREL;
12110               break;
12111             case 1: code = BFD_RELOC_8_PCREL;  break;
12112             case 2: code = BFD_RELOC_16_PCREL; break;
12113             case 4: code = BFD_RELOC_32_PCREL; break;
12114 #ifdef BFD64
12115             case 8: code = BFD_RELOC_64_PCREL; break;
12116 #endif
12117             }
12118         }
12119       else
12120         {
12121           switch (fixp->fx_size)
12122             {
12123             default:
12124               as_bad_where (fixp->fx_file, fixp->fx_line,
12125                             _("can not do %d byte relocation"),
12126                             fixp->fx_size);
12127               code = BFD_RELOC_32;
12128               break;
12129             case 1: code = BFD_RELOC_8;  break;
12130             case 2: code = BFD_RELOC_16; break;
12131             case 4: code = BFD_RELOC_32; break;
12132 #ifdef BFD64
12133             case 8: code = BFD_RELOC_64; break;
12134 #endif
12135             }
12136         }
12137       break;
12138     }
12139
12140   if ((code == BFD_RELOC_32
12141        || code == BFD_RELOC_32_PCREL
12142        || code == BFD_RELOC_X86_64_32S)
12143       && GOT_symbol
12144       && fixp->fx_addsy == GOT_symbol)
12145     {
12146       if (!object_64bit)
12147         code = BFD_RELOC_386_GOTPC;
12148       else
12149         code = BFD_RELOC_X86_64_GOTPC32;
12150     }
12151   if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
12152       && GOT_symbol
12153       && fixp->fx_addsy == GOT_symbol)
12154     {
12155       code = BFD_RELOC_X86_64_GOTPC64;
12156     }
12157
12158   rel = XNEW (arelent);
12159   rel->sym_ptr_ptr = XNEW (asymbol *);
12160   *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
12161
12162   rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
12163
12164   if (!use_rela_relocations)
12165     {
12166       /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
12167          vtable entry to be used in the relocation's section offset.  */
12168       if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
12169         rel->address = fixp->fx_offset;
12170 #if defined (OBJ_COFF) && defined (TE_PE)
12171       else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
12172         rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
12173       else
12174 #endif
12175       rel->addend = 0;
12176     }
12177   /* Use the rela in 64bit mode.  */
12178   else
12179     {
12180       if (disallow_64bit_reloc)
12181         switch (code)
12182           {
12183           case BFD_RELOC_X86_64_DTPOFF64:
12184           case BFD_RELOC_X86_64_TPOFF64:
12185           case BFD_RELOC_64_PCREL:
12186           case BFD_RELOC_X86_64_GOTOFF64:
12187           case BFD_RELOC_X86_64_GOT64:
12188           case BFD_RELOC_X86_64_GOTPCREL64:
12189           case BFD_RELOC_X86_64_GOTPC64:
12190           case BFD_RELOC_X86_64_GOTPLT64:
12191           case BFD_RELOC_X86_64_PLTOFF64:
12192             as_bad_where (fixp->fx_file, fixp->fx_line,
12193                           _("cannot represent relocation type %s in x32 mode"),
12194                           bfd_get_reloc_code_name (code));
12195             break;
12196           default:
12197             break;
12198           }
12199
12200       if (!fixp->fx_pcrel)
12201         rel->addend = fixp->fx_offset;
12202       else
12203         switch (code)
12204           {
12205           case BFD_RELOC_X86_64_PLT32:
12206           case BFD_RELOC_X86_64_GOT32:
12207           case BFD_RELOC_X86_64_GOTPCREL:
12208           case BFD_RELOC_X86_64_GOTPCRELX:
12209           case BFD_RELOC_X86_64_REX_GOTPCRELX:
12210           case BFD_RELOC_X86_64_TLSGD:
12211           case BFD_RELOC_X86_64_TLSLD:
12212           case BFD_RELOC_X86_64_GOTTPOFF:
12213           case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12214           case BFD_RELOC_X86_64_TLSDESC_CALL:
12215             rel->addend = fixp->fx_offset - fixp->fx_size;
12216             break;
12217           default:
12218             rel->addend = (section->vma
12219                            - fixp->fx_size
12220                            + fixp->fx_addnumber
12221                            + md_pcrel_from (fixp));
12222             break;
12223           }
12224     }
12225
12226   rel->howto = bfd_reloc_type_lookup (stdoutput, code);
12227   if (rel->howto == NULL)
12228     {
12229       as_bad_where (fixp->fx_file, fixp->fx_line,
12230                     _("cannot represent relocation type %s"),
12231                     bfd_get_reloc_code_name (code));
12232       /* Set howto to a garbage value so that we can keep going.  */
12233       rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
12234       gas_assert (rel->howto != NULL);
12235     }
12236
12237   return rel;
12238 }
12239
12240 #include "tc-i386-intel.c"
12241
12242 void
12243 tc_x86_parse_to_dw2regnum (expressionS *exp)
12244 {
12245   int saved_naked_reg;
12246   char saved_register_dot;
12247
12248   saved_naked_reg = allow_naked_reg;
12249   allow_naked_reg = 1;
12250   saved_register_dot = register_chars['.'];
12251   register_chars['.'] = '.';
12252   allow_pseudo_reg = 1;
12253   expression_and_evaluate (exp);
12254   allow_pseudo_reg = 0;
12255   register_chars['.'] = saved_register_dot;
12256   allow_naked_reg = saved_naked_reg;
12257
12258   if (exp->X_op == O_register && exp->X_add_number >= 0)
12259     {
12260       if ((addressT) exp->X_add_number < i386_regtab_size)
12261         {
12262           exp->X_op = O_constant;
12263           exp->X_add_number = i386_regtab[exp->X_add_number]
12264                               .dw2_regnum[flag_code >> 1];
12265         }
12266       else
12267         exp->X_op = O_illegal;
12268     }
12269 }
12270
12271 void
12272 tc_x86_frame_initial_instructions (void)
12273 {
12274   static unsigned int sp_regno[2];
12275
12276   if (!sp_regno[flag_code >> 1])
12277     {
12278       char *saved_input = input_line_pointer;
12279       char sp[][4] = {"esp", "rsp"};
12280       expressionS exp;
12281
12282       input_line_pointer = sp[flag_code >> 1];
12283       tc_x86_parse_to_dw2regnum (&exp);
12284       gas_assert (exp.X_op == O_constant);
12285       sp_regno[flag_code >> 1] = exp.X_add_number;
12286       input_line_pointer = saved_input;
12287     }
12288
12289   cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
12290   cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
12291 }
12292
12293 int
12294 x86_dwarf2_addr_size (void)
12295 {
12296 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
12297   if (x86_elf_abi == X86_64_X32_ABI)
12298     return 4;
12299 #endif
12300   return bfd_arch_bits_per_address (stdoutput) / 8;
12301 }
12302
12303 int
12304 i386_elf_section_type (const char *str, size_t len)
12305 {
12306   if (flag_code == CODE_64BIT
12307       && len == sizeof ("unwind") - 1
12308       && strncmp (str, "unwind", 6) == 0)
12309     return SHT_X86_64_UNWIND;
12310
12311   return -1;
12312 }
12313
12314 #ifdef TE_SOLARIS
12315 void
12316 i386_solaris_fix_up_eh_frame (segT sec)
12317 {
12318   if (flag_code == CODE_64BIT)
12319     elf_section_type (sec) = SHT_X86_64_UNWIND;
12320 }
12321 #endif
12322
12323 #ifdef TE_PE
12324 void
12325 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
12326 {
12327   expressionS exp;
12328
12329   exp.X_op = O_secrel;
12330   exp.X_add_symbol = symbol;
12331   exp.X_add_number = 0;
12332   emit_expr (&exp, size);
12333 }
12334 #endif
12335
12336 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12337 /* For ELF on x86-64, add support for SHF_X86_64_LARGE.  */
12338
12339 bfd_vma
12340 x86_64_section_letter (int letter, const char **ptr_msg)
12341 {
12342   if (flag_code == CODE_64BIT)
12343     {
12344       if (letter == 'l')
12345         return SHF_X86_64_LARGE;
12346
12347       *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
12348     }
12349   else
12350     *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
12351   return -1;
12352 }
12353
12354 bfd_vma
12355 x86_64_section_word (char *str, size_t len)
12356 {
12357   if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
12358     return SHF_X86_64_LARGE;
12359
12360   return -1;
12361 }
12362
12363 static void
12364 handle_large_common (int small ATTRIBUTE_UNUSED)
12365 {
12366   if (flag_code != CODE_64BIT)
12367     {
12368       s_comm_internal (0, elf_common_parse);
12369       as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
12370     }
12371   else
12372     {
12373       static segT lbss_section;
12374       asection *saved_com_section_ptr = elf_com_section_ptr;
12375       asection *saved_bss_section = bss_section;
12376
12377       if (lbss_section == NULL)
12378         {
12379           flagword applicable;
12380           segT seg = now_seg;
12381           subsegT subseg = now_subseg;
12382
12383           /* The .lbss section is for local .largecomm symbols.  */
12384           lbss_section = subseg_new (".lbss", 0);
12385           applicable = bfd_applicable_section_flags (stdoutput);
12386           bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
12387           seg_info (lbss_section)->bss = 1;
12388
12389           subseg_set (seg, subseg);
12390         }
12391
12392       elf_com_section_ptr = &_bfd_elf_large_com_section;
12393       bss_section = lbss_section;
12394
12395       s_comm_internal (0, elf_common_parse);
12396
12397       elf_com_section_ptr = saved_com_section_ptr;
12398       bss_section = saved_bss_section;
12399     }
12400 }
12401 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */