gas/config/tc-i386.c

   1 /* tc-i386.c -- Assemble code for the Intel 80386
   2    Copyright (C) 1989-2020 Free Software Foundation, Inc.
   3
   4    This file is part of GAS, the GNU Assembler.
   5
   6    GAS is free software; you can redistribute it and/or modify
   7    it under the terms of the GNU General Public License as published by
   8    the Free Software Foundation; either version 3, or (at your option)
   9    any later version.
  10
  11    GAS is distributed in the hope that it will be useful,
  12    but WITHOUT ANY WARRANTY; without even the implied warranty of
  13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14    GNU General Public License for more details.
  15
  16    You should have received a copy of the GNU General Public License
  17    along with GAS; see the file COPYING.  If not, write to the Free
  18    Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
  19    02110-1301, USA.  */
  20
  21 /* Intel 80386 machine specific gas.
  22    Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
  23    x86_64 support by Jan Hubicka (jh@suse.cz)
  24    VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
  25    Bugs & suggestions are completely welcome.  This is free software.
  26    Please help us make it better.  */
  27
  28 #include "as.h"
  29 #include "safe-ctype.h"
  30 #include "subsegs.h"
  31 #include "dwarf2dbg.h"
  32 #include "dw2gencfi.h"
  33 #include "elf/x86-64.h"
  34 #include "opcodes/i386-init.h"
  35
  36 #ifdef HAVE_LIMITS_H
  37 #include <limits.h>
  38 #else
  39 #ifdef HAVE_SYS_PARAM_H
  40 #include <sys/param.h>
  41 #endif
  42 #ifndef INT_MAX
  43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
  44 #endif
  45 #endif
  46
  47 #ifndef REGISTER_WARNINGS
  48 #define REGISTER_WARNINGS 1
  49 #endif
  50
  51 #ifndef INFER_ADDR_PREFIX
  52 #define INFER_ADDR_PREFIX 1
  53 #endif
  54
  55 #ifndef DEFAULT_ARCH
  56 #define DEFAULT_ARCH "i386"
  57 #endif
  58
  59 #ifndef INLINE
  60 #if __GNUC__ >= 2
  61 #define INLINE __inline__
  62 #else
  63 #define INLINE
  64 #endif
  65 #endif
  66
  67 /* Prefixes will be emitted in the order defined below.
  68    WAIT_PREFIX must be the first prefix since FWAIT is really is an
  69    instruction, and so must come before any prefixes.
  70    The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
  71    REP_PREFIX/HLE_PREFIX, LOCK_PREFIX.  */
  72 #define WAIT_PREFIX     0
  73 #define SEG_PREFIX      1
  74 #define ADDR_PREFIX     2
  75 #define DATA_PREFIX     3
  76 #define REP_PREFIX      4
  77 #define HLE_PREFIX      REP_PREFIX
  78 #define BND_PREFIX      REP_PREFIX
  79 #define LOCK_PREFIX     5
  80 #define REX_PREFIX      6       /* must come last.  */
  81 #define MAX_PREFIXES    7       /* max prefixes per opcode */
  82
  83 /* we define the syntax here (modulo base,index,scale syntax) */
  84 #define REGISTER_PREFIX '%'
  85 #define IMMEDIATE_PREFIX '$'
  86 #define ABSOLUTE_PREFIX '*'
  87
  88 /* these are the instruction mnemonic suffixes in AT&T syntax or
  89    memory operand size in Intel syntax.  */
  90 #define WORD_MNEM_SUFFIX  'w'
  91 #define BYTE_MNEM_SUFFIX  'b'
  92 #define SHORT_MNEM_SUFFIX 's'
  93 #define LONG_MNEM_SUFFIX  'l'
  94 #define QWORD_MNEM_SUFFIX  'q'
  95 /* Intel Syntax.  Use a non-ascii letter since since it never appears
  96    in instructions.  */
  97 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
  98
  99 #define END_OF_INSN '\0'
 100
 101 /* This matches the C -> StaticRounding alias in the opcode table.  */
 102 #define commutative staticrounding
 103
 104 /*
 105   'templates' is for grouping together 'template' structures for opcodes
 106   of the same name.  This is only used for storing the insns in the grand
 107   ole hash table of insns.
 108   The templates themselves start at START and range up to (but not including)
 109   END.
 110   */
 111 typedef struct
 112 {
 113   const insn_template *start;
 114   const insn_template *end;
 115 }
 116 templates;
 117
 118 /* 386 operand encoding bytes:  see 386 book for details of this.  */
 119 typedef struct
 120 {
 121   unsigned int regmem;  /* codes register or memory operand */
 122   unsigned int reg;     /* codes register operand (or extended opcode) */
 123   unsigned int mode;    /* how to interpret regmem & reg */
 124 }
 125 modrm_byte;
 126
 127 /* x86-64 extension prefix.  */
 128 typedef int rex_byte;
 129
 130 /* 386 opcode byte to code indirect addressing.  */
 131 typedef struct
 132 {
 133   unsigned base;
 134   unsigned index;
 135   unsigned scale;
 136 }
 137 sib_byte;
 138
 139 /* x86 arch names, types and features */
 140 typedef struct
 141 {
 142   const char *name;             /* arch name */
 143   unsigned int len;             /* arch string length */
 144   enum processor_type type;     /* arch type */
 145   i386_cpu_flags flags;         /* cpu feature flags */
 146   unsigned int skip;            /* show_arch should skip this. */
 147 }
 148 arch_entry;
 149
 150 /* Used to turn off indicated flags.  */
 151 typedef struct
 152 {
 153   const char *name;             /* arch name */
 154   unsigned int len;             /* arch string length */
 155   i386_cpu_flags flags;         /* cpu feature flags */
 156 }
 157 noarch_entry;
 158
 159 static void update_code_flag (int, int);
 160 static void set_code_flag (int);
 161 static void set_16bit_gcc_code_flag (int);
 162 static void set_intel_syntax (int);
 163 static void set_intel_mnemonic (int);
 164 static void set_allow_index_reg (int);
 165 static void set_check (int);
 166 static void set_cpu_arch (int);
 167 #ifdef TE_PE
 168 static void pe_directive_secrel (int);
 169 #endif
 170 static void signed_cons (int);
 171 static char *output_invalid (int c);
 172 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
 173                                     const char *);
 174 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
 175                                        const char *);
 176 static int i386_att_operand (char *);
 177 static int i386_intel_operand (char *, int);
 178 static int i386_intel_simplify (expressionS *);
 179 static int i386_intel_parse_name (const char *, expressionS *);
 180 static const reg_entry *parse_register (char *, char **);
 181 static char *parse_insn (char *, char *);
 182 static char *parse_operands (char *, const char *);
 183 static void swap_operands (void);
 184 static void swap_2_operands (int, int);
 185 static enum flag_code i386_addressing_mode (void);
 186 static void optimize_imm (void);
 187 static void optimize_disp (void);
 188 static const insn_template *match_template (char);
 189 static int check_string (void);
 190 static int process_suffix (void);
 191 static int check_byte_reg (void);
 192 static int check_long_reg (void);
 193 static int check_qword_reg (void);
 194 static int check_word_reg (void);
 195 static int finalize_imm (void);
 196 static int process_operands (void);
 197 static const seg_entry *build_modrm_byte (void);
 198 static void output_insn (void);
 199 static void output_imm (fragS *, offsetT);
 200 static void output_disp (fragS *, offsetT);
 201 #ifndef I386COFF
 202 static void s_bss (int);
 203 #endif
 204 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 205 static void handle_large_common (int small ATTRIBUTE_UNUSED);
 206
 207 /* GNU_PROPERTY_X86_ISA_1_USED.  */
 208 static unsigned int x86_isa_1_used;
 209 /* GNU_PROPERTY_X86_FEATURE_2_USED.  */
 210 static unsigned int x86_feature_2_used;
 211 /* Generate x86 used ISA and feature properties.  */
 212 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
 213 #endif
 214
 215 static const char *default_arch = DEFAULT_ARCH;
 216
 217 /* This struct describes rounding control and SAE in the instruction.  */
 218 struct RC_Operation
 219 {
 220   enum rc_type
 221     {
 222       rne = 0,
 223       rd,
 224       ru,
 225       rz,
 226       saeonly
 227     } type;
 228   int operand;
 229 };
 230
 231 static struct RC_Operation rc_op;
 232
 233 /* The struct describes masking, applied to OPERAND in the instruction.
 234    MASK is a pointer to the corresponding mask register.  ZEROING tells
 235    whether merging or zeroing mask is used.  */
 236 struct Mask_Operation
 237 {
 238   const reg_entry *mask;
 239   unsigned int zeroing;
 240   /* The operand where this operation is associated.  */
 241   int operand;
 242 };
 243
 244 static struct Mask_Operation mask_op;
 245
 246 /* The struct describes broadcasting, applied to OPERAND.  FACTOR is
 247    broadcast factor.  */
 248 struct Broadcast_Operation
 249 {
 250   /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}.  */
 251   int type;
 252
 253   /* Index of broadcasted operand.  */
 254   int operand;
 255
 256   /* Number of bytes to broadcast.  */
 257   int bytes;
 258 };
 259
 260 static struct Broadcast_Operation broadcast_op;
 261
 262 /* VEX prefix.  */
 263 typedef struct
 264 {
 265   /* VEX prefix is either 2 byte or 3 byte.  EVEX is 4 byte.  */
 266   unsigned char bytes[4];
 267   unsigned int length;
 268   /* Destination or source register specifier.  */
 269   const reg_entry *register_specifier;
 270 } vex_prefix;
 271
 272 /* 'md_assemble ()' gathers together information and puts it into a
 273    i386_insn.  */
 274
 275 union i386_op
 276   {
 277     expressionS *disps;
 278     expressionS *imms;
 279     const reg_entry *regs;
 280   };
 281
 282 enum i386_error
 283   {
 284     operand_size_mismatch,
 285     operand_type_mismatch,
 286     register_type_mismatch,
 287     number_of_operands_mismatch,
 288     invalid_instruction_suffix,
 289     bad_imm4,
 290     unsupported_with_intel_mnemonic,
 291     unsupported_syntax,
 292     unsupported,
 293     invalid_vsib_address,
 294     invalid_vector_register_set,
 295     unsupported_vector_index_register,
 296     unsupported_broadcast,
 297     broadcast_needed,
 298     unsupported_masking,
 299     mask_not_on_destination,
 300     no_default_mask,
 301     unsupported_rc_sae,
 302     rc_sae_operand_not_last_imm,
 303     invalid_register_operand,
 304   };
 305
 306 struct _i386_insn
 307   {
 308     /* TM holds the template for the insn were currently assembling.  */
 309     insn_template tm;
 310
 311     /* SUFFIX holds the instruction size suffix for byte, word, dword
 312        or qword, if given.  */
 313     char suffix;
 314
 315     /* OPERANDS gives the number of given operands.  */
 316     unsigned int operands;
 317
 318     /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
 319        of given register, displacement, memory operands and immediate
 320        operands.  */
 321     unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
 322
 323     /* TYPES [i] is the type (see above #defines) which tells us how to
 324        use OP[i] for the corresponding operand.  */
 325     i386_operand_type types[MAX_OPERANDS];
 326
 327     /* Displacement expression, immediate expression, or register for each
 328        operand.  */
 329     union i386_op op[MAX_OPERANDS];
 330
 331     /* Flags for operands.  */
 332     unsigned int flags[MAX_OPERANDS];
 333 #define Operand_PCrel 1
 334 #define Operand_Mem   2
 335
 336     /* Relocation type for operand */
 337     enum bfd_reloc_code_real reloc[MAX_OPERANDS];
 338
 339     /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
 340        the base index byte below.  */
 341     const reg_entry *base_reg;
 342     const reg_entry *index_reg;
 343     unsigned int log2_scale_factor;
 344
 345     /* SEG gives the seg_entries of this insn.  They are zero unless
 346        explicit segment overrides are given.  */
 347     const seg_entry *seg[2];
 348
 349     /* Copied first memory operand string, for re-checking.  */
 350     char *memop1_string;
 351
 352     /* PREFIX holds all the given prefix opcodes (usually null).
 353        PREFIXES is the number of prefix opcodes.  */
 354     unsigned int prefixes;
 355     unsigned char prefix[MAX_PREFIXES];
 356
 357     /* The operand to a branch insn indicates an absolute branch.  */
 358     bfd_boolean jumpabsolute;
 359
 360     /* Has MMX register operands.  */
 361     bfd_boolean has_regmmx;
 362
 363     /* Has XMM register operands.  */
 364     bfd_boolean has_regxmm;
 365
 366     /* Has YMM register operands.  */
 367     bfd_boolean has_regymm;
 368
 369     /* Has ZMM register operands.  */
 370     bfd_boolean has_regzmm;
 371
 372     /* Has GOTPC or TLS relocation.  */
 373     bfd_boolean has_gotpc_tls_reloc;
 374
 375     /* RM and SIB are the modrm byte and the sib byte where the
 376        addressing modes of this insn are encoded.  */
 377     modrm_byte rm;
 378     rex_byte rex;
 379     rex_byte vrex;
 380     sib_byte sib;
 381     vex_prefix vex;
 382
 383     /* Masking attributes.  */
 384     struct Mask_Operation *mask;
 385
 386     /* Rounding control and SAE attributes.  */
 387     struct RC_Operation *rounding;
 388
 389     /* Broadcasting attributes.  */
 390     struct Broadcast_Operation *broadcast;
 391
 392     /* Compressed disp8*N attribute.  */
 393     unsigned int memshift;
 394
 395     /* Prefer load or store in encoding.  */
 396     enum
 397       {
 398         dir_encoding_default = 0,
 399         dir_encoding_load,
 400         dir_encoding_store,
 401         dir_encoding_swap
 402       } dir_encoding;
 403
 404     /* Prefer 8bit or 32bit displacement in encoding.  */
 405     enum
 406       {
 407         disp_encoding_default = 0,
 408         disp_encoding_8bit,
 409         disp_encoding_32bit
 410       } disp_encoding;
 411
 412     /* Prefer the REX byte in encoding.  */
 413     bfd_boolean rex_encoding;
 414
 415     /* Disable instruction size optimization.  */
 416     bfd_boolean no_optimize;
 417
 418     /* How to encode vector instructions.  */
 419     enum
 420       {
 421         vex_encoding_default = 0,
 422         vex_encoding_vex2,
 423         vex_encoding_vex3,
 424         vex_encoding_evex
 425       } vec_encoding;
 426
 427     /* REP prefix.  */
 428     const char *rep_prefix;
 429
 430     /* HLE prefix.  */
 431     const char *hle_prefix;
 432
 433     /* Have BND prefix.  */
 434     const char *bnd_prefix;
 435
 436     /* Have NOTRACK prefix.  */
 437     const char *notrack_prefix;
 438
 439     /* Error message.  */
 440     enum i386_error error;
 441   };
 442
 443 typedef struct _i386_insn i386_insn;
 444
 445 /* Link RC type with corresponding string, that'll be looked for in
 446    asm.  */
 447 struct RC_name
 448 {
 449   enum rc_type type;
 450   const char *name;
 451   unsigned int len;
 452 };
 453
 454 static const struct RC_name RC_NamesTable[] =
 455 {
 456   {  rne, STRING_COMMA_LEN ("rn-sae") },
 457   {  rd,  STRING_COMMA_LEN ("rd-sae") },
 458   {  ru,  STRING_COMMA_LEN ("ru-sae") },
 459   {  rz,  STRING_COMMA_LEN ("rz-sae") },
 460   {  saeonly,  STRING_COMMA_LEN ("sae") },
 461 };
 462
 463 /* List of chars besides those in app.c:symbol_chars that can start an
 464    operand.  Used to prevent the scrubber eating vital white-space.  */
 465 const char extra_symbol_chars[] = "*%-([{}"
 466 #ifdef LEX_AT
 467         "@"
 468 #endif
 469 #ifdef LEX_QM
 470         "?"
 471 #endif
 472         ;
 473
 474 #if (defined (TE_I386AIX)                               \
 475      || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
 476          && !defined (TE_GNU)                           \
 477          && !defined (TE_LINUX)                         \
 478          && !defined (TE_NACL)                          \
 479          && !defined (TE_FreeBSD)                       \
 480          && !defined (TE_DragonFly)                     \
 481          && !defined (TE_NetBSD)))
 482 /* This array holds the chars that always start a comment.  If the
 483    pre-processor is disabled, these aren't very useful.  The option
 484    --divide will remove '/' from this list.  */
 485 const char *i386_comment_chars = "#/";
 486 #define SVR4_COMMENT_CHARS 1
 487 #define PREFIX_SEPARATOR '\\'
 488
 489 #else
 490 const char *i386_comment_chars = "#";
 491 #define PREFIX_SEPARATOR '/'
 492 #endif
 493
 494 /* This array holds the chars that only start a comment at the beginning of
 495    a line.  If the line seems to have the form '# 123 filename'
 496    .line and .file directives will appear in the pre-processed output.
 497    Note that input_file.c hand checks for '#' at the beginning of the
 498    first line of the input file.  This is because the compiler outputs
 499    #NO_APP at the beginning of its output.
 500    Also note that comments started like this one will always work if
 501    '/' isn't otherwise defined.  */
 502 const char line_comment_chars[] = "#/";
 503
 504 const char line_separator_chars[] = ";";
 505
 506 /* Chars that can be used to separate mant from exp in floating point
 507    nums.  */
 508 const char EXP_CHARS[] = "eE";
 509
 510 /* Chars that mean this number is a floating point constant
 511    As in 0f12.456
 512    or    0d1.2345e12.  */
 513 const char FLT_CHARS[] = "fFdDxX";
 514
 515 /* Tables for lexical analysis.  */
 516 static char mnemonic_chars[256];
 517 static char register_chars[256];
 518 static char operand_chars[256];
 519 static char identifier_chars[256];
 520 static char digit_chars[256];
 521
 522 /* Lexical macros.  */
 523 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
 524 #define is_operand_char(x) (operand_chars[(unsigned char) x])
 525 #define is_register_char(x) (register_chars[(unsigned char) x])
 526 #define is_space_char(x) ((x) == ' ')
 527 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
 528 #define is_digit_char(x) (digit_chars[(unsigned char) x])
 529
 530 /* All non-digit non-letter characters that may occur in an operand.  */
 531 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
 532
 533 /* md_assemble() always leaves the strings it's passed unaltered.  To
 534    effect this we maintain a stack of saved characters that we've smashed
 535    with '\0's (indicating end of strings for various sub-fields of the
 536    assembler instruction).  */
 537 static char save_stack[32];
 538 static char *save_stack_p;
 539 #define END_STRING_AND_SAVE(s) \
 540         do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
 541 #define RESTORE_END_STRING(s) \
 542         do { *(s) = *--save_stack_p; } while (0)
 543
 544 /* The instruction we're assembling.  */
 545 static i386_insn i;
 546
 547 /* Possible templates for current insn.  */
 548 static const templates *current_templates;
 549
 550 /* Per instruction expressionS buffers: max displacements & immediates.  */
 551 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
 552 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
 553
 554 /* Current operand we are working on.  */
 555 static int this_operand = -1;
 556
 557 /* We support four different modes.  FLAG_CODE variable is used to distinguish
 558    these.  */
 559
 560 enum flag_code {
 561         CODE_32BIT,
 562         CODE_16BIT,
 563         CODE_64BIT };
 564
 565 static enum flag_code flag_code;
 566 static unsigned int object_64bit;
 567 static unsigned int disallow_64bit_reloc;
 568 static int use_rela_relocations = 0;
 569 /* __tls_get_addr/___tls_get_addr symbol for TLS.  */
 570 static const char *tls_get_addr;
 571
 572 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
 573      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
 574      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
 575
 576 /* The ELF ABI to use.  */
 577 enum x86_elf_abi
 578 {
 579   I386_ABI,
 580   X86_64_ABI,
 581   X86_64_X32_ABI
 582 };
 583
 584 static enum x86_elf_abi x86_elf_abi = I386_ABI;
 585 #endif
 586
 587 #if defined (TE_PE) || defined (TE_PEP)
 588 /* Use big object file format.  */
 589 static int use_big_obj = 0;
 590 #endif
 591
 592 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 593 /* 1 if generating code for a shared library.  */
 594 static int shared = 0;
 595 #endif
 596
 597 /* 1 for intel syntax,
 598    0 if att syntax.  */
 599 static int intel_syntax = 0;
 600
 601 /* 1 for Intel64 ISA,
 602    0 if AMD64 ISA.  */
 603 static int intel64;
 604
 605 /* 1 for intel mnemonic,
 606    0 if att mnemonic.  */
 607 static int intel_mnemonic = !SYSV386_COMPAT;
 608
 609 /* 1 if pseudo registers are permitted.  */
 610 static int allow_pseudo_reg = 0;
 611
 612 /* 1 if register prefix % not required.  */
 613 static int allow_naked_reg = 0;
 614
 615 /* 1 if the assembler should add BND prefix for all control-transferring
 616    instructions supporting it, even if this prefix wasn't specified
 617    explicitly.  */
 618 static int add_bnd_prefix = 0;
 619
 620 /* 1 if pseudo index register, eiz/riz, is allowed .  */
 621 static int allow_index_reg = 0;
 622
 623 /* 1 if the assembler should ignore LOCK prefix, even if it was
 624    specified explicitly.  */
 625 static int omit_lock_prefix = 0;
 626
 627 /* 1 if the assembler should encode lfence, mfence, and sfence as
 628    "lock addl $0, (%{re}sp)".  */
 629 static int avoid_fence = 0;
 630
 631 /* Type of the previous instruction.  */
 632 static struct
 633   {
 634     segT seg;
 635     const char *file;
 636     const char *name;
 637     unsigned int line;
 638     enum last_insn_kind
 639       {
 640         last_insn_other = 0,
 641         last_insn_directive,
 642         last_insn_prefix
 643       } kind;
 644   } last_insn;
 645
 646 /* 1 if the assembler should generate relax relocations.  */
 647
 648 static int generate_relax_relocations
 649   = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
 650
 651 static enum check_kind
 652   {
 653     check_none = 0,
 654     check_warning,
 655     check_error
 656   }
 657 sse_check, operand_check = check_warning;
 658
 659 /* Non-zero if branches should be aligned within power of 2 boundary.  */
 660 static int align_branch_power = 0;
 661
 662 /* Types of branches to align.  */
 663 enum align_branch_kind
 664   {
 665     align_branch_none = 0,
 666     align_branch_jcc = 1,
 667     align_branch_fused = 2,
 668     align_branch_jmp = 3,
 669     align_branch_call = 4,
 670     align_branch_indirect = 5,
 671     align_branch_ret = 6
 672   };
 673
 674 /* Type bits of branches to align.  */
 675 enum align_branch_bit
 676   {
 677     align_branch_jcc_bit = 1 << align_branch_jcc,
 678     align_branch_fused_bit = 1 << align_branch_fused,
 679     align_branch_jmp_bit = 1 << align_branch_jmp,
 680     align_branch_call_bit = 1 << align_branch_call,
 681     align_branch_indirect_bit = 1 << align_branch_indirect,
 682     align_branch_ret_bit = 1 << align_branch_ret
 683   };
 684
 685 static unsigned int align_branch = (align_branch_jcc_bit
 686                                     | align_branch_fused_bit
 687                                     | align_branch_jmp_bit);
 688
 689 /* The maximum padding size for fused jcc.  CMP like instruction can
 690    be 9 bytes and jcc can be 6 bytes.  Leave room just in case for
 691    prefixes.   */
 692 #define MAX_FUSED_JCC_PADDING_SIZE 20
 693
 694 /* The maximum number of prefixes added for an instruction.  */
 695 static unsigned int align_branch_prefix_size = 5;
 696
 697 /* Optimization:
 698    1. Clear the REX_W bit with register operand if possible.
 699    2. Above plus use 128bit vector instruction to clear the full vector
 700       register.
 701  */
 702 static int optimize = 0;
 703
 704 /* Optimization:
 705    1. Clear the REX_W bit with register operand if possible.
 706    2. Above plus use 128bit vector instruction to clear the full vector
 707       register.
 708    3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
 709       "testb $imm7,%r8".
 710  */
 711 static int optimize_for_space = 0;
 712
 713 /* Register prefix used for error message.  */
 714 static const char *register_prefix = "%";
 715
 716 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
 717    leave, push, and pop instructions so that gcc has the same stack
 718    frame as in 32 bit mode.  */
 719 static char stackop_size = '\0';
 720
 721 /* Non-zero to optimize code alignment.  */
 722 int optimize_align_code = 1;
 723
 724 /* Non-zero to quieten some warnings.  */
 725 static int quiet_warnings = 0;
 726
 727 /* CPU name.  */
 728 static const char *cpu_arch_name = NULL;
 729 static char *cpu_sub_arch_name = NULL;
 730
 731 /* CPU feature flags.  */
 732 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
 733
 734 /* If we have selected a cpu we are generating instructions for.  */
 735 static int cpu_arch_tune_set = 0;
 736
 737 /* Cpu we are generating instructions for.  */
 738 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
 739
 740 /* CPU feature flags of cpu we are generating instructions for.  */
 741 static i386_cpu_flags cpu_arch_tune_flags;
 742
 743 /* CPU instruction set architecture used.  */
 744 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
 745
 746 /* CPU feature flags of instruction set architecture used.  */
 747 i386_cpu_flags cpu_arch_isa_flags;
 748
 749 /* If set, conditional jumps are not automatically promoted to handle
 750    larger than a byte offset.  */
 751 static unsigned int no_cond_jump_promotion = 0;
 752
 753 /* Encode SSE instructions with VEX prefix.  */
 754 static unsigned int sse2avx;
 755
 756 /* Encode scalar AVX instructions with specific vector length.  */
 757 static enum
 758   {
 759     vex128 = 0,
 760     vex256
 761   } avxscalar;
 762
 763 /* Encode VEX WIG instructions with specific vex.w.  */
 764 static enum
 765   {
 766     vexw0 = 0,
 767     vexw1
 768   } vexwig;
 769
 770 /* Encode scalar EVEX LIG instructions with specific vector length.  */
 771 static enum
 772   {
 773     evexl128 = 0,
 774     evexl256,
 775     evexl512
 776   } evexlig;
 777
 778 /* Encode EVEX WIG instructions with specific evex.w.  */
 779 static enum
 780   {
 781     evexw0 = 0,
 782     evexw1
 783   } evexwig;
 784
 785 /* Value to encode in EVEX RC bits, for SAE-only instructions.  */
 786 static enum rc_type evexrcig = rne;
 787
 788 /* Pre-defined "_GLOBAL_OFFSET_TABLE_".  */
 789 static symbolS *GOT_symbol;
 790
 791 /* The dwarf2 return column, adjusted for 32 or 64 bit.  */
 792 unsigned int x86_dwarf2_return_column;
 793
 794 /* The dwarf2 data alignment, adjusted for 32 or 64 bit.  */
 795 int x86_cie_data_alignment;
 796
 797 /* Interface to relax_segment.
 798    There are 3 major relax states for 386 jump insns because the
 799    different types of jumps add different sizes to frags when we're
 800    figuring out what sort of jump to choose to reach a given label.
 801
 802    BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
 803    branches which are handled by md_estimate_size_before_relax() and
 804    i386_generic_table_relax_frag().  */
 805
 806 /* Types.  */
 807 #define UNCOND_JUMP 0
 808 #define COND_JUMP 1
 809 #define COND_JUMP86 2
 810 #define BRANCH_PADDING 3
 811 #define BRANCH_PREFIX 4
 812 #define FUSED_JCC_PADDING 5
 813
 814 /* Sizes.  */
 815 #define CODE16  1
 816 #define SMALL   0
 817 #define SMALL16 (SMALL | CODE16)
 818 #define BIG     2
 819 #define BIG16   (BIG | CODE16)
 820
 821 #ifndef INLINE
 822 #ifdef __GNUC__
 823 #define INLINE __inline__
 824 #else
 825 #define INLINE
 826 #endif
 827 #endif
 828
 829 #define ENCODE_RELAX_STATE(type, size) \
 830   ((relax_substateT) (((type) << 2) | (size)))
 831 #define TYPE_FROM_RELAX_STATE(s) \
 832   ((s) >> 2)
 833 #define DISP_SIZE_FROM_RELAX_STATE(s) \
 834     ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
 835
 836 /* This table is used by relax_frag to promote short jumps to long
 837    ones where necessary.  SMALL (short) jumps may be promoted to BIG
 838    (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long).  We
 839    don't allow a short jump in a 32 bit code segment to be promoted to
 840    a 16 bit offset jump because it's slower (requires data size
 841    prefix), and doesn't work, unless the destination is in the bottom
 842    64k of the code segment (The top 16 bits of eip are zeroed).  */
 843
 844 const relax_typeS md_relax_table[] =
 845 {
 846   /* The fields are:
 847      1) most positive reach of this state,
 848      2) most negative reach of this state,
 849      3) how many bytes this mode will have in the variable part of the frag
 850      4) which index into the table to try if we can't fit into this one.  */
 851
 852   /* UNCOND_JUMP states.  */
 853   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
 854   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
 855   /* dword jmp adds 4 bytes to frag:
 856      0 extra opcode bytes, 4 displacement bytes.  */
 857   {0, 0, 4, 0},
 858   /* word jmp adds 2 byte2 to frag:
 859      0 extra opcode bytes, 2 displacement bytes.  */
 860   {0, 0, 2, 0},
 861
 862   /* COND_JUMP states.  */
 863   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
 864   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
 865   /* dword conditionals adds 5 bytes to frag:
 866      1 extra opcode byte, 4 displacement bytes.  */
 867   {0, 0, 5, 0},
 868   /* word conditionals add 3 bytes to frag:
 869      1 extra opcode byte, 2 displacement bytes.  */
 870   {0, 0, 3, 0},
 871
 872   /* COND_JUMP86 states.  */
 873   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
 874   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
 875   /* dword conditionals adds 5 bytes to frag:
 876      1 extra opcode byte, 4 displacement bytes.  */
 877   {0, 0, 5, 0},
 878   /* word conditionals add 4 bytes to frag:
 879      1 displacement byte and a 3 byte long branch insn.  */
 880   {0, 0, 4, 0}
 881 };
 882
 883 static const arch_entry cpu_arch[] =
 884 {
 885   /* Do not replace the first two entries - i386_target_format()
 886      relies on them being there in this order.  */
 887   { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
 888     CPU_GENERIC32_FLAGS, 0 },
 889   { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
 890     CPU_GENERIC64_FLAGS, 0 },
 891   { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
 892     CPU_NONE_FLAGS, 0 },
 893   { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
 894     CPU_I186_FLAGS, 0 },
 895   { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
 896     CPU_I286_FLAGS, 0 },
 897   { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
 898     CPU_I386_FLAGS, 0 },
 899   { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
 900     CPU_I486_FLAGS, 0 },
 901   { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
 902     CPU_I586_FLAGS, 0 },
 903   { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
 904     CPU_I686_FLAGS, 0 },
 905   { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
 906     CPU_I586_FLAGS, 0 },
 907   { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
 908     CPU_PENTIUMPRO_FLAGS, 0 },
 909   { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
 910     CPU_P2_FLAGS, 0 },
 911   { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
 912     CPU_P3_FLAGS, 0 },
 913   { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
 914     CPU_P4_FLAGS, 0 },
 915   { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
 916     CPU_CORE_FLAGS, 0 },
 917   { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
 918     CPU_NOCONA_FLAGS, 0 },
 919   { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
 920     CPU_CORE_FLAGS, 1 },
 921   { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
 922     CPU_CORE_FLAGS, 0 },
 923   { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
 924     CPU_CORE2_FLAGS, 1 },
 925   { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
 926     CPU_CORE2_FLAGS, 0 },
 927   { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
 928     CPU_COREI7_FLAGS, 0 },
 929   { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
 930     CPU_L1OM_FLAGS, 0 },
 931   { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
 932     CPU_K1OM_FLAGS, 0 },
 933   { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
 934     CPU_IAMCU_FLAGS, 0 },
 935   { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
 936     CPU_K6_FLAGS, 0 },
 937   { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
 938     CPU_K6_2_FLAGS, 0 },
 939   { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
 940     CPU_ATHLON_FLAGS, 0 },
 941   { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
 942     CPU_K8_FLAGS, 1 },
 943   { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
 944     CPU_K8_FLAGS, 0 },
 945   { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
 946     CPU_K8_FLAGS, 0 },
 947   { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
 948     CPU_AMDFAM10_FLAGS, 0 },
 949   { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
 950     CPU_BDVER1_FLAGS, 0 },
 951   { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
 952     CPU_BDVER2_FLAGS, 0 },
 953   { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
 954     CPU_BDVER3_FLAGS, 0 },
 955   { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
 956     CPU_BDVER4_FLAGS, 0 },
 957   { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
 958     CPU_ZNVER1_FLAGS, 0 },
 959   { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
 960     CPU_ZNVER2_FLAGS, 0 },
 961   { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
 962     CPU_BTVER1_FLAGS, 0 },
 963   { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
 964     CPU_BTVER2_FLAGS, 0 },
 965   { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
 966     CPU_8087_FLAGS, 0 },
 967   { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
 968     CPU_287_FLAGS, 0 },
 969   { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
 970     CPU_387_FLAGS, 0 },
 971   { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
 972     CPU_687_FLAGS, 0 },
 973   { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
 974     CPU_CMOV_FLAGS, 0 },
 975   { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
 976     CPU_FXSR_FLAGS, 0 },
 977   { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
 978     CPU_MMX_FLAGS, 0 },
 979   { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
 980     CPU_SSE_FLAGS, 0 },
 981   { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
 982     CPU_SSE2_FLAGS, 0 },
 983   { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
 984     CPU_SSE3_FLAGS, 0 },
 985   { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
 986     CPU_SSSE3_FLAGS, 0 },
 987   { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
 988     CPU_SSE4_1_FLAGS, 0 },
 989   { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
 990     CPU_SSE4_2_FLAGS, 0 },
 991   { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
 992     CPU_SSE4_2_FLAGS, 0 },
 993   { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
 994     CPU_AVX_FLAGS, 0 },
 995   { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
 996     CPU_AVX2_FLAGS, 0 },
 997   { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
 998     CPU_AVX512F_FLAGS, 0 },
 999   { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1000     CPU_AVX512CD_FLAGS, 0 },
1001   { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1002     CPU_AVX512ER_FLAGS, 0 },
1003   { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1004     CPU_AVX512PF_FLAGS, 0 },
1005   { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1006     CPU_AVX512DQ_FLAGS, 0 },
1007   { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1008     CPU_AVX512BW_FLAGS, 0 },
1009   { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1010     CPU_AVX512VL_FLAGS, 0 },
1011   { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1012     CPU_VMX_FLAGS, 0 },
1013   { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1014     CPU_VMFUNC_FLAGS, 0 },
1015   { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1016     CPU_SMX_FLAGS, 0 },
1017   { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1018     CPU_XSAVE_FLAGS, 0 },
1019   { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1020     CPU_XSAVEOPT_FLAGS, 0 },
1021   { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1022     CPU_XSAVEC_FLAGS, 0 },
1023   { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1024     CPU_XSAVES_FLAGS, 0 },
1025   { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1026     CPU_AES_FLAGS, 0 },
1027   { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1028     CPU_PCLMUL_FLAGS, 0 },
1029   { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1030     CPU_PCLMUL_FLAGS, 1 },
1031   { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1032     CPU_FSGSBASE_FLAGS, 0 },
1033   { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1034     CPU_RDRND_FLAGS, 0 },
1035   { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1036     CPU_F16C_FLAGS, 0 },
1037   { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1038     CPU_BMI2_FLAGS, 0 },
1039   { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1040     CPU_FMA_FLAGS, 0 },
1041   { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1042     CPU_FMA4_FLAGS, 0 },
1043   { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1044     CPU_XOP_FLAGS, 0 },
1045   { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1046     CPU_LWP_FLAGS, 0 },
1047   { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1048     CPU_MOVBE_FLAGS, 0 },
1049   { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1050     CPU_CX16_FLAGS, 0 },
1051   { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1052     CPU_EPT_FLAGS, 0 },
1053   { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1054     CPU_LZCNT_FLAGS, 0 },
1055   { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1056     CPU_HLE_FLAGS, 0 },
1057   { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1058     CPU_RTM_FLAGS, 0 },
1059   { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1060     CPU_INVPCID_FLAGS, 0 },
1061   { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1062     CPU_CLFLUSH_FLAGS, 0 },
1063   { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1064     CPU_NOP_FLAGS, 0 },
1065   { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1066     CPU_SYSCALL_FLAGS, 0 },
1067   { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1068     CPU_RDTSCP_FLAGS, 0 },
1069   { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1070     CPU_3DNOW_FLAGS, 0 },
1071   { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1072     CPU_3DNOWA_FLAGS, 0 },
1073   { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1074     CPU_PADLOCK_FLAGS, 0 },
1075   { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1076     CPU_SVME_FLAGS, 1 },
1077   { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1078     CPU_SVME_FLAGS, 0 },
1079   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1080     CPU_SSE4A_FLAGS, 0 },
1081   { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1082     CPU_ABM_FLAGS, 0 },
1083   { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1084     CPU_BMI_FLAGS, 0 },
1085   { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1086     CPU_TBM_FLAGS, 0 },
1087   { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1088     CPU_ADX_FLAGS, 0 },
1089   { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1090     CPU_RDSEED_FLAGS, 0 },
1091   { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1092     CPU_PRFCHW_FLAGS, 0 },
1093   { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1094     CPU_SMAP_FLAGS, 0 },
1095   { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1096     CPU_MPX_FLAGS, 0 },
1097   { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1098     CPU_SHA_FLAGS, 0 },
1099   { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1100     CPU_CLFLUSHOPT_FLAGS, 0 },
1101   { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1102     CPU_PREFETCHWT1_FLAGS, 0 },
1103   { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1104     CPU_SE1_FLAGS, 0 },
1105   { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1106     CPU_CLWB_FLAGS, 0 },
1107   { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1108     CPU_AVX512IFMA_FLAGS, 0 },
1109   { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1110     CPU_AVX512VBMI_FLAGS, 0 },
1111   { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1112     CPU_AVX512_4FMAPS_FLAGS, 0 },
1113   { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1114     CPU_AVX512_4VNNIW_FLAGS, 0 },
1115   { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1116     CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1117   { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1118     CPU_AVX512_VBMI2_FLAGS, 0 },
1119   { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1120     CPU_AVX512_VNNI_FLAGS, 0 },
1121   { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1122     CPU_AVX512_BITALG_FLAGS, 0 },
1123   { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1124     CPU_CLZERO_FLAGS, 0 },
1125   { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1126     CPU_MWAITX_FLAGS, 0 },
1127   { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1128     CPU_OSPKE_FLAGS, 0 },
1129   { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1130     CPU_RDPID_FLAGS, 0 },
1131   { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1132     CPU_PTWRITE_FLAGS, 0 },
1133   { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1134     CPU_IBT_FLAGS, 0 },
1135   { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1136     CPU_SHSTK_FLAGS, 0 },
1137   { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1138     CPU_GFNI_FLAGS, 0 },
1139   { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1140     CPU_VAES_FLAGS, 0 },
1141   { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1142     CPU_VPCLMULQDQ_FLAGS, 0 },
1143   { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1144     CPU_WBNOINVD_FLAGS, 0 },
1145   { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1146     CPU_PCONFIG_FLAGS, 0 },
1147   { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1148     CPU_WAITPKG_FLAGS, 0 },
1149   { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1150     CPU_CLDEMOTE_FLAGS, 0 },
1151   { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1152     CPU_MOVDIRI_FLAGS, 0 },
1153   { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1154     CPU_MOVDIR64B_FLAGS, 0 },
1155   { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1156     CPU_AVX512_BF16_FLAGS, 0 },
1157   { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1158     CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1159   { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1160     CPU_ENQCMD_FLAGS, 0 },
1161   { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1162     CPU_RDPRU_FLAGS, 0 },
1163   { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1164     CPU_MCOMMIT_FLAGS, 0 },
1165 };
1166
1167 static const noarch_entry cpu_noarch[] =
1168 {
1169   { STRING_COMMA_LEN ("no87"),  CPU_ANY_X87_FLAGS },
1170   { STRING_COMMA_LEN ("no287"),  CPU_ANY_287_FLAGS },
1171   { STRING_COMMA_LEN ("no387"),  CPU_ANY_387_FLAGS },
1172   { STRING_COMMA_LEN ("no687"),  CPU_ANY_687_FLAGS },
1173   { STRING_COMMA_LEN ("nocmov"),  CPU_ANY_CMOV_FLAGS },
1174   { STRING_COMMA_LEN ("nofxsr"),  CPU_ANY_FXSR_FLAGS },
1175   { STRING_COMMA_LEN ("nommx"),  CPU_ANY_MMX_FLAGS },
1176   { STRING_COMMA_LEN ("nosse"),  CPU_ANY_SSE_FLAGS },
1177   { STRING_COMMA_LEN ("nosse2"),  CPU_ANY_SSE2_FLAGS },
1178   { STRING_COMMA_LEN ("nosse3"),  CPU_ANY_SSE3_FLAGS },
1179   { STRING_COMMA_LEN ("nossse3"),  CPU_ANY_SSSE3_FLAGS },
1180   { STRING_COMMA_LEN ("nosse4.1"),  CPU_ANY_SSE4_1_FLAGS },
1181   { STRING_COMMA_LEN ("nosse4.2"),  CPU_ANY_SSE4_2_FLAGS },
1182   { STRING_COMMA_LEN ("nosse4"),  CPU_ANY_SSE4_1_FLAGS },
1183   { STRING_COMMA_LEN ("noavx"),  CPU_ANY_AVX_FLAGS },
1184   { STRING_COMMA_LEN ("noavx2"),  CPU_ANY_AVX2_FLAGS },
1185   { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1186   { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1187   { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1188   { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1189   { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1190   { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1191   { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1192   { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1193   { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1194   { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1195   { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1196   { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1197   { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1198   { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1199   { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1200   { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1201   { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1202   { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1203   { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1204   { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1205   { STRING_COMMA_LEN ("noavx512_vp2intersect"), CPU_ANY_SHSTK_FLAGS },
1206   { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1207 };
1208
1209 #ifdef I386COFF
1210 /* Like s_lcomm_internal in gas/read.c but the alignment string
1211    is allowed to be optional.  */
1212
1213 static symbolS *
1214 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1215 {
1216   addressT align = 0;
1217
1218   SKIP_WHITESPACE ();
1219
1220   if (needs_align
1221       && *input_line_pointer == ',')
1222     {
1223       align = parse_align (needs_align - 1);
1224
1225       if (align == (addressT) -1)
1226         return NULL;
1227     }
1228   else
1229     {
1230       if (size >= 8)
1231         align = 3;
1232       else if (size >= 4)
1233         align = 2;
1234       else if (size >= 2)
1235         align = 1;
1236       else
1237         align = 0;
1238     }
1239
1240   bss_alloc (symbolP, size, align);
1241   return symbolP;
1242 }
1243
1244 static void
1245 pe_lcomm (int needs_align)
1246 {
1247   s_comm_internal (needs_align * 2, pe_lcomm_internal);
1248 }
1249 #endif
1250
1251 const pseudo_typeS md_pseudo_table[] =
1252 {
1253 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1254   {"align", s_align_bytes, 0},
1255 #else
1256   {"align", s_align_ptwo, 0},
1257 #endif
1258   {"arch", set_cpu_arch, 0},
1259 #ifndef I386COFF
1260   {"bss", s_bss, 0},
1261 #else
1262   {"lcomm", pe_lcomm, 1},
1263 #endif
1264   {"ffloat", float_cons, 'f'},
1265   {"dfloat", float_cons, 'd'},
1266   {"tfloat", float_cons, 'x'},
1267   {"value", cons, 2},
1268   {"slong", signed_cons, 4},
1269   {"noopt", s_ignore, 0},
1270   {"optim", s_ignore, 0},
1271   {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1272   {"code16", set_code_flag, CODE_16BIT},
1273   {"code32", set_code_flag, CODE_32BIT},
1274 #ifdef BFD64
1275   {"code64", set_code_flag, CODE_64BIT},
1276 #endif
1277   {"intel_syntax", set_intel_syntax, 1},
1278   {"att_syntax", set_intel_syntax, 0},
1279   {"intel_mnemonic", set_intel_mnemonic, 1},
1280   {"att_mnemonic", set_intel_mnemonic, 0},
1281   {"allow_index_reg", set_allow_index_reg, 1},
1282   {"disallow_index_reg", set_allow_index_reg, 0},
1283   {"sse_check", set_check, 0},
1284   {"operand_check", set_check, 1},
1285 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1286   {"largecomm", handle_large_common, 0},
1287 #else
1288   {"file", dwarf2_directive_file, 0},
1289   {"loc", dwarf2_directive_loc, 0},
1290   {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1291 #endif
1292 #ifdef TE_PE
1293   {"secrel32", pe_directive_secrel, 0},
1294 #endif
1295   {0, 0, 0}
1296 };
1297
1298 /* For interface with expression ().  */
1299 extern char *input_line_pointer;
1300
1301 /* Hash table for instruction mnemonic lookup.  */
1302 static struct hash_control *op_hash;
1303
1304 /* Hash table for register lookup.  */
1305 static struct hash_control *reg_hash;
1306 \f
1307   /* Various efficient no-op patterns for aligning code labels.
1308      Note: Don't try to assemble the instructions in the comments.
1309      0L and 0w are not legal.  */
1310 static const unsigned char f32_1[] =
1311   {0x90};                               /* nop                  */
1312 static const unsigned char f32_2[] =
1313   {0x66,0x90};                          /* xchg %ax,%ax         */
1314 static const unsigned char f32_3[] =
1315   {0x8d,0x76,0x00};                     /* leal 0(%esi),%esi    */
1316 static const unsigned char f32_4[] =
1317   {0x8d,0x74,0x26,0x00};                /* leal 0(%esi,1),%esi  */
1318 static const unsigned char f32_6[] =
1319   {0x8d,0xb6,0x00,0x00,0x00,0x00};      /* leal 0L(%esi),%esi   */
1320 static const unsigned char f32_7[] =
1321   {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1322 static const unsigned char f16_3[] =
1323   {0x8d,0x74,0x00};                     /* lea 0(%si),%si       */
1324 static const unsigned char f16_4[] =
1325   {0x8d,0xb4,0x00,0x00};                /* lea 0W(%si),%si      */
1326 static const unsigned char jump_disp8[] =
1327   {0xeb};                               /* jmp disp8           */
1328 static const unsigned char jump32_disp32[] =
1329   {0xe9};                               /* jmp disp32          */
1330 static const unsigned char jump16_disp32[] =
1331   {0x66,0xe9};                          /* jmp disp32          */
1332 /* 32-bit NOPs patterns.  */
1333 static const unsigned char *const f32_patt[] = {
1334   f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1335 };
1336 /* 16-bit NOPs patterns.  */
1337 static const unsigned char *const f16_patt[] = {
1338   f32_1, f32_2, f16_3, f16_4
1339 };
1340 /* nopl (%[re]ax) */
1341 static const unsigned char alt_3[] =
1342   {0x0f,0x1f,0x00};
1343 /* nopl 0(%[re]ax) */
1344 static const unsigned char alt_4[] =
1345   {0x0f,0x1f,0x40,0x00};
1346 /* nopl 0(%[re]ax,%[re]ax,1) */
1347 static const unsigned char alt_5[] =
1348   {0x0f,0x1f,0x44,0x00,0x00};
1349 /* nopw 0(%[re]ax,%[re]ax,1) */
1350 static const unsigned char alt_6[] =
1351   {0x66,0x0f,0x1f,0x44,0x00,0x00};
1352 /* nopl 0L(%[re]ax) */
1353 static const unsigned char alt_7[] =
1354   {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1355 /* nopl 0L(%[re]ax,%[re]ax,1) */
1356 static const unsigned char alt_8[] =
1357   {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1358 /* nopw 0L(%[re]ax,%[re]ax,1) */
1359 static const unsigned char alt_9[] =
1360   {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1361 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1362 static const unsigned char alt_10[] =
1363   {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1364 /* data16 nopw %cs:0L(%eax,%eax,1) */
1365 static const unsigned char alt_11[] =
1366   {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1367 /* 32-bit and 64-bit NOPs patterns.  */
1368 static const unsigned char *const alt_patt[] = {
1369   f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1370   alt_9, alt_10, alt_11
1371 };
1372
1373 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1374    size of a single NOP instruction MAX_SINGLE_NOP_SIZE.  */
1375
1376 static void
1377 i386_output_nops (char *where, const unsigned char *const *patt,
1378                   int count, int max_single_nop_size)
1379
1380 {
1381   /* Place the longer NOP first.  */
1382   int last;
1383   int offset;
1384   const unsigned char *nops;
1385
1386   if (max_single_nop_size < 1)
1387     {
1388       as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1389                 max_single_nop_size);
1390       return;
1391     }
1392
1393   nops = patt[max_single_nop_size - 1];
1394
1395   /* Use the smaller one if the requsted one isn't available.  */
1396   if (nops == NULL)
1397     {
1398       max_single_nop_size--;
1399       nops = patt[max_single_nop_size - 1];
1400     }
1401
1402   last = count % max_single_nop_size;
1403
1404   count -= last;
1405   for (offset = 0; offset < count; offset += max_single_nop_size)
1406     memcpy (where + offset, nops, max_single_nop_size);
1407
1408   if (last)
1409     {
1410       nops = patt[last - 1];
1411       if (nops == NULL)
1412         {
1413           /* Use the smaller one plus one-byte NOP if the needed one
1414              isn't available.  */
1415           last--;
1416           nops = patt[last - 1];
1417           memcpy (where + offset, nops, last);
1418           where[offset + last] = *patt[0];
1419         }
1420       else
1421         memcpy (where + offset, nops, last);
1422     }
1423 }
1424
1425 static INLINE int
1426 fits_in_imm7 (offsetT num)
1427 {
1428   return (num & 0x7f) == num;
1429 }
1430
1431 static INLINE int
1432 fits_in_imm31 (offsetT num)
1433 {
1434   return (num & 0x7fffffff) == num;
1435 }
1436
1437 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1438    single NOP instruction LIMIT.  */
1439
1440 void
1441 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1442 {
1443   const unsigned char *const *patt = NULL;
1444   int max_single_nop_size;
1445   /* Maximum number of NOPs before switching to jump over NOPs.  */
1446   int max_number_of_nops;
1447
1448   switch (fragP->fr_type)
1449     {
1450     case rs_fill_nop:
1451     case rs_align_code:
1452       break;
1453     case rs_machine_dependent:
1454       /* Allow NOP padding for jumps and calls.  */
1455       if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1456           || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1457         break;
1458       /* Fall through.  */
1459     default:
1460       return;
1461     }
1462
1463   /* We need to decide which NOP sequence to use for 32bit and
1464      64bit. When -mtune= is used:
1465
1466      1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1467      PROCESSOR_GENERIC32, f32_patt will be used.
1468      2. For the rest, alt_patt will be used.
1469
1470      When -mtune= isn't used, alt_patt will be used if
1471      cpu_arch_isa_flags has CpuNop.  Otherwise, f32_patt will
1472      be used.
1473
1474      When -march= or .arch is used, we can't use anything beyond
1475      cpu_arch_isa_flags.   */
1476
1477   if (flag_code == CODE_16BIT)
1478     {
1479       patt = f16_patt;
1480       max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1481       /* Limit number of NOPs to 2 in 16-bit mode.  */
1482       max_number_of_nops = 2;
1483     }
1484   else
1485     {
1486       if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1487         {
1488           /* PROCESSOR_UNKNOWN means that all ISAs may be used.  */
1489           switch (cpu_arch_tune)
1490             {
1491             case PROCESSOR_UNKNOWN:
1492               /* We use cpu_arch_isa_flags to check if we SHOULD
1493                  optimize with nops.  */
1494               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1495                 patt = alt_patt;
1496               else
1497                 patt = f32_patt;
1498               break;
1499             case PROCESSOR_PENTIUM4:
1500             case PROCESSOR_NOCONA:
1501             case PROCESSOR_CORE:
1502             case PROCESSOR_CORE2:
1503             case PROCESSOR_COREI7:
1504             case PROCESSOR_L1OM:
1505             case PROCESSOR_K1OM:
1506             case PROCESSOR_GENERIC64:
1507             case PROCESSOR_K6:
1508             case PROCESSOR_ATHLON:
1509             case PROCESSOR_K8:
1510             case PROCESSOR_AMDFAM10:
1511             case PROCESSOR_BD:
1512             case PROCESSOR_ZNVER:
1513             case PROCESSOR_BT:
1514               patt = alt_patt;
1515               break;
1516             case PROCESSOR_I386:
1517             case PROCESSOR_I486:
1518             case PROCESSOR_PENTIUM:
1519             case PROCESSOR_PENTIUMPRO:
1520             case PROCESSOR_IAMCU:
1521             case PROCESSOR_GENERIC32:
1522               patt = f32_patt;
1523               break;
1524             }
1525         }
1526       else
1527         {
1528           switch (fragP->tc_frag_data.tune)
1529             {
1530             case PROCESSOR_UNKNOWN:
1531               /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1532                  PROCESSOR_UNKNOWN.  */
1533               abort ();
1534               break;
1535
1536             case PROCESSOR_I386:
1537             case PROCESSOR_I486:
1538             case PROCESSOR_PENTIUM:
1539             case PROCESSOR_IAMCU:
1540             case PROCESSOR_K6:
1541             case PROCESSOR_ATHLON:
1542             case PROCESSOR_K8:
1543             case PROCESSOR_AMDFAM10:
1544             case PROCESSOR_BD:
1545             case PROCESSOR_ZNVER:
1546             case PROCESSOR_BT:
1547             case PROCESSOR_GENERIC32:
1548               /* We use cpu_arch_isa_flags to check if we CAN optimize
1549                  with nops.  */
1550               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1551                 patt = alt_patt;
1552               else
1553                 patt = f32_patt;
1554               break;
1555             case PROCESSOR_PENTIUMPRO:
1556             case PROCESSOR_PENTIUM4:
1557             case PROCESSOR_NOCONA:
1558             case PROCESSOR_CORE:
1559             case PROCESSOR_CORE2:
1560             case PROCESSOR_COREI7:
1561             case PROCESSOR_L1OM:
1562             case PROCESSOR_K1OM:
1563               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1564                 patt = alt_patt;
1565               else
1566                 patt = f32_patt;
1567               break;
1568             case PROCESSOR_GENERIC64:
1569               patt = alt_patt;
1570               break;
1571             }
1572         }
1573
1574       if (patt == f32_patt)
1575         {
1576           max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1577           /* Limit number of NOPs to 2 for older processors.  */
1578           max_number_of_nops = 2;
1579         }
1580       else
1581         {
1582           max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1583           /* Limit number of NOPs to 7 for newer processors.  */
1584           max_number_of_nops = 7;
1585         }
1586     }
1587
1588   if (limit == 0)
1589     limit = max_single_nop_size;
1590
1591   if (fragP->fr_type == rs_fill_nop)
1592     {
1593       /* Output NOPs for .nop directive.  */
1594       if (limit > max_single_nop_size)
1595         {
1596           as_bad_where (fragP->fr_file, fragP->fr_line,
1597                         _("invalid single nop size: %d "
1598                           "(expect within [0, %d])"),
1599                         limit, max_single_nop_size);
1600           return;
1601         }
1602     }
1603   else if (fragP->fr_type != rs_machine_dependent)
1604     fragP->fr_var = count;
1605
1606   if ((count / max_single_nop_size) > max_number_of_nops)
1607     {
1608       /* Generate jump over NOPs.  */
1609       offsetT disp = count - 2;
1610       if (fits_in_imm7 (disp))
1611         {
1612           /* Use "jmp disp8" if possible.  */
1613           count = disp;
1614           where[0] = jump_disp8[0];
1615           where[1] = count;
1616           where += 2;
1617         }
1618       else
1619         {
1620           unsigned int size_of_jump;
1621
1622           if (flag_code == CODE_16BIT)
1623             {
1624               where[0] = jump16_disp32[0];
1625               where[1] = jump16_disp32[1];
1626               size_of_jump = 2;
1627             }
1628           else
1629             {
1630               where[0] = jump32_disp32[0];
1631               size_of_jump = 1;
1632             }
1633
1634           count -= size_of_jump + 4;
1635           if (!fits_in_imm31 (count))
1636             {
1637               as_bad_where (fragP->fr_file, fragP->fr_line,
1638                             _("jump over nop padding out of range"));
1639               return;
1640             }
1641
1642           md_number_to_chars (where + size_of_jump, count, 4);
1643           where += size_of_jump + 4;
1644         }
1645     }
1646
1647   /* Generate multiple NOPs.  */
1648   i386_output_nops (where, patt, count, limit);
1649 }
1650
1651 static INLINE int
1652 operand_type_all_zero (const union i386_operand_type *x)
1653 {
1654   switch (ARRAY_SIZE(x->array))
1655     {
1656     case 3:
1657       if (x->array[2])
1658         return 0;
1659       /* Fall through.  */
1660     case 2:
1661       if (x->array[1])
1662         return 0;
1663       /* Fall through.  */
1664     case 1:
1665       return !x->array[0];
1666     default:
1667       abort ();
1668     }
1669 }
1670
1671 static INLINE void
1672 operand_type_set (union i386_operand_type *x, unsigned int v)
1673 {
1674   switch (ARRAY_SIZE(x->array))
1675     {
1676     case 3:
1677       x->array[2] = v;
1678       /* Fall through.  */
1679     case 2:
1680       x->array[1] = v;
1681       /* Fall through.  */
1682     case 1:
1683       x->array[0] = v;
1684       /* Fall through.  */
1685       break;
1686     default:
1687       abort ();
1688     }
1689
1690   x->bitfield.class = ClassNone;
1691   x->bitfield.instance = InstanceNone;
1692 }
1693
1694 static INLINE int
1695 operand_type_equal (const union i386_operand_type *x,
1696                     const union i386_operand_type *y)
1697 {
1698   switch (ARRAY_SIZE(x->array))
1699     {
1700     case 3:
1701       if (x->array[2] != y->array[2])
1702         return 0;
1703       /* Fall through.  */
1704     case 2:
1705       if (x->array[1] != y->array[1])
1706         return 0;
1707       /* Fall through.  */
1708     case 1:
1709       return x->array[0] == y->array[0];
1710       break;
1711     default:
1712       abort ();
1713     }
1714 }
1715
1716 static INLINE int
1717 cpu_flags_all_zero (const union i386_cpu_flags *x)
1718 {
1719   switch (ARRAY_SIZE(x->array))
1720     {
1721     case 4:
1722       if (x->array[3])
1723         return 0;
1724       /* Fall through.  */
1725     case 3:
1726       if (x->array[2])
1727         return 0;
1728       /* Fall through.  */
1729     case 2:
1730       if (x->array[1])
1731         return 0;
1732       /* Fall through.  */
1733     case 1:
1734       return !x->array[0];
1735     default:
1736       abort ();
1737     }
1738 }
1739
1740 static INLINE int
1741 cpu_flags_equal (const union i386_cpu_flags *x,
1742                  const union i386_cpu_flags *y)
1743 {
1744   switch (ARRAY_SIZE(x->array))
1745     {
1746     case 4:
1747       if (x->array[3] != y->array[3])
1748         return 0;
1749       /* Fall through.  */
1750     case 3:
1751       if (x->array[2] != y->array[2])
1752         return 0;
1753       /* Fall through.  */
1754     case 2:
1755       if (x->array[1] != y->array[1])
1756         return 0;
1757       /* Fall through.  */
1758     case 1:
1759       return x->array[0] == y->array[0];
1760       break;
1761     default:
1762       abort ();
1763     }
1764 }
1765
1766 static INLINE int
1767 cpu_flags_check_cpu64 (i386_cpu_flags f)
1768 {
1769   return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1770            || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1771 }
1772
1773 static INLINE i386_cpu_flags
1774 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1775 {
1776   switch (ARRAY_SIZE (x.array))
1777     {
1778     case 4:
1779       x.array [3] &= y.array [3];
1780       /* Fall through.  */
1781     case 3:
1782       x.array [2] &= y.array [2];
1783       /* Fall through.  */
1784     case 2:
1785       x.array [1] &= y.array [1];
1786       /* Fall through.  */
1787     case 1:
1788       x.array [0] &= y.array [0];
1789       break;
1790     default:
1791       abort ();
1792     }
1793   return x;
1794 }
1795
1796 static INLINE i386_cpu_flags
1797 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1798 {
1799   switch (ARRAY_SIZE (x.array))
1800     {
1801     case 4:
1802       x.array [3] |= y.array [3];
1803       /* Fall through.  */
1804     case 3:
1805       x.array [2] |= y.array [2];
1806       /* Fall through.  */
1807     case 2:
1808       x.array [1] |= y.array [1];
1809       /* Fall through.  */
1810     case 1:
1811       x.array [0] |= y.array [0];
1812       break;
1813     default:
1814       abort ();
1815     }
1816   return x;
1817 }
1818
1819 static INLINE i386_cpu_flags
1820 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1821 {
1822   switch (ARRAY_SIZE (x.array))
1823     {
1824     case 4:
1825       x.array [3] &= ~y.array [3];
1826       /* Fall through.  */
1827     case 3:
1828       x.array [2] &= ~y.array [2];
1829       /* Fall through.  */
1830     case 2:
1831       x.array [1] &= ~y.array [1];
1832       /* Fall through.  */
1833     case 1:
1834       x.array [0] &= ~y.array [0];
1835       break;
1836     default:
1837       abort ();
1838     }
1839   return x;
1840 }
1841
1842 #define CPU_FLAGS_ARCH_MATCH            0x1
1843 #define CPU_FLAGS_64BIT_MATCH           0x2
1844
1845 #define CPU_FLAGS_PERFECT_MATCH \
1846   (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1847
1848 /* Return CPU flags match bits. */
1849
1850 static int
1851 cpu_flags_match (const insn_template *t)
1852 {
1853   i386_cpu_flags x = t->cpu_flags;
1854   int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1855
1856   x.bitfield.cpu64 = 0;
1857   x.bitfield.cpuno64 = 0;
1858
1859   if (cpu_flags_all_zero (&x))
1860     {
1861       /* This instruction is available on all archs.  */
1862       match |= CPU_FLAGS_ARCH_MATCH;
1863     }
1864   else
1865     {
1866       /* This instruction is available only on some archs.  */
1867       i386_cpu_flags cpu = cpu_arch_flags;
1868
1869       /* AVX512VL is no standalone feature - match it and then strip it.  */
1870       if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1871         return match;
1872       x.bitfield.cpuavx512vl = 0;
1873
1874       cpu = cpu_flags_and (x, cpu);
1875       if (!cpu_flags_all_zero (&cpu))
1876         {
1877           if (x.bitfield.cpuavx)
1878             {
1879               /* We need to check a few extra flags with AVX.  */
1880               if (cpu.bitfield.cpuavx
1881                   && (!t->opcode_modifier.sse2avx || sse2avx)
1882                   && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1883                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1884                   && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1885                 match |= CPU_FLAGS_ARCH_MATCH;
1886             }
1887           else if (x.bitfield.cpuavx512f)
1888             {
1889               /* We need to check a few extra flags with AVX512F.  */
1890               if (cpu.bitfield.cpuavx512f
1891                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1892                   && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1893                   && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1894                 match |= CPU_FLAGS_ARCH_MATCH;
1895             }
1896           else
1897             match |= CPU_FLAGS_ARCH_MATCH;
1898         }
1899     }
1900   return match;
1901 }
1902
1903 static INLINE i386_operand_type
1904 operand_type_and (i386_operand_type x, i386_operand_type y)
1905 {
1906   if (x.bitfield.class != y.bitfield.class)
1907     x.bitfield.class = ClassNone;
1908   if (x.bitfield.instance != y.bitfield.instance)
1909     x.bitfield.instance = InstanceNone;
1910
1911   switch (ARRAY_SIZE (x.array))
1912     {
1913     case 3:
1914       x.array [2] &= y.array [2];
1915       /* Fall through.  */
1916     case 2:
1917       x.array [1] &= y.array [1];
1918       /* Fall through.  */
1919     case 1:
1920       x.array [0] &= y.array [0];
1921       break;
1922     default:
1923       abort ();
1924     }
1925   return x;
1926 }
1927
1928 static INLINE i386_operand_type
1929 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1930 {
1931   gas_assert (y.bitfield.class == ClassNone);
1932   gas_assert (y.bitfield.instance == InstanceNone);
1933
1934   switch (ARRAY_SIZE (x.array))
1935     {
1936     case 3:
1937       x.array [2] &= ~y.array [2];
1938       /* Fall through.  */
1939     case 2:
1940       x.array [1] &= ~y.array [1];
1941       /* Fall through.  */
1942     case 1:
1943       x.array [0] &= ~y.array [0];
1944       break;
1945     default:
1946       abort ();
1947     }
1948   return x;
1949 }
1950
1951 static INLINE i386_operand_type
1952 operand_type_or (i386_operand_type x, i386_operand_type y)
1953 {
1954   gas_assert (x.bitfield.class == ClassNone ||
1955               y.bitfield.class == ClassNone ||
1956               x.bitfield.class == y.bitfield.class);
1957   gas_assert (x.bitfield.instance == InstanceNone ||
1958               y.bitfield.instance == InstanceNone ||
1959               x.bitfield.instance == y.bitfield.instance);
1960
1961   switch (ARRAY_SIZE (x.array))
1962     {
1963     case 3:
1964       x.array [2] |= y.array [2];
1965       /* Fall through.  */
1966     case 2:
1967       x.array [1] |= y.array [1];
1968       /* Fall through.  */
1969     case 1:
1970       x.array [0] |= y.array [0];
1971       break;
1972     default:
1973       abort ();
1974     }
1975   return x;
1976 }
1977
1978 static INLINE i386_operand_type
1979 operand_type_xor (i386_operand_type x, i386_operand_type y)
1980 {
1981   gas_assert (y.bitfield.class == ClassNone);
1982   gas_assert (y.bitfield.instance == InstanceNone);
1983
1984   switch (ARRAY_SIZE (x.array))
1985     {
1986     case 3:
1987       x.array [2] ^= y.array [2];
1988       /* Fall through.  */
1989     case 2:
1990       x.array [1] ^= y.array [1];
1991       /* Fall through.  */
1992     case 1:
1993       x.array [0] ^= y.array [0];
1994       break;
1995     default:
1996       abort ();
1997     }
1998   return x;
1999 }
2000
2001 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2002 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2003 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2004 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2005 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2006 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2007 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2008 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2009 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2010 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2011 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2012 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2013 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2014 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2015 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2016 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2017 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2018
2019 enum operand_type
2020 {
2021   reg,
2022   imm,
2023   disp,
2024   anymem
2025 };
2026
2027 static INLINE int
2028 operand_type_check (i386_operand_type t, enum operand_type c)
2029 {
2030   switch (c)
2031     {
2032     case reg:
2033       return t.bitfield.class == Reg;
2034
2035     case imm:
2036       return (t.bitfield.imm8
2037               || t.bitfield.imm8s
2038               || t.bitfield.imm16
2039               || t.bitfield.imm32
2040               || t.bitfield.imm32s
2041               || t.bitfield.imm64);
2042
2043     case disp:
2044       return (t.bitfield.disp8
2045               || t.bitfield.disp16
2046               || t.bitfield.disp32
2047               || t.bitfield.disp32s
2048               || t.bitfield.disp64);
2049
2050     case anymem:
2051       return (t.bitfield.disp8
2052               || t.bitfield.disp16
2053               || t.bitfield.disp32
2054               || t.bitfield.disp32s
2055               || t.bitfield.disp64
2056               || t.bitfield.baseindex);
2057
2058     default:
2059       abort ();
2060     }
2061
2062   return 0;
2063 }
2064
2065 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2066    between operand GIVEN and opeand WANTED for instruction template T.  */
2067
2068 static INLINE int
2069 match_operand_size (const insn_template *t, unsigned int wanted,
2070                     unsigned int given)
2071 {
2072   return !((i.types[given].bitfield.byte
2073             && !t->operand_types[wanted].bitfield.byte)
2074            || (i.types[given].bitfield.word
2075                && !t->operand_types[wanted].bitfield.word)
2076            || (i.types[given].bitfield.dword
2077                && !t->operand_types[wanted].bitfield.dword)
2078            || (i.types[given].bitfield.qword
2079                && !t->operand_types[wanted].bitfield.qword)
2080            || (i.types[given].bitfield.tbyte
2081                && !t->operand_types[wanted].bitfield.tbyte));
2082 }
2083
2084 /* Return 1 if there is no conflict in SIMD register between operand
2085    GIVEN and opeand WANTED for instruction template T.  */
2086
2087 static INLINE int
2088 match_simd_size (const insn_template *t, unsigned int wanted,
2089                  unsigned int given)
2090 {
2091   return !((i.types[given].bitfield.xmmword
2092             && !t->operand_types[wanted].bitfield.xmmword)
2093            || (i.types[given].bitfield.ymmword
2094                && !t->operand_types[wanted].bitfield.ymmword)
2095            || (i.types[given].bitfield.zmmword
2096                && !t->operand_types[wanted].bitfield.zmmword));
2097 }
2098
2099 /* Return 1 if there is no conflict in any size between operand GIVEN
2100    and opeand WANTED for instruction template T.  */
2101
2102 static INLINE int
2103 match_mem_size (const insn_template *t, unsigned int wanted,
2104                 unsigned int given)
2105 {
2106   return (match_operand_size (t, wanted, given)
2107           && !((i.types[given].bitfield.unspecified
2108                 && !i.broadcast
2109                 && !t->operand_types[wanted].bitfield.unspecified)
2110                || (i.types[given].bitfield.fword
2111                    && !t->operand_types[wanted].bitfield.fword)
2112                /* For scalar opcode templates to allow register and memory
2113                   operands at the same time, some special casing is needed
2114                   here.  Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2115                   down-conversion vpmov*.  */
2116                || ((t->operand_types[wanted].bitfield.class == RegSIMD
2117                     && !t->opcode_modifier.broadcast
2118                     && (t->operand_types[wanted].bitfield.byte
2119                         || t->operand_types[wanted].bitfield.word
2120                         || t->operand_types[wanted].bitfield.dword
2121                         || t->operand_types[wanted].bitfield.qword))
2122                    ? (i.types[given].bitfield.xmmword
2123                       || i.types[given].bitfield.ymmword
2124                       || i.types[given].bitfield.zmmword)
2125                    : !match_simd_size(t, wanted, given))));
2126 }
2127
2128 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2129    operands for instruction template T, and it has MATCH_REVERSE set if there
2130    is no size conflict on any operands for the template with operands reversed
2131    (and the template allows for reversing in the first place).  */
2132
2133 #define MATCH_STRAIGHT 1
2134 #define MATCH_REVERSE  2
2135
2136 static INLINE unsigned int
2137 operand_size_match (const insn_template *t)
2138 {
2139   unsigned int j, match = MATCH_STRAIGHT;
2140
2141   /* Don't check non-absolute jump instructions.  */
2142   if (t->opcode_modifier.jump
2143       && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2144     return match;
2145
2146   /* Check memory and accumulator operand size.  */
2147   for (j = 0; j < i.operands; j++)
2148     {
2149       if (i.types[j].bitfield.class != Reg
2150           && i.types[j].bitfield.class != RegSIMD
2151           && t->opcode_modifier.anysize)
2152         continue;
2153
2154       if (t->operand_types[j].bitfield.class == Reg
2155           && !match_operand_size (t, j, j))
2156         {
2157           match = 0;
2158           break;
2159         }
2160
2161       if (t->operand_types[j].bitfield.class == RegSIMD
2162           && !match_simd_size (t, j, j))
2163         {
2164           match = 0;
2165           break;
2166         }
2167
2168       if (t->operand_types[j].bitfield.instance == Accum
2169           && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2170         {
2171           match = 0;
2172           break;
2173         }
2174
2175       if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2176         {
2177           match = 0;
2178           break;
2179         }
2180     }
2181
2182   if (!t->opcode_modifier.d)
2183     {
2184 mismatch:
2185       if (!match)
2186         i.error = operand_size_mismatch;
2187       return match;
2188     }
2189
2190   /* Check reverse.  */
2191   gas_assert (i.operands >= 2 && i.operands <= 3);
2192
2193   for (j = 0; j < i.operands; j++)
2194     {
2195       unsigned int given = i.operands - j - 1;
2196
2197       if (t->operand_types[j].bitfield.class == Reg
2198           && !match_operand_size (t, j, given))
2199         goto mismatch;
2200
2201       if (t->operand_types[j].bitfield.class == RegSIMD
2202           && !match_simd_size (t, j, given))
2203         goto mismatch;
2204
2205       if (t->operand_types[j].bitfield.instance == Accum
2206           && (!match_operand_size (t, j, given)
2207               || !match_simd_size (t, j, given)))
2208         goto mismatch;
2209
2210       if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2211         goto mismatch;
2212     }
2213
2214   return match | MATCH_REVERSE;
2215 }
2216
2217 static INLINE int
2218 operand_type_match (i386_operand_type overlap,
2219                     i386_operand_type given)
2220 {
2221   i386_operand_type temp = overlap;
2222
2223   temp.bitfield.unspecified = 0;
2224   temp.bitfield.byte = 0;
2225   temp.bitfield.word = 0;
2226   temp.bitfield.dword = 0;
2227   temp.bitfield.fword = 0;
2228   temp.bitfield.qword = 0;
2229   temp.bitfield.tbyte = 0;
2230   temp.bitfield.xmmword = 0;
2231   temp.bitfield.ymmword = 0;
2232   temp.bitfield.zmmword = 0;
2233   if (operand_type_all_zero (&temp))
2234     goto mismatch;
2235
2236   if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2237     return 1;
2238
2239 mismatch:
2240   i.error = operand_type_mismatch;
2241   return 0;
2242 }
2243
2244 /* If given types g0 and g1 are registers they must be of the same type
2245    unless the expected operand type register overlap is null.
2246    Memory operand size of certain SIMD instructions is also being checked
2247    here.  */
2248
2249 static INLINE int
2250 operand_type_register_match (i386_operand_type g0,
2251                              i386_operand_type t0,
2252                              i386_operand_type g1,
2253                              i386_operand_type t1)
2254 {
2255   if (g0.bitfield.class != Reg
2256       && g0.bitfield.class != RegSIMD
2257       && (!operand_type_check (g0, anymem)
2258           || g0.bitfield.unspecified
2259           || t0.bitfield.class != RegSIMD))
2260     return 1;
2261
2262   if (g1.bitfield.class != Reg
2263       && g1.bitfield.class != RegSIMD
2264       && (!operand_type_check (g1, anymem)
2265           || g1.bitfield.unspecified
2266           || t1.bitfield.class != RegSIMD))
2267     return 1;
2268
2269   if (g0.bitfield.byte == g1.bitfield.byte
2270       && g0.bitfield.word == g1.bitfield.word
2271       && g0.bitfield.dword == g1.bitfield.dword
2272       && g0.bitfield.qword == g1.bitfield.qword
2273       && g0.bitfield.xmmword == g1.bitfield.xmmword
2274       && g0.bitfield.ymmword == g1.bitfield.ymmword
2275       && g0.bitfield.zmmword == g1.bitfield.zmmword)
2276     return 1;
2277
2278   if (!(t0.bitfield.byte & t1.bitfield.byte)
2279       && !(t0.bitfield.word & t1.bitfield.word)
2280       && !(t0.bitfield.dword & t1.bitfield.dword)
2281       && !(t0.bitfield.qword & t1.bitfield.qword)
2282       && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2283       && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2284       && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2285     return 1;
2286
2287   i.error = register_type_mismatch;
2288
2289   return 0;
2290 }
2291
2292 static INLINE unsigned int
2293 register_number (const reg_entry *r)
2294 {
2295   unsigned int nr = r->reg_num;
2296
2297   if (r->reg_flags & RegRex)
2298     nr += 8;
2299
2300   if (r->reg_flags & RegVRex)
2301     nr += 16;
2302
2303   return nr;
2304 }
2305
2306 static INLINE unsigned int
2307 mode_from_disp_size (i386_operand_type t)
2308 {
2309   if (t.bitfield.disp8)
2310     return 1;
2311   else if (t.bitfield.disp16
2312            || t.bitfield.disp32
2313            || t.bitfield.disp32s)
2314     return 2;
2315   else
2316     return 0;
2317 }
2318
2319 static INLINE int
2320 fits_in_signed_byte (addressT num)
2321 {
2322   return num + 0x80 <= 0xff;
2323 }
2324
2325 static INLINE int
2326 fits_in_unsigned_byte (addressT num)
2327 {
2328   return num <= 0xff;
2329 }
2330
2331 static INLINE int
2332 fits_in_unsigned_word (addressT num)
2333 {
2334   return num <= 0xffff;
2335 }
2336
2337 static INLINE int
2338 fits_in_signed_word (addressT num)
2339 {
2340   return num + 0x8000 <= 0xffff;
2341 }
2342
2343 static INLINE int
2344 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2345 {
2346 #ifndef BFD64
2347   return 1;
2348 #else
2349   return num + 0x80000000 <= 0xffffffff;
2350 #endif
2351 }                               /* fits_in_signed_long() */
2352
2353 static INLINE int
2354 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2355 {
2356 #ifndef BFD64
2357   return 1;
2358 #else
2359   return num <= 0xffffffff;
2360 #endif
2361 }                               /* fits_in_unsigned_long() */
2362
2363 static INLINE int
2364 fits_in_disp8 (offsetT num)
2365 {
2366   int shift = i.memshift;
2367   unsigned int mask;
2368
2369   if (shift == -1)
2370     abort ();
2371
2372   mask = (1 << shift) - 1;
2373
2374   /* Return 0 if NUM isn't properly aligned.  */
2375   if ((num & mask))
2376     return 0;
2377
2378   /* Check if NUM will fit in 8bit after shift.  */
2379   return fits_in_signed_byte (num >> shift);
2380 }
2381
2382 static INLINE int
2383 fits_in_imm4 (offsetT num)
2384 {
2385   return (num & 0xf) == num;
2386 }
2387
2388 static i386_operand_type
2389 smallest_imm_type (offsetT num)
2390 {
2391   i386_operand_type t;
2392
2393   operand_type_set (&t, 0);
2394   t.bitfield.imm64 = 1;
2395
2396   if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2397     {
2398       /* This code is disabled on the 486 because all the Imm1 forms
2399          in the opcode table are slower on the i486.  They're the
2400          versions with the implicitly specified single-position
2401          displacement, which has another syntax if you really want to
2402          use that form.  */
2403       t.bitfield.imm1 = 1;
2404       t.bitfield.imm8 = 1;
2405       t.bitfield.imm8s = 1;
2406       t.bitfield.imm16 = 1;
2407       t.bitfield.imm32 = 1;
2408       t.bitfield.imm32s = 1;
2409     }
2410   else if (fits_in_signed_byte (num))
2411     {
2412       t.bitfield.imm8 = 1;
2413       t.bitfield.imm8s = 1;
2414       t.bitfield.imm16 = 1;
2415       t.bitfield.imm32 = 1;
2416       t.bitfield.imm32s = 1;
2417     }
2418   else if (fits_in_unsigned_byte (num))
2419     {
2420       t.bitfield.imm8 = 1;
2421       t.bitfield.imm16 = 1;
2422       t.bitfield.imm32 = 1;
2423       t.bitfield.imm32s = 1;
2424     }
2425   else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2426     {
2427       t.bitfield.imm16 = 1;
2428       t.bitfield.imm32 = 1;
2429       t.bitfield.imm32s = 1;
2430     }
2431   else if (fits_in_signed_long (num))
2432     {
2433       t.bitfield.imm32 = 1;
2434       t.bitfield.imm32s = 1;
2435     }
2436   else if (fits_in_unsigned_long (num))
2437     t.bitfield.imm32 = 1;
2438
2439   return t;
2440 }
2441
2442 static offsetT
2443 offset_in_range (offsetT val, int size)
2444 {
2445   addressT mask;
2446
2447   switch (size)
2448     {
2449     case 1: mask = ((addressT) 1 <<  8) - 1; break;
2450     case 2: mask = ((addressT) 1 << 16) - 1; break;
2451     case 4: mask = ((addressT) 2 << 31) - 1; break;
2452 #ifdef BFD64
2453     case 8: mask = ((addressT) 2 << 63) - 1; break;
2454 #endif
2455     default: abort ();
2456     }
2457
2458 #ifdef BFD64
2459   /* If BFD64, sign extend val for 32bit address mode.  */
2460   if (flag_code != CODE_64BIT
2461       || i.prefix[ADDR_PREFIX])
2462     if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2463       val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2464 #endif
2465
2466   if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2467     {
2468       char buf1[40], buf2[40];
2469
2470       sprint_value (buf1, val);
2471       sprint_value (buf2, val & mask);
2472       as_warn (_("%s shortened to %s"), buf1, buf2);
2473     }
2474   return val & mask;
2475 }
2476
2477 enum PREFIX_GROUP
2478 {
2479   PREFIX_EXIST = 0,
2480   PREFIX_LOCK,
2481   PREFIX_REP,
2482   PREFIX_DS,
2483   PREFIX_OTHER
2484 };
2485
2486 /* Returns
2487    a. PREFIX_EXIST if attempting to add a prefix where one from the
2488    same class already exists.
2489    b. PREFIX_LOCK if lock prefix is added.
2490    c. PREFIX_REP if rep/repne prefix is added.
2491    d. PREFIX_DS if ds prefix is added.
2492    e. PREFIX_OTHER if other prefix is added.
2493  */
2494
2495 static enum PREFIX_GROUP
2496 add_prefix (unsigned int prefix)
2497 {
2498   enum PREFIX_GROUP ret = PREFIX_OTHER;
2499   unsigned int q;
2500
2501   if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2502       && flag_code == CODE_64BIT)
2503     {
2504       if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2505           || (i.prefix[REX_PREFIX] & prefix & REX_R)
2506           || (i.prefix[REX_PREFIX] & prefix & REX_X)
2507           || (i.prefix[REX_PREFIX] & prefix & REX_B))
2508         ret = PREFIX_EXIST;
2509       q = REX_PREFIX;
2510     }
2511   else
2512     {
2513       switch (prefix)
2514         {
2515         default:
2516           abort ();
2517
2518         case DS_PREFIX_OPCODE:
2519           ret = PREFIX_DS;
2520           /* Fall through.  */
2521         case CS_PREFIX_OPCODE:
2522         case ES_PREFIX_OPCODE:
2523         case FS_PREFIX_OPCODE:
2524         case GS_PREFIX_OPCODE:
2525         case SS_PREFIX_OPCODE:
2526           q = SEG_PREFIX;
2527           break;
2528
2529         case REPNE_PREFIX_OPCODE:
2530         case REPE_PREFIX_OPCODE:
2531           q = REP_PREFIX;
2532           ret = PREFIX_REP;
2533           break;
2534
2535         case LOCK_PREFIX_OPCODE:
2536           q = LOCK_PREFIX;
2537           ret = PREFIX_LOCK;
2538           break;
2539
2540         case FWAIT_OPCODE:
2541           q = WAIT_PREFIX;
2542           break;
2543
2544         case ADDR_PREFIX_OPCODE:
2545           q = ADDR_PREFIX;
2546           break;
2547
2548         case DATA_PREFIX_OPCODE:
2549           q = DATA_PREFIX;
2550           break;
2551         }
2552       if (i.prefix[q] != 0)
2553         ret = PREFIX_EXIST;
2554     }
2555
2556   if (ret)
2557     {
2558       if (!i.prefix[q])
2559         ++i.prefixes;
2560       i.prefix[q] |= prefix;
2561     }
2562   else
2563     as_bad (_("same type of prefix used twice"));
2564
2565   return ret;
2566 }
2567
2568 static void
2569 update_code_flag (int value, int check)
2570 {
2571   PRINTF_LIKE ((*as_error));
2572
2573   flag_code = (enum flag_code) value;
2574   if (flag_code == CODE_64BIT)
2575     {
2576       cpu_arch_flags.bitfield.cpu64 = 1;
2577       cpu_arch_flags.bitfield.cpuno64 = 0;
2578     }
2579   else
2580     {
2581       cpu_arch_flags.bitfield.cpu64 = 0;
2582       cpu_arch_flags.bitfield.cpuno64 = 1;
2583     }
2584   if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2585     {
2586       if (check)
2587         as_error = as_fatal;
2588       else
2589         as_error = as_bad;
2590       (*as_error) (_("64bit mode not supported on `%s'."),
2591                    cpu_arch_name ? cpu_arch_name : default_arch);
2592     }
2593   if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2594     {
2595       if (check)
2596         as_error = as_fatal;
2597       else
2598         as_error = as_bad;
2599       (*as_error) (_("32bit mode not supported on `%s'."),
2600                    cpu_arch_name ? cpu_arch_name : default_arch);
2601     }
2602   stackop_size = '\0';
2603 }
2604
2605 static void
2606 set_code_flag (int value)
2607 {
2608   update_code_flag (value, 0);
2609 }
2610
2611 static void
2612 set_16bit_gcc_code_flag (int new_code_flag)
2613 {
2614   flag_code = (enum flag_code) new_code_flag;
2615   if (flag_code != CODE_16BIT)
2616     abort ();
2617   cpu_arch_flags.bitfield.cpu64 = 0;
2618   cpu_arch_flags.bitfield.cpuno64 = 1;
2619   stackop_size = LONG_MNEM_SUFFIX;
2620 }
2621
2622 static void
2623 set_intel_syntax (int syntax_flag)
2624 {
2625   /* Find out if register prefixing is specified.  */
2626   int ask_naked_reg = 0;
2627
2628   SKIP_WHITESPACE ();
2629   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2630     {
2631       char *string;
2632       int e = get_symbol_name (&string);
2633
2634       if (strcmp (string, "prefix") == 0)
2635         ask_naked_reg = 1;
2636       else if (strcmp (string, "noprefix") == 0)
2637         ask_naked_reg = -1;
2638       else
2639         as_bad (_("bad argument to syntax directive."));
2640       (void) restore_line_pointer (e);
2641     }
2642   demand_empty_rest_of_line ();
2643
2644   intel_syntax = syntax_flag;
2645
2646   if (ask_naked_reg == 0)
2647     allow_naked_reg = (intel_syntax
2648                        && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2649   else
2650     allow_naked_reg = (ask_naked_reg < 0);
2651
2652   expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2653
2654   identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2655   identifier_chars['$'] = intel_syntax ? '$' : 0;
2656   register_prefix = allow_naked_reg ? "" : "%";
2657 }
2658
2659 static void
2660 set_intel_mnemonic (int mnemonic_flag)
2661 {
2662   intel_mnemonic = mnemonic_flag;
2663 }
2664
2665 static void
2666 set_allow_index_reg (int flag)
2667 {
2668   allow_index_reg = flag;
2669 }
2670
2671 static void
2672 set_check (int what)
2673 {
2674   enum check_kind *kind;
2675   const char *str;
2676
2677   if (what)
2678     {
2679       kind = &operand_check;
2680       str = "operand";
2681     }
2682   else
2683     {
2684       kind = &sse_check;
2685       str = "sse";
2686     }
2687
2688   SKIP_WHITESPACE ();
2689
2690   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2691     {
2692       char *string;
2693       int e = get_symbol_name (&string);
2694
2695       if (strcmp (string, "none") == 0)
2696         *kind = check_none;
2697       else if (strcmp (string, "warning") == 0)
2698         *kind = check_warning;
2699       else if (strcmp (string, "error") == 0)
2700         *kind = check_error;
2701       else
2702         as_bad (_("bad argument to %s_check directive."), str);
2703       (void) restore_line_pointer (e);
2704     }
2705   else
2706     as_bad (_("missing argument for %s_check directive"), str);
2707
2708   demand_empty_rest_of_line ();
2709 }
2710
2711 static void
2712 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2713                            i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2714 {
2715 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2716   static const char *arch;
2717
2718   /* Intel LIOM is only supported on ELF.  */
2719   if (!IS_ELF)
2720     return;
2721
2722   if (!arch)
2723     {
2724       /* Use cpu_arch_name if it is set in md_parse_option.  Otherwise
2725          use default_arch.  */
2726       arch = cpu_arch_name;
2727       if (!arch)
2728         arch = default_arch;
2729     }
2730
2731   /* If we are targeting Intel MCU, we must enable it.  */
2732   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2733       || new_flag.bitfield.cpuiamcu)
2734     return;
2735
2736   /* If we are targeting Intel L1OM, we must enable it.  */
2737   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2738       || new_flag.bitfield.cpul1om)
2739     return;
2740
2741   /* If we are targeting Intel K1OM, we must enable it.  */
2742   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2743       || new_flag.bitfield.cpuk1om)
2744     return;
2745
2746   as_bad (_("`%s' is not supported on `%s'"), name, arch);
2747 #endif
2748 }
2749
2750 static void
2751 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2752 {
2753   SKIP_WHITESPACE ();
2754
2755   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2756     {
2757       char *string;
2758       int e = get_symbol_name (&string);
2759       unsigned int j;
2760       i386_cpu_flags flags;
2761
2762       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2763         {
2764           if (strcmp (string, cpu_arch[j].name) == 0)
2765             {
2766               check_cpu_arch_compatible (string, cpu_arch[j].flags);
2767
2768               if (*string != '.')
2769                 {
2770                   cpu_arch_name = cpu_arch[j].name;
2771                   cpu_sub_arch_name = NULL;
2772                   cpu_arch_flags = cpu_arch[j].flags;
2773                   if (flag_code == CODE_64BIT)
2774                     {
2775                       cpu_arch_flags.bitfield.cpu64 = 1;
2776                       cpu_arch_flags.bitfield.cpuno64 = 0;
2777                     }
2778                   else
2779                     {
2780                       cpu_arch_flags.bitfield.cpu64 = 0;
2781                       cpu_arch_flags.bitfield.cpuno64 = 1;
2782                     }
2783                   cpu_arch_isa = cpu_arch[j].type;
2784                   cpu_arch_isa_flags = cpu_arch[j].flags;
2785                   if (!cpu_arch_tune_set)
2786                     {
2787                       cpu_arch_tune = cpu_arch_isa;
2788                       cpu_arch_tune_flags = cpu_arch_isa_flags;
2789                     }
2790                   break;
2791                 }
2792
2793               flags = cpu_flags_or (cpu_arch_flags,
2794                                     cpu_arch[j].flags);
2795
2796               if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2797                 {
2798                   if (cpu_sub_arch_name)
2799                     {
2800                       char *name = cpu_sub_arch_name;
2801                       cpu_sub_arch_name = concat (name,
2802                                                   cpu_arch[j].name,
2803                                                   (const char *) NULL);
2804                       free (name);
2805                     }
2806                   else
2807                     cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2808                   cpu_arch_flags = flags;
2809                   cpu_arch_isa_flags = flags;
2810                 }
2811               else
2812                 cpu_arch_isa_flags
2813                   = cpu_flags_or (cpu_arch_isa_flags,
2814                                   cpu_arch[j].flags);
2815               (void) restore_line_pointer (e);
2816               demand_empty_rest_of_line ();
2817               return;
2818             }
2819         }
2820
2821       if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2822         {
2823           /* Disable an ISA extension.  */
2824           for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2825             if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2826               {
2827                 flags = cpu_flags_and_not (cpu_arch_flags,
2828                                            cpu_noarch[j].flags);
2829                 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2830                   {
2831                     if (cpu_sub_arch_name)
2832                       {
2833                         char *name = cpu_sub_arch_name;
2834                         cpu_sub_arch_name = concat (name, string,
2835                                                     (const char *) NULL);
2836                         free (name);
2837                       }
2838                     else
2839                       cpu_sub_arch_name = xstrdup (string);
2840                     cpu_arch_flags = flags;
2841                     cpu_arch_isa_flags = flags;
2842                   }
2843                 (void) restore_line_pointer (e);
2844                 demand_empty_rest_of_line ();
2845                 return;
2846               }
2847
2848           j = ARRAY_SIZE (cpu_arch);
2849         }
2850
2851       if (j >= ARRAY_SIZE (cpu_arch))
2852         as_bad (_("no such architecture: `%s'"), string);
2853
2854       *input_line_pointer = e;
2855     }
2856   else
2857     as_bad (_("missing cpu architecture"));
2858
2859   no_cond_jump_promotion = 0;
2860   if (*input_line_pointer == ','
2861       && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2862     {
2863       char *string;
2864       char e;
2865
2866       ++input_line_pointer;
2867       e = get_symbol_name (&string);
2868
2869       if (strcmp (string, "nojumps") == 0)
2870         no_cond_jump_promotion = 1;
2871       else if (strcmp (string, "jumps") == 0)
2872         ;
2873       else
2874         as_bad (_("no such architecture modifier: `%s'"), string);
2875
2876       (void) restore_line_pointer (e);
2877     }
2878
2879   demand_empty_rest_of_line ();
2880 }
2881
2882 enum bfd_architecture
2883 i386_arch (void)
2884 {
2885   if (cpu_arch_isa == PROCESSOR_L1OM)
2886     {
2887       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2888           || flag_code != CODE_64BIT)
2889         as_fatal (_("Intel L1OM is 64bit ELF only"));
2890       return bfd_arch_l1om;
2891     }
2892   else if (cpu_arch_isa == PROCESSOR_K1OM)
2893     {
2894       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2895           || flag_code != CODE_64BIT)
2896         as_fatal (_("Intel K1OM is 64bit ELF only"));
2897       return bfd_arch_k1om;
2898     }
2899   else if (cpu_arch_isa == PROCESSOR_IAMCU)
2900     {
2901       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2902           || flag_code == CODE_64BIT)
2903         as_fatal (_("Intel MCU is 32bit ELF only"));
2904       return bfd_arch_iamcu;
2905     }
2906   else
2907     return bfd_arch_i386;
2908 }
2909
2910 unsigned long
2911 i386_mach (void)
2912 {
2913   if (!strncmp (default_arch, "x86_64", 6))
2914     {
2915       if (cpu_arch_isa == PROCESSOR_L1OM)
2916         {
2917           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2918               || default_arch[6] != '\0')
2919             as_fatal (_("Intel L1OM is 64bit ELF only"));
2920           return bfd_mach_l1om;
2921         }
2922       else if (cpu_arch_isa == PROCESSOR_K1OM)
2923         {
2924           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2925               || default_arch[6] != '\0')
2926             as_fatal (_("Intel K1OM is 64bit ELF only"));
2927           return bfd_mach_k1om;
2928         }
2929       else if (default_arch[6] == '\0')
2930         return bfd_mach_x86_64;
2931       else
2932         return bfd_mach_x64_32;
2933     }
2934   else if (!strcmp (default_arch, "i386")
2935            || !strcmp (default_arch, "iamcu"))
2936     {
2937       if (cpu_arch_isa == PROCESSOR_IAMCU)
2938         {
2939           if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2940             as_fatal (_("Intel MCU is 32bit ELF only"));
2941           return bfd_mach_i386_iamcu;
2942         }
2943       else
2944         return bfd_mach_i386_i386;
2945     }
2946   else
2947     as_fatal (_("unknown architecture"));
2948 }
2949 \f
2950 void
2951 md_begin (void)
2952 {
2953   const char *hash_err;
2954
2955   /* Support pseudo prefixes like {disp32}.  */
2956   lex_type ['{'] = LEX_BEGIN_NAME;
2957
2958   /* Initialize op_hash hash table.  */
2959   op_hash = hash_new ();
2960
2961   {
2962     const insn_template *optab;
2963     templates *core_optab;
2964
2965     /* Setup for loop.  */
2966     optab = i386_optab;
2967     core_optab = XNEW (templates);
2968     core_optab->start = optab;
2969
2970     while (1)
2971       {
2972         ++optab;
2973         if (optab->name == NULL
2974             || strcmp (optab->name, (optab - 1)->name) != 0)
2975           {
2976             /* different name --> ship out current template list;
2977                add to hash table; & begin anew.  */
2978             core_optab->end = optab;
2979             hash_err = hash_insert (op_hash,
2980                                     (optab - 1)->name,
2981                                     (void *) core_optab);
2982             if (hash_err)
2983               {
2984                 as_fatal (_("can't hash %s: %s"),
2985                           (optab - 1)->name,
2986                           hash_err);
2987               }
2988             if (optab->name == NULL)
2989               break;
2990             core_optab = XNEW (templates);
2991             core_optab->start = optab;
2992           }
2993       }
2994   }
2995
2996   /* Initialize reg_hash hash table.  */
2997   reg_hash = hash_new ();
2998   {
2999     const reg_entry *regtab;
3000     unsigned int regtab_size = i386_regtab_size;
3001
3002     for (regtab = i386_regtab; regtab_size--; regtab++)
3003       {
3004         hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
3005         if (hash_err)
3006           as_fatal (_("can't hash %s: %s"),
3007                     regtab->reg_name,
3008                     hash_err);
3009       }
3010   }
3011
3012   /* Fill in lexical tables:  mnemonic_chars, operand_chars.  */
3013   {
3014     int c;
3015     char *p;
3016
3017     for (c = 0; c < 256; c++)
3018       {
3019         if (ISDIGIT (c))
3020           {
3021             digit_chars[c] = c;
3022             mnemonic_chars[c] = c;
3023             register_chars[c] = c;
3024             operand_chars[c] = c;
3025           }
3026         else if (ISLOWER (c))
3027           {
3028             mnemonic_chars[c] = c;
3029             register_chars[c] = c;
3030             operand_chars[c] = c;
3031           }
3032         else if (ISUPPER (c))
3033           {
3034             mnemonic_chars[c] = TOLOWER (c);
3035             register_chars[c] = mnemonic_chars[c];
3036             operand_chars[c] = c;
3037           }
3038         else if (c == '{' || c == '}')
3039           {
3040             mnemonic_chars[c] = c;
3041             operand_chars[c] = c;
3042           }
3043
3044         if (ISALPHA (c) || ISDIGIT (c))
3045           identifier_chars[c] = c;
3046         else if (c >= 128)
3047           {
3048             identifier_chars[c] = c;
3049             operand_chars[c] = c;
3050           }
3051       }
3052
3053 #ifdef LEX_AT
3054     identifier_chars['@'] = '@';
3055 #endif
3056 #ifdef LEX_QM
3057     identifier_chars['?'] = '?';
3058     operand_chars['?'] = '?';
3059 #endif
3060     digit_chars['-'] = '-';
3061     mnemonic_chars['_'] = '_';
3062     mnemonic_chars['-'] = '-';
3063     mnemonic_chars['.'] = '.';
3064     identifier_chars['_'] = '_';
3065     identifier_chars['.'] = '.';
3066
3067     for (p = operand_special_chars; *p != '\0'; p++)
3068       operand_chars[(unsigned char) *p] = *p;
3069   }
3070
3071   if (flag_code == CODE_64BIT)
3072     {
3073 #if defined (OBJ_COFF) && defined (TE_PE)
3074       x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3075                                   ? 32 : 16);
3076 #else
3077       x86_dwarf2_return_column = 16;
3078 #endif
3079       x86_cie_data_alignment = -8;
3080     }
3081   else
3082     {
3083       x86_dwarf2_return_column = 8;
3084       x86_cie_data_alignment = -4;
3085     }
3086
3087   /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3088      can be turned into BRANCH_PREFIX frag.  */
3089   if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3090     abort ();
3091 }
3092
3093 void
3094 i386_print_statistics (FILE *file)
3095 {
3096   hash_print_statistics (file, "i386 opcode", op_hash);
3097   hash_print_statistics (file, "i386 register", reg_hash);
3098 }
3099 \f
3100 #ifdef DEBUG386
3101
3102 /* Debugging routines for md_assemble.  */
3103 static void pte (insn_template *);
3104 static void pt (i386_operand_type);
3105 static void pe (expressionS *);
3106 static void ps (symbolS *);
3107
3108 static void
3109 pi (const char *line, i386_insn *x)
3110 {
3111   unsigned int j;
3112
3113   fprintf (stdout, "%s: template ", line);
3114   pte (&x->tm);
3115   fprintf (stdout, "  address: base %s  index %s  scale %x\n",
3116            x->base_reg ? x->base_reg->reg_name : "none",
3117            x->index_reg ? x->index_reg->reg_name : "none",
3118            x->log2_scale_factor);
3119   fprintf (stdout, "  modrm:  mode %x  reg %x  reg/mem %x\n",
3120            x->rm.mode, x->rm.reg, x->rm.regmem);
3121   fprintf (stdout, "  sib:  base %x  index %x  scale %x\n",
3122            x->sib.base, x->sib.index, x->sib.scale);
3123   fprintf (stdout, "  rex: 64bit %x  extX %x  extY %x  extZ %x\n",
3124            (x->rex & REX_W) != 0,
3125            (x->rex & REX_R) != 0,
3126            (x->rex & REX_X) != 0,
3127            (x->rex & REX_B) != 0);
3128   for (j = 0; j < x->operands; j++)
3129     {
3130       fprintf (stdout, "    #%d:  ", j + 1);
3131       pt (x->types[j]);
3132       fprintf (stdout, "\n");
3133       if (x->types[j].bitfield.class == Reg
3134           || x->types[j].bitfield.class == RegMMX
3135           || x->types[j].bitfield.class == RegSIMD
3136           || x->types[j].bitfield.class == SReg
3137           || x->types[j].bitfield.class == RegCR
3138           || x->types[j].bitfield.class == RegDR
3139           || x->types[j].bitfield.class == RegTR)
3140         fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3141       if (operand_type_check (x->types[j], imm))
3142         pe (x->op[j].imms);
3143       if (operand_type_check (x->types[j], disp))
3144         pe (x->op[j].disps);
3145     }
3146 }
3147
3148 static void
3149 pte (insn_template *t)
3150 {
3151   unsigned int j;
3152   fprintf (stdout, " %d operands ", t->operands);
3153   fprintf (stdout, "opcode %x ", t->base_opcode);
3154   if (t->extension_opcode != None)
3155     fprintf (stdout, "ext %x ", t->extension_opcode);
3156   if (t->opcode_modifier.d)
3157     fprintf (stdout, "D");
3158   if (t->opcode_modifier.w)
3159     fprintf (stdout, "W");
3160   fprintf (stdout, "\n");
3161   for (j = 0; j < t->operands; j++)
3162     {
3163       fprintf (stdout, "    #%d type ", j + 1);
3164       pt (t->operand_types[j]);
3165       fprintf (stdout, "\n");
3166     }
3167 }
3168
3169 static void
3170 pe (expressionS *e)
3171 {
3172   fprintf (stdout, "    operation     %d\n", e->X_op);
3173   fprintf (stdout, "    add_number    %ld (%lx)\n",
3174            (long) e->X_add_number, (long) e->X_add_number);
3175   if (e->X_add_symbol)
3176     {
3177       fprintf (stdout, "    add_symbol    ");
3178       ps (e->X_add_symbol);
3179       fprintf (stdout, "\n");
3180     }
3181   if (e->X_op_symbol)
3182     {
3183       fprintf (stdout, "    op_symbol    ");
3184       ps (e->X_op_symbol);
3185       fprintf (stdout, "\n");
3186     }
3187 }
3188
3189 static void
3190 ps (symbolS *s)
3191 {
3192   fprintf (stdout, "%s type %s%s",
3193            S_GET_NAME (s),
3194            S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3195            segment_name (S_GET_SEGMENT (s)));
3196 }
3197
3198 static struct type_name
3199   {
3200     i386_operand_type mask;
3201     const char *name;
3202   }
3203 const type_names[] =
3204 {
3205   { OPERAND_TYPE_REG8, "r8" },
3206   { OPERAND_TYPE_REG16, "r16" },
3207   { OPERAND_TYPE_REG32, "r32" },
3208   { OPERAND_TYPE_REG64, "r64" },
3209   { OPERAND_TYPE_ACC8, "acc8" },
3210   { OPERAND_TYPE_ACC16, "acc16" },
3211   { OPERAND_TYPE_ACC32, "acc32" },
3212   { OPERAND_TYPE_ACC64, "acc64" },
3213   { OPERAND_TYPE_IMM8, "i8" },
3214   { OPERAND_TYPE_IMM8, "i8s" },
3215   { OPERAND_TYPE_IMM16, "i16" },
3216   { OPERAND_TYPE_IMM32, "i32" },
3217   { OPERAND_TYPE_IMM32S, "i32s" },
3218   { OPERAND_TYPE_IMM64, "i64" },
3219   { OPERAND_TYPE_IMM1, "i1" },
3220   { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3221   { OPERAND_TYPE_DISP8, "d8" },
3222   { OPERAND_TYPE_DISP16, "d16" },
3223   { OPERAND_TYPE_DISP32, "d32" },
3224   { OPERAND_TYPE_DISP32S, "d32s" },
3225   { OPERAND_TYPE_DISP64, "d64" },
3226   { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3227   { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3228   { OPERAND_TYPE_CONTROL, "control reg" },
3229   { OPERAND_TYPE_TEST, "test reg" },
3230   { OPERAND_TYPE_DEBUG, "debug reg" },
3231   { OPERAND_TYPE_FLOATREG, "FReg" },
3232   { OPERAND_TYPE_FLOATACC, "FAcc" },
3233   { OPERAND_TYPE_SREG, "SReg" },
3234   { OPERAND_TYPE_REGMMX, "rMMX" },
3235   { OPERAND_TYPE_REGXMM, "rXMM" },
3236   { OPERAND_TYPE_REGYMM, "rYMM" },
3237   { OPERAND_TYPE_REGZMM, "rZMM" },
3238   { OPERAND_TYPE_REGMASK, "Mask reg" },
3239 };
3240
3241 static void
3242 pt (i386_operand_type t)
3243 {
3244   unsigned int j;
3245   i386_operand_type a;
3246
3247   for (j = 0; j < ARRAY_SIZE (type_names); j++)
3248     {
3249       a = operand_type_and (t, type_names[j].mask);
3250       if (operand_type_equal (&a, &type_names[j].mask))
3251         fprintf (stdout, "%s, ",  type_names[j].name);
3252     }
3253   fflush (stdout);
3254 }
3255
3256 #endif /* DEBUG386 */
3257 \f
3258 static bfd_reloc_code_real_type
3259 reloc (unsigned int size,
3260        int pcrel,
3261        int sign,
3262        bfd_reloc_code_real_type other)
3263 {
3264   if (other != NO_RELOC)
3265     {
3266       reloc_howto_type *rel;
3267
3268       if (size == 8)
3269         switch (other)
3270           {
3271           case BFD_RELOC_X86_64_GOT32:
3272             return BFD_RELOC_X86_64_GOT64;
3273             break;
3274           case BFD_RELOC_X86_64_GOTPLT64:
3275             return BFD_RELOC_X86_64_GOTPLT64;
3276             break;
3277           case BFD_RELOC_X86_64_PLTOFF64:
3278             return BFD_RELOC_X86_64_PLTOFF64;
3279             break;
3280           case BFD_RELOC_X86_64_GOTPC32:
3281             other = BFD_RELOC_X86_64_GOTPC64;
3282             break;
3283           case BFD_RELOC_X86_64_GOTPCREL:
3284             other = BFD_RELOC_X86_64_GOTPCREL64;
3285             break;
3286           case BFD_RELOC_X86_64_TPOFF32:
3287             other = BFD_RELOC_X86_64_TPOFF64;
3288             break;
3289           case BFD_RELOC_X86_64_DTPOFF32:
3290             other = BFD_RELOC_X86_64_DTPOFF64;
3291             break;
3292           default:
3293             break;
3294           }
3295
3296 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3297       if (other == BFD_RELOC_SIZE32)
3298         {
3299           if (size == 8)
3300             other = BFD_RELOC_SIZE64;
3301           if (pcrel)
3302             {
3303               as_bad (_("there are no pc-relative size relocations"));
3304               return NO_RELOC;
3305             }
3306         }
3307 #endif
3308
3309       /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless.  */
3310       if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3311         sign = -1;
3312
3313       rel = bfd_reloc_type_lookup (stdoutput, other);
3314       if (!rel)
3315         as_bad (_("unknown relocation (%u)"), other);
3316       else if (size != bfd_get_reloc_size (rel))
3317         as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3318                 bfd_get_reloc_size (rel),
3319                 size);
3320       else if (pcrel && !rel->pc_relative)
3321         as_bad (_("non-pc-relative relocation for pc-relative field"));
3322       else if ((rel->complain_on_overflow == complain_overflow_signed
3323                 && !sign)
3324                || (rel->complain_on_overflow == complain_overflow_unsigned
3325                    && sign > 0))
3326         as_bad (_("relocated field and relocation type differ in signedness"));
3327       else
3328         return other;
3329       return NO_RELOC;
3330     }
3331
3332   if (pcrel)
3333     {
3334       if (!sign)
3335         as_bad (_("there are no unsigned pc-relative relocations"));
3336       switch (size)
3337         {
3338         case 1: return BFD_RELOC_8_PCREL;
3339         case 2: return BFD_RELOC_16_PCREL;
3340         case 4: return BFD_RELOC_32_PCREL;
3341         case 8: return BFD_RELOC_64_PCREL;
3342         }
3343       as_bad (_("cannot do %u byte pc-relative relocation"), size);
3344     }
3345   else
3346     {
3347       if (sign > 0)
3348         switch (size)
3349           {
3350           case 4: return BFD_RELOC_X86_64_32S;
3351           }
3352       else
3353         switch (size)
3354           {
3355           case 1: return BFD_RELOC_8;
3356           case 2: return BFD_RELOC_16;
3357           case 4: return BFD_RELOC_32;
3358           case 8: return BFD_RELOC_64;
3359           }
3360       as_bad (_("cannot do %s %u byte relocation"),
3361               sign > 0 ? "signed" : "unsigned", size);
3362     }
3363
3364   return NO_RELOC;
3365 }
3366
3367 /* Here we decide which fixups can be adjusted to make them relative to
3368    the beginning of the section instead of the symbol.  Basically we need
3369    to make sure that the dynamic relocations are done correctly, so in
3370    some cases we force the original symbol to be used.  */
3371
3372 int
3373 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3374 {
3375 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3376   if (!IS_ELF)
3377     return 1;
3378
3379   /* Don't adjust pc-relative references to merge sections in 64-bit
3380      mode.  */
3381   if (use_rela_relocations
3382       && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3383       && fixP->fx_pcrel)
3384     return 0;
3385
3386   /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3387      and changed later by validate_fix.  */
3388   if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3389       && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3390     return 0;
3391
3392   /* Adjust_reloc_syms doesn't know about the GOT.  Need to keep symbol
3393      for size relocations.  */
3394   if (fixP->fx_r_type == BFD_RELOC_SIZE32
3395       || fixP->fx_r_type == BFD_RELOC_SIZE64
3396       || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3397       || fixP->fx_r_type == BFD_RELOC_386_PLT32
3398       || fixP->fx_r_type == BFD_RELOC_386_GOT32
3399       || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3400       || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3401       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3402       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3403       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3404       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3405       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3406       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3407       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3408       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3409       || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3410       || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
3411       || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3412       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3413       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3414       || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3415       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3416       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3417       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3418       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3419       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3420       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3421       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3422       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3423       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3424       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3425       || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3426       || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3427     return 0;
3428 #endif
3429   return 1;
3430 }
3431
3432 static int
3433 intel_float_operand (const char *mnemonic)
3434 {
3435   /* Note that the value returned is meaningful only for opcodes with (memory)
3436      operands, hence the code here is free to improperly handle opcodes that
3437      have no operands (for better performance and smaller code). */
3438
3439   if (mnemonic[0] != 'f')
3440     return 0; /* non-math */
3441
3442   switch (mnemonic[1])
3443     {
3444     /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3445        the fs segment override prefix not currently handled because no
3446        call path can make opcodes without operands get here */
3447     case 'i':
3448       return 2 /* integer op */;
3449     case 'l':
3450       if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3451         return 3; /* fldcw/fldenv */
3452       break;
3453     case 'n':
3454       if (mnemonic[2] != 'o' /* fnop */)
3455         return 3; /* non-waiting control op */
3456       break;
3457     case 'r':
3458       if (mnemonic[2] == 's')
3459         return 3; /* frstor/frstpm */
3460       break;
3461     case 's':
3462       if (mnemonic[2] == 'a')
3463         return 3; /* fsave */
3464       if (mnemonic[2] == 't')
3465         {
3466           switch (mnemonic[3])
3467             {
3468             case 'c': /* fstcw */
3469             case 'd': /* fstdw */
3470             case 'e': /* fstenv */
3471             case 's': /* fsts[gw] */
3472               return 3;
3473             }
3474         }
3475       break;
3476     case 'x':
3477       if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3478         return 0; /* fxsave/fxrstor are not really math ops */
3479       break;
3480     }
3481
3482   return 1;
3483 }
3484
3485 /* Build the VEX prefix.  */
3486
3487 static void
3488 build_vex_prefix (const insn_template *t)
3489 {
3490   unsigned int register_specifier;
3491   unsigned int implied_prefix;
3492   unsigned int vector_length;
3493   unsigned int w;
3494
3495   /* Check register specifier.  */
3496   if (i.vex.register_specifier)
3497     {
3498       register_specifier =
3499         ~register_number (i.vex.register_specifier) & 0xf;
3500       gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3501     }
3502   else
3503     register_specifier = 0xf;
3504
3505   /* Use 2-byte VEX prefix by swapping destination and source operand
3506      if there are more than 1 register operand.  */
3507   if (i.reg_operands > 1
3508       && i.vec_encoding != vex_encoding_vex3
3509       && i.dir_encoding == dir_encoding_default
3510       && i.operands == i.reg_operands
3511       && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3512       && i.tm.opcode_modifier.vexopcode == VEX0F
3513       && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3514       && i.rex == REX_B)
3515     {
3516       unsigned int xchg = i.operands - 1;
3517       union i386_op temp_op;
3518       i386_operand_type temp_type;
3519
3520       temp_type = i.types[xchg];
3521       i.types[xchg] = i.types[0];
3522       i.types[0] = temp_type;
3523       temp_op = i.op[xchg];
3524       i.op[xchg] = i.op[0];
3525       i.op[0] = temp_op;
3526
3527       gas_assert (i.rm.mode == 3);
3528
3529       i.rex = REX_R;
3530       xchg = i.rm.regmem;
3531       i.rm.regmem = i.rm.reg;
3532       i.rm.reg = xchg;
3533
3534       if (i.tm.opcode_modifier.d)
3535         i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3536                             ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3537       else /* Use the next insn.  */
3538         i.tm = t[1];
3539     }
3540
3541   /* Use 2-byte VEX prefix by swapping commutative source operands if there
3542      are no memory operands and at least 3 register ones.  */
3543   if (i.reg_operands >= 3
3544       && i.vec_encoding != vex_encoding_vex3
3545       && i.reg_operands == i.operands - i.imm_operands
3546       && i.tm.opcode_modifier.vex
3547       && i.tm.opcode_modifier.commutative
3548       && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3549       && i.rex == REX_B
3550       && i.vex.register_specifier
3551       && !(i.vex.register_specifier->reg_flags & RegRex))
3552     {
3553       unsigned int xchg = i.operands - i.reg_operands;
3554       union i386_op temp_op;
3555       i386_operand_type temp_type;
3556
3557       gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3558       gas_assert (!i.tm.opcode_modifier.sae);
3559       gas_assert (operand_type_equal (&i.types[i.operands - 2],
3560                                       &i.types[i.operands - 3]));
3561       gas_assert (i.rm.mode == 3);
3562
3563       temp_type = i.types[xchg];
3564       i.types[xchg] = i.types[xchg + 1];
3565       i.types[xchg + 1] = temp_type;
3566       temp_op = i.op[xchg];
3567       i.op[xchg] = i.op[xchg + 1];
3568       i.op[xchg + 1] = temp_op;
3569
3570       i.rex = 0;
3571       xchg = i.rm.regmem | 8;
3572       i.rm.regmem = ~register_specifier & 0xf;
3573       gas_assert (!(i.rm.regmem & 8));
3574       i.vex.register_specifier += xchg - i.rm.regmem;
3575       register_specifier = ~xchg & 0xf;
3576     }
3577
3578   if (i.tm.opcode_modifier.vex == VEXScalar)
3579     vector_length = avxscalar;
3580   else if (i.tm.opcode_modifier.vex == VEX256)
3581     vector_length = 1;
3582   else
3583     {
3584       unsigned int op;
3585
3586       /* Determine vector length from the last multi-length vector
3587          operand.  */
3588       vector_length = 0;
3589       for (op = t->operands; op--;)
3590         if (t->operand_types[op].bitfield.xmmword
3591             && t->operand_types[op].bitfield.ymmword
3592             && i.types[op].bitfield.ymmword)
3593           {
3594             vector_length = 1;
3595             break;
3596           }
3597     }
3598
3599   switch ((i.tm.base_opcode >> 8) & 0xff)
3600     {
3601     case 0:
3602       implied_prefix = 0;
3603       break;
3604     case DATA_PREFIX_OPCODE:
3605       implied_prefix = 1;
3606       break;
3607     case REPE_PREFIX_OPCODE:
3608       implied_prefix = 2;
3609       break;
3610     case REPNE_PREFIX_OPCODE:
3611       implied_prefix = 3;
3612       break;
3613     default:
3614       abort ();
3615     }
3616
3617   /* Check the REX.W bit and VEXW.  */
3618   if (i.tm.opcode_modifier.vexw == VEXWIG)
3619     w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3620   else if (i.tm.opcode_modifier.vexw)
3621     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3622   else
3623     w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3624
3625   /* Use 2-byte VEX prefix if possible.  */
3626   if (w == 0
3627       && i.vec_encoding != vex_encoding_vex3
3628       && i.tm.opcode_modifier.vexopcode == VEX0F
3629       && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3630     {
3631       /* 2-byte VEX prefix.  */
3632       unsigned int r;
3633
3634       i.vex.length = 2;
3635       i.vex.bytes[0] = 0xc5;
3636
3637       /* Check the REX.R bit.  */
3638       r = (i.rex & REX_R) ? 0 : 1;
3639       i.vex.bytes[1] = (r << 7
3640                         | register_specifier << 3
3641                         | vector_length << 2
3642                         | implied_prefix);
3643     }
3644   else
3645     {
3646       /* 3-byte VEX prefix.  */
3647       unsigned int m;
3648
3649       i.vex.length = 3;
3650
3651       switch (i.tm.opcode_modifier.vexopcode)
3652         {
3653         case VEX0F:
3654           m = 0x1;
3655           i.vex.bytes[0] = 0xc4;
3656           break;
3657         case VEX0F38:
3658           m = 0x2;
3659           i.vex.bytes[0] = 0xc4;
3660           break;
3661         case VEX0F3A:
3662           m = 0x3;
3663           i.vex.bytes[0] = 0xc4;
3664           break;
3665         case XOP08:
3666           m = 0x8;
3667           i.vex.bytes[0] = 0x8f;
3668           break;
3669         case XOP09:
3670           m = 0x9;
3671           i.vex.bytes[0] = 0x8f;
3672           break;
3673         case XOP0A:
3674           m = 0xa;
3675           i.vex.bytes[0] = 0x8f;
3676           break;
3677         default:
3678           abort ();
3679         }
3680
3681       /* The high 3 bits of the second VEX byte are 1's compliment
3682          of RXB bits from REX.  */
3683       i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3684
3685       i.vex.bytes[2] = (w << 7
3686                         | register_specifier << 3
3687                         | vector_length << 2
3688                         | implied_prefix);
3689     }
3690 }
3691
3692 static INLINE bfd_boolean
3693 is_evex_encoding (const insn_template *t)
3694 {
3695   return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3696          || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3697          || t->opcode_modifier.sae;
3698 }
3699
3700 static INLINE bfd_boolean
3701 is_any_vex_encoding (const insn_template *t)
3702 {
3703   return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3704          || is_evex_encoding (t);
3705 }
3706
3707 /* Build the EVEX prefix.  */
3708
3709 static void
3710 build_evex_prefix (void)
3711 {
3712   unsigned int register_specifier;
3713   unsigned int implied_prefix;
3714   unsigned int m, w;
3715   rex_byte vrex_used = 0;
3716
3717   /* Check register specifier.  */
3718   if (i.vex.register_specifier)
3719     {
3720       gas_assert ((i.vrex & REX_X) == 0);
3721
3722       register_specifier = i.vex.register_specifier->reg_num;
3723       if ((i.vex.register_specifier->reg_flags & RegRex))
3724         register_specifier += 8;
3725       /* The upper 16 registers are encoded in the fourth byte of the
3726          EVEX prefix.  */
3727       if (!(i.vex.register_specifier->reg_flags & RegVRex))
3728         i.vex.bytes[3] = 0x8;
3729       register_specifier = ~register_specifier & 0xf;
3730     }
3731   else
3732     {
3733       register_specifier = 0xf;
3734
3735       /* Encode upper 16 vector index register in the fourth byte of
3736          the EVEX prefix.  */
3737       if (!(i.vrex & REX_X))
3738         i.vex.bytes[3] = 0x8;
3739       else
3740         vrex_used |= REX_X;
3741     }
3742
3743   switch ((i.tm.base_opcode >> 8) & 0xff)
3744     {
3745     case 0:
3746       implied_prefix = 0;
3747       break;
3748     case DATA_PREFIX_OPCODE:
3749       implied_prefix = 1;
3750       break;
3751     case REPE_PREFIX_OPCODE:
3752       implied_prefix = 2;
3753       break;
3754     case REPNE_PREFIX_OPCODE:
3755       implied_prefix = 3;
3756       break;
3757     default:
3758       abort ();
3759     }
3760
3761   /* 4 byte EVEX prefix.  */
3762   i.vex.length = 4;
3763   i.vex.bytes[0] = 0x62;
3764
3765   /* mmmm bits.  */
3766   switch (i.tm.opcode_modifier.vexopcode)
3767     {
3768     case VEX0F:
3769       m = 1;
3770       break;
3771     case VEX0F38:
3772       m = 2;
3773       break;
3774     case VEX0F3A:
3775       m = 3;
3776       break;
3777     default:
3778       abort ();
3779       break;
3780     }
3781
3782   /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3783      bits from REX.  */
3784   i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3785
3786   /* The fifth bit of the second EVEX byte is 1's compliment of the
3787      REX_R bit in VREX.  */
3788   if (!(i.vrex & REX_R))
3789     i.vex.bytes[1] |= 0x10;
3790   else
3791     vrex_used |= REX_R;
3792
3793   if ((i.reg_operands + i.imm_operands) == i.operands)
3794     {
3795       /* When all operands are registers, the REX_X bit in REX is not
3796          used.  We reuse it to encode the upper 16 registers, which is
3797          indicated by the REX_B bit in VREX.  The REX_X bit is encoded
3798          as 1's compliment.  */
3799       if ((i.vrex & REX_B))
3800         {
3801           vrex_used |= REX_B;
3802           i.vex.bytes[1] &= ~0x40;
3803         }
3804     }
3805
3806   /* EVEX instructions shouldn't need the REX prefix.  */
3807   i.vrex &= ~vrex_used;
3808   gas_assert (i.vrex == 0);
3809
3810   /* Check the REX.W bit and VEXW.  */
3811   if (i.tm.opcode_modifier.vexw == VEXWIG)
3812     w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3813   else if (i.tm.opcode_modifier.vexw)
3814     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3815   else
3816     w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3817
3818   /* Encode the U bit.  */
3819   implied_prefix |= 0x4;
3820
3821   /* The third byte of the EVEX prefix.  */
3822   i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3823
3824   /* The fourth byte of the EVEX prefix.  */
3825   /* The zeroing-masking bit.  */
3826   if (i.mask && i.mask->zeroing)
3827     i.vex.bytes[3] |= 0x80;
3828
3829   /* Don't always set the broadcast bit if there is no RC.  */
3830   if (!i.rounding)
3831     {
3832       /* Encode the vector length.  */
3833       unsigned int vec_length;
3834
3835       if (!i.tm.opcode_modifier.evex
3836           || i.tm.opcode_modifier.evex == EVEXDYN)
3837         {
3838           unsigned int op;
3839
3840           /* Determine vector length from the last multi-length vector
3841              operand.  */
3842           vec_length = 0;
3843           for (op = i.operands; op--;)
3844             if (i.tm.operand_types[op].bitfield.xmmword
3845                 + i.tm.operand_types[op].bitfield.ymmword
3846                 + i.tm.operand_types[op].bitfield.zmmword > 1)
3847               {
3848                 if (i.types[op].bitfield.zmmword)
3849                   {
3850                     i.tm.opcode_modifier.evex = EVEX512;
3851                     break;
3852                   }
3853                 else if (i.types[op].bitfield.ymmword)
3854                   {
3855                     i.tm.opcode_modifier.evex = EVEX256;
3856                     break;
3857                   }
3858                 else if (i.types[op].bitfield.xmmword)
3859                   {
3860                     i.tm.opcode_modifier.evex = EVEX128;
3861                     break;
3862                   }
3863                 else if (i.broadcast && (int) op == i.broadcast->operand)
3864                   {
3865                     switch (i.broadcast->bytes)
3866                       {
3867                         case 64:
3868                           i.tm.opcode_modifier.evex = EVEX512;
3869                           break;
3870                         case 32:
3871                           i.tm.opcode_modifier.evex = EVEX256;
3872                           break;
3873                         case 16:
3874                           i.tm.opcode_modifier.evex = EVEX128;
3875                           break;
3876                         default:
3877                           abort ();
3878                       }
3879                     break;
3880                   }
3881               }
3882
3883           if (op >= MAX_OPERANDS)
3884             abort ();
3885         }
3886
3887       switch (i.tm.opcode_modifier.evex)
3888         {
3889         case EVEXLIG: /* LL' is ignored */
3890           vec_length = evexlig << 5;
3891           break;
3892         case EVEX128:
3893           vec_length = 0 << 5;
3894           break;
3895         case EVEX256:
3896           vec_length = 1 << 5;
3897           break;
3898         case EVEX512:
3899           vec_length = 2 << 5;
3900           break;
3901         default:
3902           abort ();
3903           break;
3904         }
3905       i.vex.bytes[3] |= vec_length;
3906       /* Encode the broadcast bit.  */
3907       if (i.broadcast)
3908         i.vex.bytes[3] |= 0x10;
3909     }
3910   else
3911     {
3912       if (i.rounding->type != saeonly)
3913         i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3914       else
3915         i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3916     }
3917
3918   if (i.mask && i.mask->mask)
3919     i.vex.bytes[3] |= i.mask->mask->reg_num;
3920 }
3921
3922 static void
3923 process_immext (void)
3924 {
3925   expressionS *exp;
3926
3927   /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3928      which is coded in the same place as an 8-bit immediate field
3929      would be.  Here we fake an 8-bit immediate operand from the
3930      opcode suffix stored in tm.extension_opcode.
3931
3932      AVX instructions also use this encoding, for some of
3933      3 argument instructions.  */
3934
3935   gas_assert (i.imm_operands <= 1
3936               && (i.operands <= 2
3937                   || (is_any_vex_encoding (&i.tm)
3938                       && i.operands <= 4)));
3939
3940   exp = &im_expressions[i.imm_operands++];
3941   i.op[i.operands].imms = exp;
3942   i.types[i.operands] = imm8;
3943   i.operands++;
3944   exp->X_op = O_constant;
3945   exp->X_add_number = i.tm.extension_opcode;
3946   i.tm.extension_opcode = None;
3947 }
3948
3949
3950 static int
3951 check_hle (void)
3952 {
3953   switch (i.tm.opcode_modifier.hleprefixok)
3954     {
3955     default:
3956       abort ();
3957     case HLEPrefixNone:
3958       as_bad (_("invalid instruction `%s' after `%s'"),
3959               i.tm.name, i.hle_prefix);
3960       return 0;
3961     case HLEPrefixLock:
3962       if (i.prefix[LOCK_PREFIX])
3963         return 1;
3964       as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3965       return 0;
3966     case HLEPrefixAny:
3967       return 1;
3968     case HLEPrefixRelease:
3969       if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3970         {
3971           as_bad (_("instruction `%s' after `xacquire' not allowed"),
3972                   i.tm.name);
3973           return 0;
3974         }
3975       if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
3976         {
3977           as_bad (_("memory destination needed for instruction `%s'"
3978                     " after `xrelease'"), i.tm.name);
3979           return 0;
3980         }
3981       return 1;
3982     }
3983 }
3984
3985 /* Try the shortest encoding by shortening operand size.  */
3986
3987 static void
3988 optimize_encoding (void)
3989 {
3990   unsigned int j;
3991
3992   if (optimize_for_space
3993       && i.reg_operands == 1
3994       && i.imm_operands == 1
3995       && !i.types[1].bitfield.byte
3996       && i.op[0].imms->X_op == O_constant
3997       && fits_in_imm7 (i.op[0].imms->X_add_number)
3998       && ((i.tm.base_opcode == 0xa8
3999            && i.tm.extension_opcode == None)
4000           || (i.tm.base_opcode == 0xf6
4001               && i.tm.extension_opcode == 0x0)))
4002     {
4003       /* Optimize: -Os:
4004            test $imm7, %r64/%r32/%r16  -> test $imm7, %r8
4005        */
4006       unsigned int base_regnum = i.op[1].regs->reg_num;
4007       if (flag_code == CODE_64BIT || base_regnum < 4)
4008         {
4009           i.types[1].bitfield.byte = 1;
4010           /* Ignore the suffix.  */
4011           i.suffix = 0;
4012           /* Convert to byte registers.  */
4013           if (i.types[1].bitfield.word)
4014             j = 16;
4015           else if (i.types[1].bitfield.dword)
4016             j = 32;
4017           else
4018             j = 48;
4019           if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4020             j += 8;
4021           i.op[1].regs -= j;
4022         }
4023     }
4024   else if (flag_code == CODE_64BIT
4025            && ((i.types[1].bitfield.qword
4026                 && i.reg_operands == 1
4027                 && i.imm_operands == 1
4028                 && i.op[0].imms->X_op == O_constant
4029                 && ((i.tm.base_opcode == 0xb8
4030                      && i.tm.extension_opcode == None
4031                      && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4032                     || (fits_in_imm31 (i.op[0].imms->X_add_number)
4033                         && (((i.tm.base_opcode == 0x24
4034                               || i.tm.base_opcode == 0xa8)
4035                              && i.tm.extension_opcode == None)
4036                             || (i.tm.base_opcode == 0x80
4037                                 && i.tm.extension_opcode == 0x4)
4038                             || ((i.tm.base_opcode == 0xf6
4039                                  || (i.tm.base_opcode | 1) == 0xc7)
4040                                 && i.tm.extension_opcode == 0x0)))
4041                     || (fits_in_imm7 (i.op[0].imms->X_add_number)
4042                         && i.tm.base_opcode == 0x83
4043                         && i.tm.extension_opcode == 0x4)))
4044                || (i.types[0].bitfield.qword
4045                    && ((i.reg_operands == 2
4046                         && i.op[0].regs == i.op[1].regs
4047                         && ((i.tm.base_opcode == 0x30
4048                              || i.tm.base_opcode == 0x28)
4049                             && i.tm.extension_opcode == None))
4050                        || (i.reg_operands == 1
4051                            && i.operands == 1
4052                            && i.tm.base_opcode == 0x30
4053                            && i.tm.extension_opcode == None)))))
4054     {
4055       /* Optimize: -O:
4056            andq $imm31, %r64   -> andl $imm31, %r32
4057            andq $imm7, %r64    -> andl $imm7, %r32
4058            testq $imm31, %r64  -> testl $imm31, %r32
4059            xorq %r64, %r64     -> xorl %r32, %r32
4060            subq %r64, %r64     -> subl %r32, %r32
4061            movq $imm31, %r64   -> movl $imm31, %r32
4062            movq $imm32, %r64   -> movl $imm32, %r32
4063         */
4064       i.tm.opcode_modifier.norex64 = 1;
4065       if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4066         {
4067           /* Handle
4068                movq $imm31, %r64   -> movl $imm31, %r32
4069                movq $imm32, %r64   -> movl $imm32, %r32
4070            */
4071           i.tm.operand_types[0].bitfield.imm32 = 1;
4072           i.tm.operand_types[0].bitfield.imm32s = 0;
4073           i.tm.operand_types[0].bitfield.imm64 = 0;
4074           i.types[0].bitfield.imm32 = 1;
4075           i.types[0].bitfield.imm32s = 0;
4076           i.types[0].bitfield.imm64 = 0;
4077           i.types[1].bitfield.dword = 1;
4078           i.types[1].bitfield.qword = 0;
4079           if ((i.tm.base_opcode | 1) == 0xc7)
4080             {
4081               /* Handle
4082                    movq $imm31, %r64   -> movl $imm31, %r32
4083                */
4084               i.tm.base_opcode = 0xb8;
4085               i.tm.extension_opcode = None;
4086               i.tm.opcode_modifier.w = 0;
4087               i.tm.opcode_modifier.shortform = 1;
4088               i.tm.opcode_modifier.modrm = 0;
4089             }
4090         }
4091     }
4092   else if (optimize > 1
4093            && !optimize_for_space
4094            && i.reg_operands == 2
4095            && i.op[0].regs == i.op[1].regs
4096            && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4097                || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4098            && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4099     {
4100       /* Optimize: -O2:
4101            andb %rN, %rN  -> testb %rN, %rN
4102            andw %rN, %rN  -> testw %rN, %rN
4103            andq %rN, %rN  -> testq %rN, %rN
4104            orb %rN, %rN   -> testb %rN, %rN
4105            orw %rN, %rN   -> testw %rN, %rN
4106            orq %rN, %rN   -> testq %rN, %rN
4107
4108            and outside of 64-bit mode
4109
4110            andl %rN, %rN  -> testl %rN, %rN
4111            orl %rN, %rN   -> testl %rN, %rN
4112        */
4113       i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4114     }
4115   else if (i.reg_operands == 3
4116            && i.op[0].regs == i.op[1].regs
4117            && !i.types[2].bitfield.xmmword
4118            && (i.tm.opcode_modifier.vex
4119                || ((!i.mask || i.mask->zeroing)
4120                    && !i.rounding
4121                    && is_evex_encoding (&i.tm)
4122                    && (i.vec_encoding != vex_encoding_evex
4123                        || cpu_arch_isa_flags.bitfield.cpuavx512vl
4124                        || i.tm.cpu_flags.bitfield.cpuavx512vl
4125                        || (i.tm.operand_types[2].bitfield.zmmword
4126                            && i.types[2].bitfield.ymmword))))
4127            && ((i.tm.base_opcode == 0x55
4128                 || i.tm.base_opcode == 0x6655
4129                 || i.tm.base_opcode == 0x66df
4130                 || i.tm.base_opcode == 0x57
4131                 || i.tm.base_opcode == 0x6657
4132                 || i.tm.base_opcode == 0x66ef
4133                 || i.tm.base_opcode == 0x66f8
4134                 || i.tm.base_opcode == 0x66f9
4135                 || i.tm.base_opcode == 0x66fa
4136                 || i.tm.base_opcode == 0x66fb
4137                 || i.tm.base_opcode == 0x42
4138                 || i.tm.base_opcode == 0x6642
4139                 || i.tm.base_opcode == 0x47
4140                 || i.tm.base_opcode == 0x6647)
4141                && i.tm.extension_opcode == None))
4142     {
4143       /* Optimize: -O1:
4144            VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4145            vpsubq and vpsubw:
4146              EVEX VOP %zmmM, %zmmM, %zmmN
4147                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4148                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4149              EVEX VOP %ymmM, %ymmM, %ymmN
4150                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4151                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4152              VEX VOP %ymmM, %ymmM, %ymmN
4153                -> VEX VOP %xmmM, %xmmM, %xmmN
4154            VOP, one of vpandn and vpxor:
4155              VEX VOP %ymmM, %ymmM, %ymmN
4156                -> VEX VOP %xmmM, %xmmM, %xmmN
4157            VOP, one of vpandnd and vpandnq:
4158              EVEX VOP %zmmM, %zmmM, %zmmN
4159                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4160                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4161              EVEX VOP %ymmM, %ymmM, %ymmN
4162                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4163                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4164            VOP, one of vpxord and vpxorq:
4165              EVEX VOP %zmmM, %zmmM, %zmmN
4166                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4167                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4168              EVEX VOP %ymmM, %ymmM, %ymmN
4169                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4170                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4171            VOP, one of kxord and kxorq:
4172              VEX VOP %kM, %kM, %kN
4173                -> VEX kxorw %kM, %kM, %kN
4174            VOP, one of kandnd and kandnq:
4175              VEX VOP %kM, %kM, %kN
4176                -> VEX kandnw %kM, %kM, %kN
4177        */
4178       if (is_evex_encoding (&i.tm))
4179         {
4180           if (i.vec_encoding != vex_encoding_evex)
4181             {
4182               i.tm.opcode_modifier.vex = VEX128;
4183               i.tm.opcode_modifier.vexw = VEXW0;
4184               i.tm.opcode_modifier.evex = 0;
4185             }
4186           else if (optimize > 1)
4187             i.tm.opcode_modifier.evex = EVEX128;
4188           else
4189             return;
4190         }
4191       else if (i.tm.operand_types[0].bitfield.class == RegMask)
4192         {
4193           i.tm.base_opcode &= 0xff;
4194           i.tm.opcode_modifier.vexw = VEXW0;
4195         }
4196       else
4197         i.tm.opcode_modifier.vex = VEX128;
4198
4199       if (i.tm.opcode_modifier.vex)
4200         for (j = 0; j < 3; j++)
4201           {
4202             i.types[j].bitfield.xmmword = 1;
4203             i.types[j].bitfield.ymmword = 0;
4204           }
4205     }
4206   else if (i.vec_encoding != vex_encoding_evex
4207            && !i.types[0].bitfield.zmmword
4208            && !i.types[1].bitfield.zmmword
4209            && !i.mask
4210            && !i.broadcast
4211            && is_evex_encoding (&i.tm)
4212            && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4213                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4214                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4215                || (i.tm.base_opcode & ~4) == 0x66db
4216                || (i.tm.base_opcode & ~4) == 0x66eb)
4217            && i.tm.extension_opcode == None)
4218     {
4219       /* Optimize: -O1:
4220            VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4221            vmovdqu32 and vmovdqu64:
4222              EVEX VOP %xmmM, %xmmN
4223                -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4224              EVEX VOP %ymmM, %ymmN
4225                -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4226              EVEX VOP %xmmM, mem
4227                -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4228              EVEX VOP %ymmM, mem
4229                -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4230              EVEX VOP mem, %xmmN
4231                -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4232              EVEX VOP mem, %ymmN
4233                -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4234            VOP, one of vpand, vpandn, vpor, vpxor:
4235              EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4236                -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4237              EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4238                -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4239              EVEX VOP{d,q} mem, %xmmM, %xmmN
4240                -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4241              EVEX VOP{d,q} mem, %ymmM, %ymmN
4242                -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4243        */
4244       for (j = 0; j < i.operands; j++)
4245         if (operand_type_check (i.types[j], disp)
4246             && i.op[j].disps->X_op == O_constant)
4247           {
4248             /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4249                has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4250                bytes, we choose EVEX Disp8 over VEX Disp32.  */
4251             int evex_disp8, vex_disp8;
4252             unsigned int memshift = i.memshift;
4253             offsetT n = i.op[j].disps->X_add_number;
4254
4255             evex_disp8 = fits_in_disp8 (n);
4256             i.memshift = 0;
4257             vex_disp8 = fits_in_disp8 (n);
4258             if (evex_disp8 != vex_disp8)
4259               {
4260                 i.memshift = memshift;
4261                 return;
4262               }
4263
4264             i.types[j].bitfield.disp8 = vex_disp8;
4265             break;
4266           }
4267       if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4268         i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4269       i.tm.opcode_modifier.vex
4270         = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4271       i.tm.opcode_modifier.vexw = VEXW0;
4272       /* VPAND, VPOR, and VPXOR are commutative.  */
4273       if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4274         i.tm.opcode_modifier.commutative = 1;
4275       i.tm.opcode_modifier.evex = 0;
4276       i.tm.opcode_modifier.masking = 0;
4277       i.tm.opcode_modifier.broadcast = 0;
4278       i.tm.opcode_modifier.disp8memshift = 0;
4279       i.memshift = 0;
4280       if (j < i.operands)
4281         i.types[j].bitfield.disp8
4282           = fits_in_disp8 (i.op[j].disps->X_add_number);
4283     }
4284 }
4285
4286 /* This is the guts of the machine-dependent assembler.  LINE points to a
4287    machine dependent instruction.  This function is supposed to emit
4288    the frags/bytes it assembles to.  */
4289
4290 void
4291 md_assemble (char *line)
4292 {
4293   unsigned int j;
4294   char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4295   const insn_template *t;
4296
4297   /* Initialize globals.  */
4298   memset (&i, '\0', sizeof (i));
4299   for (j = 0; j < MAX_OPERANDS; j++)
4300     i.reloc[j] = NO_RELOC;
4301   memset (disp_expressions, '\0', sizeof (disp_expressions));
4302   memset (im_expressions, '\0', sizeof (im_expressions));
4303   save_stack_p = save_stack;
4304
4305   /* First parse an instruction mnemonic & call i386_operand for the operands.
4306      We assume that the scrubber has arranged it so that line[0] is the valid
4307      start of a (possibly prefixed) mnemonic.  */
4308
4309   line = parse_insn (line, mnemonic);
4310   if (line == NULL)
4311     return;
4312   mnem_suffix = i.suffix;
4313
4314   line = parse_operands (line, mnemonic);
4315   this_operand = -1;
4316   xfree (i.memop1_string);
4317   i.memop1_string = NULL;
4318   if (line == NULL)
4319     return;
4320
4321   /* Now we've parsed the mnemonic into a set of templates, and have the
4322      operands at hand.  */
4323
4324   /* All intel opcodes have reversed operands except for "bound" and
4325      "enter".  We also don't reverse intersegment "jmp" and "call"
4326      instructions with 2 immediate operands so that the immediate segment
4327      precedes the offset, as it does when in AT&T mode. */
4328   if (intel_syntax
4329       && i.operands > 1
4330       && (strcmp (mnemonic, "bound") != 0)
4331       && (strcmp (mnemonic, "invlpga") != 0)
4332       && !(operand_type_check (i.types[0], imm)
4333            && operand_type_check (i.types[1], imm)))
4334     swap_operands ();
4335
4336   /* The order of the immediates should be reversed
4337      for 2 immediates extrq and insertq instructions */
4338   if (i.imm_operands == 2
4339       && (strcmp (mnemonic, "extrq") == 0
4340           || strcmp (mnemonic, "insertq") == 0))
4341       swap_2_operands (0, 1);
4342
4343   if (i.imm_operands)
4344     optimize_imm ();
4345
4346   /* Don't optimize displacement for movabs since it only takes 64bit
4347      displacement.  */
4348   if (i.disp_operands
4349       && i.disp_encoding != disp_encoding_32bit
4350       && (flag_code != CODE_64BIT
4351           || strcmp (mnemonic, "movabs") != 0))
4352     optimize_disp ();
4353
4354   /* Next, we find a template that matches the given insn,
4355      making sure the overlap of the given operands types is consistent
4356      with the template operand types.  */
4357
4358   if (!(t = match_template (mnem_suffix)))
4359     return;
4360
4361   if (sse_check != check_none
4362       && !i.tm.opcode_modifier.noavx
4363       && !i.tm.cpu_flags.bitfield.cpuavx
4364       && !i.tm.cpu_flags.bitfield.cpuavx512f
4365       && (i.tm.cpu_flags.bitfield.cpusse
4366           || i.tm.cpu_flags.bitfield.cpusse2
4367           || i.tm.cpu_flags.bitfield.cpusse3
4368           || i.tm.cpu_flags.bitfield.cpussse3
4369           || i.tm.cpu_flags.bitfield.cpusse4_1
4370           || i.tm.cpu_flags.bitfield.cpusse4_2
4371           || i.tm.cpu_flags.bitfield.cpusse4a
4372           || i.tm.cpu_flags.bitfield.cpupclmul
4373           || i.tm.cpu_flags.bitfield.cpuaes
4374           || i.tm.cpu_flags.bitfield.cpusha
4375           || i.tm.cpu_flags.bitfield.cpugfni))
4376     {
4377       (sse_check == check_warning
4378        ? as_warn
4379        : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4380     }
4381
4382   /* Zap movzx and movsx suffix.  The suffix has been set from
4383      "word ptr" or "byte ptr" on the source operand in Intel syntax
4384      or extracted from mnemonic in AT&T syntax.  But we'll use
4385      the destination register to choose the suffix for encoding.  */
4386   if ((i.tm.base_opcode & ~9) == 0x0fb6)
4387     {
4388       /* In Intel syntax, there must be a suffix.  In AT&T syntax, if
4389          there is no suffix, the default will be byte extension.  */
4390       if (i.reg_operands != 2
4391           && !i.suffix
4392           && intel_syntax)
4393         as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
4394
4395       i.suffix = 0;
4396     }
4397
4398   if (i.tm.opcode_modifier.fwait)
4399     if (!add_prefix (FWAIT_OPCODE))
4400       return;
4401
4402   /* Check if REP prefix is OK.  */
4403   if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4404     {
4405       as_bad (_("invalid instruction `%s' after `%s'"),
4406                 i.tm.name, i.rep_prefix);
4407       return;
4408     }
4409
4410   /* Check for lock without a lockable instruction.  Destination operand
4411      must be memory unless it is xchg (0x86).  */
4412   if (i.prefix[LOCK_PREFIX]
4413       && (!i.tm.opcode_modifier.islockable
4414           || i.mem_operands == 0
4415           || (i.tm.base_opcode != 0x86
4416               && !(i.flags[i.operands - 1] & Operand_Mem))))
4417     {
4418       as_bad (_("expecting lockable instruction after `lock'"));
4419       return;
4420     }
4421
4422   /* Check for data size prefix on VEX/XOP/EVEX encoded insns.  */
4423   if (i.prefix[DATA_PREFIX] && is_any_vex_encoding (&i.tm))
4424     {
4425       as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4426       return;
4427     }
4428
4429   /* Check if HLE prefix is OK.  */
4430   if (i.hle_prefix && !check_hle ())
4431     return;
4432
4433   /* Check BND prefix.  */
4434   if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4435     as_bad (_("expecting valid branch instruction after `bnd'"));
4436
4437   /* Check NOTRACK prefix.  */
4438   if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4439     as_bad (_("expecting indirect branch instruction after `notrack'"));
4440
4441   if (i.tm.cpu_flags.bitfield.cpumpx)
4442     {
4443       if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4444         as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4445       else if (flag_code != CODE_16BIT
4446                ? i.prefix[ADDR_PREFIX]
4447                : i.mem_operands && !i.prefix[ADDR_PREFIX])
4448         as_bad (_("16-bit address isn't allowed in MPX instructions"));
4449     }
4450
4451   /* Insert BND prefix.  */
4452   if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4453     {
4454       if (!i.prefix[BND_PREFIX])
4455         add_prefix (BND_PREFIX_OPCODE);
4456       else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4457         {
4458           as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4459           i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4460         }
4461     }
4462
4463   /* Check string instruction segment overrides.  */
4464   if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4465     {
4466       gas_assert (i.mem_operands);
4467       if (!check_string ())
4468         return;
4469       i.disp_operands = 0;
4470     }
4471
4472   if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4473     optimize_encoding ();
4474
4475   if (!process_suffix ())
4476     return;
4477
4478   /* Update operand types.  */
4479   for (j = 0; j < i.operands; j++)
4480     i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4481
4482   /* Make still unresolved immediate matches conform to size of immediate
4483      given in i.suffix.  */
4484   if (!finalize_imm ())
4485     return;
4486
4487   if (i.types[0].bitfield.imm1)
4488     i.imm_operands = 0; /* kludge for shift insns.  */
4489
4490   /* We only need to check those implicit registers for instructions
4491      with 3 operands or less.  */
4492   if (i.operands <= 3)
4493     for (j = 0; j < i.operands; j++)
4494       if (i.types[j].bitfield.instance != InstanceNone
4495           && !i.types[j].bitfield.xmmword)
4496         i.reg_operands--;
4497
4498   /* ImmExt should be processed after SSE2AVX.  */
4499   if (!i.tm.opcode_modifier.sse2avx
4500       && i.tm.opcode_modifier.immext)
4501     process_immext ();
4502
4503   /* For insns with operands there are more diddles to do to the opcode.  */
4504   if (i.operands)
4505     {
4506       if (!process_operands ())
4507         return;
4508     }
4509   else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4510     {
4511       /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc.  */
4512       as_warn (_("translating to `%sp'"), i.tm.name);
4513     }
4514
4515   if (is_any_vex_encoding (&i.tm))
4516     {
4517       if (!cpu_arch_flags.bitfield.cpui286)
4518         {
4519           as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4520                   i.tm.name);
4521           return;
4522         }
4523
4524       if (i.tm.opcode_modifier.vex)
4525         build_vex_prefix (t);
4526       else
4527         build_evex_prefix ();
4528     }
4529
4530   /* Handle conversion of 'int $3' --> special int3 insn.  XOP or FMA4
4531      instructions may define INT_OPCODE as well, so avoid this corner
4532      case for those instructions that use MODRM.  */
4533   if (i.tm.base_opcode == INT_OPCODE
4534       && !i.tm.opcode_modifier.modrm
4535       && i.op[0].imms->X_add_number == 3)
4536     {
4537       i.tm.base_opcode = INT3_OPCODE;
4538       i.imm_operands = 0;
4539     }
4540
4541   if ((i.tm.opcode_modifier.jump == JUMP
4542        || i.tm.opcode_modifier.jump == JUMP_BYTE
4543        || i.tm.opcode_modifier.jump == JUMP_DWORD)
4544       && i.op[0].disps->X_op == O_constant)
4545     {
4546       /* Convert "jmp constant" (and "call constant") to a jump (call) to
4547          the absolute address given by the constant.  Since ix86 jumps and
4548          calls are pc relative, we need to generate a reloc.  */
4549       i.op[0].disps->X_add_symbol = &abs_symbol;
4550       i.op[0].disps->X_op = O_symbol;
4551     }
4552
4553   if (i.tm.opcode_modifier.rex64)
4554     i.rex |= REX_W;
4555
4556   /* For 8 bit registers we need an empty rex prefix.  Also if the
4557      instruction already has a prefix, we need to convert old
4558      registers to new ones.  */
4559
4560   if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4561        && (i.op[0].regs->reg_flags & RegRex64) != 0)
4562       || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4563           && (i.op[1].regs->reg_flags & RegRex64) != 0)
4564       || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4565            || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4566           && i.rex != 0))
4567     {
4568       int x;
4569
4570       i.rex |= REX_OPCODE;
4571       for (x = 0; x < 2; x++)
4572         {
4573           /* Look for 8 bit operand that uses old registers.  */
4574           if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4575               && (i.op[x].regs->reg_flags & RegRex64) == 0)
4576             {
4577               /* In case it is "hi" register, give up.  */
4578               if (i.op[x].regs->reg_num > 3)
4579                 as_bad (_("can't encode register '%s%s' in an "
4580                           "instruction requiring REX prefix."),
4581                         register_prefix, i.op[x].regs->reg_name);
4582
4583               /* Otherwise it is equivalent to the extended register.
4584                  Since the encoding doesn't change this is merely
4585                  cosmetic cleanup for debug output.  */
4586
4587               i.op[x].regs = i.op[x].regs + 8;
4588             }
4589         }
4590     }
4591
4592   if (i.rex == 0 && i.rex_encoding)
4593     {
4594       /* Check if we can add a REX_OPCODE byte.  Look for 8 bit operand
4595          that uses legacy register.  If it is "hi" register, don't add
4596          the REX_OPCODE byte.  */
4597       int x;
4598       for (x = 0; x < 2; x++)
4599         if (i.types[x].bitfield.class == Reg
4600             && i.types[x].bitfield.byte
4601             && (i.op[x].regs->reg_flags & RegRex64) == 0
4602             && i.op[x].regs->reg_num > 3)
4603           {
4604             i.rex_encoding = FALSE;
4605             break;
4606           }
4607
4608       if (i.rex_encoding)
4609         i.rex = REX_OPCODE;
4610     }
4611
4612   if (i.rex != 0)
4613     add_prefix (REX_OPCODE | i.rex);
4614
4615   /* We are ready to output the insn.  */
4616   output_insn ();
4617
4618   last_insn.seg = now_seg;
4619
4620   if (i.tm.opcode_modifier.isprefix)
4621     {
4622       last_insn.kind = last_insn_prefix;
4623       last_insn.name = i.tm.name;
4624       last_insn.file = as_where (&last_insn.line);
4625     }
4626   else
4627     last_insn.kind = last_insn_other;
4628 }
4629
4630 static char *
4631 parse_insn (char *line, char *mnemonic)
4632 {
4633   char *l = line;
4634   char *token_start = l;
4635   char *mnem_p;
4636   int supported;
4637   const insn_template *t;
4638   char *dot_p = NULL;
4639
4640   while (1)
4641     {
4642       mnem_p = mnemonic;
4643       while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
4644         {
4645           if (*mnem_p == '.')
4646             dot_p = mnem_p;
4647           mnem_p++;
4648           if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
4649             {
4650               as_bad (_("no such instruction: `%s'"), token_start);
4651               return NULL;
4652             }
4653           l++;
4654         }
4655       if (!is_space_char (*l)
4656           && *l != END_OF_INSN
4657           && (intel_syntax
4658               || (*l != PREFIX_SEPARATOR
4659                   && *l != ',')))
4660         {
4661           as_bad (_("invalid character %s in mnemonic"),
4662                   output_invalid (*l));
4663           return NULL;
4664         }
4665       if (token_start == l)
4666         {
4667           if (!intel_syntax && *l == PREFIX_SEPARATOR)
4668             as_bad (_("expecting prefix; got nothing"));
4669           else
4670             as_bad (_("expecting mnemonic; got nothing"));
4671           return NULL;
4672         }
4673
4674       /* Look up instruction (or prefix) via hash table.  */
4675       current_templates = (const templates *) hash_find (op_hash, mnemonic);
4676
4677       if (*l != END_OF_INSN
4678           && (!is_space_char (*l) || l[1] != END_OF_INSN)
4679           && current_templates
4680           && current_templates->start->opcode_modifier.isprefix)
4681         {
4682           if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
4683             {
4684               as_bad ((flag_code != CODE_64BIT
4685                        ? _("`%s' is only supported in 64-bit mode")
4686                        : _("`%s' is not supported in 64-bit mode")),
4687                       current_templates->start->name);
4688               return NULL;
4689             }
4690           /* If we are in 16-bit mode, do not allow addr16 or data16.
4691              Similarly, in 32-bit mode, do not allow addr32 or data32.  */
4692           if ((current_templates->start->opcode_modifier.size == SIZE16
4693                || current_templates->start->opcode_modifier.size == SIZE32)
4694               && flag_code != CODE_64BIT
4695               && ((current_templates->start->opcode_modifier.size == SIZE32)
4696                   ^ (flag_code == CODE_16BIT)))
4697             {
4698               as_bad (_("redundant %s prefix"),
4699                       current_templates->start->name);
4700               return NULL;
4701             }
4702           if (current_templates->start->opcode_length == 0)
4703             {
4704               /* Handle pseudo prefixes.  */
4705               switch (current_templates->start->base_opcode)
4706                 {
4707                 case 0x0:
4708                   /* {disp8} */
4709                   i.disp_encoding = disp_encoding_8bit;
4710                   break;
4711                 case 0x1:
4712                   /* {disp32} */
4713                   i.disp_encoding = disp_encoding_32bit;
4714                   break;
4715                 case 0x2:
4716                   /* {load} */
4717                   i.dir_encoding = dir_encoding_load;
4718                   break;
4719                 case 0x3:
4720                   /* {store} */
4721                   i.dir_encoding = dir_encoding_store;
4722                   break;
4723                 case 0x4:
4724                   /* {vex2} */
4725                   i.vec_encoding = vex_encoding_vex2;
4726                   break;
4727                 case 0x5:
4728                   /* {vex3} */
4729                   i.vec_encoding = vex_encoding_vex3;
4730                   break;
4731                 case 0x6:
4732                   /* {evex} */
4733                   i.vec_encoding = vex_encoding_evex;
4734                   break;
4735                 case 0x7:
4736                   /* {rex} */
4737                   i.rex_encoding = TRUE;
4738                   break;
4739                 case 0x8:
4740                   /* {nooptimize} */
4741                   i.no_optimize = TRUE;
4742                   break;
4743                 default:
4744                   abort ();
4745                 }
4746             }
4747           else
4748             {
4749               /* Add prefix, checking for repeated prefixes.  */
4750               switch (add_prefix (current_templates->start->base_opcode))
4751                 {
4752                 case PREFIX_EXIST:
4753                   return NULL;
4754                 case PREFIX_DS:
4755                   if (current_templates->start->cpu_flags.bitfield.cpuibt)
4756                     i.notrack_prefix = current_templates->start->name;
4757                   break;
4758                 case PREFIX_REP:
4759                   if (current_templates->start->cpu_flags.bitfield.cpuhle)
4760                     i.hle_prefix = current_templates->start->name;
4761                   else if (current_templates->start->cpu_flags.bitfield.cpumpx)
4762                     i.bnd_prefix = current_templates->start->name;
4763                   else
4764                     i.rep_prefix = current_templates->start->name;
4765                   break;
4766                 default:
4767                   break;
4768                 }
4769             }
4770           /* Skip past PREFIX_SEPARATOR and reset token_start.  */
4771           token_start = ++l;
4772         }
4773       else
4774         break;
4775     }
4776
4777   if (!current_templates)
4778     {
4779       /* Deprecated functionality (new code should use pseudo-prefixes instead):
4780          Check if we should swap operand or force 32bit displacement in
4781          encoding.  */
4782       if (mnem_p - 2 == dot_p && dot_p[1] == 's')
4783         i.dir_encoding = dir_encoding_swap;
4784       else if (mnem_p - 3 == dot_p
4785                && dot_p[1] == 'd'
4786                && dot_p[2] == '8')
4787         i.disp_encoding = disp_encoding_8bit;
4788       else if (mnem_p - 4 == dot_p
4789                && dot_p[1] == 'd'
4790                && dot_p[2] == '3'
4791                && dot_p[3] == '2')
4792         i.disp_encoding = disp_encoding_32bit;
4793       else
4794         goto check_suffix;
4795       mnem_p = dot_p;
4796       *dot_p = '\0';
4797       current_templates = (const templates *) hash_find (op_hash, mnemonic);
4798     }
4799
4800   if (!current_templates)
4801     {
4802 check_suffix:
4803       if (mnem_p > mnemonic)
4804         {
4805           /* See if we can get a match by trimming off a suffix.  */
4806           switch (mnem_p[-1])
4807             {
4808             case WORD_MNEM_SUFFIX:
4809               if (intel_syntax && (intel_float_operand (mnemonic) & 2))
4810                 i.suffix = SHORT_MNEM_SUFFIX;
4811               else
4812                 /* Fall through.  */
4813               case BYTE_MNEM_SUFFIX:
4814               case QWORD_MNEM_SUFFIX:
4815                 i.suffix = mnem_p[-1];
4816               mnem_p[-1] = '\0';
4817               current_templates = (const templates *) hash_find (op_hash,
4818                                                                  mnemonic);
4819               break;
4820             case SHORT_MNEM_SUFFIX:
4821             case LONG_MNEM_SUFFIX:
4822               if (!intel_syntax)
4823                 {
4824                   i.suffix = mnem_p[-1];
4825                   mnem_p[-1] = '\0';
4826                   current_templates = (const templates *) hash_find (op_hash,
4827                                                                      mnemonic);
4828                 }
4829               break;
4830
4831               /* Intel Syntax.  */
4832             case 'd':
4833               if (intel_syntax)
4834                 {
4835                   if (intel_float_operand (mnemonic) == 1)
4836                     i.suffix = SHORT_MNEM_SUFFIX;
4837                   else
4838                     i.suffix = LONG_MNEM_SUFFIX;
4839                   mnem_p[-1] = '\0';
4840                   current_templates = (const templates *) hash_find (op_hash,
4841                                                                      mnemonic);
4842                 }
4843               break;
4844             }
4845         }
4846
4847       if (!current_templates)
4848         {
4849           as_bad (_("no such instruction: `%s'"), token_start);
4850           return NULL;
4851         }
4852     }
4853
4854   if (current_templates->start->opcode_modifier.jump == JUMP
4855       || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
4856     {
4857       /* Check for a branch hint.  We allow ",pt" and ",pn" for
4858          predict taken and predict not taken respectively.
4859          I'm not sure that branch hints actually do anything on loop
4860          and jcxz insns (JumpByte) for current Pentium4 chips.  They
4861          may work in the future and it doesn't hurt to accept them
4862          now.  */
4863       if (l[0] == ',' && l[1] == 'p')
4864         {
4865           if (l[2] == 't')
4866             {
4867               if (!add_prefix (DS_PREFIX_OPCODE))
4868                 return NULL;
4869               l += 3;
4870             }
4871           else if (l[2] == 'n')
4872             {
4873               if (!add_prefix (CS_PREFIX_OPCODE))
4874                 return NULL;
4875               l += 3;
4876             }
4877         }
4878     }
4879   /* Any other comma loses.  */
4880   if (*l == ',')
4881     {
4882       as_bad (_("invalid character %s in mnemonic"),
4883               output_invalid (*l));
4884       return NULL;
4885     }
4886
4887   /* Check if instruction is supported on specified architecture.  */
4888   supported = 0;
4889   for (t = current_templates->start; t < current_templates->end; ++t)
4890     {
4891       supported |= cpu_flags_match (t);
4892       if (supported == CPU_FLAGS_PERFECT_MATCH)
4893         {
4894           if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
4895             as_warn (_("use .code16 to ensure correct addressing mode"));
4896
4897           return l;
4898         }
4899     }
4900
4901   if (!(supported & CPU_FLAGS_64BIT_MATCH))
4902     as_bad (flag_code == CODE_64BIT
4903             ? _("`%s' is not supported in 64-bit mode")
4904             : _("`%s' is only supported in 64-bit mode"),
4905             current_templates->start->name);
4906   else
4907     as_bad (_("`%s' is not supported on `%s%s'"),
4908             current_templates->start->name,
4909             cpu_arch_name ? cpu_arch_name : default_arch,
4910             cpu_sub_arch_name ? cpu_sub_arch_name : "");
4911
4912   return NULL;
4913 }
4914
4915 static char *
4916 parse_operands (char *l, const char *mnemonic)
4917 {
4918   char *token_start;
4919
4920   /* 1 if operand is pending after ','.  */
4921   unsigned int expecting_operand = 0;
4922
4923   /* Non-zero if operand parens not balanced.  */
4924   unsigned int paren_not_balanced;
4925
4926   while (*l != END_OF_INSN)
4927     {
4928       /* Skip optional white space before operand.  */
4929       if (is_space_char (*l))
4930         ++l;
4931       if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
4932         {
4933           as_bad (_("invalid character %s before operand %d"),
4934                   output_invalid (*l),
4935                   i.operands + 1);
4936           return NULL;
4937         }
4938       token_start = l;  /* After white space.  */
4939       paren_not_balanced = 0;
4940       while (paren_not_balanced || *l != ',')
4941         {
4942           if (*l == END_OF_INSN)
4943             {
4944               if (paren_not_balanced)
4945                 {
4946                   if (!intel_syntax)
4947                     as_bad (_("unbalanced parenthesis in operand %d."),
4948                             i.operands + 1);
4949                   else
4950                     as_bad (_("unbalanced brackets in operand %d."),
4951                             i.operands + 1);
4952                   return NULL;
4953                 }
4954               else
4955                 break;  /* we are done */
4956             }
4957           else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4958             {
4959               as_bad (_("invalid character %s in operand %d"),
4960                       output_invalid (*l),
4961                       i.operands + 1);
4962               return NULL;
4963             }
4964           if (!intel_syntax)
4965             {
4966               if (*l == '(')
4967                 ++paren_not_balanced;
4968               if (*l == ')')
4969                 --paren_not_balanced;
4970             }
4971           else
4972             {
4973               if (*l == '[')
4974                 ++paren_not_balanced;
4975               if (*l == ']')
4976                 --paren_not_balanced;
4977             }
4978           l++;
4979         }
4980       if (l != token_start)
4981         {                       /* Yes, we've read in another operand.  */
4982           unsigned int operand_ok;
4983           this_operand = i.operands++;
4984           if (i.operands > MAX_OPERANDS)
4985             {
4986               as_bad (_("spurious operands; (%d operands/instruction max)"),
4987                       MAX_OPERANDS);
4988               return NULL;
4989             }
4990           i.types[this_operand].bitfield.unspecified = 1;
4991           /* Now parse operand adding info to 'i' as we go along.  */
4992           END_STRING_AND_SAVE (l);
4993
4994           if (i.mem_operands > 1)
4995             {
4996               as_bad (_("too many memory references for `%s'"),
4997                       mnemonic);
4998               return 0;
4999             }
5000
5001           if (intel_syntax)
5002             operand_ok =
5003               i386_intel_operand (token_start,
5004                                   intel_float_operand (mnemonic));
5005           else
5006             operand_ok = i386_att_operand (token_start);
5007
5008           RESTORE_END_STRING (l);
5009           if (!operand_ok)
5010             return NULL;
5011         }
5012       else
5013         {
5014           if (expecting_operand)
5015             {
5016             expecting_operand_after_comma:
5017               as_bad (_("expecting operand after ','; got nothing"));
5018               return NULL;
5019             }
5020           if (*l == ',')
5021             {
5022               as_bad (_("expecting operand before ','; got nothing"));
5023               return NULL;
5024             }
5025         }
5026
5027       /* Now *l must be either ',' or END_OF_INSN.  */
5028       if (*l == ',')
5029         {
5030           if (*++l == END_OF_INSN)
5031             {
5032               /* Just skip it, if it's \n complain.  */
5033               goto expecting_operand_after_comma;
5034             }
5035           expecting_operand = 1;
5036         }
5037     }
5038   return l;
5039 }
5040
5041 static void
5042 swap_2_operands (int xchg1, int xchg2)
5043 {
5044   union i386_op temp_op;
5045   i386_operand_type temp_type;
5046   unsigned int temp_flags;
5047   enum bfd_reloc_code_real temp_reloc;
5048
5049   temp_type = i.types[xchg2];
5050   i.types[xchg2] = i.types[xchg1];
5051   i.types[xchg1] = temp_type;
5052
5053   temp_flags = i.flags[xchg2];
5054   i.flags[xchg2] = i.flags[xchg1];
5055   i.flags[xchg1] = temp_flags;
5056
5057   temp_op = i.op[xchg2];
5058   i.op[xchg2] = i.op[xchg1];
5059   i.op[xchg1] = temp_op;
5060
5061   temp_reloc = i.reloc[xchg2];
5062   i.reloc[xchg2] = i.reloc[xchg1];
5063   i.reloc[xchg1] = temp_reloc;
5064
5065   if (i.mask)
5066     {
5067       if (i.mask->operand == xchg1)
5068         i.mask->operand = xchg2;
5069       else if (i.mask->operand == xchg2)
5070         i.mask->operand = xchg1;
5071     }
5072   if (i.broadcast)
5073     {
5074       if (i.broadcast->operand == xchg1)
5075         i.broadcast->operand = xchg2;
5076       else if (i.broadcast->operand == xchg2)
5077         i.broadcast->operand = xchg1;
5078     }
5079   if (i.rounding)
5080     {
5081       if (i.rounding->operand == xchg1)
5082         i.rounding->operand = xchg2;
5083       else if (i.rounding->operand == xchg2)
5084         i.rounding->operand = xchg1;
5085     }
5086 }
5087
5088 static void
5089 swap_operands (void)
5090 {
5091   switch (i.operands)
5092     {
5093     case 5:
5094     case 4:
5095       swap_2_operands (1, i.operands - 2);
5096       /* Fall through.  */
5097     case 3:
5098     case 2:
5099       swap_2_operands (0, i.operands - 1);
5100       break;
5101     default:
5102       abort ();
5103     }
5104
5105   if (i.mem_operands == 2)
5106     {
5107       const seg_entry *temp_seg;
5108       temp_seg = i.seg[0];
5109       i.seg[0] = i.seg[1];
5110       i.seg[1] = temp_seg;
5111     }
5112 }
5113
5114 /* Try to ensure constant immediates are represented in the smallest
5115    opcode possible.  */
5116 static void
5117 optimize_imm (void)
5118 {
5119   char guess_suffix = 0;
5120   int op;
5121
5122   if (i.suffix)
5123     guess_suffix = i.suffix;
5124   else if (i.reg_operands)
5125     {
5126       /* Figure out a suffix from the last register operand specified.
5127          We can't do this properly yet, i.e. excluding special register
5128          instances, but the following works for instructions with
5129          immediates.  In any case, we can't set i.suffix yet.  */
5130       for (op = i.operands; --op >= 0;)
5131         if (i.types[op].bitfield.class != Reg)
5132           continue;
5133         else if (i.types[op].bitfield.byte)
5134           {
5135             guess_suffix = BYTE_MNEM_SUFFIX;
5136             break;
5137           }
5138         else if (i.types[op].bitfield.word)
5139           {
5140             guess_suffix = WORD_MNEM_SUFFIX;
5141             break;
5142           }
5143         else if (i.types[op].bitfield.dword)
5144           {
5145             guess_suffix = LONG_MNEM_SUFFIX;
5146             break;
5147           }
5148         else if (i.types[op].bitfield.qword)
5149           {
5150             guess_suffix = QWORD_MNEM_SUFFIX;
5151             break;
5152           }
5153     }
5154   else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5155     guess_suffix = WORD_MNEM_SUFFIX;
5156
5157   for (op = i.operands; --op >= 0;)
5158     if (operand_type_check (i.types[op], imm))
5159       {
5160         switch (i.op[op].imms->X_op)
5161           {
5162           case O_constant:
5163             /* If a suffix is given, this operand may be shortened.  */
5164             switch (guess_suffix)
5165               {
5166               case LONG_MNEM_SUFFIX:
5167                 i.types[op].bitfield.imm32 = 1;
5168                 i.types[op].bitfield.imm64 = 1;
5169                 break;
5170               case WORD_MNEM_SUFFIX:
5171                 i.types[op].bitfield.imm16 = 1;
5172                 i.types[op].bitfield.imm32 = 1;
5173                 i.types[op].bitfield.imm32s = 1;
5174                 i.types[op].bitfield.imm64 = 1;
5175                 break;
5176               case BYTE_MNEM_SUFFIX:
5177                 i.types[op].bitfield.imm8 = 1;
5178                 i.types[op].bitfield.imm8s = 1;
5179                 i.types[op].bitfield.imm16 = 1;
5180                 i.types[op].bitfield.imm32 = 1;
5181                 i.types[op].bitfield.imm32s = 1;
5182                 i.types[op].bitfield.imm64 = 1;
5183                 break;
5184               }
5185
5186             /* If this operand is at most 16 bits, convert it
5187                to a signed 16 bit number before trying to see
5188                whether it will fit in an even smaller size.
5189                This allows a 16-bit operand such as $0xffe0 to
5190                be recognised as within Imm8S range.  */
5191             if ((i.types[op].bitfield.imm16)
5192                 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5193               {
5194                 i.op[op].imms->X_add_number =
5195                   (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5196               }
5197 #ifdef BFD64
5198             /* Store 32-bit immediate in 64-bit for 64-bit BFD.  */
5199             if ((i.types[op].bitfield.imm32)
5200                 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5201                     == 0))
5202               {
5203                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5204                                                 ^ ((offsetT) 1 << 31))
5205                                                - ((offsetT) 1 << 31));
5206               }
5207 #endif
5208             i.types[op]
5209               = operand_type_or (i.types[op],
5210                                  smallest_imm_type (i.op[op].imms->X_add_number));
5211
5212             /* We must avoid matching of Imm32 templates when 64bit
5213                only immediate is available.  */
5214             if (guess_suffix == QWORD_MNEM_SUFFIX)
5215               i.types[op].bitfield.imm32 = 0;
5216             break;
5217
5218           case O_absent:
5219           case O_register:
5220             abort ();
5221
5222             /* Symbols and expressions.  */
5223           default:
5224             /* Convert symbolic operand to proper sizes for matching, but don't
5225                prevent matching a set of insns that only supports sizes other
5226                than those matching the insn suffix.  */
5227             {
5228               i386_operand_type mask, allowed;
5229               const insn_template *t;
5230
5231               operand_type_set (&mask, 0);
5232               operand_type_set (&allowed, 0);
5233
5234               for (t = current_templates->start;
5235                    t < current_templates->end;
5236                    ++t)
5237                 {
5238                   allowed = operand_type_or (allowed, t->operand_types[op]);
5239                   allowed = operand_type_and (allowed, anyimm);
5240                 }
5241               switch (guess_suffix)
5242                 {
5243                 case QWORD_MNEM_SUFFIX:
5244                   mask.bitfield.imm64 = 1;
5245                   mask.bitfield.imm32s = 1;
5246                   break;
5247                 case LONG_MNEM_SUFFIX:
5248                   mask.bitfield.imm32 = 1;
5249                   break;
5250                 case WORD_MNEM_SUFFIX:
5251                   mask.bitfield.imm16 = 1;
5252                   break;
5253                 case BYTE_MNEM_SUFFIX:
5254                   mask.bitfield.imm8 = 1;
5255                   break;
5256                 default:
5257                   break;
5258                 }
5259               allowed = operand_type_and (mask, allowed);
5260               if (!operand_type_all_zero (&allowed))
5261                 i.types[op] = operand_type_and (i.types[op], mask);
5262             }
5263             break;
5264           }
5265       }
5266 }
5267
5268 /* Try to use the smallest displacement type too.  */
5269 static void
5270 optimize_disp (void)
5271 {
5272   int op;
5273
5274   for (op = i.operands; --op >= 0;)
5275     if (operand_type_check (i.types[op], disp))
5276       {
5277         if (i.op[op].disps->X_op == O_constant)
5278           {
5279             offsetT op_disp = i.op[op].disps->X_add_number;
5280
5281             if (i.types[op].bitfield.disp16
5282                 && (op_disp & ~(offsetT) 0xffff) == 0)
5283               {
5284                 /* If this operand is at most 16 bits, convert
5285                    to a signed 16 bit number and don't use 64bit
5286                    displacement.  */
5287                 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5288                 i.types[op].bitfield.disp64 = 0;
5289               }
5290 #ifdef BFD64
5291             /* Optimize 64-bit displacement to 32-bit for 64-bit BFD.  */
5292             if (i.types[op].bitfield.disp32
5293                 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5294               {
5295                 /* If this operand is at most 32 bits, convert
5296                    to a signed 32 bit number and don't use 64bit
5297                    displacement.  */
5298                 op_disp &= (((offsetT) 2 << 31) - 1);
5299                 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5300                 i.types[op].bitfield.disp64 = 0;
5301               }
5302 #endif
5303             if (!op_disp && i.types[op].bitfield.baseindex)
5304               {
5305                 i.types[op].bitfield.disp8 = 0;
5306                 i.types[op].bitfield.disp16 = 0;
5307                 i.types[op].bitfield.disp32 = 0;
5308                 i.types[op].bitfield.disp32s = 0;
5309                 i.types[op].bitfield.disp64 = 0;
5310                 i.op[op].disps = 0;
5311                 i.disp_operands--;
5312               }
5313             else if (flag_code == CODE_64BIT)
5314               {
5315                 if (fits_in_signed_long (op_disp))
5316                   {
5317                     i.types[op].bitfield.disp64 = 0;
5318                     i.types[op].bitfield.disp32s = 1;
5319                   }
5320                 if (i.prefix[ADDR_PREFIX]
5321                     && fits_in_unsigned_long (op_disp))
5322                   i.types[op].bitfield.disp32 = 1;
5323               }
5324             if ((i.types[op].bitfield.disp32
5325                  || i.types[op].bitfield.disp32s
5326                  || i.types[op].bitfield.disp16)
5327                 && fits_in_disp8 (op_disp))
5328               i.types[op].bitfield.disp8 = 1;
5329           }
5330         else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5331                  || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5332           {
5333             fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5334                          i.op[op].disps, 0, i.reloc[op]);
5335             i.types[op].bitfield.disp8 = 0;
5336             i.types[op].bitfield.disp16 = 0;
5337             i.types[op].bitfield.disp32 = 0;
5338             i.types[op].bitfield.disp32s = 0;
5339             i.types[op].bitfield.disp64 = 0;
5340           }
5341         else
5342           /* We only support 64bit displacement on constants.  */
5343           i.types[op].bitfield.disp64 = 0;
5344       }
5345 }
5346
5347 /* Return 1 if there is a match in broadcast bytes between operand
5348    GIVEN and instruction template T.   */
5349
5350 static INLINE int
5351 match_broadcast_size (const insn_template *t, unsigned int given)
5352 {
5353   return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5354            && i.types[given].bitfield.byte)
5355           || (t->opcode_modifier.broadcast == WORD_BROADCAST
5356               && i.types[given].bitfield.word)
5357           || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5358               && i.types[given].bitfield.dword)
5359           || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5360               && i.types[given].bitfield.qword));
5361 }
5362
5363 /* Check if operands are valid for the instruction.  */
5364
5365 static int
5366 check_VecOperands (const insn_template *t)
5367 {
5368   unsigned int op;
5369   i386_cpu_flags cpu;
5370   static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
5371
5372   /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5373      any one operand are implicity requiring AVX512VL support if the actual
5374      operand size is YMMword or XMMword.  Since this function runs after
5375      template matching, there's no need to check for YMMword/XMMword in
5376      the template.  */
5377   cpu = cpu_flags_and (t->cpu_flags, avx512);
5378   if (!cpu_flags_all_zero (&cpu)
5379       && !t->cpu_flags.bitfield.cpuavx512vl
5380       && !cpu_arch_flags.bitfield.cpuavx512vl)
5381     {
5382       for (op = 0; op < t->operands; ++op)
5383         {
5384           if (t->operand_types[op].bitfield.zmmword
5385               && (i.types[op].bitfield.ymmword
5386                   || i.types[op].bitfield.xmmword))
5387             {
5388               i.error = unsupported;
5389               return 1;
5390             }
5391         }
5392     }
5393
5394   /* Without VSIB byte, we can't have a vector register for index.  */
5395   if (!t->opcode_modifier.vecsib
5396       && i.index_reg
5397       && (i.index_reg->reg_type.bitfield.xmmword
5398           || i.index_reg->reg_type.bitfield.ymmword
5399           || i.index_reg->reg_type.bitfield.zmmword))
5400     {
5401       i.error = unsupported_vector_index_register;
5402       return 1;
5403     }
5404
5405   /* Check if default mask is allowed.  */
5406   if (t->opcode_modifier.nodefmask
5407       && (!i.mask || i.mask->mask->reg_num == 0))
5408     {
5409       i.error = no_default_mask;
5410       return 1;
5411     }
5412
5413   /* For VSIB byte, we need a vector register for index, and all vector
5414      registers must be distinct.  */
5415   if (t->opcode_modifier.vecsib)
5416     {
5417       if (!i.index_reg
5418           || !((t->opcode_modifier.vecsib == VecSIB128
5419                 && i.index_reg->reg_type.bitfield.xmmword)
5420                || (t->opcode_modifier.vecsib == VecSIB256
5421                    && i.index_reg->reg_type.bitfield.ymmword)
5422                || (t->opcode_modifier.vecsib == VecSIB512
5423                    && i.index_reg->reg_type.bitfield.zmmword)))
5424       {
5425         i.error = invalid_vsib_address;
5426         return 1;
5427       }
5428
5429       gas_assert (i.reg_operands == 2 || i.mask);
5430       if (i.reg_operands == 2 && !i.mask)
5431         {
5432           gas_assert (i.types[0].bitfield.class == RegSIMD);
5433           gas_assert (i.types[0].bitfield.xmmword
5434                       || i.types[0].bitfield.ymmword);
5435           gas_assert (i.types[2].bitfield.class == RegSIMD);
5436           gas_assert (i.types[2].bitfield.xmmword
5437                       || i.types[2].bitfield.ymmword);
5438           if (operand_check == check_none)
5439             return 0;
5440           if (register_number (i.op[0].regs)
5441               != register_number (i.index_reg)
5442               && register_number (i.op[2].regs)
5443                  != register_number (i.index_reg)
5444               && register_number (i.op[0].regs)
5445                  != register_number (i.op[2].regs))
5446             return 0;
5447           if (operand_check == check_error)
5448             {
5449               i.error = invalid_vector_register_set;
5450               return 1;
5451             }
5452           as_warn (_("mask, index, and destination registers should be distinct"));
5453         }
5454       else if (i.reg_operands == 1 && i.mask)
5455         {
5456           if (i.types[1].bitfield.class == RegSIMD
5457               && (i.types[1].bitfield.xmmword
5458                   || i.types[1].bitfield.ymmword
5459                   || i.types[1].bitfield.zmmword)
5460               && (register_number (i.op[1].regs)
5461                   == register_number (i.index_reg)))
5462             {
5463               if (operand_check == check_error)
5464                 {
5465                   i.error = invalid_vector_register_set;
5466                   return 1;
5467                 }
5468               if (operand_check != check_none)
5469                 as_warn (_("index and destination registers should be distinct"));
5470             }
5471         }
5472     }
5473
5474   /* Check if broadcast is supported by the instruction and is applied
5475      to the memory operand.  */
5476   if (i.broadcast)
5477     {
5478       i386_operand_type type, overlap;
5479
5480       /* Check if specified broadcast is supported in this instruction,
5481          and its broadcast bytes match the memory operand.  */
5482       op = i.broadcast->operand;
5483       if (!t->opcode_modifier.broadcast
5484           || !(i.flags[op] & Operand_Mem)
5485           || (!i.types[op].bitfield.unspecified
5486               && !match_broadcast_size (t, op)))
5487         {
5488         bad_broadcast:
5489           i.error = unsupported_broadcast;
5490           return 1;
5491         }
5492
5493       i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5494                             * i.broadcast->type);
5495       operand_type_set (&type, 0);
5496       switch (i.broadcast->bytes)
5497         {
5498         case 2:
5499           type.bitfield.word = 1;
5500           break;
5501         case 4:
5502           type.bitfield.dword = 1;
5503           break;
5504         case 8:
5505           type.bitfield.qword = 1;
5506           break;
5507         case 16:
5508           type.bitfield.xmmword = 1;
5509           break;
5510         case 32:
5511           type.bitfield.ymmword = 1;
5512           break;
5513         case 64:
5514           type.bitfield.zmmword = 1;
5515           break;
5516         default:
5517           goto bad_broadcast;
5518         }
5519
5520       overlap = operand_type_and (type, t->operand_types[op]);
5521       if (operand_type_all_zero (&overlap))
5522           goto bad_broadcast;
5523
5524       if (t->opcode_modifier.checkregsize)
5525         {
5526           unsigned int j;
5527
5528           type.bitfield.baseindex = 1;
5529           for (j = 0; j < i.operands; ++j)
5530             {
5531               if (j != op
5532                   && !operand_type_register_match(i.types[j],
5533                                                   t->operand_types[j],
5534                                                   type,
5535                                                   t->operand_types[op]))
5536                 goto bad_broadcast;
5537             }
5538         }
5539     }
5540   /* If broadcast is supported in this instruction, we need to check if
5541      operand of one-element size isn't specified without broadcast.  */
5542   else if (t->opcode_modifier.broadcast && i.mem_operands)
5543     {
5544       /* Find memory operand.  */
5545       for (op = 0; op < i.operands; op++)
5546         if (i.flags[op] & Operand_Mem)
5547           break;
5548       gas_assert (op < i.operands);
5549       /* Check size of the memory operand.  */
5550       if (match_broadcast_size (t, op))
5551         {
5552           i.error = broadcast_needed;
5553           return 1;
5554         }
5555     }
5556   else
5557     op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning.  */
5558
5559   /* Check if requested masking is supported.  */
5560   if (i.mask)
5561     {
5562       switch (t->opcode_modifier.masking)
5563         {
5564         case BOTH_MASKING:
5565           break;
5566         case MERGING_MASKING:
5567           if (i.mask->zeroing)
5568             {
5569         case 0:
5570               i.error = unsupported_masking;
5571               return 1;
5572             }
5573           break;
5574         case DYNAMIC_MASKING:
5575           /* Memory destinations allow only merging masking.  */
5576           if (i.mask->zeroing && i.mem_operands)
5577             {
5578               /* Find memory operand.  */
5579               for (op = 0; op < i.operands; op++)
5580                 if (i.flags[op] & Operand_Mem)
5581                   break;
5582               gas_assert (op < i.operands);
5583               if (op == i.operands - 1)
5584                 {
5585                   i.error = unsupported_masking;
5586                   return 1;
5587                 }
5588             }
5589           break;
5590         default:
5591           abort ();
5592         }
5593     }
5594
5595   /* Check if masking is applied to dest operand.  */
5596   if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5597     {
5598       i.error = mask_not_on_destination;
5599       return 1;
5600     }
5601
5602   /* Check RC/SAE.  */
5603   if (i.rounding)
5604     {
5605       if (!t->opcode_modifier.sae
5606           || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
5607         {
5608           i.error = unsupported_rc_sae;
5609           return 1;
5610         }
5611       /* If the instruction has several immediate operands and one of
5612          them is rounding, the rounding operand should be the last
5613          immediate operand.  */
5614       if (i.imm_operands > 1
5615           && i.rounding->operand != (int) (i.imm_operands - 1))
5616         {
5617           i.error = rc_sae_operand_not_last_imm;
5618           return 1;
5619         }
5620     }
5621
5622   /* Check vector Disp8 operand.  */
5623   if (t->opcode_modifier.disp8memshift
5624       && i.disp_encoding != disp_encoding_32bit)
5625     {
5626       if (i.broadcast)
5627         i.memshift = t->opcode_modifier.broadcast - 1;
5628       else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
5629         i.memshift = t->opcode_modifier.disp8memshift;
5630       else
5631         {
5632           const i386_operand_type *type = NULL;
5633
5634           i.memshift = 0;
5635           for (op = 0; op < i.operands; op++)
5636             if (i.flags[op] & Operand_Mem)
5637               {
5638                 if (t->opcode_modifier.evex == EVEXLIG)
5639                   i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
5640                 else if (t->operand_types[op].bitfield.xmmword
5641                          + t->operand_types[op].bitfield.ymmword
5642                          + t->operand_types[op].bitfield.zmmword <= 1)
5643                   type = &t->operand_types[op];
5644                 else if (!i.types[op].bitfield.unspecified)
5645                   type = &i.types[op];
5646               }
5647             else if (i.types[op].bitfield.class == RegSIMD
5648                      && t->opcode_modifier.evex != EVEXLIG)
5649               {
5650                 if (i.types[op].bitfield.zmmword)
5651                   i.memshift = 6;
5652                 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
5653                   i.memshift = 5;
5654                 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
5655                   i.memshift = 4;
5656               }
5657
5658           if (type)
5659             {
5660               if (type->bitfield.zmmword)
5661                 i.memshift = 6;
5662               else if (type->bitfield.ymmword)
5663                 i.memshift = 5;
5664               else if (type->bitfield.xmmword)
5665                 i.memshift = 4;
5666             }
5667
5668           /* For the check in fits_in_disp8().  */
5669           if (i.memshift == 0)
5670             i.memshift = -1;
5671         }
5672
5673       for (op = 0; op < i.operands; op++)
5674         if (operand_type_check (i.types[op], disp)
5675             && i.op[op].disps->X_op == O_constant)
5676           {
5677             if (fits_in_disp8 (i.op[op].disps->X_add_number))
5678               {
5679                 i.types[op].bitfield.disp8 = 1;
5680                 return 0;
5681               }
5682             i.types[op].bitfield.disp8 = 0;
5683           }
5684     }
5685
5686   i.memshift = 0;
5687
5688   return 0;
5689 }
5690
5691 /* Check if operands are valid for the instruction.  Update VEX
5692    operand types.  */
5693
5694 static int
5695 VEX_check_operands (const insn_template *t)
5696 {
5697   if (i.vec_encoding == vex_encoding_evex)
5698     {
5699       /* This instruction must be encoded with EVEX prefix.  */
5700       if (!is_evex_encoding (t))
5701         {
5702           i.error = unsupported;
5703           return 1;
5704         }
5705       return 0;
5706     }
5707
5708   if (!t->opcode_modifier.vex)
5709     {
5710       /* This instruction template doesn't have VEX prefix.  */
5711       if (i.vec_encoding != vex_encoding_default)
5712         {
5713           i.error = unsupported;
5714           return 1;
5715         }
5716       return 0;
5717     }
5718
5719   /* Check the special Imm4 cases; must be the first operand.  */
5720   if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
5721     {
5722       if (i.op[0].imms->X_op != O_constant
5723           || !fits_in_imm4 (i.op[0].imms->X_add_number))
5724         {
5725           i.error = bad_imm4;
5726           return 1;
5727         }
5728
5729       /* Turn off Imm<N> so that update_imm won't complain.  */
5730       operand_type_set (&i.types[0], 0);
5731     }
5732
5733   return 0;
5734 }
5735
5736 static const insn_template *
5737 match_template (char mnem_suffix)
5738 {
5739   /* Points to template once we've found it.  */
5740   const insn_template *t;
5741   i386_operand_type overlap0, overlap1, overlap2, overlap3;
5742   i386_operand_type overlap4;
5743   unsigned int found_reverse_match;
5744   i386_opcode_modifier suffix_check;
5745   i386_operand_type operand_types [MAX_OPERANDS];
5746   int addr_prefix_disp;
5747   unsigned int j;
5748   unsigned int found_cpu_match, size_match;
5749   unsigned int check_register;
5750   enum i386_error specific_error = 0;
5751
5752 #if MAX_OPERANDS != 5
5753 # error "MAX_OPERANDS must be 5."
5754 #endif
5755
5756   found_reverse_match = 0;
5757   addr_prefix_disp = -1;
5758
5759   /* Prepare for mnemonic suffix check.  */
5760   memset (&suffix_check, 0, sizeof (suffix_check));
5761   switch (mnem_suffix)
5762     {
5763     case BYTE_MNEM_SUFFIX:
5764       suffix_check.no_bsuf = 1;
5765       break;
5766     case WORD_MNEM_SUFFIX:
5767       suffix_check.no_wsuf = 1;
5768       break;
5769     case SHORT_MNEM_SUFFIX:
5770       suffix_check.no_ssuf = 1;
5771       break;
5772     case LONG_MNEM_SUFFIX:
5773       suffix_check.no_lsuf = 1;
5774       break;
5775     case QWORD_MNEM_SUFFIX:
5776       suffix_check.no_qsuf = 1;
5777       break;
5778     default:
5779       /* NB: In Intel syntax, normally we can check for memory operand
5780          size when there is no mnemonic suffix.  But jmp and call have
5781          2 different encodings with Dword memory operand size, one with
5782          No_ldSuf and the other without.  i.suffix is set to
5783          LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf.  */
5784       if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
5785         suffix_check.no_ldsuf = 1;
5786     }
5787
5788   /* Must have right number of operands.  */
5789   i.error = number_of_operands_mismatch;
5790
5791   for (t = current_templates->start; t < current_templates->end; t++)
5792     {
5793       addr_prefix_disp = -1;
5794       found_reverse_match = 0;
5795
5796       if (i.operands != t->operands)
5797         continue;
5798
5799       /* Check processor support.  */
5800       i.error = unsupported;
5801       found_cpu_match = (cpu_flags_match (t)
5802                          == CPU_FLAGS_PERFECT_MATCH);
5803       if (!found_cpu_match)
5804         continue;
5805
5806       /* Check AT&T mnemonic.   */
5807       i.error = unsupported_with_intel_mnemonic;
5808       if (intel_mnemonic && t->opcode_modifier.attmnemonic)
5809         continue;
5810
5811       /* Check AT&T/Intel syntax and Intel64/AMD64 ISA.   */
5812       i.error = unsupported_syntax;
5813       if ((intel_syntax && t->opcode_modifier.attsyntax)
5814           || (!intel_syntax && t->opcode_modifier.intelsyntax)
5815           || (intel64 && t->opcode_modifier.amd64)
5816           || (!intel64 && t->opcode_modifier.intel64))
5817         continue;
5818
5819       /* Check the suffix.  */
5820       i.error = invalid_instruction_suffix;
5821       if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
5822           || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
5823           || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
5824           || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
5825           || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
5826           || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
5827         continue;
5828
5829       size_match = operand_size_match (t);
5830       if (!size_match)
5831         continue;
5832
5833       /* This is intentionally not
5834
5835          if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
5836
5837          as the case of a missing * on the operand is accepted (perhaps with
5838          a warning, issued further down).  */
5839       if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
5840         {
5841           i.error = operand_type_mismatch;
5842           continue;
5843         }
5844
5845       for (j = 0; j < MAX_OPERANDS; j++)
5846         operand_types[j] = t->operand_types[j];
5847
5848       /* In general, don't allow 64-bit operands in 32-bit mode.  */
5849       if (i.suffix == QWORD_MNEM_SUFFIX
5850           && flag_code != CODE_64BIT
5851           && (intel_syntax
5852               ? (!t->opcode_modifier.ignoresize
5853                  && !t->opcode_modifier.broadcast
5854                  && !intel_float_operand (t->name))
5855               : intel_float_operand (t->name) != 2)
5856           && ((operand_types[0].bitfield.class != RegMMX
5857                && operand_types[0].bitfield.class != RegSIMD)
5858               || (operand_types[t->operands > 1].bitfield.class != RegMMX
5859                   && operand_types[t->operands > 1].bitfield.class != RegSIMD))
5860           && (t->base_opcode != 0x0fc7
5861               || t->extension_opcode != 1 /* cmpxchg8b */))
5862         continue;
5863
5864       /* In general, don't allow 32-bit operands on pre-386.  */
5865       else if (i.suffix == LONG_MNEM_SUFFIX
5866                && !cpu_arch_flags.bitfield.cpui386
5867                && (intel_syntax
5868                    ? (!t->opcode_modifier.ignoresize
5869                       && !intel_float_operand (t->name))
5870                    : intel_float_operand (t->name) != 2)
5871                && ((operand_types[0].bitfield.class != RegMMX
5872                     && operand_types[0].bitfield.class != RegSIMD)
5873                    || (operand_types[t->operands > 1].bitfield.class != RegMMX
5874                        && operand_types[t->operands > 1].bitfield.class
5875                           != RegSIMD)))
5876         continue;
5877
5878       /* Do not verify operands when there are none.  */
5879       else
5880         {
5881           if (!t->operands)
5882             /* We've found a match; break out of loop.  */
5883             break;
5884         }
5885
5886       if (!t->opcode_modifier.jump
5887           || t->opcode_modifier.jump == JUMP_ABSOLUTE)
5888         {
5889           /* There should be only one Disp operand.  */
5890           for (j = 0; j < MAX_OPERANDS; j++)
5891             if (operand_type_check (operand_types[j], disp))
5892               break;
5893           if (j < MAX_OPERANDS)
5894             {
5895               bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
5896
5897               addr_prefix_disp = j;
5898
5899               /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
5900                  operand into Disp32/Disp32/Disp16/Disp32 operand.  */
5901               switch (flag_code)
5902                 {
5903                 case CODE_16BIT:
5904                   override = !override;
5905                   /* Fall through.  */
5906                 case CODE_32BIT:
5907                   if (operand_types[j].bitfield.disp32
5908                       && operand_types[j].bitfield.disp16)
5909                     {
5910                       operand_types[j].bitfield.disp16 = override;
5911                       operand_types[j].bitfield.disp32 = !override;
5912                     }
5913                   operand_types[j].bitfield.disp32s = 0;
5914                   operand_types[j].bitfield.disp64 = 0;
5915                   break;
5916
5917                 case CODE_64BIT:
5918                   if (operand_types[j].bitfield.disp32s
5919                       || operand_types[j].bitfield.disp64)
5920                     {
5921                       operand_types[j].bitfield.disp64 &= !override;
5922                       operand_types[j].bitfield.disp32s &= !override;
5923                       operand_types[j].bitfield.disp32 = override;
5924                     }
5925                   operand_types[j].bitfield.disp16 = 0;
5926                   break;
5927                 }
5928             }
5929         }
5930
5931       /* Force 0x8b encoding for "mov foo@GOT, %eax".  */
5932       if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
5933         continue;
5934
5935       /* We check register size if needed.  */
5936       if (t->opcode_modifier.checkregsize)
5937         {
5938           check_register = (1 << t->operands) - 1;
5939           if (i.broadcast)
5940             check_register &= ~(1 << i.broadcast->operand);
5941         }
5942       else
5943         check_register = 0;
5944
5945       overlap0 = operand_type_and (i.types[0], operand_types[0]);
5946       switch (t->operands)
5947         {
5948         case 1:
5949           if (!operand_type_match (overlap0, i.types[0]))
5950             continue;
5951           break;
5952         case 2:
5953           /* xchg %eax, %eax is a special case. It is an alias for nop
5954              only in 32bit mode and we can use opcode 0x90.  In 64bit
5955              mode, we can't use 0x90 for xchg %eax, %eax since it should
5956              zero-extend %eax to %rax.  */
5957           if (flag_code == CODE_64BIT
5958               && t->base_opcode == 0x90
5959               && i.types[0].bitfield.instance == Accum
5960               && i.types[0].bitfield.dword
5961               && i.types[1].bitfield.instance == Accum
5962               && i.types[1].bitfield.dword)
5963             continue;
5964           /* xrelease mov %eax, <disp> is another special case. It must not
5965              match the accumulator-only encoding of mov.  */
5966           if (flag_code != CODE_64BIT
5967               && i.hle_prefix
5968               && t->base_opcode == 0xa0
5969               && i.types[0].bitfield.instance == Accum
5970               && (i.flags[1] & Operand_Mem))
5971             continue;
5972           /* Fall through.  */
5973
5974         case 3:
5975           if (!(size_match & MATCH_STRAIGHT))
5976             goto check_reverse;
5977           /* Reverse direction of operands if swapping is possible in the first
5978              place (operands need to be symmetric) and
5979              - the load form is requested, and the template is a store form,
5980              - the store form is requested, and the template is a load form,
5981              - the non-default (swapped) form is requested.  */
5982           overlap1 = operand_type_and (operand_types[0], operand_types[1]);
5983           if (t->opcode_modifier.d && i.reg_operands == i.operands
5984               && !operand_type_all_zero (&overlap1))
5985             switch (i.dir_encoding)
5986               {
5987               case dir_encoding_load:
5988                 if (operand_type_check (operand_types[i.operands - 1], anymem)
5989                     || t->opcode_modifier.regmem)
5990                   goto check_reverse;
5991                 break;
5992
5993               case dir_encoding_store:
5994                 if (!operand_type_check (operand_types[i.operands - 1], anymem)
5995                     && !t->opcode_modifier.regmem)
5996                   goto check_reverse;
5997                 break;
5998
5999               case dir_encoding_swap:
6000                 goto check_reverse;
6001
6002               case dir_encoding_default:
6003                 break;
6004               }
6005           /* If we want store form, we skip the current load.  */
6006           if ((i.dir_encoding == dir_encoding_store
6007                || i.dir_encoding == dir_encoding_swap)
6008               && i.mem_operands == 0
6009               && t->opcode_modifier.load)
6010             continue;
6011           /* Fall through.  */
6012         case 4:
6013         case 5:
6014           overlap1 = operand_type_and (i.types[1], operand_types[1]);
6015           if (!operand_type_match (overlap0, i.types[0])
6016               || !operand_type_match (overlap1, i.types[1])
6017               || ((check_register & 3) == 3
6018                   && !operand_type_register_match (i.types[0],
6019                                                    operand_types[0],
6020                                                    i.types[1],
6021                                                    operand_types[1])))
6022             {
6023               /* Check if other direction is valid ...  */
6024               if (!t->opcode_modifier.d)
6025                 continue;
6026
6027 check_reverse:
6028               if (!(size_match & MATCH_REVERSE))
6029                 continue;
6030               /* Try reversing direction of operands.  */
6031               overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6032               overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6033               if (!operand_type_match (overlap0, i.types[0])
6034                   || !operand_type_match (overlap1, i.types[i.operands - 1])
6035                   || (check_register
6036                       && !operand_type_register_match (i.types[0],
6037                                                        operand_types[i.operands - 1],
6038                                                        i.types[i.operands - 1],
6039                                                        operand_types[0])))
6040                 {
6041                   /* Does not match either direction.  */
6042                   continue;
6043                 }
6044               /* found_reverse_match holds which of D or FloatR
6045                  we've found.  */
6046               if (!t->opcode_modifier.d)
6047                 found_reverse_match = 0;
6048               else if (operand_types[0].bitfield.tbyte)
6049                 found_reverse_match = Opcode_FloatD;
6050               else if (operand_types[0].bitfield.xmmword
6051                        || operand_types[i.operands - 1].bitfield.xmmword
6052                        || operand_types[0].bitfield.class == RegMMX
6053                        || operand_types[i.operands - 1].bitfield.class == RegMMX
6054                        || is_any_vex_encoding(t))
6055                 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6056                                       ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6057               else
6058                 found_reverse_match = Opcode_D;
6059               if (t->opcode_modifier.floatr)
6060                 found_reverse_match |= Opcode_FloatR;
6061             }
6062           else
6063             {
6064               /* Found a forward 2 operand match here.  */
6065               switch (t->operands)
6066                 {
6067                 case 5:
6068                   overlap4 = operand_type_and (i.types[4],
6069                                                operand_types[4]);
6070                   /* Fall through.  */
6071                 case 4:
6072                   overlap3 = operand_type_and (i.types[3],
6073                                                operand_types[3]);
6074                   /* Fall through.  */
6075                 case 3:
6076                   overlap2 = operand_type_and (i.types[2],
6077                                                operand_types[2]);
6078                   break;
6079                 }
6080
6081               switch (t->operands)
6082                 {
6083                 case 5:
6084                   if (!operand_type_match (overlap4, i.types[4])
6085                       || !operand_type_register_match (i.types[3],
6086                                                        operand_types[3],
6087                                                        i.types[4],
6088                                                        operand_types[4]))
6089                     continue;
6090                   /* Fall through.  */
6091                 case 4:
6092                   if (!operand_type_match (overlap3, i.types[3])
6093                       || ((check_register & 0xa) == 0xa
6094                           && !operand_type_register_match (i.types[1],
6095                                                             operand_types[1],
6096                                                             i.types[3],
6097                                                             operand_types[3]))
6098                       || ((check_register & 0xc) == 0xc
6099                           && !operand_type_register_match (i.types[2],
6100                                                             operand_types[2],
6101                                                             i.types[3],
6102                                                             operand_types[3])))
6103                     continue;
6104                   /* Fall through.  */
6105                 case 3:
6106                   /* Here we make use of the fact that there are no
6107                      reverse match 3 operand instructions.  */
6108                   if (!operand_type_match (overlap2, i.types[2])
6109                       || ((check_register & 5) == 5
6110                           && !operand_type_register_match (i.types[0],
6111                                                             operand_types[0],
6112                                                             i.types[2],
6113                                                             operand_types[2]))
6114                       || ((check_register & 6) == 6
6115                           && !operand_type_register_match (i.types[1],
6116                                                             operand_types[1],
6117                                                             i.types[2],
6118                                                             operand_types[2])))
6119                     continue;
6120                   break;
6121                 }
6122             }
6123           /* Found either forward/reverse 2, 3 or 4 operand match here:
6124              slip through to break.  */
6125         }
6126       if (!found_cpu_match)
6127         continue;
6128
6129       /* Check if vector and VEX operands are valid.  */
6130       if (check_VecOperands (t) || VEX_check_operands (t))
6131         {
6132           specific_error = i.error;
6133           continue;
6134         }
6135
6136       /* We've found a match; break out of loop.  */
6137       break;
6138     }
6139
6140   if (t == current_templates->end)
6141     {
6142       /* We found no match.  */
6143       const char *err_msg;
6144       switch (specific_error ? specific_error : i.error)
6145         {
6146         default:
6147           abort ();
6148         case operand_size_mismatch:
6149           err_msg = _("operand size mismatch");
6150           break;
6151         case operand_type_mismatch:
6152           err_msg = _("operand type mismatch");
6153           break;
6154         case register_type_mismatch:
6155           err_msg = _("register type mismatch");
6156           break;
6157         case number_of_operands_mismatch:
6158           err_msg = _("number of operands mismatch");
6159           break;
6160         case invalid_instruction_suffix:
6161           err_msg = _("invalid instruction suffix");
6162           break;
6163         case bad_imm4:
6164           err_msg = _("constant doesn't fit in 4 bits");
6165           break;
6166         case unsupported_with_intel_mnemonic:
6167           err_msg = _("unsupported with Intel mnemonic");
6168           break;
6169         case unsupported_syntax:
6170           err_msg = _("unsupported syntax");
6171           break;
6172         case unsupported:
6173           as_bad (_("unsupported instruction `%s'"),
6174                   current_templates->start->name);
6175           return NULL;
6176         case invalid_vsib_address:
6177           err_msg = _("invalid VSIB address");
6178           break;
6179         case invalid_vector_register_set:
6180           err_msg = _("mask, index, and destination registers must be distinct");
6181           break;
6182         case unsupported_vector_index_register:
6183           err_msg = _("unsupported vector index register");
6184           break;
6185         case unsupported_broadcast:
6186           err_msg = _("unsupported broadcast");
6187           break;
6188         case broadcast_needed:
6189           err_msg = _("broadcast is needed for operand of such type");
6190           break;
6191         case unsupported_masking:
6192           err_msg = _("unsupported masking");
6193           break;
6194         case mask_not_on_destination:
6195           err_msg = _("mask not on destination operand");
6196           break;
6197         case no_default_mask:
6198           err_msg = _("default mask isn't allowed");
6199           break;
6200         case unsupported_rc_sae:
6201           err_msg = _("unsupported static rounding/sae");
6202           break;
6203         case rc_sae_operand_not_last_imm:
6204           if (intel_syntax)
6205             err_msg = _("RC/SAE operand must precede immediate operands");
6206           else
6207             err_msg = _("RC/SAE operand must follow immediate operands");
6208           break;
6209         case invalid_register_operand:
6210           err_msg = _("invalid register operand");
6211           break;
6212         }
6213       as_bad (_("%s for `%s'"), err_msg,
6214               current_templates->start->name);
6215       return NULL;
6216     }
6217
6218   if (!quiet_warnings)
6219     {
6220       if (!intel_syntax
6221           && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6222         as_warn (_("indirect %s without `*'"), t->name);
6223
6224       if (t->opcode_modifier.isprefix
6225           && t->opcode_modifier.ignoresize)
6226         {
6227           /* Warn them that a data or address size prefix doesn't
6228              affect assembly of the next line of code.  */
6229           as_warn (_("stand-alone `%s' prefix"), t->name);
6230         }
6231     }
6232
6233   /* Copy the template we found.  */
6234   i.tm = *t;
6235
6236   if (addr_prefix_disp != -1)
6237     i.tm.operand_types[addr_prefix_disp]
6238       = operand_types[addr_prefix_disp];
6239
6240   if (found_reverse_match)
6241     {
6242       /* If we found a reverse match we must alter the opcode direction
6243          bit and clear/flip the regmem modifier one.  found_reverse_match
6244          holds bits to change (different for int & float insns).  */
6245
6246       i.tm.base_opcode ^= found_reverse_match;
6247
6248       i.tm.operand_types[0] = operand_types[i.operands - 1];
6249       i.tm.operand_types[i.operands - 1] = operand_types[0];
6250
6251       /* Certain SIMD insns have their load forms specified in the opcode
6252          table, and hence we need to _set_ RegMem instead of clearing it.
6253          We need to avoid setting the bit though on insns like KMOVW.  */
6254       i.tm.opcode_modifier.regmem
6255         = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6256           && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6257           && !i.tm.opcode_modifier.regmem;
6258     }
6259
6260   return t;
6261 }
6262
6263 static int
6264 check_string (void)
6265 {
6266   unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6267   unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6268
6269   if (i.seg[op] != NULL && i.seg[op] != &es)
6270     {
6271       as_bad (_("`%s' operand %u must use `%ses' segment"),
6272               i.tm.name,
6273               intel_syntax ? i.tm.operands - es_op : es_op + 1,
6274               register_prefix);
6275       return 0;
6276     }
6277
6278   /* There's only ever one segment override allowed per instruction.
6279      This instruction possibly has a legal segment override on the
6280      second operand, so copy the segment to where non-string
6281      instructions store it, allowing common code.  */
6282   i.seg[op] = i.seg[1];
6283
6284   return 1;
6285 }
6286
6287 static int
6288 process_suffix (void)
6289 {
6290   /* If matched instruction specifies an explicit instruction mnemonic
6291      suffix, use it.  */
6292   if (i.tm.opcode_modifier.size == SIZE16)
6293     i.suffix = WORD_MNEM_SUFFIX;
6294   else if (i.tm.opcode_modifier.size == SIZE32)
6295     i.suffix = LONG_MNEM_SUFFIX;
6296   else if (i.tm.opcode_modifier.size == SIZE64)
6297     i.suffix = QWORD_MNEM_SUFFIX;
6298   else if (i.reg_operands
6299            && (i.operands > 1 || i.types[0].bitfield.class == Reg))
6300     {
6301       /* If there's no instruction mnemonic suffix we try to invent one
6302          based on GPR operands.  */
6303       if (!i.suffix)
6304         {
6305           /* We take i.suffix from the last register operand specified,
6306              Destination register type is more significant than source
6307              register type.  crc32 in SSE4.2 prefers source register
6308              type. */
6309           if (i.tm.base_opcode == 0xf20f38f0
6310               && i.types[0].bitfield.class == Reg)
6311             {
6312               if (i.types[0].bitfield.byte)
6313                 i.suffix = BYTE_MNEM_SUFFIX;
6314               else if (i.types[0].bitfield.word)
6315                 i.suffix = WORD_MNEM_SUFFIX;
6316               else if (i.types[0].bitfield.dword)
6317                 i.suffix = LONG_MNEM_SUFFIX;
6318               else if (i.types[0].bitfield.qword)
6319                 i.suffix = QWORD_MNEM_SUFFIX;
6320             }
6321
6322           if (!i.suffix)
6323             {
6324               int op;
6325
6326               if (i.tm.base_opcode == 0xf20f38f0)
6327                 {
6328                   /* We have to know the operand size for crc32.  */
6329                   as_bad (_("ambiguous memory operand size for `%s`"),
6330                           i.tm.name);
6331                   return 0;
6332                 }
6333
6334               for (op = i.operands; --op >= 0;)
6335                 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6336                     || i.tm.operand_types[op].bitfield.instance == Accum)
6337                   {
6338                     if (i.types[op].bitfield.class != Reg)
6339                       continue;
6340                     if (i.types[op].bitfield.byte)
6341                       i.suffix = BYTE_MNEM_SUFFIX;
6342                     else if (i.types[op].bitfield.word)
6343                       i.suffix = WORD_MNEM_SUFFIX;
6344                     else if (i.types[op].bitfield.dword)
6345                       i.suffix = LONG_MNEM_SUFFIX;
6346                     else if (i.types[op].bitfield.qword)
6347                       i.suffix = QWORD_MNEM_SUFFIX;
6348                     else
6349                       continue;
6350                     break;
6351                   }
6352             }
6353         }
6354       else if (i.suffix == BYTE_MNEM_SUFFIX)
6355         {
6356           if (intel_syntax
6357               && i.tm.opcode_modifier.ignoresize
6358               && i.tm.opcode_modifier.no_bsuf)
6359             i.suffix = 0;
6360           else if (!check_byte_reg ())
6361             return 0;
6362         }
6363       else if (i.suffix == LONG_MNEM_SUFFIX)
6364         {
6365           if (intel_syntax
6366               && i.tm.opcode_modifier.ignoresize
6367               && i.tm.opcode_modifier.no_lsuf
6368               && !i.tm.opcode_modifier.todword
6369               && !i.tm.opcode_modifier.toqword)
6370             i.suffix = 0;
6371           else if (!check_long_reg ())
6372             return 0;
6373         }
6374       else if (i.suffix == QWORD_MNEM_SUFFIX)
6375         {
6376           if (intel_syntax
6377               && i.tm.opcode_modifier.ignoresize
6378               && i.tm.opcode_modifier.no_qsuf
6379               && !i.tm.opcode_modifier.todword
6380               && !i.tm.opcode_modifier.toqword)
6381             i.suffix = 0;
6382           else if (!check_qword_reg ())
6383             return 0;
6384         }
6385       else if (i.suffix == WORD_MNEM_SUFFIX)
6386         {
6387           if (intel_syntax
6388               && i.tm.opcode_modifier.ignoresize
6389               && i.tm.opcode_modifier.no_wsuf)
6390             i.suffix = 0;
6391           else if (!check_word_reg ())
6392             return 0;
6393         }
6394       else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
6395         /* Do nothing if the instruction is going to ignore the prefix.  */
6396         ;
6397       else
6398         abort ();
6399     }
6400   else if (i.tm.opcode_modifier.defaultsize
6401            && !i.suffix
6402            /* exclude fldenv/frstor/fsave/fstenv */
6403            && i.tm.opcode_modifier.no_ssuf
6404            /* exclude sysret */
6405            && i.tm.base_opcode != 0x0f07)
6406     {
6407       i.suffix = stackop_size;
6408       if (stackop_size == LONG_MNEM_SUFFIX)
6409         {
6410           /* stackop_size is set to LONG_MNEM_SUFFIX for the
6411              .code16gcc directive to support 16-bit mode with
6412              32-bit address.  For IRET without a suffix, generate
6413              16-bit IRET (opcode 0xcf) to return from an interrupt
6414              handler.  */
6415           if (i.tm.base_opcode == 0xcf)
6416             {
6417               i.suffix = WORD_MNEM_SUFFIX;
6418               as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6419             }
6420           /* Warn about changed behavior for segment register push/pop.  */
6421           else if ((i.tm.base_opcode | 1) == 0x07)
6422             as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6423                      i.tm.name);
6424         }
6425     }
6426   else if (intel_syntax
6427            && !i.suffix
6428            && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6429                || i.tm.opcode_modifier.jump == JUMP_BYTE
6430                || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6431                || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6432                    && i.tm.extension_opcode <= 3)))
6433     {
6434       switch (flag_code)
6435         {
6436         case CODE_64BIT:
6437           if (!i.tm.opcode_modifier.no_qsuf)
6438             {
6439               i.suffix = QWORD_MNEM_SUFFIX;
6440               break;
6441             }
6442           /* Fall through.  */
6443         case CODE_32BIT:
6444           if (!i.tm.opcode_modifier.no_lsuf)
6445             i.suffix = LONG_MNEM_SUFFIX;
6446           break;
6447         case CODE_16BIT:
6448           if (!i.tm.opcode_modifier.no_wsuf)
6449             i.suffix = WORD_MNEM_SUFFIX;
6450           break;
6451         }
6452     }
6453
6454   if (!i.suffix)
6455     {
6456       if (!intel_syntax)
6457         {
6458           if (i.tm.opcode_modifier.w)
6459             {
6460               as_bad (_("no instruction mnemonic suffix given and "
6461                         "no register operands; can't size instruction"));
6462               return 0;
6463             }
6464         }
6465       else
6466         {
6467           unsigned int suffixes;
6468
6469           suffixes = !i.tm.opcode_modifier.no_bsuf;
6470           if (!i.tm.opcode_modifier.no_wsuf)
6471             suffixes |= 1 << 1;
6472           if (!i.tm.opcode_modifier.no_lsuf)
6473             suffixes |= 1 << 2;
6474           if (!i.tm.opcode_modifier.no_ldsuf)
6475             suffixes |= 1 << 3;
6476           if (!i.tm.opcode_modifier.no_ssuf)
6477             suffixes |= 1 << 4;
6478           if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6479             suffixes |= 1 << 5;
6480
6481           /* There are more than suffix matches.  */
6482           if (i.tm.opcode_modifier.w
6483               || ((suffixes & (suffixes - 1))
6484                   && !i.tm.opcode_modifier.defaultsize
6485                   && !i.tm.opcode_modifier.ignoresize))
6486             {
6487               as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6488               return 0;
6489             }
6490         }
6491     }
6492
6493   /* Change the opcode based on the operand size given by i.suffix.  */
6494   switch (i.suffix)
6495     {
6496     /* Size floating point instruction.  */
6497     case LONG_MNEM_SUFFIX:
6498       if (i.tm.opcode_modifier.floatmf)
6499         {
6500           i.tm.base_opcode ^= 4;
6501           break;
6502         }
6503     /* fall through */
6504     case WORD_MNEM_SUFFIX:
6505     case QWORD_MNEM_SUFFIX:
6506       /* It's not a byte, select word/dword operation.  */
6507       if (i.tm.opcode_modifier.w)
6508         {
6509           if (i.tm.opcode_modifier.shortform)
6510             i.tm.base_opcode |= 8;
6511           else
6512             i.tm.base_opcode |= 1;
6513         }
6514     /* fall through */
6515     case SHORT_MNEM_SUFFIX:
6516       /* Now select between word & dword operations via the operand
6517          size prefix, except for instructions that will ignore this
6518          prefix anyway.  */
6519       if (i.reg_operands > 0
6520           && i.types[0].bitfield.class == Reg
6521           && i.tm.opcode_modifier.addrprefixopreg
6522           && (i.tm.operand_types[0].bitfield.instance == Accum
6523               || i.operands == 1))
6524         {
6525           /* The address size override prefix changes the size of the
6526              first operand.  */
6527           if ((flag_code == CODE_32BIT
6528                && i.op[0].regs->reg_type.bitfield.word)
6529               || (flag_code != CODE_32BIT
6530                   && i.op[0].regs->reg_type.bitfield.dword))
6531             if (!add_prefix (ADDR_PREFIX_OPCODE))
6532               return 0;
6533         }
6534       else if (i.suffix != QWORD_MNEM_SUFFIX
6535                && !i.tm.opcode_modifier.ignoresize
6536                && !i.tm.opcode_modifier.floatmf
6537                && !is_any_vex_encoding (&i.tm)
6538                && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
6539                    || (flag_code == CODE_64BIT
6540                        && i.tm.opcode_modifier.jump == JUMP_BYTE)))
6541         {
6542           unsigned int prefix = DATA_PREFIX_OPCODE;
6543
6544           if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
6545             prefix = ADDR_PREFIX_OPCODE;
6546
6547           if (!add_prefix (prefix))
6548             return 0;
6549         }
6550
6551       /* Set mode64 for an operand.  */
6552       if (i.suffix == QWORD_MNEM_SUFFIX
6553           && flag_code == CODE_64BIT
6554           && !i.tm.opcode_modifier.norex64
6555           /* Special case for xchg %rax,%rax.  It is NOP and doesn't
6556              need rex64. */
6557           && ! (i.operands == 2
6558                 && i.tm.base_opcode == 0x90
6559                 && i.tm.extension_opcode == None
6560                 && i.types[0].bitfield.instance == Accum
6561                 && i.types[0].bitfield.qword
6562                 && i.types[1].bitfield.instance == Accum
6563                 && i.types[1].bitfield.qword))
6564         i.rex |= REX_W;
6565
6566       break;
6567     }
6568
6569   if (i.reg_operands != 0
6570       && i.operands > 1
6571       && i.tm.opcode_modifier.addrprefixopreg
6572       && i.tm.operand_types[0].bitfield.instance != Accum)
6573     {
6574       /* Check invalid register operand when the address size override
6575          prefix changes the size of register operands.  */
6576       unsigned int op;
6577       enum { need_word, need_dword, need_qword } need;
6578
6579       if (flag_code == CODE_32BIT)
6580         need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
6581       else
6582         {
6583           if (i.prefix[ADDR_PREFIX])
6584             need = need_dword;
6585           else
6586             need = flag_code == CODE_64BIT ? need_qword : need_word;
6587         }
6588
6589       for (op = 0; op < i.operands; op++)
6590         if (i.types[op].bitfield.class == Reg
6591             && ((need == need_word
6592                  && !i.op[op].regs->reg_type.bitfield.word)
6593                 || (need == need_dword
6594                     && !i.op[op].regs->reg_type.bitfield.dword)
6595                 || (need == need_qword
6596                     && !i.op[op].regs->reg_type.bitfield.qword)))
6597           {
6598             as_bad (_("invalid register operand size for `%s'"),
6599                     i.tm.name);
6600             return 0;
6601           }
6602     }
6603
6604   return 1;
6605 }
6606
6607 static int
6608 check_byte_reg (void)
6609 {
6610   int op;
6611
6612   for (op = i.operands; --op >= 0;)
6613     {
6614       /* Skip non-register operands. */
6615       if (i.types[op].bitfield.class != Reg)
6616         continue;
6617
6618       /* If this is an eight bit register, it's OK.  If it's the 16 or
6619          32 bit version of an eight bit register, we will just use the
6620          low portion, and that's OK too.  */
6621       if (i.types[op].bitfield.byte)
6622         continue;
6623
6624       /* I/O port address operands are OK too.  */
6625       if (i.tm.operand_types[op].bitfield.instance == RegD
6626           && i.tm.operand_types[op].bitfield.word)
6627         continue;
6628
6629       /* crc32 doesn't generate this warning.  */
6630       if (i.tm.base_opcode == 0xf20f38f0)
6631         continue;
6632
6633       if ((i.types[op].bitfield.word
6634            || i.types[op].bitfield.dword
6635            || i.types[op].bitfield.qword)
6636           && i.op[op].regs->reg_num < 4
6637           /* Prohibit these changes in 64bit mode, since the lowering
6638              would be more complicated.  */
6639           && flag_code != CODE_64BIT)
6640         {
6641 #if REGISTER_WARNINGS
6642           if (!quiet_warnings)
6643             as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6644                      register_prefix,
6645                      (i.op[op].regs + (i.types[op].bitfield.word
6646                                        ? REGNAM_AL - REGNAM_AX
6647                                        : REGNAM_AL - REGNAM_EAX))->reg_name,
6648                      register_prefix,
6649                      i.op[op].regs->reg_name,
6650                      i.suffix);
6651 #endif
6652           continue;
6653         }
6654       /* Any other register is bad.  */
6655       if (i.types[op].bitfield.class == Reg
6656           || i.types[op].bitfield.class == RegMMX
6657           || i.types[op].bitfield.class == RegSIMD
6658           || i.types[op].bitfield.class == SReg
6659           || i.types[op].bitfield.class == RegCR
6660           || i.types[op].bitfield.class == RegDR
6661           || i.types[op].bitfield.class == RegTR)
6662         {
6663           as_bad (_("`%s%s' not allowed with `%s%c'"),
6664                   register_prefix,
6665                   i.op[op].regs->reg_name,
6666                   i.tm.name,
6667                   i.suffix);
6668           return 0;
6669         }
6670     }
6671   return 1;
6672 }
6673
6674 static int
6675 check_long_reg (void)
6676 {
6677   int op;
6678
6679   for (op = i.operands; --op >= 0;)
6680     /* Skip non-register operands. */
6681     if (i.types[op].bitfield.class != Reg)
6682       continue;
6683     /* Reject eight bit registers, except where the template requires
6684        them. (eg. movzb)  */
6685     else if (i.types[op].bitfield.byte
6686              && (i.tm.operand_types[op].bitfield.class == Reg
6687                  || i.tm.operand_types[op].bitfield.instance == Accum)
6688              && (i.tm.operand_types[op].bitfield.word
6689                  || i.tm.operand_types[op].bitfield.dword))
6690       {
6691         as_bad (_("`%s%s' not allowed with `%s%c'"),
6692                 register_prefix,
6693                 i.op[op].regs->reg_name,
6694                 i.tm.name,
6695                 i.suffix);
6696         return 0;
6697       }
6698     /* Warn if the e prefix on a general reg is missing.  */
6699     else if ((!quiet_warnings || flag_code == CODE_64BIT)
6700              && i.types[op].bitfield.word
6701              && (i.tm.operand_types[op].bitfield.class == Reg
6702                  || i.tm.operand_types[op].bitfield.instance == Accum)
6703              && i.tm.operand_types[op].bitfield.dword)
6704       {
6705         /* Prohibit these changes in the 64bit mode, since the
6706            lowering is more complicated.  */
6707         if (flag_code == CODE_64BIT)
6708           {
6709             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6710                     register_prefix, i.op[op].regs->reg_name,
6711                     i.suffix);
6712             return 0;
6713           }
6714 #if REGISTER_WARNINGS
6715         as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6716                  register_prefix,
6717                  (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
6718                  register_prefix, i.op[op].regs->reg_name, i.suffix);
6719 #endif
6720       }
6721     /* Warn if the r prefix on a general reg is present.  */
6722     else if (i.types[op].bitfield.qword
6723              && (i.tm.operand_types[op].bitfield.class == Reg
6724                  || i.tm.operand_types[op].bitfield.instance == Accum)
6725              && i.tm.operand_types[op].bitfield.dword)
6726       {
6727         if (intel_syntax
6728             && i.tm.opcode_modifier.toqword
6729             && i.types[0].bitfield.class != RegSIMD)
6730           {
6731             /* Convert to QWORD.  We want REX byte. */
6732             i.suffix = QWORD_MNEM_SUFFIX;
6733           }
6734         else
6735           {
6736             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6737                     register_prefix, i.op[op].regs->reg_name,
6738                     i.suffix);
6739             return 0;
6740           }
6741       }
6742   return 1;
6743 }
6744
6745 static int
6746 check_qword_reg (void)
6747 {
6748   int op;
6749
6750   for (op = i.operands; --op >= 0; )
6751     /* Skip non-register operands. */
6752     if (i.types[op].bitfield.class != Reg)
6753       continue;
6754     /* Reject eight bit registers, except where the template requires
6755        them. (eg. movzb)  */
6756     else if (i.types[op].bitfield.byte
6757              && (i.tm.operand_types[op].bitfield.class == Reg
6758                  || i.tm.operand_types[op].bitfield.instance == Accum)
6759              && (i.tm.operand_types[op].bitfield.word
6760                  || i.tm.operand_types[op].bitfield.dword))
6761       {
6762         as_bad (_("`%s%s' not allowed with `%s%c'"),
6763                 register_prefix,
6764                 i.op[op].regs->reg_name,
6765                 i.tm.name,
6766                 i.suffix);
6767         return 0;
6768       }
6769     /* Warn if the r prefix on a general reg is missing.  */
6770     else if ((i.types[op].bitfield.word
6771               || i.types[op].bitfield.dword)
6772              && (i.tm.operand_types[op].bitfield.class == Reg
6773                  || i.tm.operand_types[op].bitfield.instance == Accum)
6774              && i.tm.operand_types[op].bitfield.qword)
6775       {
6776         /* Prohibit these changes in the 64bit mode, since the
6777            lowering is more complicated.  */
6778         if (intel_syntax
6779             && i.tm.opcode_modifier.todword
6780             && i.types[0].bitfield.class != RegSIMD)
6781           {
6782             /* Convert to DWORD.  We don't want REX byte. */
6783             i.suffix = LONG_MNEM_SUFFIX;
6784           }
6785         else
6786           {
6787             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6788                     register_prefix, i.op[op].regs->reg_name,
6789                     i.suffix);
6790             return 0;
6791           }
6792       }
6793   return 1;
6794 }
6795
6796 static int
6797 check_word_reg (void)
6798 {
6799   int op;
6800   for (op = i.operands; --op >= 0;)
6801     /* Skip non-register operands. */
6802     if (i.types[op].bitfield.class != Reg)
6803       continue;
6804     /* Reject eight bit registers, except where the template requires
6805        them. (eg. movzb)  */
6806     else if (i.types[op].bitfield.byte
6807              && (i.tm.operand_types[op].bitfield.class == Reg
6808                  || i.tm.operand_types[op].bitfield.instance == Accum)
6809              && (i.tm.operand_types[op].bitfield.word
6810                  || i.tm.operand_types[op].bitfield.dword))
6811       {
6812         as_bad (_("`%s%s' not allowed with `%s%c'"),
6813                 register_prefix,
6814                 i.op[op].regs->reg_name,
6815                 i.tm.name,
6816                 i.suffix);
6817         return 0;
6818       }
6819     /* Warn if the e or r prefix on a general reg is present.  */
6820     else if ((!quiet_warnings || flag_code == CODE_64BIT)
6821              && (i.types[op].bitfield.dword
6822                  || i.types[op].bitfield.qword)
6823              && (i.tm.operand_types[op].bitfield.class == Reg
6824                  || i.tm.operand_types[op].bitfield.instance == Accum)
6825              && i.tm.operand_types[op].bitfield.word)
6826       {
6827         /* Prohibit these changes in the 64bit mode, since the
6828            lowering is more complicated.  */
6829         if (flag_code == CODE_64BIT)
6830           {
6831             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6832                     register_prefix, i.op[op].regs->reg_name,
6833                     i.suffix);
6834             return 0;
6835           }
6836 #if REGISTER_WARNINGS
6837         as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6838                  register_prefix,
6839                  (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
6840                  register_prefix, i.op[op].regs->reg_name, i.suffix);
6841 #endif
6842       }
6843   return 1;
6844 }
6845
6846 static int
6847 update_imm (unsigned int j)
6848 {
6849   i386_operand_type overlap = i.types[j];
6850   if ((overlap.bitfield.imm8
6851        || overlap.bitfield.imm8s
6852        || overlap.bitfield.imm16
6853        || overlap.bitfield.imm32
6854        || overlap.bitfield.imm32s
6855        || overlap.bitfield.imm64)
6856       && !operand_type_equal (&overlap, &imm8)
6857       && !operand_type_equal (&overlap, &imm8s)
6858       && !operand_type_equal (&overlap, &imm16)
6859       && !operand_type_equal (&overlap, &imm32)
6860       && !operand_type_equal (&overlap, &imm32s)
6861       && !operand_type_equal (&overlap, &imm64))
6862     {
6863       if (i.suffix)
6864         {
6865           i386_operand_type temp;
6866
6867           operand_type_set (&temp, 0);
6868           if (i.suffix == BYTE_MNEM_SUFFIX)
6869             {
6870               temp.bitfield.imm8 = overlap.bitfield.imm8;
6871               temp.bitfield.imm8s = overlap.bitfield.imm8s;
6872             }
6873           else if (i.suffix == WORD_MNEM_SUFFIX)
6874             temp.bitfield.imm16 = overlap.bitfield.imm16;
6875           else if (i.suffix == QWORD_MNEM_SUFFIX)
6876             {
6877               temp.bitfield.imm64 = overlap.bitfield.imm64;
6878               temp.bitfield.imm32s = overlap.bitfield.imm32s;
6879             }
6880           else
6881             temp.bitfield.imm32 = overlap.bitfield.imm32;
6882           overlap = temp;
6883         }
6884       else if (operand_type_equal (&overlap, &imm16_32_32s)
6885                || operand_type_equal (&overlap, &imm16_32)
6886                || operand_type_equal (&overlap, &imm16_32s))
6887         {
6888           if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
6889             overlap = imm16;
6890           else
6891             overlap = imm32s;
6892         }
6893       if (!operand_type_equal (&overlap, &imm8)
6894           && !operand_type_equal (&overlap, &imm8s)
6895           && !operand_type_equal (&overlap, &imm16)
6896           && !operand_type_equal (&overlap, &imm32)
6897           && !operand_type_equal (&overlap, &imm32s)
6898           && !operand_type_equal (&overlap, &imm64))
6899         {
6900           as_bad (_("no instruction mnemonic suffix given; "
6901                     "can't determine immediate size"));
6902           return 0;
6903         }
6904     }
6905   i.types[j] = overlap;
6906
6907   return 1;
6908 }
6909
6910 static int
6911 finalize_imm (void)
6912 {
6913   unsigned int j, n;
6914
6915   /* Update the first 2 immediate operands.  */
6916   n = i.operands > 2 ? 2 : i.operands;
6917   if (n)
6918     {
6919       for (j = 0; j < n; j++)
6920         if (update_imm (j) == 0)
6921           return 0;
6922
6923       /* The 3rd operand can't be immediate operand.  */
6924       gas_assert (operand_type_check (i.types[2], imm) == 0);
6925     }
6926
6927   return 1;
6928 }
6929
6930 static int
6931 process_operands (void)
6932 {
6933   /* Default segment register this instruction will use for memory
6934      accesses.  0 means unknown.  This is only for optimizing out
6935      unnecessary segment overrides.  */
6936   const seg_entry *default_seg = 0;
6937
6938   if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
6939     {
6940       unsigned int dupl = i.operands;
6941       unsigned int dest = dupl - 1;
6942       unsigned int j;
6943
6944       /* The destination must be an xmm register.  */
6945       gas_assert (i.reg_operands
6946                   && MAX_OPERANDS > dupl
6947                   && operand_type_equal (&i.types[dest], &regxmm));
6948
6949       if (i.tm.operand_types[0].bitfield.instance == Accum
6950           && i.tm.operand_types[0].bitfield.xmmword)
6951         {
6952           if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
6953             {
6954               /* Keep xmm0 for instructions with VEX prefix and 3
6955                  sources.  */
6956               i.tm.operand_types[0].bitfield.instance = InstanceNone;
6957               i.tm.operand_types[0].bitfield.class = RegSIMD;
6958               goto duplicate;
6959             }
6960           else
6961             {
6962               /* We remove the first xmm0 and keep the number of
6963                  operands unchanged, which in fact duplicates the
6964                  destination.  */
6965               for (j = 1; j < i.operands; j++)
6966                 {
6967                   i.op[j - 1] = i.op[j];
6968                   i.types[j - 1] = i.types[j];
6969                   i.tm.operand_types[j - 1] = i.tm.operand_types[j];
6970                   i.flags[j - 1] = i.flags[j];
6971                 }
6972             }
6973         }
6974       else if (i.tm.opcode_modifier.implicit1stxmm0)
6975         {
6976           gas_assert ((MAX_OPERANDS - 1) > dupl
6977                       && (i.tm.opcode_modifier.vexsources
6978                           == VEX3SOURCES));
6979
6980           /* Add the implicit xmm0 for instructions with VEX prefix
6981              and 3 sources.  */
6982           for (j = i.operands; j > 0; j--)
6983             {
6984               i.op[j] = i.op[j - 1];
6985               i.types[j] = i.types[j - 1];
6986               i.tm.operand_types[j] = i.tm.operand_types[j - 1];
6987               i.flags[j] = i.flags[j - 1];
6988             }
6989           i.op[0].regs
6990             = (const reg_entry *) hash_find (reg_hash, "xmm0");
6991           i.types[0] = regxmm;
6992           i.tm.operand_types[0] = regxmm;
6993
6994           i.operands += 2;
6995           i.reg_operands += 2;
6996           i.tm.operands += 2;
6997
6998           dupl++;
6999           dest++;
7000           i.op[dupl] = i.op[dest];
7001           i.types[dupl] = i.types[dest];
7002           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7003           i.flags[dupl] = i.flags[dest];
7004         }
7005       else
7006         {
7007 duplicate:
7008           i.operands++;
7009           i.reg_operands++;
7010           i.tm.operands++;
7011
7012           i.op[dupl] = i.op[dest];
7013           i.types[dupl] = i.types[dest];
7014           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7015           i.flags[dupl] = i.flags[dest];
7016         }
7017
7018        if (i.tm.opcode_modifier.immext)
7019          process_immext ();
7020     }
7021   else if (i.tm.operand_types[0].bitfield.instance == Accum
7022            && i.tm.operand_types[0].bitfield.xmmword)
7023     {
7024       unsigned int j;
7025
7026       for (j = 1; j < i.operands; j++)
7027         {
7028           i.op[j - 1] = i.op[j];
7029           i.types[j - 1] = i.types[j];
7030
7031           /* We need to adjust fields in i.tm since they are used by
7032              build_modrm_byte.  */
7033           i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7034
7035           i.flags[j - 1] = i.flags[j];
7036         }
7037
7038       i.operands--;
7039       i.reg_operands--;
7040       i.tm.operands--;
7041     }
7042   else if (i.tm.opcode_modifier.implicitquadgroup)
7043     {
7044       unsigned int regnum, first_reg_in_group, last_reg_in_group;
7045
7046       /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7047       gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7048       regnum = register_number (i.op[1].regs);
7049       first_reg_in_group = regnum & ~3;
7050       last_reg_in_group = first_reg_in_group + 3;
7051       if (regnum != first_reg_in_group)
7052         as_warn (_("source register `%s%s' implicitly denotes"
7053                    " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7054                  register_prefix, i.op[1].regs->reg_name,
7055                  register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7056                  register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7057                  i.tm.name);
7058     }
7059   else if (i.tm.opcode_modifier.regkludge)
7060     {
7061       /* The imul $imm, %reg instruction is converted into
7062          imul $imm, %reg, %reg, and the clr %reg instruction
7063          is converted into xor %reg, %reg.  */
7064
7065       unsigned int first_reg_op;
7066
7067       if (operand_type_check (i.types[0], reg))
7068         first_reg_op = 0;
7069       else
7070         first_reg_op = 1;
7071       /* Pretend we saw the extra register operand.  */
7072       gas_assert (i.reg_operands == 1
7073                   && i.op[first_reg_op + 1].regs == 0);
7074       i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7075       i.types[first_reg_op + 1] = i.types[first_reg_op];
7076       i.operands++;
7077       i.reg_operands++;
7078     }
7079
7080   if (i.tm.opcode_modifier.modrm)
7081     {
7082       /* The opcode is completed (modulo i.tm.extension_opcode which
7083          must be put into the modrm byte).  Now, we make the modrm and
7084          index base bytes based on all the info we've collected.  */
7085
7086       default_seg = build_modrm_byte ();
7087     }
7088   else if (i.types[0].bitfield.class == SReg)
7089     {
7090       if (flag_code != CODE_64BIT
7091           ? i.tm.base_opcode == POP_SEG_SHORT
7092             && i.op[0].regs->reg_num == 1
7093           : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7094             && i.op[0].regs->reg_num < 4)
7095         {
7096           as_bad (_("you can't `%s %s%s'"),
7097                   i.tm.name, register_prefix, i.op[0].regs->reg_name);
7098           return 0;
7099         }
7100       if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7101         {
7102           i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7103           i.tm.opcode_length = 2;
7104         }
7105       i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7106     }
7107   else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7108     {
7109       default_seg = &ds;
7110     }
7111   else if (i.tm.opcode_modifier.isstring)
7112     {
7113       /* For the string instructions that allow a segment override
7114          on one of their operands, the default segment is ds.  */
7115       default_seg = &ds;
7116     }
7117   else if (i.tm.opcode_modifier.shortform)
7118     {
7119       /* The register or float register operand is in operand
7120          0 or 1.  */
7121       unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7122
7123       /* Register goes in low 3 bits of opcode.  */
7124       i.tm.base_opcode |= i.op[op].regs->reg_num;
7125       if ((i.op[op].regs->reg_flags & RegRex) != 0)
7126         i.rex |= REX_B;
7127       if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7128         {
7129           /* Warn about some common errors, but press on regardless.
7130              The first case can be generated by gcc (<= 2.8.1).  */
7131           if (i.operands == 2)
7132             {
7133               /* Reversed arguments on faddp, fsubp, etc.  */
7134               as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7135                        register_prefix, i.op[!intel_syntax].regs->reg_name,
7136                        register_prefix, i.op[intel_syntax].regs->reg_name);
7137             }
7138           else
7139             {
7140               /* Extraneous `l' suffix on fp insn.  */
7141               as_warn (_("translating to `%s %s%s'"), i.tm.name,
7142                        register_prefix, i.op[0].regs->reg_name);
7143             }
7144         }
7145     }
7146
7147   if (i.tm.base_opcode == 0x8d /* lea */
7148       && i.seg[0]
7149       && !quiet_warnings)
7150     as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7151
7152   /* If a segment was explicitly specified, and the specified segment
7153      is not the default, use an opcode prefix to select it.  If we
7154      never figured out what the default segment is, then default_seg
7155      will be zero at this point, and the specified segment prefix will
7156      always be used.  */
7157   if ((i.seg[0]) && (i.seg[0] != default_seg))
7158     {
7159       if (!add_prefix (i.seg[0]->seg_prefix))
7160         return 0;
7161     }
7162   return 1;
7163 }
7164
7165 static const seg_entry *
7166 build_modrm_byte (void)
7167 {
7168   const seg_entry *default_seg = 0;
7169   unsigned int source, dest;
7170   int vex_3_sources;
7171
7172   vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7173   if (vex_3_sources)
7174     {
7175       unsigned int nds, reg_slot;
7176       expressionS *exp;
7177
7178       dest = i.operands - 1;
7179       nds = dest - 1;
7180
7181       /* There are 2 kinds of instructions:
7182          1. 5 operands: 4 register operands or 3 register operands
7183          plus 1 memory operand plus one Imm4 operand, VexXDS, and
7184          VexW0 or VexW1.  The destination must be either XMM, YMM or
7185          ZMM register.
7186          2. 4 operands: 4 register operands or 3 register operands
7187          plus 1 memory operand, with VexXDS.  */
7188       gas_assert ((i.reg_operands == 4
7189                    || (i.reg_operands == 3 && i.mem_operands == 1))
7190                   && i.tm.opcode_modifier.vexvvvv == VEXXDS
7191                   && i.tm.opcode_modifier.vexw
7192                   && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7193
7194       /* If VexW1 is set, the first non-immediate operand is the source and
7195          the second non-immediate one is encoded in the immediate operand.  */
7196       if (i.tm.opcode_modifier.vexw == VEXW1)
7197         {
7198           source = i.imm_operands;
7199           reg_slot = i.imm_operands + 1;
7200         }
7201       else
7202         {
7203           source = i.imm_operands + 1;
7204           reg_slot = i.imm_operands;
7205         }
7206
7207       if (i.imm_operands == 0)
7208         {
7209           /* When there is no immediate operand, generate an 8bit
7210              immediate operand to encode the first operand.  */
7211           exp = &im_expressions[i.imm_operands++];
7212           i.op[i.operands].imms = exp;
7213           i.types[i.operands] = imm8;
7214           i.operands++;
7215
7216           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7217           exp->X_op = O_constant;
7218           exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7219           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7220         }
7221       else
7222         {
7223           gas_assert (i.imm_operands == 1);
7224           gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7225           gas_assert (!i.tm.opcode_modifier.immext);
7226
7227           /* Turn on Imm8 again so that output_imm will generate it.  */
7228           i.types[0].bitfield.imm8 = 1;
7229
7230           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7231           i.op[0].imms->X_add_number
7232               |= register_number (i.op[reg_slot].regs) << 4;
7233           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7234         }
7235
7236       gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7237       i.vex.register_specifier = i.op[nds].regs;
7238     }
7239   else
7240     source = dest = 0;
7241
7242   /* i.reg_operands MUST be the number of real register operands;
7243      implicit registers do not count.  If there are 3 register
7244      operands, it must be a instruction with VexNDS.  For a
7245      instruction with VexNDD, the destination register is encoded
7246      in VEX prefix.  If there are 4 register operands, it must be
7247      a instruction with VEX prefix and 3 sources.  */
7248   if (i.mem_operands == 0
7249       && ((i.reg_operands == 2
7250            && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7251           || (i.reg_operands == 3
7252               && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7253           || (i.reg_operands == 4 && vex_3_sources)))
7254     {
7255       switch (i.operands)
7256         {
7257         case 2:
7258           source = 0;
7259           break;
7260         case 3:
7261           /* When there are 3 operands, one of them may be immediate,
7262              which may be the first or the last operand.  Otherwise,
7263              the first operand must be shift count register (cl) or it
7264              is an instruction with VexNDS. */
7265           gas_assert (i.imm_operands == 1
7266                       || (i.imm_operands == 0
7267                           && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7268                               || (i.types[0].bitfield.instance == RegC
7269                                   && i.types[0].bitfield.byte))));
7270           if (operand_type_check (i.types[0], imm)
7271               || (i.types[0].bitfield.instance == RegC
7272                   && i.types[0].bitfield.byte))
7273             source = 1;
7274           else
7275             source = 0;
7276           break;
7277         case 4:
7278           /* When there are 4 operands, the first two must be 8bit
7279              immediate operands. The source operand will be the 3rd
7280              one.
7281
7282              For instructions with VexNDS, if the first operand
7283              an imm8, the source operand is the 2nd one.  If the last
7284              operand is imm8, the source operand is the first one.  */
7285           gas_assert ((i.imm_operands == 2
7286                        && i.types[0].bitfield.imm8
7287                        && i.types[1].bitfield.imm8)
7288                       || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7289                           && i.imm_operands == 1
7290                           && (i.types[0].bitfield.imm8
7291                               || i.types[i.operands - 1].bitfield.imm8
7292                               || i.rounding)));
7293           if (i.imm_operands == 2)
7294             source = 2;
7295           else
7296             {
7297               if (i.types[0].bitfield.imm8)
7298                 source = 1;
7299               else
7300                 source = 0;
7301             }
7302           break;
7303         case 5:
7304           if (is_evex_encoding (&i.tm))
7305             {
7306               /* For EVEX instructions, when there are 5 operands, the
7307                  first one must be immediate operand.  If the second one
7308                  is immediate operand, the source operand is the 3th
7309                  one.  If the last one is immediate operand, the source
7310                  operand is the 2nd one.  */
7311               gas_assert (i.imm_operands == 2
7312                           && i.tm.opcode_modifier.sae
7313                           && operand_type_check (i.types[0], imm));
7314               if (operand_type_check (i.types[1], imm))
7315                 source = 2;
7316               else if (operand_type_check (i.types[4], imm))
7317                 source = 1;
7318               else
7319                 abort ();
7320             }
7321           break;
7322         default:
7323           abort ();
7324         }
7325
7326       if (!vex_3_sources)
7327         {
7328           dest = source + 1;
7329
7330           /* RC/SAE operand could be between DEST and SRC.  That happens
7331              when one operand is GPR and the other one is XMM/YMM/ZMM
7332              register.  */
7333           if (i.rounding && i.rounding->operand == (int) dest)
7334             dest++;
7335
7336           if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7337             {
7338               /* For instructions with VexNDS, the register-only source
7339                  operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7340                  register.  It is encoded in VEX prefix.  */
7341
7342               i386_operand_type op;
7343               unsigned int vvvv;
7344
7345               /* Check register-only source operand when two source
7346                  operands are swapped.  */
7347               if (!i.tm.operand_types[source].bitfield.baseindex
7348                   && i.tm.operand_types[dest].bitfield.baseindex)
7349                 {
7350                   vvvv = source;
7351                   source = dest;
7352                 }
7353               else
7354                 vvvv = dest;
7355
7356               op = i.tm.operand_types[vvvv];
7357               if ((dest + 1) >= i.operands
7358                   || ((op.bitfield.class != Reg
7359                        || (!op.bitfield.dword && !op.bitfield.qword))
7360                       && op.bitfield.class != RegSIMD
7361                       && !operand_type_equal (&op, &regmask)))
7362                 abort ();
7363               i.vex.register_specifier = i.op[vvvv].regs;
7364               dest++;
7365             }
7366         }
7367
7368       i.rm.mode = 3;
7369       /* One of the register operands will be encoded in the i.rm.reg
7370          field, the other in the combined i.rm.mode and i.rm.regmem
7371          fields.  If no form of this instruction supports a memory
7372          destination operand, then we assume the source operand may
7373          sometimes be a memory operand and so we need to store the
7374          destination in the i.rm.reg field.  */
7375       if (!i.tm.opcode_modifier.regmem
7376           && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7377         {
7378           i.rm.reg = i.op[dest].regs->reg_num;
7379           i.rm.regmem = i.op[source].regs->reg_num;
7380           if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7381                || i.op[source].regs->reg_type.bitfield.class == RegMMX)
7382             i.has_regmmx = TRUE;
7383           else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7384                    || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
7385             {
7386               if (i.types[dest].bitfield.zmmword
7387                   || i.types[source].bitfield.zmmword)
7388                 i.has_regzmm = TRUE;
7389               else if (i.types[dest].bitfield.ymmword
7390                        || i.types[source].bitfield.ymmword)
7391                 i.has_regymm = TRUE;
7392               else
7393                 i.has_regxmm = TRUE;
7394             }
7395           if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7396             i.rex |= REX_R;
7397           if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7398             i.vrex |= REX_R;
7399           if ((i.op[source].regs->reg_flags & RegRex) != 0)
7400             i.rex |= REX_B;
7401           if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7402             i.vrex |= REX_B;
7403         }
7404       else
7405         {
7406           i.rm.reg = i.op[source].regs->reg_num;
7407           i.rm.regmem = i.op[dest].regs->reg_num;
7408           if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7409             i.rex |= REX_B;
7410           if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7411             i.vrex |= REX_B;
7412           if ((i.op[source].regs->reg_flags & RegRex) != 0)
7413             i.rex |= REX_R;
7414           if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7415             i.vrex |= REX_R;
7416         }
7417       if (flag_code != CODE_64BIT && (i.rex & REX_R))
7418         {
7419           if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
7420             abort ();
7421           i.rex &= ~REX_R;
7422           add_prefix (LOCK_PREFIX_OPCODE);
7423         }
7424     }
7425   else
7426     {                   /* If it's not 2 reg operands...  */
7427       unsigned int mem;
7428
7429       if (i.mem_operands)
7430         {
7431           unsigned int fake_zero_displacement = 0;
7432           unsigned int op;
7433
7434           for (op = 0; op < i.operands; op++)
7435             if (i.flags[op] & Operand_Mem)
7436               break;
7437           gas_assert (op < i.operands);
7438
7439           if (i.tm.opcode_modifier.vecsib)
7440             {
7441               if (i.index_reg->reg_num == RegIZ)
7442                 abort ();
7443
7444               i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7445               if (!i.base_reg)
7446                 {
7447                   i.sib.base = NO_BASE_REGISTER;
7448                   i.sib.scale = i.log2_scale_factor;
7449                   i.types[op].bitfield.disp8 = 0;
7450                   i.types[op].bitfield.disp16 = 0;
7451                   i.types[op].bitfield.disp64 = 0;
7452                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7453                     {
7454                       /* Must be 32 bit */
7455                       i.types[op].bitfield.disp32 = 1;
7456                       i.types[op].bitfield.disp32s = 0;
7457                     }
7458                   else
7459                     {
7460                       i.types[op].bitfield.disp32 = 0;
7461                       i.types[op].bitfield.disp32s = 1;
7462                     }
7463                 }
7464               i.sib.index = i.index_reg->reg_num;
7465               if ((i.index_reg->reg_flags & RegRex) != 0)
7466                 i.rex |= REX_X;
7467               if ((i.index_reg->reg_flags & RegVRex) != 0)
7468                 i.vrex |= REX_X;
7469             }
7470
7471           default_seg = &ds;
7472
7473           if (i.base_reg == 0)
7474             {
7475               i.rm.mode = 0;
7476               if (!i.disp_operands)
7477                 fake_zero_displacement = 1;
7478               if (i.index_reg == 0)
7479                 {
7480                   i386_operand_type newdisp;
7481
7482                   gas_assert (!i.tm.opcode_modifier.vecsib);
7483                   /* Operand is just <disp>  */
7484                   if (flag_code == CODE_64BIT)
7485                     {
7486                       /* 64bit mode overwrites the 32bit absolute
7487                          addressing by RIP relative addressing and
7488                          absolute addressing is encoded by one of the
7489                          redundant SIB forms.  */
7490                       i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7491                       i.sib.base = NO_BASE_REGISTER;
7492                       i.sib.index = NO_INDEX_REGISTER;
7493                       newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7494                     }
7495                   else if ((flag_code == CODE_16BIT)
7496                            ^ (i.prefix[ADDR_PREFIX] != 0))
7497                     {
7498                       i.rm.regmem = NO_BASE_REGISTER_16;
7499                       newdisp = disp16;
7500                     }
7501                   else
7502                     {
7503                       i.rm.regmem = NO_BASE_REGISTER;
7504                       newdisp = disp32;
7505                     }
7506                   i.types[op] = operand_type_and_not (i.types[op], anydisp);
7507                   i.types[op] = operand_type_or (i.types[op], newdisp);
7508                 }
7509               else if (!i.tm.opcode_modifier.vecsib)
7510                 {
7511                   /* !i.base_reg && i.index_reg  */
7512                   if (i.index_reg->reg_num == RegIZ)
7513                     i.sib.index = NO_INDEX_REGISTER;
7514                   else
7515                     i.sib.index = i.index_reg->reg_num;
7516                   i.sib.base = NO_BASE_REGISTER;
7517                   i.sib.scale = i.log2_scale_factor;
7518                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7519                   i.types[op].bitfield.disp8 = 0;
7520                   i.types[op].bitfield.disp16 = 0;
7521                   i.types[op].bitfield.disp64 = 0;
7522                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7523                     {
7524                       /* Must be 32 bit */
7525                       i.types[op].bitfield.disp32 = 1;
7526                       i.types[op].bitfield.disp32s = 0;
7527                     }
7528                   else
7529                     {
7530                       i.types[op].bitfield.disp32 = 0;
7531                       i.types[op].bitfield.disp32s = 1;
7532                     }
7533                   if ((i.index_reg->reg_flags & RegRex) != 0)
7534                     i.rex |= REX_X;
7535                 }
7536             }
7537           /* RIP addressing for 64bit mode.  */
7538           else if (i.base_reg->reg_num == RegIP)
7539             {
7540               gas_assert (!i.tm.opcode_modifier.vecsib);
7541               i.rm.regmem = NO_BASE_REGISTER;
7542               i.types[op].bitfield.disp8 = 0;
7543               i.types[op].bitfield.disp16 = 0;
7544               i.types[op].bitfield.disp32 = 0;
7545               i.types[op].bitfield.disp32s = 1;
7546               i.types[op].bitfield.disp64 = 0;
7547               i.flags[op] |= Operand_PCrel;
7548               if (! i.disp_operands)
7549                 fake_zero_displacement = 1;
7550             }
7551           else if (i.base_reg->reg_type.bitfield.word)
7552             {
7553               gas_assert (!i.tm.opcode_modifier.vecsib);
7554               switch (i.base_reg->reg_num)
7555                 {
7556                 case 3: /* (%bx)  */
7557                   if (i.index_reg == 0)
7558                     i.rm.regmem = 7;
7559                   else /* (%bx,%si) -> 0, or (%bx,%di) -> 1  */
7560                     i.rm.regmem = i.index_reg->reg_num - 6;
7561                   break;
7562                 case 5: /* (%bp)  */
7563                   default_seg = &ss;
7564                   if (i.index_reg == 0)
7565                     {
7566                       i.rm.regmem = 6;
7567                       if (operand_type_check (i.types[op], disp) == 0)
7568                         {
7569                           /* fake (%bp) into 0(%bp)  */
7570                           i.types[op].bitfield.disp8 = 1;
7571                           fake_zero_displacement = 1;
7572                         }
7573                     }
7574                   else /* (%bp,%si) -> 2, or (%bp,%di) -> 3  */
7575                     i.rm.regmem = i.index_reg->reg_num - 6 + 2;
7576                   break;
7577                 default: /* (%si) -> 4 or (%di) -> 5  */
7578                   i.rm.regmem = i.base_reg->reg_num - 6 + 4;
7579                 }
7580               i.rm.mode = mode_from_disp_size (i.types[op]);
7581             }
7582           else /* i.base_reg and 32/64 bit mode  */
7583             {
7584               if (flag_code == CODE_64BIT
7585                   && operand_type_check (i.types[op], disp))
7586                 {
7587                   i.types[op].bitfield.disp16 = 0;
7588                   i.types[op].bitfield.disp64 = 0;
7589                   if (i.prefix[ADDR_PREFIX] == 0)
7590                     {
7591                       i.types[op].bitfield.disp32 = 0;
7592                       i.types[op].bitfield.disp32s = 1;
7593                     }
7594                   else
7595                     {
7596                       i.types[op].bitfield.disp32 = 1;
7597                       i.types[op].bitfield.disp32s = 0;
7598                     }
7599                 }
7600
7601               if (!i.tm.opcode_modifier.vecsib)
7602                 i.rm.regmem = i.base_reg->reg_num;
7603               if ((i.base_reg->reg_flags & RegRex) != 0)
7604                 i.rex |= REX_B;
7605               i.sib.base = i.base_reg->reg_num;
7606               /* x86-64 ignores REX prefix bit here to avoid decoder
7607                  complications.  */
7608               if (!(i.base_reg->reg_flags & RegRex)
7609                   && (i.base_reg->reg_num == EBP_REG_NUM
7610                    || i.base_reg->reg_num == ESP_REG_NUM))
7611                   default_seg = &ss;
7612               if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
7613                 {
7614                   fake_zero_displacement = 1;
7615                   i.types[op].bitfield.disp8 = 1;
7616                 }
7617               i.sib.scale = i.log2_scale_factor;
7618               if (i.index_reg == 0)
7619                 {
7620                   gas_assert (!i.tm.opcode_modifier.vecsib);
7621                   /* <disp>(%esp) becomes two byte modrm with no index
7622                      register.  We've already stored the code for esp
7623                      in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
7624                      Any base register besides %esp will not use the
7625                      extra modrm byte.  */
7626                   i.sib.index = NO_INDEX_REGISTER;
7627                 }
7628               else if (!i.tm.opcode_modifier.vecsib)
7629                 {
7630                   if (i.index_reg->reg_num == RegIZ)
7631                     i.sib.index = NO_INDEX_REGISTER;
7632                   else
7633                     i.sib.index = i.index_reg->reg_num;
7634                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7635                   if ((i.index_reg->reg_flags & RegRex) != 0)
7636                     i.rex |= REX_X;
7637                 }
7638
7639               if (i.disp_operands
7640                   && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
7641                       || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
7642                 i.rm.mode = 0;
7643               else
7644                 {
7645                   if (!fake_zero_displacement
7646                       && !i.disp_operands
7647                       && i.disp_encoding)
7648                     {
7649                       fake_zero_displacement = 1;
7650                       if (i.disp_encoding == disp_encoding_8bit)
7651                         i.types[op].bitfield.disp8 = 1;
7652                       else
7653                         i.types[op].bitfield.disp32 = 1;
7654                     }
7655                   i.rm.mode = mode_from_disp_size (i.types[op]);
7656                 }
7657             }
7658
7659           if (fake_zero_displacement)
7660             {
7661               /* Fakes a zero displacement assuming that i.types[op]
7662                  holds the correct displacement size.  */
7663               expressionS *exp;
7664
7665               gas_assert (i.op[op].disps == 0);
7666               exp = &disp_expressions[i.disp_operands++];
7667               i.op[op].disps = exp;
7668               exp->X_op = O_constant;
7669               exp->X_add_number = 0;
7670               exp->X_add_symbol = (symbolS *) 0;
7671               exp->X_op_symbol = (symbolS *) 0;
7672             }
7673
7674           mem = op;
7675         }
7676       else
7677         mem = ~0;
7678
7679       if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
7680         {
7681           if (operand_type_check (i.types[0], imm))
7682             i.vex.register_specifier = NULL;
7683           else
7684             {
7685               /* VEX.vvvv encodes one of the sources when the first
7686                  operand is not an immediate.  */
7687               if (i.tm.opcode_modifier.vexw == VEXW0)
7688                 i.vex.register_specifier = i.op[0].regs;
7689               else
7690                 i.vex.register_specifier = i.op[1].regs;
7691             }
7692
7693           /* Destination is a XMM register encoded in the ModRM.reg
7694              and VEX.R bit.  */
7695           i.rm.reg = i.op[2].regs->reg_num;
7696           if ((i.op[2].regs->reg_flags & RegRex) != 0)
7697             i.rex |= REX_R;
7698
7699           /* ModRM.rm and VEX.B encodes the other source.  */
7700           if (!i.mem_operands)
7701             {
7702               i.rm.mode = 3;
7703
7704               if (i.tm.opcode_modifier.vexw == VEXW0)
7705                 i.rm.regmem = i.op[1].regs->reg_num;
7706               else
7707                 i.rm.regmem = i.op[0].regs->reg_num;
7708
7709               if ((i.op[1].regs->reg_flags & RegRex) != 0)
7710                 i.rex |= REX_B;
7711             }
7712         }
7713       else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
7714         {
7715           i.vex.register_specifier = i.op[2].regs;
7716           if (!i.mem_operands)
7717             {
7718               i.rm.mode = 3;
7719               i.rm.regmem = i.op[1].regs->reg_num;
7720               if ((i.op[1].regs->reg_flags & RegRex) != 0)
7721                 i.rex |= REX_B;
7722             }
7723         }
7724       /* Fill in i.rm.reg or i.rm.regmem field with register operand
7725          (if any) based on i.tm.extension_opcode.  Again, we must be
7726          careful to make sure that segment/control/debug/test/MMX
7727          registers are coded into the i.rm.reg field.  */
7728       else if (i.reg_operands)
7729         {
7730           unsigned int op;
7731           unsigned int vex_reg = ~0;
7732
7733           for (op = 0; op < i.operands; op++)
7734             {
7735               if (i.types[op].bitfield.class == Reg
7736                   || i.types[op].bitfield.class == RegBND
7737                   || i.types[op].bitfield.class == RegMask
7738                   || i.types[op].bitfield.class == SReg
7739                   || i.types[op].bitfield.class == RegCR
7740                   || i.types[op].bitfield.class == RegDR
7741                   || i.types[op].bitfield.class == RegTR)
7742                 break;
7743               if (i.types[op].bitfield.class == RegSIMD)
7744                 {
7745                   if (i.types[op].bitfield.zmmword)
7746                     i.has_regzmm = TRUE;
7747                   else if (i.types[op].bitfield.ymmword)
7748                     i.has_regymm = TRUE;
7749                   else
7750                     i.has_regxmm = TRUE;
7751                   break;
7752                 }
7753               if (i.types[op].bitfield.class == RegMMX)
7754                 {
7755                   i.has_regmmx = TRUE;
7756                   break;
7757                 }
7758             }
7759
7760           if (vex_3_sources)
7761             op = dest;
7762           else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7763             {
7764               /* For instructions with VexNDS, the register-only
7765                  source operand is encoded in VEX prefix. */
7766               gas_assert (mem != (unsigned int) ~0);
7767
7768               if (op > mem)
7769                 {
7770                   vex_reg = op++;
7771                   gas_assert (op < i.operands);
7772                 }
7773               else
7774                 {
7775                   /* Check register-only source operand when two source
7776                      operands are swapped.  */
7777                   if (!i.tm.operand_types[op].bitfield.baseindex
7778                       && i.tm.operand_types[op + 1].bitfield.baseindex)
7779                     {
7780                       vex_reg = op;
7781                       op += 2;
7782                       gas_assert (mem == (vex_reg + 1)
7783                                   && op < i.operands);
7784                     }
7785                   else
7786                     {
7787                       vex_reg = op + 1;
7788                       gas_assert (vex_reg < i.operands);
7789                     }
7790                 }
7791             }
7792           else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7793             {
7794               /* For instructions with VexNDD, the register destination
7795                  is encoded in VEX prefix.  */
7796               if (i.mem_operands == 0)
7797                 {
7798                   /* There is no memory operand.  */
7799                   gas_assert ((op + 2) == i.operands);
7800                   vex_reg = op + 1;
7801                 }
7802               else
7803                 {
7804                   /* There are only 2 non-immediate operands.  */
7805                   gas_assert (op < i.imm_operands + 2
7806                               && i.operands == i.imm_operands + 2);
7807                   vex_reg = i.imm_operands + 1;
7808                 }
7809             }
7810           else
7811             gas_assert (op < i.operands);
7812
7813           if (vex_reg != (unsigned int) ~0)
7814             {
7815               i386_operand_type *type = &i.tm.operand_types[vex_reg];
7816
7817               if ((type->bitfield.class != Reg
7818                    || (!type->bitfield.dword && !type->bitfield.qword))
7819                   && type->bitfield.class != RegSIMD
7820                   && !operand_type_equal (type, &regmask))
7821                 abort ();
7822
7823               i.vex.register_specifier = i.op[vex_reg].regs;
7824             }
7825
7826           /* Don't set OP operand twice.  */
7827           if (vex_reg != op)
7828             {
7829               /* If there is an extension opcode to put here, the
7830                  register number must be put into the regmem field.  */
7831               if (i.tm.extension_opcode != None)
7832                 {
7833                   i.rm.regmem = i.op[op].regs->reg_num;
7834                   if ((i.op[op].regs->reg_flags & RegRex) != 0)
7835                     i.rex |= REX_B;
7836                   if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7837                     i.vrex |= REX_B;
7838                 }
7839               else
7840                 {
7841                   i.rm.reg = i.op[op].regs->reg_num;
7842                   if ((i.op[op].regs->reg_flags & RegRex) != 0)
7843                     i.rex |= REX_R;
7844                   if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7845                     i.vrex |= REX_R;
7846                 }
7847             }
7848
7849           /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
7850              must set it to 3 to indicate this is a register operand
7851              in the regmem field.  */
7852           if (!i.mem_operands)
7853             i.rm.mode = 3;
7854         }
7855
7856       /* Fill in i.rm.reg field with extension opcode (if any).  */
7857       if (i.tm.extension_opcode != None)
7858         i.rm.reg = i.tm.extension_opcode;
7859     }
7860   return default_seg;
7861 }
7862
7863 static unsigned int
7864 flip_code16 (unsigned int code16)
7865 {
7866   gas_assert (i.tm.operands == 1);
7867
7868   return !(i.prefix[REX_PREFIX] & REX_W)
7869          && (code16 ? i.tm.operand_types[0].bitfield.disp32
7870                       || i.tm.operand_types[0].bitfield.disp32s
7871                     : i.tm.operand_types[0].bitfield.disp16)
7872          ? CODE16 : 0;
7873 }
7874
7875 static void
7876 output_branch (void)
7877 {
7878   char *p;
7879   int size;
7880   int code16;
7881   int prefix;
7882   relax_substateT subtype;
7883   symbolS *sym;
7884   offsetT off;
7885
7886   code16 = flag_code == CODE_16BIT ? CODE16 : 0;
7887   size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
7888
7889   prefix = 0;
7890   if (i.prefix[DATA_PREFIX] != 0)
7891     {
7892       prefix = 1;
7893       i.prefixes -= 1;
7894       code16 ^= flip_code16(code16);
7895     }
7896   /* Pentium4 branch hints.  */
7897   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7898       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7899     {
7900       prefix++;
7901       i.prefixes--;
7902     }
7903   if (i.prefix[REX_PREFIX] != 0)
7904     {
7905       prefix++;
7906       i.prefixes--;
7907     }
7908
7909   /* BND prefixed jump.  */
7910   if (i.prefix[BND_PREFIX] != 0)
7911     {
7912       prefix++;
7913       i.prefixes--;
7914     }
7915
7916   if (i.prefixes != 0)
7917     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
7918
7919   /* It's always a symbol;  End frag & setup for relax.
7920      Make sure there is enough room in this frag for the largest
7921      instruction we may generate in md_convert_frag.  This is 2
7922      bytes for the opcode and room for the prefix and largest
7923      displacement.  */
7924   frag_grow (prefix + 2 + 4);
7925   /* Prefix and 1 opcode byte go in fr_fix.  */
7926   p = frag_more (prefix + 1);
7927   if (i.prefix[DATA_PREFIX] != 0)
7928     *p++ = DATA_PREFIX_OPCODE;
7929   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
7930       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
7931     *p++ = i.prefix[SEG_PREFIX];
7932   if (i.prefix[BND_PREFIX] != 0)
7933     *p++ = BND_PREFIX_OPCODE;
7934   if (i.prefix[REX_PREFIX] != 0)
7935     *p++ = i.prefix[REX_PREFIX];
7936   *p = i.tm.base_opcode;
7937
7938   if ((unsigned char) *p == JUMP_PC_RELATIVE)
7939     subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
7940   else if (cpu_arch_flags.bitfield.cpui386)
7941     subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
7942   else
7943     subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
7944   subtype |= code16;
7945
7946   sym = i.op[0].disps->X_add_symbol;
7947   off = i.op[0].disps->X_add_number;
7948
7949   if (i.op[0].disps->X_op != O_constant
7950       && i.op[0].disps->X_op != O_symbol)
7951     {
7952       /* Handle complex expressions.  */
7953       sym = make_expr_symbol (i.op[0].disps);
7954       off = 0;
7955     }
7956
7957   /* 1 possible extra opcode + 4 byte displacement go in var part.
7958      Pass reloc in fr_var.  */
7959   frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
7960 }
7961
7962 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7963 /* Return TRUE iff PLT32 relocation should be used for branching to
7964    symbol S.  */
7965
7966 static bfd_boolean
7967 need_plt32_p (symbolS *s)
7968 {
7969   /* PLT32 relocation is ELF only.  */
7970   if (!IS_ELF)
7971     return FALSE;
7972
7973 #ifdef TE_SOLARIS
7974   /* Don't emit PLT32 relocation on Solaris: neither native linker nor
7975      krtld support it.  */
7976   return FALSE;
7977 #endif
7978
7979   /* Since there is no need to prepare for PLT branch on x86-64, we
7980      can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
7981      be used as a marker for 32-bit PC-relative branches.  */
7982   if (!object_64bit)
7983     return FALSE;
7984
7985   /* Weak or undefined symbol need PLT32 relocation.  */
7986   if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
7987     return TRUE;
7988
7989   /* Non-global symbol doesn't need PLT32 relocation.  */
7990   if (! S_IS_EXTERNAL (s))
7991     return FALSE;
7992
7993   /* Other global symbols need PLT32 relocation.  NB: Symbol with
7994      non-default visibilities are treated as normal global symbol
7995      so that PLT32 relocation can be used as a marker for 32-bit
7996      PC-relative branches.  It is useful for linker relaxation.  */
7997   return TRUE;
7998 }
7999 #endif
8000
8001 static void
8002 output_jump (void)
8003 {
8004   char *p;
8005   int size;
8006   fixS *fixP;
8007   bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8008
8009   if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8010     {
8011       /* This is a loop or jecxz type instruction.  */
8012       size = 1;
8013       if (i.prefix[ADDR_PREFIX] != 0)
8014         {
8015           FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
8016           i.prefixes -= 1;
8017         }
8018       /* Pentium4 branch hints.  */
8019       if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8020           || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8021         {
8022           FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
8023           i.prefixes--;
8024         }
8025     }
8026   else
8027     {
8028       int code16;
8029
8030       code16 = 0;
8031       if (flag_code == CODE_16BIT)
8032         code16 = CODE16;
8033
8034       if (i.prefix[DATA_PREFIX] != 0)
8035         {
8036           FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8037           i.prefixes -= 1;
8038           code16 ^= flip_code16(code16);
8039         }
8040
8041       size = 4;
8042       if (code16)
8043         size = 2;
8044     }
8045
8046   /* BND prefixed jump.  */
8047   if (i.prefix[BND_PREFIX] != 0)
8048     {
8049       FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
8050       i.prefixes -= 1;
8051     }
8052
8053   if (i.prefix[REX_PREFIX] != 0)
8054     {
8055       FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
8056       i.prefixes -= 1;
8057     }
8058
8059   if (i.prefixes != 0)
8060     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8061
8062   p = frag_more (i.tm.opcode_length + size);
8063   switch (i.tm.opcode_length)
8064     {
8065     case 2:
8066       *p++ = i.tm.base_opcode >> 8;
8067       /* Fall through.  */
8068     case 1:
8069       *p++ = i.tm.base_opcode;
8070       break;
8071     default:
8072       abort ();
8073     }
8074
8075 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8076   if (size == 4
8077       && jump_reloc == NO_RELOC
8078       && need_plt32_p (i.op[0].disps->X_add_symbol))
8079     jump_reloc = BFD_RELOC_X86_64_PLT32;
8080 #endif
8081
8082   jump_reloc = reloc (size, 1, 1, jump_reloc);
8083
8084   fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8085                       i.op[0].disps, 1, jump_reloc);
8086
8087   /* All jumps handled here are signed, but don't use a signed limit
8088      check for 32 and 16 bit jumps as we want to allow wrap around at
8089      4G and 64k respectively.  */
8090   if (size == 1)
8091     fixP->fx_signed = 1;
8092 }
8093
8094 static void
8095 output_interseg_jump (void)
8096 {
8097   char *p;
8098   int size;
8099   int prefix;
8100   int code16;
8101
8102   code16 = 0;
8103   if (flag_code == CODE_16BIT)
8104     code16 = CODE16;
8105
8106   prefix = 0;
8107   if (i.prefix[DATA_PREFIX] != 0)
8108     {
8109       prefix = 1;
8110       i.prefixes -= 1;
8111       code16 ^= CODE16;
8112     }
8113
8114   gas_assert (!i.prefix[REX_PREFIX]);
8115
8116   size = 4;
8117   if (code16)
8118     size = 2;
8119
8120   if (i.prefixes != 0)
8121     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8122
8123   /* 1 opcode; 2 segment; offset  */
8124   p = frag_more (prefix + 1 + 2 + size);
8125
8126   if (i.prefix[DATA_PREFIX] != 0)
8127     *p++ = DATA_PREFIX_OPCODE;
8128
8129   if (i.prefix[REX_PREFIX] != 0)
8130     *p++ = i.prefix[REX_PREFIX];
8131
8132   *p++ = i.tm.base_opcode;
8133   if (i.op[1].imms->X_op == O_constant)
8134     {
8135       offsetT n = i.op[1].imms->X_add_number;
8136
8137       if (size == 2
8138           && !fits_in_unsigned_word (n)
8139           && !fits_in_signed_word (n))
8140         {
8141           as_bad (_("16-bit jump out of range"));
8142           return;
8143         }
8144       md_number_to_chars (p, n, size);
8145     }
8146   else
8147     fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8148                  i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8149   if (i.op[0].imms->X_op != O_constant)
8150     as_bad (_("can't handle non absolute segment in `%s'"),
8151             i.tm.name);
8152   md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8153 }
8154
8155 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8156 void
8157 x86_cleanup (void)
8158 {
8159   char *p;
8160   asection *seg = now_seg;
8161   subsegT subseg = now_subseg;
8162   asection *sec;
8163   unsigned int alignment, align_size_1;
8164   unsigned int isa_1_descsz, feature_2_descsz, descsz;
8165   unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8166   unsigned int padding;
8167
8168   if (!IS_ELF || !x86_used_note)
8169     return;
8170
8171   x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8172
8173   /* The .note.gnu.property section layout:
8174
8175      Field      Length          Contents
8176      ----       ----            ----
8177      n_namsz    4               4
8178      n_descsz   4               The note descriptor size
8179      n_type     4               NT_GNU_PROPERTY_TYPE_0
8180      n_name     4               "GNU"
8181      n_desc     n_descsz        The program property array
8182      ....       ....            ....
8183    */
8184
8185   /* Create the .note.gnu.property section.  */
8186   sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8187   bfd_set_section_flags (sec,
8188                          (SEC_ALLOC
8189                           | SEC_LOAD
8190                           | SEC_DATA
8191                           | SEC_HAS_CONTENTS
8192                           | SEC_READONLY));
8193
8194   if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8195     {
8196       align_size_1 = 7;
8197       alignment = 3;
8198     }
8199   else
8200     {
8201       align_size_1 = 3;
8202       alignment = 2;
8203     }
8204
8205   bfd_set_section_alignment (sec, alignment);
8206   elf_section_type (sec) = SHT_NOTE;
8207
8208   /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8209                                   + 4-byte data  */
8210   isa_1_descsz_raw = 4 + 4 + 4;
8211   /* Align GNU_PROPERTY_X86_ISA_1_USED.  */
8212   isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8213
8214   feature_2_descsz_raw = isa_1_descsz;
8215   /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8216                                       + 4-byte data  */
8217   feature_2_descsz_raw += 4 + 4 + 4;
8218   /* Align GNU_PROPERTY_X86_FEATURE_2_USED.  */
8219   feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8220                       & ~align_size_1);
8221
8222   descsz = feature_2_descsz;
8223   /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz.  */
8224   p = frag_more (4 + 4 + 4 + 4 + descsz);
8225
8226   /* Write n_namsz.  */
8227   md_number_to_chars (p, (valueT) 4, 4);
8228
8229   /* Write n_descsz.  */
8230   md_number_to_chars (p + 4, (valueT) descsz, 4);
8231
8232   /* Write n_type.  */
8233   md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8234
8235   /* Write n_name.  */
8236   memcpy (p + 4 * 3, "GNU", 4);
8237
8238   /* Write 4-byte type.  */
8239   md_number_to_chars (p + 4 * 4,
8240                       (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8241
8242   /* Write 4-byte data size.  */
8243   md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8244
8245   /* Write 4-byte data.  */
8246   md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8247
8248   /* Zero out paddings.  */
8249   padding = isa_1_descsz - isa_1_descsz_raw;
8250   if (padding)
8251     memset (p + 4 * 7, 0, padding);
8252
8253   /* Write 4-byte type.  */
8254   md_number_to_chars (p + isa_1_descsz + 4 * 4,
8255                       (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8256
8257   /* Write 4-byte data size.  */
8258   md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8259
8260   /* Write 4-byte data.  */
8261   md_number_to_chars (p + isa_1_descsz + 4 * 6,
8262                       (valueT) x86_feature_2_used, 4);
8263
8264   /* Zero out paddings.  */
8265   padding = feature_2_descsz - feature_2_descsz_raw;
8266   if (padding)
8267     memset (p + isa_1_descsz + 4 * 7, 0, padding);
8268
8269   /* We probably can't restore the current segment, for there likely
8270      isn't one yet...  */
8271   if (seg && subseg)
8272     subseg_set (seg, subseg);
8273 }
8274 #endif
8275
8276 static unsigned int
8277 encoding_length (const fragS *start_frag, offsetT start_off,
8278                  const char *frag_now_ptr)
8279 {
8280   unsigned int len = 0;
8281
8282   if (start_frag != frag_now)
8283     {
8284       const fragS *fr = start_frag;
8285
8286       do {
8287         len += fr->fr_fix;
8288         fr = fr->fr_next;
8289       } while (fr && fr != frag_now);
8290     }
8291
8292   return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8293 }
8294
8295 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8296    be macro-fused with conditional jumps.  */
8297
8298 static int
8299 maybe_fused_with_jcc_p (void)
8300 {
8301   /* No RIP address.  */
8302   if (i.base_reg && i.base_reg->reg_num == RegIP)
8303     return 0;
8304
8305   /* No VEX/EVEX encoding.  */
8306   if (is_any_vex_encoding (&i.tm))
8307     return 0;
8308
8309   /* and, add, sub with destination register.  */
8310   if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8311       || i.tm.base_opcode <= 5
8312       || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8313       || ((i.tm.base_opcode | 3) == 0x83
8314           && ((i.tm.extension_opcode | 1) == 0x5
8315               || i.tm.extension_opcode == 0x0)))
8316     return (i.types[1].bitfield.class == Reg
8317             || i.types[1].bitfield.instance == Accum);
8318
8319   /* test, cmp with any register.  */
8320   if ((i.tm.base_opcode | 1) == 0x85
8321       || (i.tm.base_opcode | 1) == 0xa9
8322       || ((i.tm.base_opcode | 1) == 0xf7
8323           && i.tm.extension_opcode == 0)
8324       || (i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8325       || ((i.tm.base_opcode | 3) == 0x83
8326           && (i.tm.extension_opcode == 0x7)))
8327     return (i.types[0].bitfield.class == Reg
8328             || i.types[0].bitfield.instance == Accum
8329             || i.types[1].bitfield.class == Reg
8330             || i.types[1].bitfield.instance == Accum);
8331
8332   /* inc, dec with any register.   */
8333   if ((i.tm.cpu_flags.bitfield.cpuno64
8334        && (i.tm.base_opcode | 0xf) == 0x4f)
8335       || ((i.tm.base_opcode | 1) == 0xff
8336           && i.tm.extension_opcode <= 0x1))
8337     return (i.types[0].bitfield.class == Reg
8338             || i.types[0].bitfield.instance == Accum);
8339
8340   return 0;
8341 }
8342
8343 /* Return 1 if a FUSED_JCC_PADDING frag should be generated.  */
8344
8345 static int
8346 add_fused_jcc_padding_frag_p (void)
8347 {
8348   /* NB: Don't work with COND_JUMP86 without i386.  */
8349   if (!align_branch_power
8350       || now_seg == absolute_section
8351       || !cpu_arch_flags.bitfield.cpui386
8352       || !(align_branch & align_branch_fused_bit))
8353     return 0;
8354
8355   if (maybe_fused_with_jcc_p ())
8356     {
8357       if (last_insn.kind == last_insn_other
8358           || last_insn.seg != now_seg)
8359         return 1;
8360       if (flag_debug)
8361         as_warn_where (last_insn.file, last_insn.line,
8362                        _("`%s` skips -malign-branch-boundary on `%s`"),
8363                        last_insn.name, i.tm.name);
8364     }
8365
8366   return 0;
8367 }
8368
8369 /* Return 1 if a BRANCH_PREFIX frag should be generated.  */
8370
8371 static int
8372 add_branch_prefix_frag_p (void)
8373 {
8374   /* NB: Don't work with COND_JUMP86 without i386.  Don't add prefix
8375      to PadLock instructions since they include prefixes in opcode.  */
8376   if (!align_branch_power
8377       || !align_branch_prefix_size
8378       || now_seg == absolute_section
8379       || i.tm.cpu_flags.bitfield.cpupadlock
8380       || !cpu_arch_flags.bitfield.cpui386)
8381     return 0;
8382
8383   /* Don't add prefix if it is a prefix or there is no operand in case
8384      that segment prefix is special.  */
8385   if (!i.operands || i.tm.opcode_modifier.isprefix)
8386     return 0;
8387
8388   if (last_insn.kind == last_insn_other
8389       || last_insn.seg != now_seg)
8390     return 1;
8391
8392   if (flag_debug)
8393     as_warn_where (last_insn.file, last_insn.line,
8394                    _("`%s` skips -malign-branch-boundary on `%s`"),
8395                    last_insn.name, i.tm.name);
8396
8397   return 0;
8398 }
8399
8400 /* Return 1 if a BRANCH_PADDING frag should be generated.  */
8401
8402 static int
8403 add_branch_padding_frag_p (enum align_branch_kind *branch_p)
8404 {
8405   int add_padding;
8406
8407   /* NB: Don't work with COND_JUMP86 without i386.  */
8408   if (!align_branch_power
8409       || now_seg == absolute_section
8410       || !cpu_arch_flags.bitfield.cpui386)
8411     return 0;
8412
8413   add_padding = 0;
8414
8415   /* Check for jcc and direct jmp.  */
8416   if (i.tm.opcode_modifier.jump == JUMP)
8417     {
8418       if (i.tm.base_opcode == JUMP_PC_RELATIVE)
8419         {
8420           *branch_p = align_branch_jmp;
8421           add_padding = align_branch & align_branch_jmp_bit;
8422         }
8423       else
8424         {
8425           *branch_p = align_branch_jcc;
8426           if ((align_branch & align_branch_jcc_bit))
8427             add_padding = 1;
8428         }
8429     }
8430   else if (is_any_vex_encoding (&i.tm))
8431     return 0;
8432   else if ((i.tm.base_opcode | 1) == 0xc3)
8433     {
8434       /* Near ret.  */
8435       *branch_p = align_branch_ret;
8436       if ((align_branch & align_branch_ret_bit))
8437         add_padding = 1;
8438     }
8439   else
8440     {
8441       /* Check for indirect jmp, direct and indirect calls.  */
8442       if (i.tm.base_opcode == 0xe8)
8443         {
8444           /* Direct call.  */
8445           *branch_p = align_branch_call;
8446           if ((align_branch & align_branch_call_bit))
8447             add_padding = 1;
8448         }
8449       else if (i.tm.base_opcode == 0xff
8450                && (i.tm.extension_opcode == 2
8451                    || i.tm.extension_opcode == 4))
8452         {
8453           /* Indirect call and jmp.  */
8454           *branch_p = align_branch_indirect;
8455           if ((align_branch & align_branch_indirect_bit))
8456             add_padding = 1;
8457         }
8458
8459       if (add_padding
8460           && i.disp_operands
8461           && tls_get_addr
8462           && (i.op[0].disps->X_op == O_symbol
8463               || (i.op[0].disps->X_op == O_subtract
8464                   && i.op[0].disps->X_op_symbol == GOT_symbol)))
8465         {
8466           symbolS *s = i.op[0].disps->X_add_symbol;
8467           /* No padding to call to global or undefined tls_get_addr.  */
8468           if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
8469               && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
8470             return 0;
8471         }
8472     }
8473
8474   if (add_padding
8475       && last_insn.kind != last_insn_other
8476       && last_insn.seg == now_seg)
8477     {
8478       if (flag_debug)
8479         as_warn_where (last_insn.file, last_insn.line,
8480                        _("`%s` skips -malign-branch-boundary on `%s`"),
8481                        last_insn.name, i.tm.name);
8482       return 0;
8483     }
8484
8485   return add_padding;
8486 }
8487
8488 static void
8489 output_insn (void)
8490 {
8491   fragS *insn_start_frag;
8492   offsetT insn_start_off;
8493   fragS *fragP = NULL;
8494   enum align_branch_kind branch = align_branch_none;
8495
8496 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8497   if (IS_ELF && x86_used_note)
8498     {
8499       if (i.tm.cpu_flags.bitfield.cpucmov)
8500         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
8501       if (i.tm.cpu_flags.bitfield.cpusse)
8502         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
8503       if (i.tm.cpu_flags.bitfield.cpusse2)
8504         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
8505       if (i.tm.cpu_flags.bitfield.cpusse3)
8506         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
8507       if (i.tm.cpu_flags.bitfield.cpussse3)
8508         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
8509       if (i.tm.cpu_flags.bitfield.cpusse4_1)
8510         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
8511       if (i.tm.cpu_flags.bitfield.cpusse4_2)
8512         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
8513       if (i.tm.cpu_flags.bitfield.cpuavx)
8514         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
8515       if (i.tm.cpu_flags.bitfield.cpuavx2)
8516         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
8517       if (i.tm.cpu_flags.bitfield.cpufma)
8518         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
8519       if (i.tm.cpu_flags.bitfield.cpuavx512f)
8520         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
8521       if (i.tm.cpu_flags.bitfield.cpuavx512cd)
8522         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
8523       if (i.tm.cpu_flags.bitfield.cpuavx512er)
8524         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
8525       if (i.tm.cpu_flags.bitfield.cpuavx512pf)
8526         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
8527       if (i.tm.cpu_flags.bitfield.cpuavx512vl)
8528         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
8529       if (i.tm.cpu_flags.bitfield.cpuavx512dq)
8530         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
8531       if (i.tm.cpu_flags.bitfield.cpuavx512bw)
8532         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
8533       if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
8534         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
8535       if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
8536         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
8537       if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
8538         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
8539       if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
8540         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
8541       if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
8542         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
8543       if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
8544         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
8545       if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
8546         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
8547       if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
8548         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
8549
8550       if (i.tm.cpu_flags.bitfield.cpu8087
8551           || i.tm.cpu_flags.bitfield.cpu287
8552           || i.tm.cpu_flags.bitfield.cpu387
8553           || i.tm.cpu_flags.bitfield.cpu687
8554           || i.tm.cpu_flags.bitfield.cpufisttp)
8555         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
8556       if (i.has_regmmx
8557           || i.tm.base_opcode == 0xf77 /* emms */
8558           || i.tm.base_opcode == 0xf0e /* femms */)
8559         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
8560       if (i.has_regxmm)
8561         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
8562       if (i.has_regymm)
8563         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
8564       if (i.has_regzmm)
8565         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
8566       if (i.tm.cpu_flags.bitfield.cpufxsr)
8567         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
8568       if (i.tm.cpu_flags.bitfield.cpuxsave)
8569         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
8570       if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
8571         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
8572       if (i.tm.cpu_flags.bitfield.cpuxsavec)
8573         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
8574     }
8575 #endif
8576
8577   /* Tie dwarf2 debug info to the address at the start of the insn.
8578      We can't do this after the insn has been output as the current
8579      frag may have been closed off.  eg. by frag_var.  */
8580   dwarf2_emit_insn (0);
8581
8582   insn_start_frag = frag_now;
8583   insn_start_off = frag_now_fix ();
8584
8585   if (add_branch_padding_frag_p (&branch))
8586     {
8587       char *p;
8588       /* Branch can be 8 bytes.  Leave some room for prefixes.  */
8589       unsigned int max_branch_padding_size = 14;
8590
8591       /* Align section to boundary.  */
8592       record_alignment (now_seg, align_branch_power);
8593
8594       /* Make room for padding.  */
8595       frag_grow (max_branch_padding_size);
8596
8597       /* Start of the padding.  */
8598       p = frag_more (0);
8599
8600       fragP = frag_now;
8601
8602       frag_var (rs_machine_dependent, max_branch_padding_size, 0,
8603                 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
8604                 NULL, 0, p);
8605
8606       fragP->tc_frag_data.branch_type = branch;
8607       fragP->tc_frag_data.max_bytes = max_branch_padding_size;
8608     }
8609
8610   /* Output jumps.  */
8611   if (i.tm.opcode_modifier.jump == JUMP)
8612     output_branch ();
8613   else if (i.tm.opcode_modifier.jump == JUMP_BYTE
8614            || i.tm.opcode_modifier.jump == JUMP_DWORD)
8615     output_jump ();
8616   else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
8617     output_interseg_jump ();
8618   else
8619     {
8620       /* Output normal instructions here.  */
8621       char *p;
8622       unsigned char *q;
8623       unsigned int j;
8624       unsigned int prefix;
8625
8626       if (avoid_fence
8627           && (i.tm.base_opcode == 0xfaee8
8628               || i.tm.base_opcode == 0xfaef0
8629               || i.tm.base_opcode == 0xfaef8))
8630         {
8631           /* Encode lfence, mfence, and sfence as
8632              f0 83 04 24 00   lock addl $0x0, (%{re}sp).  */
8633           offsetT val = 0x240483f0ULL;
8634           p = frag_more (5);
8635           md_number_to_chars (p, val, 5);
8636           return;
8637         }
8638
8639       /* Some processors fail on LOCK prefix. This options makes
8640          assembler ignore LOCK prefix and serves as a workaround.  */
8641       if (omit_lock_prefix)
8642         {
8643           if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
8644             return;
8645           i.prefix[LOCK_PREFIX] = 0;
8646         }
8647
8648       if (branch)
8649         /* Skip if this is a branch.  */
8650         ;
8651       else if (add_fused_jcc_padding_frag_p ())
8652         {
8653           /* Make room for padding.  */
8654           frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
8655           p = frag_more (0);
8656
8657           fragP = frag_now;
8658
8659           frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
8660                     ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
8661                     NULL, 0, p);
8662
8663           fragP->tc_frag_data.branch_type = align_branch_fused;
8664           fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
8665         }
8666       else if (add_branch_prefix_frag_p ())
8667         {
8668           unsigned int max_prefix_size = align_branch_prefix_size;
8669
8670           /* Make room for padding.  */
8671           frag_grow (max_prefix_size);
8672           p = frag_more (0);
8673
8674           fragP = frag_now;
8675
8676           frag_var (rs_machine_dependent, max_prefix_size, 0,
8677                     ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
8678                     NULL, 0, p);
8679
8680           fragP->tc_frag_data.max_bytes = max_prefix_size;
8681         }
8682
8683       /* Since the VEX/EVEX prefix contains the implicit prefix, we
8684          don't need the explicit prefix.  */
8685       if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
8686         {
8687           switch (i.tm.opcode_length)
8688             {
8689             case 3:
8690               if (i.tm.base_opcode & 0xff000000)
8691                 {
8692                   prefix = (i.tm.base_opcode >> 24) & 0xff;
8693                   if (!i.tm.cpu_flags.bitfield.cpupadlock
8694                       || prefix != REPE_PREFIX_OPCODE
8695                       || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
8696                     add_prefix (prefix);
8697                 }
8698               break;
8699             case 2:
8700               if ((i.tm.base_opcode & 0xff0000) != 0)
8701                 {
8702                   prefix = (i.tm.base_opcode >> 16) & 0xff;
8703                   add_prefix (prefix);
8704                 }
8705               break;
8706             case 1:
8707               break;
8708             case 0:
8709               /* Check for pseudo prefixes.  */
8710               as_bad_where (insn_start_frag->fr_file,
8711                             insn_start_frag->fr_line,
8712                              _("pseudo prefix without instruction"));
8713               return;
8714             default:
8715               abort ();
8716             }
8717
8718 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
8719           /* For x32, add a dummy REX_OPCODE prefix for mov/add with
8720              R_X86_64_GOTTPOFF relocation so that linker can safely
8721              perform IE->LE optimization.  */
8722           if (x86_elf_abi == X86_64_X32_ABI
8723               && i.operands == 2
8724               && i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
8725               && i.prefix[REX_PREFIX] == 0)
8726             add_prefix (REX_OPCODE);
8727 #endif
8728
8729           /* The prefix bytes.  */
8730           for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
8731             if (*q)
8732               FRAG_APPEND_1_CHAR (*q);
8733         }
8734       else
8735         {
8736           for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
8737             if (*q)
8738               switch (j)
8739                 {
8740                 case REX_PREFIX:
8741                   /* REX byte is encoded in VEX prefix.  */
8742                   break;
8743                 case SEG_PREFIX:
8744                 case ADDR_PREFIX:
8745                   FRAG_APPEND_1_CHAR (*q);
8746                   break;
8747                 default:
8748                   /* There should be no other prefixes for instructions
8749                      with VEX prefix.  */
8750                   abort ();
8751                 }
8752
8753           /* For EVEX instructions i.vrex should become 0 after
8754              build_evex_prefix.  For VEX instructions upper 16 registers
8755              aren't available, so VREX should be 0.  */
8756           if (i.vrex)
8757             abort ();
8758           /* Now the VEX prefix.  */
8759           p = frag_more (i.vex.length);
8760           for (j = 0; j < i.vex.length; j++)
8761             p[j] = i.vex.bytes[j];
8762         }
8763
8764       /* Now the opcode; be careful about word order here!  */
8765       if (i.tm.opcode_length == 1)
8766         {
8767           FRAG_APPEND_1_CHAR (i.tm.base_opcode);
8768         }
8769       else
8770         {
8771           switch (i.tm.opcode_length)
8772             {
8773             case 4:
8774               p = frag_more (4);
8775               *p++ = (i.tm.base_opcode >> 24) & 0xff;
8776               *p++ = (i.tm.base_opcode >> 16) & 0xff;
8777               break;
8778             case 3:
8779               p = frag_more (3);
8780               *p++ = (i.tm.base_opcode >> 16) & 0xff;
8781               break;
8782             case 2:
8783               p = frag_more (2);
8784               break;
8785             default:
8786               abort ();
8787               break;
8788             }
8789
8790           /* Put out high byte first: can't use md_number_to_chars!  */
8791           *p++ = (i.tm.base_opcode >> 8) & 0xff;
8792           *p = i.tm.base_opcode & 0xff;
8793         }
8794
8795       /* Now the modrm byte and sib byte (if present).  */
8796       if (i.tm.opcode_modifier.modrm)
8797         {
8798           FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
8799                                | i.rm.reg << 3
8800                                | i.rm.mode << 6));
8801           /* If i.rm.regmem == ESP (4)
8802              && i.rm.mode != (Register mode)
8803              && not 16 bit
8804              ==> need second modrm byte.  */
8805           if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
8806               && i.rm.mode != 3
8807               && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
8808             FRAG_APPEND_1_CHAR ((i.sib.base << 0
8809                                  | i.sib.index << 3
8810                                  | i.sib.scale << 6));
8811         }
8812
8813       if (i.disp_operands)
8814         output_disp (insn_start_frag, insn_start_off);
8815
8816       if (i.imm_operands)
8817         output_imm (insn_start_frag, insn_start_off);
8818
8819       /*
8820        * frag_now_fix () returning plain abs_section_offset when we're in the
8821        * absolute section, and abs_section_offset not getting updated as data
8822        * gets added to the frag breaks the logic below.
8823        */
8824       if (now_seg != absolute_section)
8825         {
8826           j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
8827           if (j > 15)
8828             as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
8829                      j);
8830           else if (fragP)
8831             {
8832               /* NB: Don't add prefix with GOTPC relocation since
8833                  output_disp() above depends on the fixed encoding
8834                  length.  Can't add prefix with TLS relocation since
8835                  it breaks TLS linker optimization.  */
8836               unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
8837               /* Prefix count on the current instruction.  */
8838               unsigned int count = i.vex.length;
8839               unsigned int k;
8840               for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
8841                 /* REX byte is encoded in VEX/EVEX prefix.  */
8842                 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
8843                   count++;
8844
8845               /* Count prefixes for extended opcode maps.  */
8846               if (!i.vex.length)
8847                 switch (i.tm.opcode_length)
8848                   {
8849                   case 3:
8850                     if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
8851                       {
8852                         count++;
8853                         switch ((i.tm.base_opcode >> 8) & 0xff)
8854                           {
8855                           case 0x38:
8856                           case 0x3a:
8857                             count++;
8858                             break;
8859                           default:
8860                             break;
8861                           }
8862                       }
8863                     break;
8864                   case 2:
8865                     if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
8866                       count++;
8867                     break;
8868                   case 1:
8869                     break;
8870                   default:
8871                     abort ();
8872                   }
8873
8874               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
8875                   == BRANCH_PREFIX)
8876                 {
8877                   /* Set the maximum prefix size in BRANCH_PREFIX
8878                      frag.  */
8879                   if (fragP->tc_frag_data.max_bytes > max)
8880                     fragP->tc_frag_data.max_bytes = max;
8881                   if (fragP->tc_frag_data.max_bytes > count)
8882                     fragP->tc_frag_data.max_bytes -= count;
8883                   else
8884                     fragP->tc_frag_data.max_bytes = 0;
8885                 }
8886               else
8887                 {
8888                   /* Remember the maximum prefix size in FUSED_JCC_PADDING
8889                      frag.  */
8890                   unsigned int max_prefix_size;
8891                   if (align_branch_prefix_size > max)
8892                     max_prefix_size = max;
8893                   else
8894                     max_prefix_size = align_branch_prefix_size;
8895                   if (max_prefix_size > count)
8896                     fragP->tc_frag_data.max_prefix_length
8897                       = max_prefix_size - count;
8898                 }
8899
8900               /* Use existing segment prefix if possible.  Use CS
8901                  segment prefix in 64-bit mode.  In 32-bit mode, use SS
8902                  segment prefix with ESP/EBP base register and use DS
8903                  segment prefix without ESP/EBP base register.  */
8904               if (i.prefix[SEG_PREFIX])
8905                 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
8906               else if (flag_code == CODE_64BIT)
8907                 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
8908               else if (i.base_reg
8909                        && (i.base_reg->reg_num == 4
8910                            || i.base_reg->reg_num == 5))
8911                 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
8912               else
8913                 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
8914             }
8915         }
8916     }
8917
8918   /* NB: Don't work with COND_JUMP86 without i386.  */
8919   if (align_branch_power
8920       && now_seg != absolute_section
8921       && cpu_arch_flags.bitfield.cpui386)
8922     {
8923       /* Terminate each frag so that we can add prefix and check for
8924          fused jcc.  */
8925       frag_wane (frag_now);
8926       frag_new (0);
8927     }
8928
8929 #ifdef DEBUG386
8930   if (flag_debug)
8931     {
8932       pi ("" /*line*/, &i);
8933     }
8934 #endif /* DEBUG386  */
8935 }
8936
8937 /* Return the size of the displacement operand N.  */
8938
8939 static int
8940 disp_size (unsigned int n)
8941 {
8942   int size = 4;
8943
8944   if (i.types[n].bitfield.disp64)
8945     size = 8;
8946   else if (i.types[n].bitfield.disp8)
8947     size = 1;
8948   else if (i.types[n].bitfield.disp16)
8949     size = 2;
8950   return size;
8951 }
8952
8953 /* Return the size of the immediate operand N.  */
8954
8955 static int
8956 imm_size (unsigned int n)
8957 {
8958   int size = 4;
8959   if (i.types[n].bitfield.imm64)
8960     size = 8;
8961   else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
8962     size = 1;
8963   else if (i.types[n].bitfield.imm16)
8964     size = 2;
8965   return size;
8966 }
8967
8968 static void
8969 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
8970 {
8971   char *p;
8972   unsigned int n;
8973
8974   for (n = 0; n < i.operands; n++)
8975     {
8976       if (operand_type_check (i.types[n], disp))
8977         {
8978           if (i.op[n].disps->X_op == O_constant)
8979             {
8980               int size = disp_size (n);
8981               offsetT val = i.op[n].disps->X_add_number;
8982
8983               val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
8984                                      size);
8985               p = frag_more (size);
8986               md_number_to_chars (p, val, size);
8987             }
8988           else
8989             {
8990               enum bfd_reloc_code_real reloc_type;
8991               int size = disp_size (n);
8992               int sign = i.types[n].bitfield.disp32s;
8993               int pcrel = (i.flags[n] & Operand_PCrel) != 0;
8994               fixS *fixP;
8995
8996               /* We can't have 8 bit displacement here.  */
8997               gas_assert (!i.types[n].bitfield.disp8);
8998
8999               /* The PC relative address is computed relative
9000                  to the instruction boundary, so in case immediate
9001                  fields follows, we need to adjust the value.  */
9002               if (pcrel && i.imm_operands)
9003                 {
9004                   unsigned int n1;
9005                   int sz = 0;
9006
9007                   for (n1 = 0; n1 < i.operands; n1++)
9008                     if (operand_type_check (i.types[n1], imm))
9009                       {
9010                         /* Only one immediate is allowed for PC
9011                            relative address.  */
9012                         gas_assert (sz == 0);
9013                         sz = imm_size (n1);
9014                         i.op[n].disps->X_add_number -= sz;
9015                       }
9016                   /* We should find the immediate.  */
9017                   gas_assert (sz != 0);
9018                 }
9019
9020               p = frag_more (size);
9021               reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9022               if (GOT_symbol
9023                   && GOT_symbol == i.op[n].disps->X_add_symbol
9024                   && (((reloc_type == BFD_RELOC_32
9025                         || reloc_type == BFD_RELOC_X86_64_32S
9026                         || (reloc_type == BFD_RELOC_64
9027                             && object_64bit))
9028                        && (i.op[n].disps->X_op == O_symbol
9029                            || (i.op[n].disps->X_op == O_add
9030                                && ((symbol_get_value_expression
9031                                     (i.op[n].disps->X_op_symbol)->X_op)
9032                                    == O_subtract))))
9033                       || reloc_type == BFD_RELOC_32_PCREL))
9034                 {
9035                   if (!object_64bit)
9036                     {
9037                       reloc_type = BFD_RELOC_386_GOTPC;
9038                       i.has_gotpc_tls_reloc = TRUE;
9039                       i.op[n].imms->X_add_number +=
9040                         encoding_length (insn_start_frag, insn_start_off, p);
9041                     }
9042                   else if (reloc_type == BFD_RELOC_64)
9043                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9044                   else
9045                     /* Don't do the adjustment for x86-64, as there
9046                        the pcrel addressing is relative to the _next_
9047                        insn, and that is taken care of in other code.  */
9048                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9049                 }
9050               else if (align_branch_power)
9051                 {
9052                   switch (reloc_type)
9053                     {
9054                     case BFD_RELOC_386_TLS_GD:
9055                     case BFD_RELOC_386_TLS_LDM:
9056                     case BFD_RELOC_386_TLS_IE:
9057                     case BFD_RELOC_386_TLS_IE_32:
9058                     case BFD_RELOC_386_TLS_GOTIE:
9059                     case BFD_RELOC_386_TLS_GOTDESC:
9060                     case BFD_RELOC_386_TLS_DESC_CALL:
9061                     case BFD_RELOC_X86_64_TLSGD:
9062                     case BFD_RELOC_X86_64_TLSLD:
9063                     case BFD_RELOC_X86_64_GOTTPOFF:
9064                     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9065                     case BFD_RELOC_X86_64_TLSDESC_CALL:
9066                       i.has_gotpc_tls_reloc = TRUE;
9067                     default:
9068                       break;
9069                     }
9070                 }
9071               fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9072                                   size, i.op[n].disps, pcrel,
9073                                   reloc_type);
9074               /* Check for "call/jmp *mem", "mov mem, %reg",
9075                  "test %reg, mem" and "binop mem, %reg" where binop
9076                  is one of adc, add, and, cmp, or, sbb, sub, xor
9077                  instructions without data prefix.  Always generate
9078                  R_386_GOT32X for "sym*GOT" operand in 32-bit mode.  */
9079               if (i.prefix[DATA_PREFIX] == 0
9080                   && (generate_relax_relocations
9081                       || (!object_64bit
9082                           && i.rm.mode == 0
9083                           && i.rm.regmem == 5))
9084                   && (i.rm.mode == 2
9085                       || (i.rm.mode == 0 && i.rm.regmem == 5))
9086                   && ((i.operands == 1
9087                        && i.tm.base_opcode == 0xff
9088                        && (i.rm.reg == 2 || i.rm.reg == 4))
9089                       || (i.operands == 2
9090                           && (i.tm.base_opcode == 0x8b
9091                               || i.tm.base_opcode == 0x85
9092                               || (i.tm.base_opcode & 0xc7) == 0x03))))
9093                 {
9094                   if (object_64bit)
9095                     {
9096                       fixP->fx_tcbit = i.rex != 0;
9097                       if (i.base_reg
9098                           && (i.base_reg->reg_num == RegIP))
9099                       fixP->fx_tcbit2 = 1;
9100                     }
9101                   else
9102                     fixP->fx_tcbit2 = 1;
9103                 }
9104             }
9105         }
9106     }
9107 }
9108
9109 static void
9110 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9111 {
9112   char *p;
9113   unsigned int n;
9114
9115   for (n = 0; n < i.operands; n++)
9116     {
9117       /* Skip SAE/RC Imm operand in EVEX.  They are already handled.  */
9118       if (i.rounding && (int) n == i.rounding->operand)
9119         continue;
9120
9121       if (operand_type_check (i.types[n], imm))
9122         {
9123           if (i.op[n].imms->X_op == O_constant)
9124             {
9125               int size = imm_size (n);
9126               offsetT val;
9127
9128               val = offset_in_range (i.op[n].imms->X_add_number,
9129                                      size);
9130               p = frag_more (size);
9131               md_number_to_chars (p, val, size);
9132             }
9133           else
9134             {
9135               /* Not absolute_section.
9136                  Need a 32-bit fixup (don't support 8bit
9137                  non-absolute imms).  Try to support other
9138                  sizes ...  */
9139               enum bfd_reloc_code_real reloc_type;
9140               int size = imm_size (n);
9141               int sign;
9142
9143               if (i.types[n].bitfield.imm32s
9144                   && (i.suffix == QWORD_MNEM_SUFFIX
9145                       || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9146                 sign = 1;
9147               else
9148                 sign = 0;
9149
9150               p = frag_more (size);
9151               reloc_type = reloc (size, 0, sign, i.reloc[n]);
9152
9153               /*   This is tough to explain.  We end up with this one if we
9154                * have operands that look like
9155                * "_GLOBAL_OFFSET_TABLE_+[.-.L284]".  The goal here is to
9156                * obtain the absolute address of the GOT, and it is strongly
9157                * preferable from a performance point of view to avoid using
9158                * a runtime relocation for this.  The actual sequence of
9159                * instructions often look something like:
9160                *
9161                *        call    .L66
9162                * .L66:
9163                *        popl    %ebx
9164                *        addl    $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9165                *
9166                *   The call and pop essentially return the absolute address
9167                * of the label .L66 and store it in %ebx.  The linker itself
9168                * will ultimately change the first operand of the addl so
9169                * that %ebx points to the GOT, but to keep things simple, the
9170                * .o file must have this operand set so that it generates not
9171                * the absolute address of .L66, but the absolute address of
9172                * itself.  This allows the linker itself simply treat a GOTPC
9173                * relocation as asking for a pcrel offset to the GOT to be
9174                * added in, and the addend of the relocation is stored in the
9175                * operand field for the instruction itself.
9176                *
9177                *   Our job here is to fix the operand so that it would add
9178                * the correct offset so that %ebx would point to itself.  The
9179                * thing that is tricky is that .-.L66 will point to the
9180                * beginning of the instruction, so we need to further modify
9181                * the operand so that it will point to itself.  There are
9182                * other cases where you have something like:
9183                *
9184                *        .long   $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9185                *
9186                * and here no correction would be required.  Internally in
9187                * the assembler we treat operands of this form as not being
9188                * pcrel since the '.' is explicitly mentioned, and I wonder
9189                * whether it would simplify matters to do it this way.  Who
9190                * knows.  In earlier versions of the PIC patches, the
9191                * pcrel_adjust field was used to store the correction, but
9192                * since the expression is not pcrel, I felt it would be
9193                * confusing to do it this way.  */
9194
9195               if ((reloc_type == BFD_RELOC_32
9196                    || reloc_type == BFD_RELOC_X86_64_32S
9197                    || reloc_type == BFD_RELOC_64)
9198                   && GOT_symbol
9199                   && GOT_symbol == i.op[n].imms->X_add_symbol
9200                   && (i.op[n].imms->X_op == O_symbol
9201                       || (i.op[n].imms->X_op == O_add
9202                           && ((symbol_get_value_expression
9203                                (i.op[n].imms->X_op_symbol)->X_op)
9204                               == O_subtract))))
9205                 {
9206                   if (!object_64bit)
9207                     reloc_type = BFD_RELOC_386_GOTPC;
9208                   else if (size == 4)
9209                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9210                   else if (size == 8)
9211                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9212                   i.has_gotpc_tls_reloc = TRUE;
9213                   i.op[n].imms->X_add_number +=
9214                     encoding_length (insn_start_frag, insn_start_off, p);
9215                 }
9216               fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9217                            i.op[n].imms, 0, reloc_type);
9218             }
9219         }
9220     }
9221 }
9222 \f
9223 /* x86_cons_fix_new is called via the expression parsing code when a
9224    reloc is needed.  We use this hook to get the correct .got reloc.  */
9225 static int cons_sign = -1;
9226
9227 void
9228 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9229                   expressionS *exp, bfd_reloc_code_real_type r)
9230 {
9231   r = reloc (len, 0, cons_sign, r);
9232
9233 #ifdef TE_PE
9234   if (exp->X_op == O_secrel)
9235     {
9236       exp->X_op = O_symbol;
9237       r = BFD_RELOC_32_SECREL;
9238     }
9239 #endif
9240
9241   fix_new_exp (frag, off, len, exp, 0, r);
9242 }
9243
9244 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9245    purpose of the `.dc.a' internal pseudo-op.  */
9246
9247 int
9248 x86_address_bytes (void)
9249 {
9250   if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9251     return 4;
9252   return stdoutput->arch_info->bits_per_address / 8;
9253 }
9254
9255 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9256     || defined (LEX_AT)
9257 # define lex_got(reloc, adjust, types) NULL
9258 #else
9259 /* Parse operands of the form
9260    <symbol>@GOTOFF+<nnn>
9261    and similar .plt or .got references.
9262
9263    If we find one, set up the correct relocation in RELOC and copy the
9264    input string, minus the `@GOTOFF' into a malloc'd buffer for
9265    parsing by the calling routine.  Return this buffer, and if ADJUST
9266    is non-null set it to the length of the string we removed from the
9267    input line.  Otherwise return NULL.  */
9268 static char *
9269 lex_got (enum bfd_reloc_code_real *rel,
9270          int *adjust,
9271          i386_operand_type *types)
9272 {
9273   /* Some of the relocations depend on the size of what field is to
9274      be relocated.  But in our callers i386_immediate and i386_displacement
9275      we don't yet know the operand size (this will be set by insn
9276      matching).  Hence we record the word32 relocation here,
9277      and adjust the reloc according to the real size in reloc().  */
9278   static const struct {
9279     const char *str;
9280     int len;
9281     const enum bfd_reloc_code_real rel[2];
9282     const i386_operand_type types64;
9283   } gotrel[] = {
9284 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9285     { STRING_COMMA_LEN ("SIZE"),      { BFD_RELOC_SIZE32,
9286                                         BFD_RELOC_SIZE32 },
9287       OPERAND_TYPE_IMM32_64 },
9288 #endif
9289     { STRING_COMMA_LEN ("PLTOFF"),   { _dummy_first_bfd_reloc_code_real,
9290                                        BFD_RELOC_X86_64_PLTOFF64 },
9291       OPERAND_TYPE_IMM64 },
9292     { STRING_COMMA_LEN ("PLT"),      { BFD_RELOC_386_PLT32,
9293                                        BFD_RELOC_X86_64_PLT32    },
9294       OPERAND_TYPE_IMM32_32S_DISP32 },
9295     { STRING_COMMA_LEN ("GOTPLT"),   { _dummy_first_bfd_reloc_code_real,
9296                                        BFD_RELOC_X86_64_GOTPLT64 },
9297       OPERAND_TYPE_IMM64_DISP64 },
9298     { STRING_COMMA_LEN ("GOTOFF"),   { BFD_RELOC_386_GOTOFF,
9299                                        BFD_RELOC_X86_64_GOTOFF64 },
9300       OPERAND_TYPE_IMM64_DISP64 },
9301     { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9302                                        BFD_RELOC_X86_64_GOTPCREL },
9303       OPERAND_TYPE_IMM32_32S_DISP32 },
9304     { STRING_COMMA_LEN ("TLSGD"),    { BFD_RELOC_386_TLS_GD,
9305                                        BFD_RELOC_X86_64_TLSGD    },
9306       OPERAND_TYPE_IMM32_32S_DISP32 },
9307     { STRING_COMMA_LEN ("TLSLDM"),   { BFD_RELOC_386_TLS_LDM,
9308                                        _dummy_first_bfd_reloc_code_real },
9309       OPERAND_TYPE_NONE },
9310     { STRING_COMMA_LEN ("TLSLD"),    { _dummy_first_bfd_reloc_code_real,
9311                                        BFD_RELOC_X86_64_TLSLD    },
9312       OPERAND_TYPE_IMM32_32S_DISP32 },
9313     { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9314                                        BFD_RELOC_X86_64_GOTTPOFF },
9315       OPERAND_TYPE_IMM32_32S_DISP32 },
9316     { STRING_COMMA_LEN ("TPOFF"),    { BFD_RELOC_386_TLS_LE_32,
9317                                        BFD_RELOC_X86_64_TPOFF32  },
9318       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9319     { STRING_COMMA_LEN ("NTPOFF"),   { BFD_RELOC_386_TLS_LE,
9320                                        _dummy_first_bfd_reloc_code_real },
9321       OPERAND_TYPE_NONE },
9322     { STRING_COMMA_LEN ("DTPOFF"),   { BFD_RELOC_386_TLS_LDO_32,
9323                                        BFD_RELOC_X86_64_DTPOFF32 },
9324       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9325     { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9326                                        _dummy_first_bfd_reloc_code_real },
9327       OPERAND_TYPE_NONE },
9328     { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9329                                        _dummy_first_bfd_reloc_code_real },
9330       OPERAND_TYPE_NONE },
9331     { STRING_COMMA_LEN ("GOT"),      { BFD_RELOC_386_GOT32,
9332                                        BFD_RELOC_X86_64_GOT32    },
9333       OPERAND_TYPE_IMM32_32S_64_DISP32 },
9334     { STRING_COMMA_LEN ("TLSDESC"),  { BFD_RELOC_386_TLS_GOTDESC,
9335                                        BFD_RELOC_X86_64_GOTPC32_TLSDESC },
9336       OPERAND_TYPE_IMM32_32S_DISP32 },
9337     { STRING_COMMA_LEN ("TLSCALL"),  { BFD_RELOC_386_TLS_DESC_CALL,
9338                                        BFD_RELOC_X86_64_TLSDESC_CALL },
9339       OPERAND_TYPE_IMM32_32S_DISP32 },
9340   };
9341   char *cp;
9342   unsigned int j;
9343
9344 #if defined (OBJ_MAYBE_ELF)
9345   if (!IS_ELF)
9346     return NULL;
9347 #endif
9348
9349   for (cp = input_line_pointer; *cp != '@'; cp++)
9350     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9351       return NULL;
9352
9353   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9354     {
9355       int len = gotrel[j].len;
9356       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9357         {
9358           if (gotrel[j].rel[object_64bit] != 0)
9359             {
9360               int first, second;
9361               char *tmpbuf, *past_reloc;
9362
9363               *rel = gotrel[j].rel[object_64bit];
9364
9365               if (types)
9366                 {
9367                   if (flag_code != CODE_64BIT)
9368                     {
9369                       types->bitfield.imm32 = 1;
9370                       types->bitfield.disp32 = 1;
9371                     }
9372                   else
9373                     *types = gotrel[j].types64;
9374                 }
9375
9376               if (j != 0 && GOT_symbol == NULL)
9377                 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9378
9379               /* The length of the first part of our input line.  */
9380               first = cp - input_line_pointer;
9381
9382               /* The second part goes from after the reloc token until
9383                  (and including) an end_of_line char or comma.  */
9384               past_reloc = cp + 1 + len;
9385               cp = past_reloc;
9386               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9387                 ++cp;
9388               second = cp + 1 - past_reloc;
9389
9390               /* Allocate and copy string.  The trailing NUL shouldn't
9391                  be necessary, but be safe.  */
9392               tmpbuf = XNEWVEC (char, first + second + 2);
9393               memcpy (tmpbuf, input_line_pointer, first);
9394               if (second != 0 && *past_reloc != ' ')
9395                 /* Replace the relocation token with ' ', so that
9396                    errors like foo@GOTOFF1 will be detected.  */
9397                 tmpbuf[first++] = ' ';
9398               else
9399                 /* Increment length by 1 if the relocation token is
9400                    removed.  */
9401                 len++;
9402               if (adjust)
9403                 *adjust = len;
9404               memcpy (tmpbuf + first, past_reloc, second);
9405               tmpbuf[first + second] = '\0';
9406               return tmpbuf;
9407             }
9408
9409           as_bad (_("@%s reloc is not supported with %d-bit output format"),
9410                   gotrel[j].str, 1 << (5 + object_64bit));
9411           return NULL;
9412         }
9413     }
9414
9415   /* Might be a symbol version string.  Don't as_bad here.  */
9416   return NULL;
9417 }
9418 #endif
9419
9420 #ifdef TE_PE
9421 #ifdef lex_got
9422 #undef lex_got
9423 #endif
9424 /* Parse operands of the form
9425    <symbol>@SECREL32+<nnn>
9426
9427    If we find one, set up the correct relocation in RELOC and copy the
9428    input string, minus the `@SECREL32' into a malloc'd buffer for
9429    parsing by the calling routine.  Return this buffer, and if ADJUST
9430    is non-null set it to the length of the string we removed from the
9431    input line.  Otherwise return NULL.
9432
9433    This function is copied from the ELF version above adjusted for PE targets.  */
9434
9435 static char *
9436 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
9437          int *adjust ATTRIBUTE_UNUSED,
9438          i386_operand_type *types)
9439 {
9440   static const struct
9441   {
9442     const char *str;
9443     int len;
9444     const enum bfd_reloc_code_real rel[2];
9445     const i386_operand_type types64;
9446   }
9447   gotrel[] =
9448   {
9449     { STRING_COMMA_LEN ("SECREL32"),    { BFD_RELOC_32_SECREL,
9450                                           BFD_RELOC_32_SECREL },
9451       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9452   };
9453
9454   char *cp;
9455   unsigned j;
9456
9457   for (cp = input_line_pointer; *cp != '@'; cp++)
9458     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9459       return NULL;
9460
9461   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9462     {
9463       int len = gotrel[j].len;
9464
9465       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9466         {
9467           if (gotrel[j].rel[object_64bit] != 0)
9468             {
9469               int first, second;
9470               char *tmpbuf, *past_reloc;
9471
9472               *rel = gotrel[j].rel[object_64bit];
9473               if (adjust)
9474                 *adjust = len;
9475
9476               if (types)
9477                 {
9478                   if (flag_code != CODE_64BIT)
9479                     {
9480                       types->bitfield.imm32 = 1;
9481                       types->bitfield.disp32 = 1;
9482                     }
9483                   else
9484                     *types = gotrel[j].types64;
9485                 }
9486
9487               /* The length of the first part of our input line.  */
9488               first = cp - input_line_pointer;
9489
9490               /* The second part goes from after the reloc token until
9491                  (and including) an end_of_line char or comma.  */
9492               past_reloc = cp + 1 + len;
9493               cp = past_reloc;
9494               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9495                 ++cp;
9496               second = cp + 1 - past_reloc;
9497
9498               /* Allocate and copy string.  The trailing NUL shouldn't
9499                  be necessary, but be safe.  */
9500               tmpbuf = XNEWVEC (char, first + second + 2);
9501               memcpy (tmpbuf, input_line_pointer, first);
9502               if (second != 0 && *past_reloc != ' ')
9503                 /* Replace the relocation token with ' ', so that
9504                    errors like foo@SECLREL321 will be detected.  */
9505                 tmpbuf[first++] = ' ';
9506               memcpy (tmpbuf + first, past_reloc, second);
9507               tmpbuf[first + second] = '\0';
9508               return tmpbuf;
9509             }
9510
9511           as_bad (_("@%s reloc is not supported with %d-bit output format"),
9512                   gotrel[j].str, 1 << (5 + object_64bit));
9513           return NULL;
9514         }
9515     }
9516
9517   /* Might be a symbol version string.  Don't as_bad here.  */
9518   return NULL;
9519 }
9520
9521 #endif /* TE_PE */
9522
9523 bfd_reloc_code_real_type
9524 x86_cons (expressionS *exp, int size)
9525 {
9526   bfd_reloc_code_real_type got_reloc = NO_RELOC;
9527
9528   intel_syntax = -intel_syntax;
9529
9530   exp->X_md = 0;
9531   if (size == 4 || (object_64bit && size == 8))
9532     {
9533       /* Handle @GOTOFF and the like in an expression.  */
9534       char *save;
9535       char *gotfree_input_line;
9536       int adjust = 0;
9537
9538       save = input_line_pointer;
9539       gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
9540       if (gotfree_input_line)
9541         input_line_pointer = gotfree_input_line;
9542
9543       expression (exp);
9544
9545       if (gotfree_input_line)
9546         {
9547           /* expression () has merrily parsed up to the end of line,
9548              or a comma - in the wrong buffer.  Transfer how far
9549              input_line_pointer has moved to the right buffer.  */
9550           input_line_pointer = (save
9551                                 + (input_line_pointer - gotfree_input_line)
9552                                 + adjust);
9553           free (gotfree_input_line);
9554           if (exp->X_op == O_constant
9555               || exp->X_op == O_absent
9556               || exp->X_op == O_illegal
9557               || exp->X_op == O_register
9558               || exp->X_op == O_big)
9559             {
9560               char c = *input_line_pointer;
9561               *input_line_pointer = 0;
9562               as_bad (_("missing or invalid expression `%s'"), save);
9563               *input_line_pointer = c;
9564             }
9565           else if ((got_reloc == BFD_RELOC_386_PLT32
9566                     || got_reloc == BFD_RELOC_X86_64_PLT32)
9567                    && exp->X_op != O_symbol)
9568             {
9569               char c = *input_line_pointer;
9570               *input_line_pointer = 0;
9571               as_bad (_("invalid PLT expression `%s'"), save);
9572               *input_line_pointer = c;
9573             }
9574         }
9575     }
9576   else
9577     expression (exp);
9578
9579   intel_syntax = -intel_syntax;
9580
9581   if (intel_syntax)
9582     i386_intel_simplify (exp);
9583
9584   return got_reloc;
9585 }
9586
9587 static void
9588 signed_cons (int size)
9589 {
9590   if (flag_code == CODE_64BIT)
9591     cons_sign = 1;
9592   cons (size);
9593   cons_sign = -1;
9594 }
9595
9596 #ifdef TE_PE
9597 static void
9598 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
9599 {
9600   expressionS exp;
9601
9602   do
9603     {
9604       expression (&exp);
9605       if (exp.X_op == O_symbol)
9606         exp.X_op = O_secrel;
9607
9608       emit_expr (&exp, 4);
9609     }
9610   while (*input_line_pointer++ == ',');
9611
9612   input_line_pointer--;
9613   demand_empty_rest_of_line ();
9614 }
9615 #endif
9616
9617 /* Handle Vector operations.  */
9618
9619 static char *
9620 check_VecOperations (char *op_string, char *op_end)
9621 {
9622   const reg_entry *mask;
9623   const char *saved;
9624   char *end_op;
9625
9626   while (*op_string
9627          && (op_end == NULL || op_string < op_end))
9628     {
9629       saved = op_string;
9630       if (*op_string == '{')
9631         {
9632           op_string++;
9633
9634           /* Check broadcasts.  */
9635           if (strncmp (op_string, "1to", 3) == 0)
9636             {
9637               int bcst_type;
9638
9639               if (i.broadcast)
9640                 goto duplicated_vec_op;
9641
9642               op_string += 3;
9643               if (*op_string == '8')
9644                 bcst_type = 8;
9645               else if (*op_string == '4')
9646                 bcst_type = 4;
9647               else if (*op_string == '2')
9648                 bcst_type = 2;
9649               else if (*op_string == '1'
9650                        && *(op_string+1) == '6')
9651                 {
9652                   bcst_type = 16;
9653                   op_string++;
9654                 }
9655               else
9656                 {
9657                   as_bad (_("Unsupported broadcast: `%s'"), saved);
9658                   return NULL;
9659                 }
9660               op_string++;
9661
9662               broadcast_op.type = bcst_type;
9663               broadcast_op.operand = this_operand;
9664               broadcast_op.bytes = 0;
9665               i.broadcast = &broadcast_op;
9666             }
9667           /* Check masking operation.  */
9668           else if ((mask = parse_register (op_string, &end_op)) != NULL)
9669             {
9670               /* k0 can't be used for write mask.  */
9671               if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
9672                 {
9673                   as_bad (_("`%s%s' can't be used for write mask"),
9674                           register_prefix, mask->reg_name);
9675                   return NULL;
9676                 }
9677
9678               if (!i.mask)
9679                 {
9680                   mask_op.mask = mask;
9681                   mask_op.zeroing = 0;
9682                   mask_op.operand = this_operand;
9683                   i.mask = &mask_op;
9684                 }
9685               else
9686                 {
9687                   if (i.mask->mask)
9688                     goto duplicated_vec_op;
9689
9690                   i.mask->mask = mask;
9691
9692                   /* Only "{z}" is allowed here.  No need to check
9693                      zeroing mask explicitly.  */
9694                   if (i.mask->operand != this_operand)
9695                     {
9696                       as_bad (_("invalid write mask `%s'"), saved);
9697                       return NULL;
9698                     }
9699                 }
9700
9701               op_string = end_op;
9702             }
9703           /* Check zeroing-flag for masking operation.  */
9704           else if (*op_string == 'z')
9705             {
9706               if (!i.mask)
9707                 {
9708                   mask_op.mask = NULL;
9709                   mask_op.zeroing = 1;
9710                   mask_op.operand = this_operand;
9711                   i.mask = &mask_op;
9712                 }
9713               else
9714                 {
9715                   if (i.mask->zeroing)
9716                     {
9717                     duplicated_vec_op:
9718                       as_bad (_("duplicated `%s'"), saved);
9719                       return NULL;
9720                     }
9721
9722                   i.mask->zeroing = 1;
9723
9724                   /* Only "{%k}" is allowed here.  No need to check mask
9725                      register explicitly.  */
9726                   if (i.mask->operand != this_operand)
9727                     {
9728                       as_bad (_("invalid zeroing-masking `%s'"),
9729                               saved);
9730                       return NULL;
9731                     }
9732                 }
9733
9734               op_string++;
9735             }
9736           else
9737             goto unknown_vec_op;
9738
9739           if (*op_string != '}')
9740             {
9741               as_bad (_("missing `}' in `%s'"), saved);
9742               return NULL;
9743             }
9744           op_string++;
9745
9746           /* Strip whitespace since the addition of pseudo prefixes
9747              changed how the scrubber treats '{'.  */
9748           if (is_space_char (*op_string))
9749             ++op_string;
9750
9751           continue;
9752         }
9753     unknown_vec_op:
9754       /* We don't know this one.  */
9755       as_bad (_("unknown vector operation: `%s'"), saved);
9756       return NULL;
9757     }
9758
9759   if (i.mask && i.mask->zeroing && !i.mask->mask)
9760     {
9761       as_bad (_("zeroing-masking only allowed with write mask"));
9762       return NULL;
9763     }
9764
9765   return op_string;
9766 }
9767
9768 static int
9769 i386_immediate (char *imm_start)
9770 {
9771   char *save_input_line_pointer;
9772   char *gotfree_input_line;
9773   segT exp_seg = 0;
9774   expressionS *exp;
9775   i386_operand_type types;
9776
9777   operand_type_set (&types, ~0);
9778
9779   if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
9780     {
9781       as_bad (_("at most %d immediate operands are allowed"),
9782               MAX_IMMEDIATE_OPERANDS);
9783       return 0;
9784     }
9785
9786   exp = &im_expressions[i.imm_operands++];
9787   i.op[this_operand].imms = exp;
9788
9789   if (is_space_char (*imm_start))
9790     ++imm_start;
9791
9792   save_input_line_pointer = input_line_pointer;
9793   input_line_pointer = imm_start;
9794
9795   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9796   if (gotfree_input_line)
9797     input_line_pointer = gotfree_input_line;
9798
9799   exp_seg = expression (exp);
9800
9801   SKIP_WHITESPACE ();
9802
9803   /* Handle vector operations.  */
9804   if (*input_line_pointer == '{')
9805     {
9806       input_line_pointer = check_VecOperations (input_line_pointer,
9807                                                 NULL);
9808       if (input_line_pointer == NULL)
9809         return 0;
9810     }
9811
9812   if (*input_line_pointer)
9813     as_bad (_("junk `%s' after expression"), input_line_pointer);
9814
9815   input_line_pointer = save_input_line_pointer;
9816   if (gotfree_input_line)
9817     {
9818       free (gotfree_input_line);
9819
9820       if (exp->X_op == O_constant || exp->X_op == O_register)
9821         exp->X_op = O_illegal;
9822     }
9823
9824   return i386_finalize_immediate (exp_seg, exp, types, imm_start);
9825 }
9826
9827 static int
9828 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9829                          i386_operand_type types, const char *imm_start)
9830 {
9831   if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
9832     {
9833       if (imm_start)
9834         as_bad (_("missing or invalid immediate expression `%s'"),
9835                 imm_start);
9836       return 0;
9837     }
9838   else if (exp->X_op == O_constant)
9839     {
9840       /* Size it properly later.  */
9841       i.types[this_operand].bitfield.imm64 = 1;
9842       /* If not 64bit, sign extend val.  */
9843       if (flag_code != CODE_64BIT
9844           && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
9845         exp->X_add_number
9846           = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
9847     }
9848 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9849   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
9850            && exp_seg != absolute_section
9851            && exp_seg != text_section
9852            && exp_seg != data_section
9853            && exp_seg != bss_section
9854            && exp_seg != undefined_section
9855            && !bfd_is_com_section (exp_seg))
9856     {
9857       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9858       return 0;
9859     }
9860 #endif
9861   else if (!intel_syntax && exp_seg == reg_section)
9862     {
9863       if (imm_start)
9864         as_bad (_("illegal immediate register operand %s"), imm_start);
9865       return 0;
9866     }
9867   else
9868     {
9869       /* This is an address.  The size of the address will be
9870          determined later, depending on destination register,
9871          suffix, or the default for the section.  */
9872       i.types[this_operand].bitfield.imm8 = 1;
9873       i.types[this_operand].bitfield.imm16 = 1;
9874       i.types[this_operand].bitfield.imm32 = 1;
9875       i.types[this_operand].bitfield.imm32s = 1;
9876       i.types[this_operand].bitfield.imm64 = 1;
9877       i.types[this_operand] = operand_type_and (i.types[this_operand],
9878                                                 types);
9879     }
9880
9881   return 1;
9882 }
9883
9884 static char *
9885 i386_scale (char *scale)
9886 {
9887   offsetT val;
9888   char *save = input_line_pointer;
9889
9890   input_line_pointer = scale;
9891   val = get_absolute_expression ();
9892
9893   switch (val)
9894     {
9895     case 1:
9896       i.log2_scale_factor = 0;
9897       break;
9898     case 2:
9899       i.log2_scale_factor = 1;
9900       break;
9901     case 4:
9902       i.log2_scale_factor = 2;
9903       break;
9904     case 8:
9905       i.log2_scale_factor = 3;
9906       break;
9907     default:
9908       {
9909         char sep = *input_line_pointer;
9910
9911         *input_line_pointer = '\0';
9912         as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
9913                 scale);
9914         *input_line_pointer = sep;
9915         input_line_pointer = save;
9916         return NULL;
9917       }
9918     }
9919   if (i.log2_scale_factor != 0 && i.index_reg == 0)
9920     {
9921       as_warn (_("scale factor of %d without an index register"),
9922                1 << i.log2_scale_factor);
9923       i.log2_scale_factor = 0;
9924     }
9925   scale = input_line_pointer;
9926   input_line_pointer = save;
9927   return scale;
9928 }
9929
9930 static int
9931 i386_displacement (char *disp_start, char *disp_end)
9932 {
9933   expressionS *exp;
9934   segT exp_seg = 0;
9935   char *save_input_line_pointer;
9936   char *gotfree_input_line;
9937   int override;
9938   i386_operand_type bigdisp, types = anydisp;
9939   int ret;
9940
9941   if (i.disp_operands == MAX_MEMORY_OPERANDS)
9942     {
9943       as_bad (_("at most %d displacement operands are allowed"),
9944               MAX_MEMORY_OPERANDS);
9945       return 0;
9946     }
9947
9948   operand_type_set (&bigdisp, 0);
9949   if (i.jumpabsolute
9950       || i.types[this_operand].bitfield.baseindex
9951       || (current_templates->start->opcode_modifier.jump != JUMP
9952           && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
9953     {
9954       i386_addressing_mode ();
9955       override = (i.prefix[ADDR_PREFIX] != 0);
9956       if (flag_code == CODE_64BIT)
9957         {
9958           if (!override)
9959             {
9960               bigdisp.bitfield.disp32s = 1;
9961               bigdisp.bitfield.disp64 = 1;
9962             }
9963           else
9964             bigdisp.bitfield.disp32 = 1;
9965         }
9966       else if ((flag_code == CODE_16BIT) ^ override)
9967           bigdisp.bitfield.disp16 = 1;
9968       else
9969           bigdisp.bitfield.disp32 = 1;
9970     }
9971   else
9972     {
9973       /* For PC-relative branches, the width of the displacement may be
9974          dependent upon data size, but is never dependent upon address size.
9975          Also make sure to not unintentionally match against a non-PC-relative
9976          branch template.  */
9977       static templates aux_templates;
9978       const insn_template *t = current_templates->start;
9979       bfd_boolean has_intel64 = FALSE;
9980
9981       aux_templates.start = t;
9982       while (++t < current_templates->end)
9983         {
9984           if (t->opcode_modifier.jump
9985               != current_templates->start->opcode_modifier.jump)
9986             break;
9987           if (t->opcode_modifier.intel64)
9988             has_intel64 = TRUE;
9989         }
9990       if (t < current_templates->end)
9991         {
9992           aux_templates.end = t;
9993           current_templates = &aux_templates;
9994         }
9995
9996       override = (i.prefix[DATA_PREFIX] != 0);
9997       if (flag_code == CODE_64BIT)
9998         {
9999           if ((override || i.suffix == WORD_MNEM_SUFFIX)
10000               && (!intel64 || !has_intel64))
10001             bigdisp.bitfield.disp16 = 1;
10002           else
10003             bigdisp.bitfield.disp32s = 1;
10004         }
10005       else
10006         {
10007           if (!override)
10008             override = (i.suffix == (flag_code != CODE_16BIT
10009                                      ? WORD_MNEM_SUFFIX
10010                                      : LONG_MNEM_SUFFIX));
10011           bigdisp.bitfield.disp32 = 1;
10012           if ((flag_code == CODE_16BIT) ^ override)
10013             {
10014               bigdisp.bitfield.disp32 = 0;
10015               bigdisp.bitfield.disp16 = 1;
10016             }
10017         }
10018     }
10019   i.types[this_operand] = operand_type_or (i.types[this_operand],
10020                                            bigdisp);
10021
10022   exp = &disp_expressions[i.disp_operands];
10023   i.op[this_operand].disps = exp;
10024   i.disp_operands++;
10025   save_input_line_pointer = input_line_pointer;
10026   input_line_pointer = disp_start;
10027   END_STRING_AND_SAVE (disp_end);
10028
10029 #ifndef GCC_ASM_O_HACK
10030 #define GCC_ASM_O_HACK 0
10031 #endif
10032 #if GCC_ASM_O_HACK
10033   END_STRING_AND_SAVE (disp_end + 1);
10034   if (i.types[this_operand].bitfield.baseIndex
10035       && displacement_string_end[-1] == '+')
10036     {
10037       /* This hack is to avoid a warning when using the "o"
10038          constraint within gcc asm statements.
10039          For instance:
10040
10041          #define _set_tssldt_desc(n,addr,limit,type) \
10042          __asm__ __volatile__ ( \
10043          "movw %w2,%0\n\t" \
10044          "movw %w1,2+%0\n\t" \
10045          "rorl $16,%1\n\t" \
10046          "movb %b1,4+%0\n\t" \
10047          "movb %4,5+%0\n\t" \
10048          "movb $0,6+%0\n\t" \
10049          "movb %h1,7+%0\n\t" \
10050          "rorl $16,%1" \
10051          : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10052
10053          This works great except that the output assembler ends
10054          up looking a bit weird if it turns out that there is
10055          no offset.  You end up producing code that looks like:
10056
10057          #APP
10058          movw $235,(%eax)
10059          movw %dx,2+(%eax)
10060          rorl $16,%edx
10061          movb %dl,4+(%eax)
10062          movb $137,5+(%eax)
10063          movb $0,6+(%eax)
10064          movb %dh,7+(%eax)
10065          rorl $16,%edx
10066          #NO_APP
10067
10068          So here we provide the missing zero.  */
10069
10070       *displacement_string_end = '0';
10071     }
10072 #endif
10073   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10074   if (gotfree_input_line)
10075     input_line_pointer = gotfree_input_line;
10076
10077   exp_seg = expression (exp);
10078
10079   SKIP_WHITESPACE ();
10080   if (*input_line_pointer)
10081     as_bad (_("junk `%s' after expression"), input_line_pointer);
10082 #if GCC_ASM_O_HACK
10083   RESTORE_END_STRING (disp_end + 1);
10084 #endif
10085   input_line_pointer = save_input_line_pointer;
10086   if (gotfree_input_line)
10087     {
10088       free (gotfree_input_line);
10089
10090       if (exp->X_op == O_constant || exp->X_op == O_register)
10091         exp->X_op = O_illegal;
10092     }
10093
10094   ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10095
10096   RESTORE_END_STRING (disp_end);
10097
10098   return ret;
10099 }
10100
10101 static int
10102 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10103                             i386_operand_type types, const char *disp_start)
10104 {
10105   i386_operand_type bigdisp;
10106   int ret = 1;
10107
10108   /* We do this to make sure that the section symbol is in
10109      the symbol table.  We will ultimately change the relocation
10110      to be relative to the beginning of the section.  */
10111   if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10112       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10113       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10114     {
10115       if (exp->X_op != O_symbol)
10116         goto inv_disp;
10117
10118       if (S_IS_LOCAL (exp->X_add_symbol)
10119           && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10120           && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10121         section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10122       exp->X_op = O_subtract;
10123       exp->X_op_symbol = GOT_symbol;
10124       if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10125         i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10126       else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10127         i.reloc[this_operand] = BFD_RELOC_64;
10128       else
10129         i.reloc[this_operand] = BFD_RELOC_32;
10130     }
10131
10132   else if (exp->X_op == O_absent
10133            || exp->X_op == O_illegal
10134            || exp->X_op == O_big)
10135     {
10136     inv_disp:
10137       as_bad (_("missing or invalid displacement expression `%s'"),
10138               disp_start);
10139       ret = 0;
10140     }
10141
10142   else if (flag_code == CODE_64BIT
10143            && !i.prefix[ADDR_PREFIX]
10144            && exp->X_op == O_constant)
10145     {
10146       /* Since displacement is signed extended to 64bit, don't allow
10147          disp32 and turn off disp32s if they are out of range.  */
10148       i.types[this_operand].bitfield.disp32 = 0;
10149       if (!fits_in_signed_long (exp->X_add_number))
10150         {
10151           i.types[this_operand].bitfield.disp32s = 0;
10152           if (i.types[this_operand].bitfield.baseindex)
10153             {
10154               as_bad (_("0x%lx out range of signed 32bit displacement"),
10155                       (long) exp->X_add_number);
10156               ret = 0;
10157             }
10158         }
10159     }
10160
10161 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10162   else if (exp->X_op != O_constant
10163            && OUTPUT_FLAVOR == bfd_target_aout_flavour
10164            && exp_seg != absolute_section
10165            && exp_seg != text_section
10166            && exp_seg != data_section
10167            && exp_seg != bss_section
10168            && exp_seg != undefined_section
10169            && !bfd_is_com_section (exp_seg))
10170     {
10171       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10172       ret = 0;
10173     }
10174 #endif
10175
10176   if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10177       /* Constants get taken care of by optimize_disp().  */
10178       && exp->X_op != O_constant)
10179     i.types[this_operand].bitfield.disp8 = 1;
10180
10181   /* Check if this is a displacement only operand.  */
10182   bigdisp = i.types[this_operand];
10183   bigdisp.bitfield.disp8 = 0;
10184   bigdisp.bitfield.disp16 = 0;
10185   bigdisp.bitfield.disp32 = 0;
10186   bigdisp.bitfield.disp32s = 0;
10187   bigdisp.bitfield.disp64 = 0;
10188   if (operand_type_all_zero (&bigdisp))
10189     i.types[this_operand] = operand_type_and (i.types[this_operand],
10190                                               types);
10191
10192   return ret;
10193 }
10194
10195 /* Return the active addressing mode, taking address override and
10196    registers forming the address into consideration.  Update the
10197    address override prefix if necessary.  */
10198
10199 static enum flag_code
10200 i386_addressing_mode (void)
10201 {
10202   enum flag_code addr_mode;
10203
10204   if (i.prefix[ADDR_PREFIX])
10205     addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10206   else
10207     {
10208       addr_mode = flag_code;
10209
10210 #if INFER_ADDR_PREFIX
10211       if (i.mem_operands == 0)
10212         {
10213           /* Infer address prefix from the first memory operand.  */
10214           const reg_entry *addr_reg = i.base_reg;
10215
10216           if (addr_reg == NULL)
10217             addr_reg = i.index_reg;
10218
10219           if (addr_reg)
10220             {
10221               if (addr_reg->reg_type.bitfield.dword)
10222                 addr_mode = CODE_32BIT;
10223               else if (flag_code != CODE_64BIT
10224                        && addr_reg->reg_type.bitfield.word)
10225                 addr_mode = CODE_16BIT;
10226
10227               if (addr_mode != flag_code)
10228                 {
10229                   i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10230                   i.prefixes += 1;
10231                   /* Change the size of any displacement too.  At most one
10232                      of Disp16 or Disp32 is set.
10233                      FIXME.  There doesn't seem to be any real need for
10234                      separate Disp16 and Disp32 flags.  The same goes for
10235                      Imm16 and Imm32.  Removing them would probably clean
10236                      up the code quite a lot.  */
10237                   if (flag_code != CODE_64BIT
10238                       && (i.types[this_operand].bitfield.disp16
10239                           || i.types[this_operand].bitfield.disp32))
10240                     i.types[this_operand]
10241                       = operand_type_xor (i.types[this_operand], disp16_32);
10242                 }
10243             }
10244         }
10245 #endif
10246     }
10247
10248   return addr_mode;
10249 }
10250
10251 /* Make sure the memory operand we've been dealt is valid.
10252    Return 1 on success, 0 on a failure.  */
10253
10254 static int
10255 i386_index_check (const char *operand_string)
10256 {
10257   const char *kind = "base/index";
10258   enum flag_code addr_mode = i386_addressing_mode ();
10259
10260   if (current_templates->start->opcode_modifier.isstring
10261       && !current_templates->start->cpu_flags.bitfield.cpupadlock
10262       && (current_templates->end[-1].opcode_modifier.isstring
10263           || i.mem_operands))
10264     {
10265       /* Memory operands of string insns are special in that they only allow
10266          a single register (rDI, rSI, or rBX) as their memory address.  */
10267       const reg_entry *expected_reg;
10268       static const char *di_si[][2] =
10269         {
10270           { "esi", "edi" },
10271           { "si", "di" },
10272           { "rsi", "rdi" }
10273         };
10274       static const char *bx[] = { "ebx", "bx", "rbx" };
10275
10276       kind = "string address";
10277
10278       if (current_templates->start->opcode_modifier.repprefixok)
10279         {
10280           int es_op = current_templates->end[-1].opcode_modifier.isstring
10281                       - IS_STRING_ES_OP0;
10282           int op = 0;
10283
10284           if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
10285               || ((!i.mem_operands != !intel_syntax)
10286                   && current_templates->end[-1].operand_types[1]
10287                      .bitfield.baseindex))
10288             op = 1;
10289           expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
10290         }
10291       else
10292         expected_reg = hash_find (reg_hash, bx[addr_mode]);
10293
10294       if (i.base_reg != expected_reg
10295           || i.index_reg
10296           || operand_type_check (i.types[this_operand], disp))
10297         {
10298           /* The second memory operand must have the same size as
10299              the first one.  */
10300           if (i.mem_operands
10301               && i.base_reg
10302               && !((addr_mode == CODE_64BIT
10303                     && i.base_reg->reg_type.bitfield.qword)
10304                    || (addr_mode == CODE_32BIT
10305                        ? i.base_reg->reg_type.bitfield.dword
10306                        : i.base_reg->reg_type.bitfield.word)))
10307             goto bad_address;
10308
10309           as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10310                    operand_string,
10311                    intel_syntax ? '[' : '(',
10312                    register_prefix,
10313                    expected_reg->reg_name,
10314                    intel_syntax ? ']' : ')');
10315           return 1;
10316         }
10317       else
10318         return 1;
10319
10320 bad_address:
10321       as_bad (_("`%s' is not a valid %s expression"),
10322               operand_string, kind);
10323       return 0;
10324     }
10325   else
10326     {
10327       if (addr_mode != CODE_16BIT)
10328         {
10329           /* 32-bit/64-bit checks.  */
10330           if ((i.base_reg
10331                && ((addr_mode == CODE_64BIT
10332                     ? !i.base_reg->reg_type.bitfield.qword
10333                     : !i.base_reg->reg_type.bitfield.dword)
10334                    || (i.index_reg && i.base_reg->reg_num == RegIP)
10335                    || i.base_reg->reg_num == RegIZ))
10336               || (i.index_reg
10337                   && !i.index_reg->reg_type.bitfield.xmmword
10338                   && !i.index_reg->reg_type.bitfield.ymmword
10339                   && !i.index_reg->reg_type.bitfield.zmmword
10340                   && ((addr_mode == CODE_64BIT
10341                        ? !i.index_reg->reg_type.bitfield.qword
10342                        : !i.index_reg->reg_type.bitfield.dword)
10343                       || !i.index_reg->reg_type.bitfield.baseindex)))
10344             goto bad_address;
10345
10346           /* bndmk, bndldx, and bndstx have special restrictions. */
10347           if (current_templates->start->base_opcode == 0xf30f1b
10348               || (current_templates->start->base_opcode & ~1) == 0x0f1a)
10349             {
10350               /* They cannot use RIP-relative addressing. */
10351               if (i.base_reg && i.base_reg->reg_num == RegIP)
10352                 {
10353                   as_bad (_("`%s' cannot be used here"), operand_string);
10354                   return 0;
10355                 }
10356
10357               /* bndldx and bndstx ignore their scale factor. */
10358               if (current_templates->start->base_opcode != 0xf30f1b
10359                   && i.log2_scale_factor)
10360                 as_warn (_("register scaling is being ignored here"));
10361             }
10362         }
10363       else
10364         {
10365           /* 16-bit checks.  */
10366           if ((i.base_reg
10367                && (!i.base_reg->reg_type.bitfield.word
10368                    || !i.base_reg->reg_type.bitfield.baseindex))
10369               || (i.index_reg
10370                   && (!i.index_reg->reg_type.bitfield.word
10371                       || !i.index_reg->reg_type.bitfield.baseindex
10372                       || !(i.base_reg
10373                            && i.base_reg->reg_num < 6
10374                            && i.index_reg->reg_num >= 6
10375                            && i.log2_scale_factor == 0))))
10376             goto bad_address;
10377         }
10378     }
10379   return 1;
10380 }
10381
10382 /* Handle vector immediates.  */
10383
10384 static int
10385 RC_SAE_immediate (const char *imm_start)
10386 {
10387   unsigned int match_found, j;
10388   const char *pstr = imm_start;
10389   expressionS *exp;
10390
10391   if (*pstr != '{')
10392     return 0;
10393
10394   pstr++;
10395   match_found = 0;
10396   for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10397     {
10398       if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10399         {
10400           if (!i.rounding)
10401             {
10402               rc_op.type = RC_NamesTable[j].type;
10403               rc_op.operand = this_operand;
10404               i.rounding = &rc_op;
10405             }
10406           else
10407             {
10408               as_bad (_("duplicated `%s'"), imm_start);
10409               return 0;
10410             }
10411           pstr += RC_NamesTable[j].len;
10412           match_found = 1;
10413           break;
10414         }
10415     }
10416   if (!match_found)
10417     return 0;
10418
10419   if (*pstr++ != '}')
10420     {
10421       as_bad (_("Missing '}': '%s'"), imm_start);
10422       return 0;
10423     }
10424   /* RC/SAE immediate string should contain nothing more.  */;
10425   if (*pstr != 0)
10426     {
10427       as_bad (_("Junk after '}': '%s'"), imm_start);
10428       return 0;
10429     }
10430
10431   exp = &im_expressions[i.imm_operands++];
10432   i.op[this_operand].imms = exp;
10433
10434   exp->X_op = O_constant;
10435   exp->X_add_number = 0;
10436   exp->X_add_symbol = (symbolS *) 0;
10437   exp->X_op_symbol = (symbolS *) 0;
10438
10439   i.types[this_operand].bitfield.imm8 = 1;
10440   return 1;
10441 }
10442
10443 /* Only string instructions can have a second memory operand, so
10444    reduce current_templates to just those if it contains any.  */
10445 static int
10446 maybe_adjust_templates (void)
10447 {
10448   const insn_template *t;
10449
10450   gas_assert (i.mem_operands == 1);
10451
10452   for (t = current_templates->start; t < current_templates->end; ++t)
10453     if (t->opcode_modifier.isstring)
10454       break;
10455
10456   if (t < current_templates->end)
10457     {
10458       static templates aux_templates;
10459       bfd_boolean recheck;
10460
10461       aux_templates.start = t;
10462       for (; t < current_templates->end; ++t)
10463         if (!t->opcode_modifier.isstring)
10464           break;
10465       aux_templates.end = t;
10466
10467       /* Determine whether to re-check the first memory operand.  */
10468       recheck = (aux_templates.start != current_templates->start
10469                  || t != current_templates->end);
10470
10471       current_templates = &aux_templates;
10472
10473       if (recheck)
10474         {
10475           i.mem_operands = 0;
10476           if (i.memop1_string != NULL
10477               && i386_index_check (i.memop1_string) == 0)
10478             return 0;
10479           i.mem_operands = 1;
10480         }
10481     }
10482
10483   return 1;
10484 }
10485
10486 /* Parse OPERAND_STRING into the i386_insn structure I.  Returns zero
10487    on error.  */
10488
10489 static int
10490 i386_att_operand (char *operand_string)
10491 {
10492   const reg_entry *r;
10493   char *end_op;
10494   char *op_string = operand_string;
10495
10496   if (is_space_char (*op_string))
10497     ++op_string;
10498
10499   /* We check for an absolute prefix (differentiating,
10500      for example, 'jmp pc_relative_label' from 'jmp *absolute_label'.  */
10501   if (*op_string == ABSOLUTE_PREFIX)
10502     {
10503       ++op_string;
10504       if (is_space_char (*op_string))
10505         ++op_string;
10506       i.jumpabsolute = TRUE;
10507     }
10508
10509   /* Check if operand is a register.  */
10510   if ((r = parse_register (op_string, &end_op)) != NULL)
10511     {
10512       i386_operand_type temp;
10513
10514       /* Check for a segment override by searching for ':' after a
10515          segment register.  */
10516       op_string = end_op;
10517       if (is_space_char (*op_string))
10518         ++op_string;
10519       if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
10520         {
10521           switch (r->reg_num)
10522             {
10523             case 0:
10524               i.seg[i.mem_operands] = &es;
10525               break;
10526             case 1:
10527               i.seg[i.mem_operands] = &cs;
10528               break;
10529             case 2:
10530               i.seg[i.mem_operands] = &ss;
10531               break;
10532             case 3:
10533               i.seg[i.mem_operands] = &ds;
10534               break;
10535             case 4:
10536               i.seg[i.mem_operands] = &fs;
10537               break;
10538             case 5:
10539               i.seg[i.mem_operands] = &gs;
10540               break;
10541             }
10542
10543           /* Skip the ':' and whitespace.  */
10544           ++op_string;
10545           if (is_space_char (*op_string))
10546             ++op_string;
10547
10548           if (!is_digit_char (*op_string)
10549               && !is_identifier_char (*op_string)
10550               && *op_string != '('
10551               && *op_string != ABSOLUTE_PREFIX)
10552             {
10553               as_bad (_("bad memory operand `%s'"), op_string);
10554               return 0;
10555             }
10556           /* Handle case of %es:*foo.  */
10557           if (*op_string == ABSOLUTE_PREFIX)
10558             {
10559               ++op_string;
10560               if (is_space_char (*op_string))
10561                 ++op_string;
10562               i.jumpabsolute = TRUE;
10563             }
10564           goto do_memory_reference;
10565         }
10566
10567       /* Handle vector operations.  */
10568       if (*op_string == '{')
10569         {
10570           op_string = check_VecOperations (op_string, NULL);
10571           if (op_string == NULL)
10572             return 0;
10573         }
10574
10575       if (*op_string)
10576         {
10577           as_bad (_("junk `%s' after register"), op_string);
10578           return 0;
10579         }
10580       temp = r->reg_type;
10581       temp.bitfield.baseindex = 0;
10582       i.types[this_operand] = operand_type_or (i.types[this_operand],
10583                                                temp);
10584       i.types[this_operand].bitfield.unspecified = 0;
10585       i.op[this_operand].regs = r;
10586       i.reg_operands++;
10587     }
10588   else if (*op_string == REGISTER_PREFIX)
10589     {
10590       as_bad (_("bad register name `%s'"), op_string);
10591       return 0;
10592     }
10593   else if (*op_string == IMMEDIATE_PREFIX)
10594     {
10595       ++op_string;
10596       if (i.jumpabsolute)
10597         {
10598           as_bad (_("immediate operand illegal with absolute jump"));
10599           return 0;
10600         }
10601       if (!i386_immediate (op_string))
10602         return 0;
10603     }
10604   else if (RC_SAE_immediate (operand_string))
10605     {
10606       /* If it is a RC or SAE immediate, do nothing.  */
10607       ;
10608     }
10609   else if (is_digit_char (*op_string)
10610            || is_identifier_char (*op_string)
10611            || *op_string == '"'
10612            || *op_string == '(')
10613     {
10614       /* This is a memory reference of some sort.  */
10615       char *base_string;
10616
10617       /* Start and end of displacement string expression (if found).  */
10618       char *displacement_string_start;
10619       char *displacement_string_end;
10620       char *vop_start;
10621
10622     do_memory_reference:
10623       if (i.mem_operands == 1 && !maybe_adjust_templates ())
10624         return 0;
10625       if ((i.mem_operands == 1
10626            && !current_templates->start->opcode_modifier.isstring)
10627           || i.mem_operands == 2)
10628         {
10629           as_bad (_("too many memory references for `%s'"),
10630                   current_templates->start->name);
10631           return 0;
10632         }
10633
10634       /* Check for base index form.  We detect the base index form by
10635          looking for an ')' at the end of the operand, searching
10636          for the '(' matching it, and finding a REGISTER_PREFIX or ','
10637          after the '('.  */
10638       base_string = op_string + strlen (op_string);
10639
10640       /* Handle vector operations.  */
10641       vop_start = strchr (op_string, '{');
10642       if (vop_start && vop_start < base_string)
10643         {
10644           if (check_VecOperations (vop_start, base_string) == NULL)
10645             return 0;
10646           base_string = vop_start;
10647         }
10648
10649       --base_string;
10650       if (is_space_char (*base_string))
10651         --base_string;
10652
10653       /* If we only have a displacement, set-up for it to be parsed later.  */
10654       displacement_string_start = op_string;
10655       displacement_string_end = base_string + 1;
10656
10657       if (*base_string == ')')
10658         {
10659           char *temp_string;
10660           unsigned int parens_balanced = 1;
10661           /* We've already checked that the number of left & right ()'s are
10662              equal, so this loop will not be infinite.  */
10663           do
10664             {
10665               base_string--;
10666               if (*base_string == ')')
10667                 parens_balanced++;
10668               if (*base_string == '(')
10669                 parens_balanced--;
10670             }
10671           while (parens_balanced);
10672
10673           temp_string = base_string;
10674
10675           /* Skip past '(' and whitespace.  */
10676           ++base_string;
10677           if (is_space_char (*base_string))
10678             ++base_string;
10679
10680           if (*base_string == ','
10681               || ((i.base_reg = parse_register (base_string, &end_op))
10682                   != NULL))
10683             {
10684               displacement_string_end = temp_string;
10685
10686               i.types[this_operand].bitfield.baseindex = 1;
10687
10688               if (i.base_reg)
10689                 {
10690                   base_string = end_op;
10691                   if (is_space_char (*base_string))
10692                     ++base_string;
10693                 }
10694
10695               /* There may be an index reg or scale factor here.  */
10696               if (*base_string == ',')
10697                 {
10698                   ++base_string;
10699                   if (is_space_char (*base_string))
10700                     ++base_string;
10701
10702                   if ((i.index_reg = parse_register (base_string, &end_op))
10703                       != NULL)
10704                     {
10705                       base_string = end_op;
10706                       if (is_space_char (*base_string))
10707                         ++base_string;
10708                       if (*base_string == ',')
10709                         {
10710                           ++base_string;
10711                           if (is_space_char (*base_string))
10712                             ++base_string;
10713                         }
10714                       else if (*base_string != ')')
10715                         {
10716                           as_bad (_("expecting `,' or `)' "
10717                                     "after index register in `%s'"),
10718                                   operand_string);
10719                           return 0;
10720                         }
10721                     }
10722                   else if (*base_string == REGISTER_PREFIX)
10723                     {
10724                       end_op = strchr (base_string, ',');
10725                       if (end_op)
10726                         *end_op = '\0';
10727                       as_bad (_("bad register name `%s'"), base_string);
10728                       return 0;
10729                     }
10730
10731                   /* Check for scale factor.  */
10732                   if (*base_string != ')')
10733                     {
10734                       char *end_scale = i386_scale (base_string);
10735
10736                       if (!end_scale)
10737                         return 0;
10738
10739                       base_string = end_scale;
10740                       if (is_space_char (*base_string))
10741                         ++base_string;
10742                       if (*base_string != ')')
10743                         {
10744                           as_bad (_("expecting `)' "
10745                                     "after scale factor in `%s'"),
10746                                   operand_string);
10747                           return 0;
10748                         }
10749                     }
10750                   else if (!i.index_reg)
10751                     {
10752                       as_bad (_("expecting index register or scale factor "
10753                                 "after `,'; got '%c'"),
10754                               *base_string);
10755                       return 0;
10756                     }
10757                 }
10758               else if (*base_string != ')')
10759                 {
10760                   as_bad (_("expecting `,' or `)' "
10761                             "after base register in `%s'"),
10762                           operand_string);
10763                   return 0;
10764                 }
10765             }
10766           else if (*base_string == REGISTER_PREFIX)
10767             {
10768               end_op = strchr (base_string, ',');
10769               if (end_op)
10770                 *end_op = '\0';
10771               as_bad (_("bad register name `%s'"), base_string);
10772               return 0;
10773             }
10774         }
10775
10776       /* If there's an expression beginning the operand, parse it,
10777          assuming displacement_string_start and
10778          displacement_string_end are meaningful.  */
10779       if (displacement_string_start != displacement_string_end)
10780         {
10781           if (!i386_displacement (displacement_string_start,
10782                                   displacement_string_end))
10783             return 0;
10784         }
10785
10786       /* Special case for (%dx) while doing input/output op.  */
10787       if (i.base_reg
10788           && i.base_reg->reg_type.bitfield.instance == RegD
10789           && i.base_reg->reg_type.bitfield.word
10790           && i.index_reg == 0
10791           && i.log2_scale_factor == 0
10792           && i.seg[i.mem_operands] == 0
10793           && !operand_type_check (i.types[this_operand], disp))
10794         {
10795           i.types[this_operand] = i.base_reg->reg_type;
10796           return 1;
10797         }
10798
10799       if (i386_index_check (operand_string) == 0)
10800         return 0;
10801       i.flags[this_operand] |= Operand_Mem;
10802       if (i.mem_operands == 0)
10803         i.memop1_string = xstrdup (operand_string);
10804       i.mem_operands++;
10805     }
10806   else
10807     {
10808       /* It's not a memory operand; argh!  */
10809       as_bad (_("invalid char %s beginning operand %d `%s'"),
10810               output_invalid (*op_string),
10811               this_operand + 1,
10812               op_string);
10813       return 0;
10814     }
10815   return 1;                     /* Normal return.  */
10816 }
10817 \f
10818 /* Calculate the maximum variable size (i.e., excluding fr_fix)
10819    that an rs_machine_dependent frag may reach.  */
10820
10821 unsigned int
10822 i386_frag_max_var (fragS *frag)
10823 {
10824   /* The only relaxable frags are for jumps.
10825      Unconditional jumps can grow by 4 bytes and others by 5 bytes.  */
10826   gas_assert (frag->fr_type == rs_machine_dependent);
10827   return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
10828 }
10829
10830 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10831 static int
10832 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
10833 {
10834   /* STT_GNU_IFUNC symbol must go through PLT.  */
10835   if ((symbol_get_bfdsym (fr_symbol)->flags
10836        & BSF_GNU_INDIRECT_FUNCTION) != 0)
10837     return 0;
10838
10839   if (!S_IS_EXTERNAL (fr_symbol))
10840     /* Symbol may be weak or local.  */
10841     return !S_IS_WEAK (fr_symbol);
10842
10843   /* Global symbols with non-default visibility can't be preempted. */
10844   if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
10845     return 1;
10846
10847   if (fr_var != NO_RELOC)
10848     switch ((enum bfd_reloc_code_real) fr_var)
10849       {
10850       case BFD_RELOC_386_PLT32:
10851       case BFD_RELOC_X86_64_PLT32:
10852         /* Symbol with PLT relocation may be preempted. */
10853         return 0;
10854       default:
10855         abort ();
10856       }
10857
10858   /* Global symbols with default visibility in a shared library may be
10859      preempted by another definition.  */
10860   return !shared;
10861 }
10862 #endif
10863
10864 /* Return the next non-empty frag.  */
10865
10866 static fragS *
10867 i386_next_non_empty_frag (fragS *fragP)
10868 {
10869   /* There may be a frag with a ".fill 0" when there is no room in
10870      the current frag for frag_grow in output_insn.  */
10871   for (fragP = fragP->fr_next;
10872        (fragP != NULL
10873         && fragP->fr_type == rs_fill
10874         && fragP->fr_fix == 0);
10875        fragP = fragP->fr_next)
10876     ;
10877   return fragP;
10878 }
10879
10880 /* Return the next jcc frag after BRANCH_PADDING.  */
10881
10882 static fragS *
10883 i386_next_jcc_frag (fragS *fragP)
10884 {
10885   if (!fragP)
10886     return NULL;
10887
10888   if (fragP->fr_type == rs_machine_dependent
10889       && (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
10890           == BRANCH_PADDING))
10891     {
10892       fragP = i386_next_non_empty_frag (fragP);
10893       if (fragP->fr_type != rs_machine_dependent)
10894         return NULL;
10895       if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == COND_JUMP)
10896         return fragP;
10897     }
10898
10899   return NULL;
10900 }
10901
10902 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags.  */
10903
10904 static void
10905 i386_classify_machine_dependent_frag (fragS *fragP)
10906 {
10907   fragS *cmp_fragP;
10908   fragS *pad_fragP;
10909   fragS *branch_fragP;
10910   fragS *next_fragP;
10911   unsigned int max_prefix_length;
10912
10913   if (fragP->tc_frag_data.classified)
10914     return;
10915
10916   /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING.  Convert
10917      FUSED_JCC_PADDING and merge BRANCH_PADDING.  */
10918   for (next_fragP = fragP;
10919        next_fragP != NULL;
10920        next_fragP = next_fragP->fr_next)
10921     {
10922       next_fragP->tc_frag_data.classified = 1;
10923       if (next_fragP->fr_type == rs_machine_dependent)
10924         switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
10925           {
10926           case BRANCH_PADDING:
10927             /* The BRANCH_PADDING frag must be followed by a branch
10928                frag.  */
10929             branch_fragP = i386_next_non_empty_frag (next_fragP);
10930             next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
10931             break;
10932           case FUSED_JCC_PADDING:
10933             /* Check if this is a fused jcc:
10934                FUSED_JCC_PADDING
10935                CMP like instruction
10936                BRANCH_PADDING
10937                COND_JUMP
10938                */
10939             cmp_fragP = i386_next_non_empty_frag (next_fragP);
10940             pad_fragP = i386_next_non_empty_frag (cmp_fragP);
10941             branch_fragP = i386_next_jcc_frag (pad_fragP);
10942             if (branch_fragP)
10943               {
10944                 /* The BRANCH_PADDING frag is merged with the
10945                    FUSED_JCC_PADDING frag.  */
10946                 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
10947                 /* CMP like instruction size.  */
10948                 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
10949                 frag_wane (pad_fragP);
10950                 /* Skip to branch_fragP.  */
10951                 next_fragP = branch_fragP;
10952               }
10953             else if (next_fragP->tc_frag_data.max_prefix_length)
10954               {
10955                 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
10956                    a fused jcc.  */
10957                 next_fragP->fr_subtype
10958                   = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
10959                 next_fragP->tc_frag_data.max_bytes
10960                   = next_fragP->tc_frag_data.max_prefix_length;
10961                 /* This will be updated in the BRANCH_PREFIX scan.  */
10962                 next_fragP->tc_frag_data.max_prefix_length = 0;
10963               }
10964             else
10965               frag_wane (next_fragP);
10966             break;
10967           }
10968     }
10969
10970   /* Stop if there is no BRANCH_PREFIX.  */
10971   if (!align_branch_prefix_size)
10972     return;
10973
10974   /* Scan for BRANCH_PREFIX.  */
10975   for (; fragP != NULL; fragP = fragP->fr_next)
10976     {
10977       if (fragP->fr_type != rs_machine_dependent
10978           || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
10979               != BRANCH_PREFIX))
10980         continue;
10981
10982       /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
10983          COND_JUMP_PREFIX.  */
10984       max_prefix_length = 0;
10985       for (next_fragP = fragP;
10986            next_fragP != NULL;
10987            next_fragP = next_fragP->fr_next)
10988         {
10989           if (next_fragP->fr_type == rs_fill)
10990             /* Skip rs_fill frags.  */
10991             continue;
10992           else if (next_fragP->fr_type != rs_machine_dependent)
10993             /* Stop for all other frags.  */
10994             break;
10995
10996           /* rs_machine_dependent frags.  */
10997           if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
10998               == BRANCH_PREFIX)
10999             {
11000               /* Count BRANCH_PREFIX frags.  */
11001               if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11002                 {
11003                   max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11004                   frag_wane (next_fragP);
11005                 }
11006               else
11007                 max_prefix_length
11008                   += next_fragP->tc_frag_data.max_bytes;
11009             }
11010           else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11011                     == BRANCH_PADDING)
11012                    || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11013                        == FUSED_JCC_PADDING))
11014             {
11015               /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING.  */
11016               fragP->tc_frag_data.u.padding_fragP = next_fragP;
11017               break;
11018             }
11019           else
11020             /* Stop for other rs_machine_dependent frags.  */
11021             break;
11022         }
11023
11024       fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11025
11026       /* Skip to the next frag.  */
11027       fragP = next_fragP;
11028     }
11029 }
11030
11031 /* Compute padding size for
11032
11033         FUSED_JCC_PADDING
11034         CMP like instruction
11035         BRANCH_PADDING
11036         COND_JUMP/UNCOND_JUMP
11037
11038    or
11039
11040         BRANCH_PADDING
11041         COND_JUMP/UNCOND_JUMP
11042  */
11043
11044 static int
11045 i386_branch_padding_size (fragS *fragP, offsetT address)
11046 {
11047   unsigned int offset, size, padding_size;
11048   fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11049
11050   /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag.  */
11051   if (!address)
11052     address = fragP->fr_address;
11053   address += fragP->fr_fix;
11054
11055   /* CMP like instrunction size.  */
11056   size = fragP->tc_frag_data.cmp_size;
11057
11058   /* The base size of the branch frag.  */
11059   size += branch_fragP->fr_fix;
11060
11061   /* Add opcode and displacement bytes for the rs_machine_dependent
11062      branch frag.  */
11063   if (branch_fragP->fr_type == rs_machine_dependent)
11064     size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11065
11066   /* Check if branch is within boundary and doesn't end at the last
11067      byte.  */
11068   offset = address & ((1U << align_branch_power) - 1);
11069   if ((offset + size) >= (1U << align_branch_power))
11070     /* Padding needed to avoid crossing boundary.  */
11071     padding_size = (1U << align_branch_power) - offset;
11072   else
11073     /* No padding needed.  */
11074     padding_size = 0;
11075
11076   /* The return value may be saved in tc_frag_data.length which is
11077      unsigned byte.  */
11078   if (!fits_in_unsigned_byte (padding_size))
11079     abort ();
11080
11081   return padding_size;
11082 }
11083
11084 /* i386_generic_table_relax_frag()
11085
11086    Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11087    grow/shrink padding to align branch frags.  Hand others to
11088    relax_frag().  */
11089
11090 long
11091 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11092 {
11093   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11094       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11095     {
11096       long padding_size = i386_branch_padding_size (fragP, 0);
11097       long grow = padding_size - fragP->tc_frag_data.length;
11098
11099       /* When the BRANCH_PREFIX frag is used, the computed address
11100          must match the actual address and there should be no padding.  */
11101       if (fragP->tc_frag_data.padding_address
11102           && (fragP->tc_frag_data.padding_address != fragP->fr_address
11103               || padding_size))
11104         abort ();
11105
11106       /* Update the padding size.  */
11107       if (grow)
11108         fragP->tc_frag_data.length = padding_size;
11109
11110       return grow;
11111     }
11112   else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11113     {
11114       fragS *padding_fragP, *next_fragP;
11115       long padding_size, left_size, last_size;
11116
11117       padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11118       if (!padding_fragP)
11119         /* Use the padding set by the leading BRANCH_PREFIX frag.  */
11120         return (fragP->tc_frag_data.length
11121                 - fragP->tc_frag_data.last_length);
11122
11123       /* Compute the relative address of the padding frag in the very
11124         first time where the BRANCH_PREFIX frag sizes are zero.  */
11125       if (!fragP->tc_frag_data.padding_address)
11126         fragP->tc_frag_data.padding_address
11127           = padding_fragP->fr_address - (fragP->fr_address - stretch);
11128
11129       /* First update the last length from the previous interation.  */
11130       left_size = fragP->tc_frag_data.prefix_length;
11131       for (next_fragP = fragP;
11132            next_fragP != padding_fragP;
11133            next_fragP = next_fragP->fr_next)
11134         if (next_fragP->fr_type == rs_machine_dependent
11135             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11136                 == BRANCH_PREFIX))
11137           {
11138             if (left_size)
11139               {
11140                 int max = next_fragP->tc_frag_data.max_bytes;
11141                 if (max)
11142                   {
11143                     int size;
11144                     if (max > left_size)
11145                       size = left_size;
11146                     else
11147                       size = max;
11148                     left_size -= size;
11149                     next_fragP->tc_frag_data.last_length = size;
11150                   }
11151               }
11152             else
11153               next_fragP->tc_frag_data.last_length = 0;
11154           }
11155
11156       /* Check the padding size for the padding frag.  */
11157       padding_size = i386_branch_padding_size
11158         (padding_fragP, (fragP->fr_address
11159                          + fragP->tc_frag_data.padding_address));
11160
11161       last_size = fragP->tc_frag_data.prefix_length;
11162       /* Check if there is change from the last interation.  */
11163       if (padding_size == last_size)
11164         {
11165           /* Update the expected address of the padding frag.  */
11166           padding_fragP->tc_frag_data.padding_address
11167             = (fragP->fr_address + padding_size
11168                + fragP->tc_frag_data.padding_address);
11169           return 0;
11170         }
11171
11172       if (padding_size > fragP->tc_frag_data.max_prefix_length)
11173         {
11174           /* No padding if there is no sufficient room.  Clear the
11175              expected address of the padding frag.  */
11176           padding_fragP->tc_frag_data.padding_address = 0;
11177           padding_size = 0;
11178         }
11179       else
11180         /* Store the expected address of the padding frag.  */
11181         padding_fragP->tc_frag_data.padding_address
11182           = (fragP->fr_address + padding_size
11183              + fragP->tc_frag_data.padding_address);
11184
11185       fragP->tc_frag_data.prefix_length = padding_size;
11186
11187       /* Update the length for the current interation.  */
11188       left_size = padding_size;
11189       for (next_fragP = fragP;
11190            next_fragP != padding_fragP;
11191            next_fragP = next_fragP->fr_next)
11192         if (next_fragP->fr_type == rs_machine_dependent
11193             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11194                 == BRANCH_PREFIX))
11195           {
11196             if (left_size)
11197               {
11198                 int max = next_fragP->tc_frag_data.max_bytes;
11199                 if (max)
11200                   {
11201                     int size;
11202                     if (max > left_size)
11203                       size = left_size;
11204                     else
11205                       size = max;
11206                     left_size -= size;
11207                     next_fragP->tc_frag_data.length = size;
11208                   }
11209               }
11210             else
11211               next_fragP->tc_frag_data.length = 0;
11212           }
11213
11214       return (fragP->tc_frag_data.length
11215               - fragP->tc_frag_data.last_length);
11216     }
11217   return relax_frag (segment, fragP, stretch);
11218 }
11219
11220 /* md_estimate_size_before_relax()
11221
11222    Called just before relax() for rs_machine_dependent frags.  The x86
11223    assembler uses these frags to handle variable size jump
11224    instructions.
11225
11226    Any symbol that is now undefined will not become defined.
11227    Return the correct fr_subtype in the frag.
11228    Return the initial "guess for variable size of frag" to caller.
11229    The guess is actually the growth beyond the fixed part.  Whatever
11230    we do to grow the fixed or variable part contributes to our
11231    returned value.  */
11232
11233 int
11234 md_estimate_size_before_relax (fragS *fragP, segT segment)
11235 {
11236   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11237       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11238       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11239     {
11240       i386_classify_machine_dependent_frag (fragP);
11241       return fragP->tc_frag_data.length;
11242     }
11243
11244   /* We've already got fragP->fr_subtype right;  all we have to do is
11245      check for un-relaxable symbols.  On an ELF system, we can't relax
11246      an externally visible symbol, because it may be overridden by a
11247      shared library.  */
11248   if (S_GET_SEGMENT (fragP->fr_symbol) != segment
11249 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11250       || (IS_ELF
11251           && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11252                                                 fragP->fr_var))
11253 #endif
11254 #if defined (OBJ_COFF) && defined (TE_PE)
11255       || (OUTPUT_FLAVOR == bfd_target_coff_flavour
11256           && S_IS_WEAK (fragP->fr_symbol))
11257 #endif
11258       )
11259     {
11260       /* Symbol is undefined in this segment, or we need to keep a
11261          reloc so that weak symbols can be overridden.  */
11262       int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
11263       enum bfd_reloc_code_real reloc_type;
11264       unsigned char *opcode;
11265       int old_fr_fix;
11266
11267       if (fragP->fr_var != NO_RELOC)
11268         reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
11269       else if (size == 2)
11270         reloc_type = BFD_RELOC_16_PCREL;
11271 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11272       else if (need_plt32_p (fragP->fr_symbol))
11273         reloc_type = BFD_RELOC_X86_64_PLT32;
11274 #endif
11275       else
11276         reloc_type = BFD_RELOC_32_PCREL;
11277
11278       old_fr_fix = fragP->fr_fix;
11279       opcode = (unsigned char *) fragP->fr_opcode;
11280
11281       switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
11282         {
11283         case UNCOND_JUMP:
11284           /* Make jmp (0xeb) a (d)word displacement jump.  */
11285           opcode[0] = 0xe9;
11286           fragP->fr_fix += size;
11287           fix_new (fragP, old_fr_fix, size,
11288                    fragP->fr_symbol,
11289                    fragP->fr_offset, 1,
11290                    reloc_type);
11291           break;
11292
11293         case COND_JUMP86:
11294           if (size == 2
11295               && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
11296             {
11297               /* Negate the condition, and branch past an
11298                  unconditional jump.  */
11299               opcode[0] ^= 1;
11300               opcode[1] = 3;
11301               /* Insert an unconditional jump.  */
11302               opcode[2] = 0xe9;
11303               /* We added two extra opcode bytes, and have a two byte
11304                  offset.  */
11305               fragP->fr_fix += 2 + 2;
11306               fix_new (fragP, old_fr_fix + 2, 2,
11307                        fragP->fr_symbol,
11308                        fragP->fr_offset, 1,
11309                        reloc_type);
11310               break;
11311             }
11312           /* Fall through.  */
11313
11314         case COND_JUMP:
11315           if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11316             {
11317               fixS *fixP;
11318
11319               fragP->fr_fix += 1;
11320               fixP = fix_new (fragP, old_fr_fix, 1,
11321                               fragP->fr_symbol,
11322                               fragP->fr_offset, 1,
11323                               BFD_RELOC_8_PCREL);
11324               fixP->fx_signed = 1;
11325               break;
11326             }
11327
11328           /* This changes the byte-displacement jump 0x7N
11329              to the (d)word-displacement jump 0x0f,0x8N.  */
11330           opcode[1] = opcode[0] + 0x10;
11331           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11332           /* We've added an opcode byte.  */
11333           fragP->fr_fix += 1 + size;
11334           fix_new (fragP, old_fr_fix + 1, size,
11335                    fragP->fr_symbol,
11336                    fragP->fr_offset, 1,
11337                    reloc_type);
11338           break;
11339
11340         default:
11341           BAD_CASE (fragP->fr_subtype);
11342           break;
11343         }
11344       frag_wane (fragP);
11345       return fragP->fr_fix - old_fr_fix;
11346     }
11347
11348   /* Guess size depending on current relax state.  Initially the relax
11349      state will correspond to a short jump and we return 1, because
11350      the variable part of the frag (the branch offset) is one byte
11351      long.  However, we can relax a section more than once and in that
11352      case we must either set fr_subtype back to the unrelaxed state,
11353      or return the value for the appropriate branch.  */
11354   return md_relax_table[fragP->fr_subtype].rlx_length;
11355 }
11356
11357 /* Called after relax() is finished.
11358
11359    In:  Address of frag.
11360         fr_type == rs_machine_dependent.
11361         fr_subtype is what the address relaxed to.
11362
11363    Out: Any fixSs and constants are set up.
11364         Caller will turn frag into a ".space 0".  */
11365
11366 void
11367 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
11368                  fragS *fragP)
11369 {
11370   unsigned char *opcode;
11371   unsigned char *where_to_put_displacement = NULL;
11372   offsetT target_address;
11373   offsetT opcode_address;
11374   unsigned int extension = 0;
11375   offsetT displacement_from_opcode_start;
11376
11377   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11378       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
11379       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11380     {
11381       /* Generate nop padding.  */
11382       unsigned int size = fragP->tc_frag_data.length;
11383       if (size)
11384         {
11385           if (size > fragP->tc_frag_data.max_bytes)
11386             abort ();
11387
11388           if (flag_debug)
11389             {
11390               const char *msg;
11391               const char *branch = "branch";
11392               const char *prefix = "";
11393               fragS *padding_fragP;
11394               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11395                   == BRANCH_PREFIX)
11396                 {
11397                   padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11398                   switch (fragP->tc_frag_data.default_prefix)
11399                     {
11400                     default:
11401                       abort ();
11402                       break;
11403                     case CS_PREFIX_OPCODE:
11404                       prefix = " cs";
11405                       break;
11406                     case DS_PREFIX_OPCODE:
11407                       prefix = " ds";
11408                       break;
11409                     case ES_PREFIX_OPCODE:
11410                       prefix = " es";
11411                       break;
11412                     case FS_PREFIX_OPCODE:
11413                       prefix = " fs";
11414                       break;
11415                     case GS_PREFIX_OPCODE:
11416                       prefix = " gs";
11417                       break;
11418                     case SS_PREFIX_OPCODE:
11419                       prefix = " ss";
11420                       break;
11421                     }
11422                   if (padding_fragP)
11423                     msg = _("%s:%u: add %d%s at 0x%llx to align "
11424                             "%s within %d-byte boundary\n");
11425                   else
11426                     msg = _("%s:%u: add additional %d%s at 0x%llx to "
11427                             "align %s within %d-byte boundary\n");
11428                 }
11429               else
11430                 {
11431                   padding_fragP = fragP;
11432                   msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
11433                           "%s within %d-byte boundary\n");
11434                 }
11435
11436               if (padding_fragP)
11437                 switch (padding_fragP->tc_frag_data.branch_type)
11438                   {
11439                   case align_branch_jcc:
11440                     branch = "jcc";
11441                     break;
11442                   case align_branch_fused:
11443                     branch = "fused jcc";
11444                     break;
11445                   case align_branch_jmp:
11446                     branch = "jmp";
11447                     break;
11448                   case align_branch_call:
11449                     branch = "call";
11450                     break;
11451                   case align_branch_indirect:
11452                     branch = "indiret branch";
11453                     break;
11454                   case align_branch_ret:
11455                     branch = "ret";
11456                     break;
11457                   default:
11458                     break;
11459                   }
11460
11461               fprintf (stdout, msg,
11462                        fragP->fr_file, fragP->fr_line, size, prefix,
11463                        (long long) fragP->fr_address, branch,
11464                        1 << align_branch_power);
11465             }
11466           if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11467             memset (fragP->fr_opcode,
11468                     fragP->tc_frag_data.default_prefix, size);
11469           else
11470             i386_generate_nops (fragP, (char *) fragP->fr_opcode,
11471                                 size, 0);
11472           fragP->fr_fix += size;
11473         }
11474       return;
11475     }
11476
11477   opcode = (unsigned char *) fragP->fr_opcode;
11478
11479   /* Address we want to reach in file space.  */
11480   target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
11481
11482   /* Address opcode resides at in file space.  */
11483   opcode_address = fragP->fr_address + fragP->fr_fix;
11484
11485   /* Displacement from opcode start to fill into instruction.  */
11486   displacement_from_opcode_start = target_address - opcode_address;
11487
11488   if ((fragP->fr_subtype & BIG) == 0)
11489     {
11490       /* Don't have to change opcode.  */
11491       extension = 1;            /* 1 opcode + 1 displacement  */
11492       where_to_put_displacement = &opcode[1];
11493     }
11494   else
11495     {
11496       if (no_cond_jump_promotion
11497           && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
11498         as_warn_where (fragP->fr_file, fragP->fr_line,
11499                        _("long jump required"));
11500
11501       switch (fragP->fr_subtype)
11502         {
11503         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
11504           extension = 4;                /* 1 opcode + 4 displacement  */
11505           opcode[0] = 0xe9;
11506           where_to_put_displacement = &opcode[1];
11507           break;
11508
11509         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
11510           extension = 2;                /* 1 opcode + 2 displacement  */
11511           opcode[0] = 0xe9;
11512           where_to_put_displacement = &opcode[1];
11513           break;
11514
11515         case ENCODE_RELAX_STATE (COND_JUMP, BIG):
11516         case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
11517           extension = 5;                /* 2 opcode + 4 displacement  */
11518           opcode[1] = opcode[0] + 0x10;
11519           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11520           where_to_put_displacement = &opcode[2];
11521           break;
11522
11523         case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
11524           extension = 3;                /* 2 opcode + 2 displacement  */
11525           opcode[1] = opcode[0] + 0x10;
11526           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11527           where_to_put_displacement = &opcode[2];
11528           break;
11529
11530         case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
11531           extension = 4;
11532           opcode[0] ^= 1;
11533           opcode[1] = 3;
11534           opcode[2] = 0xe9;
11535           where_to_put_displacement = &opcode[3];
11536           break;
11537
11538         default:
11539           BAD_CASE (fragP->fr_subtype);
11540           break;
11541         }
11542     }
11543
11544   /* If size if less then four we are sure that the operand fits,
11545      but if it's 4, then it could be that the displacement is larger
11546      then -/+ 2GB.  */
11547   if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
11548       && object_64bit
11549       && ((addressT) (displacement_from_opcode_start - extension
11550                       + ((addressT) 1 << 31))
11551           > (((addressT) 2 << 31) - 1)))
11552     {
11553       as_bad_where (fragP->fr_file, fragP->fr_line,
11554                     _("jump target out of range"));
11555       /* Make us emit 0.  */
11556       displacement_from_opcode_start = extension;
11557     }
11558   /* Now put displacement after opcode.  */
11559   md_number_to_chars ((char *) where_to_put_displacement,
11560                       (valueT) (displacement_from_opcode_start - extension),
11561                       DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
11562   fragP->fr_fix += extension;
11563 }
11564 \f
11565 /* Apply a fixup (fixP) to segment data, once it has been determined
11566    by our caller that we have all the info we need to fix it up.
11567
11568    Parameter valP is the pointer to the value of the bits.
11569
11570    On the 386, immediates, displacements, and data pointers are all in
11571    the same (little-endian) format, so we don't need to care about which
11572    we are handling.  */
11573
11574 void
11575 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
11576 {
11577   char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
11578   valueT value = *valP;
11579
11580 #if !defined (TE_Mach)
11581   if (fixP->fx_pcrel)
11582     {
11583       switch (fixP->fx_r_type)
11584         {
11585         default:
11586           break;
11587
11588         case BFD_RELOC_64:
11589           fixP->fx_r_type = BFD_RELOC_64_PCREL;
11590           break;
11591         case BFD_RELOC_32:
11592         case BFD_RELOC_X86_64_32S:
11593           fixP->fx_r_type = BFD_RELOC_32_PCREL;
11594           break;
11595         case BFD_RELOC_16:
11596           fixP->fx_r_type = BFD_RELOC_16_PCREL;
11597           break;
11598         case BFD_RELOC_8:
11599           fixP->fx_r_type = BFD_RELOC_8_PCREL;
11600           break;
11601         }
11602     }
11603
11604   if (fixP->fx_addsy != NULL
11605       && (fixP->fx_r_type == BFD_RELOC_32_PCREL
11606           || fixP->fx_r_type == BFD_RELOC_64_PCREL
11607           || fixP->fx_r_type == BFD_RELOC_16_PCREL
11608           || fixP->fx_r_type == BFD_RELOC_8_PCREL)
11609       && !use_rela_relocations)
11610     {
11611       /* This is a hack.  There should be a better way to handle this.
11612          This covers for the fact that bfd_install_relocation will
11613          subtract the current location (for partial_inplace, PC relative
11614          relocations); see more below.  */
11615 #ifndef OBJ_AOUT
11616       if (IS_ELF
11617 #ifdef TE_PE
11618           || OUTPUT_FLAVOR == bfd_target_coff_flavour
11619 #endif
11620           )
11621         value += fixP->fx_where + fixP->fx_frag->fr_address;
11622 #endif
11623 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11624       if (IS_ELF)
11625         {
11626           segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
11627
11628           if ((sym_seg == seg
11629                || (symbol_section_p (fixP->fx_addsy)
11630                    && sym_seg != absolute_section))
11631               && !generic_force_reloc (fixP))
11632             {
11633               /* Yes, we add the values in twice.  This is because
11634                  bfd_install_relocation subtracts them out again.  I think
11635                  bfd_install_relocation is broken, but I don't dare change
11636                  it.  FIXME.  */
11637               value += fixP->fx_where + fixP->fx_frag->fr_address;
11638             }
11639         }
11640 #endif
11641 #if defined (OBJ_COFF) && defined (TE_PE)
11642       /* For some reason, the PE format does not store a
11643          section address offset for a PC relative symbol.  */
11644       if (S_GET_SEGMENT (fixP->fx_addsy) != seg
11645           || S_IS_WEAK (fixP->fx_addsy))
11646         value += md_pcrel_from (fixP);
11647 #endif
11648     }
11649 #if defined (OBJ_COFF) && defined (TE_PE)
11650   if (fixP->fx_addsy != NULL
11651       && S_IS_WEAK (fixP->fx_addsy)
11652       /* PR 16858: Do not modify weak function references.  */
11653       && ! fixP->fx_pcrel)
11654     {
11655 #if !defined (TE_PEP)
11656       /* For x86 PE weak function symbols are neither PC-relative
11657          nor do they set S_IS_FUNCTION.  So the only reliable way
11658          to detect them is to check the flags of their containing
11659          section.  */
11660       if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
11661           && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
11662         ;
11663       else
11664 #endif
11665       value -= S_GET_VALUE (fixP->fx_addsy);
11666     }
11667 #endif
11668
11669   /* Fix a few things - the dynamic linker expects certain values here,
11670      and we must not disappoint it.  */
11671 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11672   if (IS_ELF && fixP->fx_addsy)
11673     switch (fixP->fx_r_type)
11674       {
11675       case BFD_RELOC_386_PLT32:
11676       case BFD_RELOC_X86_64_PLT32:
11677         /* Make the jump instruction point to the address of the operand.
11678            At runtime we merely add the offset to the actual PLT entry.
11679            NB: Subtract the offset size only for jump instructions.  */
11680         if (fixP->fx_pcrel)
11681           value = -4;
11682         break;
11683
11684       case BFD_RELOC_386_TLS_GD:
11685       case BFD_RELOC_386_TLS_LDM:
11686       case BFD_RELOC_386_TLS_IE_32:
11687       case BFD_RELOC_386_TLS_IE:
11688       case BFD_RELOC_386_TLS_GOTIE:
11689       case BFD_RELOC_386_TLS_GOTDESC:
11690       case BFD_RELOC_X86_64_TLSGD:
11691       case BFD_RELOC_X86_64_TLSLD:
11692       case BFD_RELOC_X86_64_GOTTPOFF:
11693       case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
11694         value = 0; /* Fully resolved at runtime.  No addend.  */
11695         /* Fallthrough */
11696       case BFD_RELOC_386_TLS_LE:
11697       case BFD_RELOC_386_TLS_LDO_32:
11698       case BFD_RELOC_386_TLS_LE_32:
11699       case BFD_RELOC_X86_64_DTPOFF32:
11700       case BFD_RELOC_X86_64_DTPOFF64:
11701       case BFD_RELOC_X86_64_TPOFF32:
11702       case BFD_RELOC_X86_64_TPOFF64:
11703         S_SET_THREAD_LOCAL (fixP->fx_addsy);
11704         break;
11705
11706       case BFD_RELOC_386_TLS_DESC_CALL:
11707       case BFD_RELOC_X86_64_TLSDESC_CALL:
11708         value = 0; /* Fully resolved at runtime.  No addend.  */
11709         S_SET_THREAD_LOCAL (fixP->fx_addsy);
11710         fixP->fx_done = 0;
11711         return;
11712
11713       case BFD_RELOC_VTABLE_INHERIT:
11714       case BFD_RELOC_VTABLE_ENTRY:
11715         fixP->fx_done = 0;
11716         return;
11717
11718       default:
11719         break;
11720       }
11721 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)  */
11722   *valP = value;
11723 #endif /* !defined (TE_Mach)  */
11724
11725   /* Are we finished with this relocation now?  */
11726   if (fixP->fx_addsy == NULL)
11727     fixP->fx_done = 1;
11728 #if defined (OBJ_COFF) && defined (TE_PE)
11729   else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
11730     {
11731       fixP->fx_done = 0;
11732       /* Remember value for tc_gen_reloc.  */
11733       fixP->fx_addnumber = value;
11734       /* Clear out the frag for now.  */
11735       value = 0;
11736     }
11737 #endif
11738   else if (use_rela_relocations)
11739     {
11740       fixP->fx_no_overflow = 1;
11741       /* Remember value for tc_gen_reloc.  */
11742       fixP->fx_addnumber = value;
11743       value = 0;
11744     }
11745
11746   md_number_to_chars (p, value, fixP->fx_size);
11747 }
11748 \f
11749 const char *
11750 md_atof (int type, char *litP, int *sizeP)
11751 {
11752   /* This outputs the LITTLENUMs in REVERSE order;
11753      in accord with the bigendian 386.  */
11754   return ieee_md_atof (type, litP, sizeP, FALSE);
11755 }
11756 \f
11757 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
11758
11759 static char *
11760 output_invalid (int c)
11761 {
11762   if (ISPRINT (c))
11763     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11764               "'%c'", c);
11765   else
11766     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11767               "(0x%x)", (unsigned char) c);
11768   return output_invalid_buf;
11769 }
11770
11771 /* REG_STRING starts *before* REGISTER_PREFIX.  */
11772
11773 static const reg_entry *
11774 parse_real_register (char *reg_string, char **end_op)
11775 {
11776   char *s = reg_string;
11777   char *p;
11778   char reg_name_given[MAX_REG_NAME_SIZE + 1];
11779   const reg_entry *r;
11780
11781   /* Skip possible REGISTER_PREFIX and possible whitespace.  */
11782   if (*s == REGISTER_PREFIX)
11783     ++s;
11784
11785   if (is_space_char (*s))
11786     ++s;
11787
11788   p = reg_name_given;
11789   while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
11790     {
11791       if (p >= reg_name_given + MAX_REG_NAME_SIZE)
11792         return (const reg_entry *) NULL;
11793       s++;
11794     }
11795
11796   /* For naked regs, make sure that we are not dealing with an identifier.
11797      This prevents confusing an identifier like `eax_var' with register
11798      `eax'.  */
11799   if (allow_naked_reg && identifier_chars[(unsigned char) *s])
11800     return (const reg_entry *) NULL;
11801
11802   *end_op = s;
11803
11804   r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
11805
11806   /* Handle floating point regs, allowing spaces in the (i) part.  */
11807   if (r == i386_regtab /* %st is first entry of table  */)
11808     {
11809       if (!cpu_arch_flags.bitfield.cpu8087
11810           && !cpu_arch_flags.bitfield.cpu287
11811           && !cpu_arch_flags.bitfield.cpu387)
11812         return (const reg_entry *) NULL;
11813
11814       if (is_space_char (*s))
11815         ++s;
11816       if (*s == '(')
11817         {
11818           ++s;
11819           if (is_space_char (*s))
11820             ++s;
11821           if (*s >= '0' && *s <= '7')
11822             {
11823               int fpr = *s - '0';
11824               ++s;
11825               if (is_space_char (*s))
11826                 ++s;
11827               if (*s == ')')
11828                 {
11829                   *end_op = s + 1;
11830                   r = (const reg_entry *) hash_find (reg_hash, "st(0)");
11831                   know (r);
11832                   return r + fpr;
11833                 }
11834             }
11835           /* We have "%st(" then garbage.  */
11836           return (const reg_entry *) NULL;
11837         }
11838     }
11839
11840   if (r == NULL || allow_pseudo_reg)
11841     return r;
11842
11843   if (operand_type_all_zero (&r->reg_type))
11844     return (const reg_entry *) NULL;
11845
11846   if ((r->reg_type.bitfield.dword
11847        || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
11848        || r->reg_type.bitfield.class == RegCR
11849        || r->reg_type.bitfield.class == RegDR
11850        || r->reg_type.bitfield.class == RegTR)
11851       && !cpu_arch_flags.bitfield.cpui386)
11852     return (const reg_entry *) NULL;
11853
11854   if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
11855     return (const reg_entry *) NULL;
11856
11857   if (!cpu_arch_flags.bitfield.cpuavx512f)
11858     {
11859       if (r->reg_type.bitfield.zmmword
11860           || r->reg_type.bitfield.class == RegMask)
11861         return (const reg_entry *) NULL;
11862
11863       if (!cpu_arch_flags.bitfield.cpuavx)
11864         {
11865           if (r->reg_type.bitfield.ymmword)
11866             return (const reg_entry *) NULL;
11867
11868           if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
11869             return (const reg_entry *) NULL;
11870         }
11871     }
11872
11873   if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
11874     return (const reg_entry *) NULL;
11875
11876   /* Don't allow fake index register unless allow_index_reg isn't 0. */
11877   if (!allow_index_reg && r->reg_num == RegIZ)
11878     return (const reg_entry *) NULL;
11879
11880   /* Upper 16 vector registers are only available with VREX in 64bit
11881      mode, and require EVEX encoding.  */
11882   if (r->reg_flags & RegVRex)
11883     {
11884       if (!cpu_arch_flags.bitfield.cpuavx512f
11885           || flag_code != CODE_64BIT)
11886         return (const reg_entry *) NULL;
11887
11888       i.vec_encoding = vex_encoding_evex;
11889     }
11890
11891   if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
11892       && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
11893       && flag_code != CODE_64BIT)
11894     return (const reg_entry *) NULL;
11895
11896   if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
11897       && !intel_syntax)
11898     return (const reg_entry *) NULL;
11899
11900   return r;
11901 }
11902
11903 /* REG_STRING starts *before* REGISTER_PREFIX.  */
11904
11905 static const reg_entry *
11906 parse_register (char *reg_string, char **end_op)
11907 {
11908   const reg_entry *r;
11909
11910   if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
11911     r = parse_real_register (reg_string, end_op);
11912   else
11913     r = NULL;
11914   if (!r)
11915     {
11916       char *save = input_line_pointer;
11917       char c;
11918       symbolS *symbolP;
11919
11920       input_line_pointer = reg_string;
11921       c = get_symbol_name (&reg_string);
11922       symbolP = symbol_find (reg_string);
11923       if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
11924         {
11925           const expressionS *e = symbol_get_value_expression (symbolP);
11926
11927           know (e->X_op == O_register);
11928           know (e->X_add_number >= 0
11929                 && (valueT) e->X_add_number < i386_regtab_size);
11930           r = i386_regtab + e->X_add_number;
11931           if ((r->reg_flags & RegVRex))
11932             i.vec_encoding = vex_encoding_evex;
11933           *end_op = input_line_pointer;
11934         }
11935       *input_line_pointer = c;
11936       input_line_pointer = save;
11937     }
11938   return r;
11939 }
11940
11941 int
11942 i386_parse_name (char *name, expressionS *e, char *nextcharP)
11943 {
11944   const reg_entry *r;
11945   char *end = input_line_pointer;
11946
11947   *end = *nextcharP;
11948   r = parse_register (name, &input_line_pointer);
11949   if (r && end <= input_line_pointer)
11950     {
11951       *nextcharP = *input_line_pointer;
11952       *input_line_pointer = 0;
11953       e->X_op = O_register;
11954       e->X_add_number = r - i386_regtab;
11955       return 1;
11956     }
11957   input_line_pointer = end;
11958   *end = 0;
11959   return intel_syntax ? i386_intel_parse_name (name, e) : 0;
11960 }
11961
11962 void
11963 md_operand (expressionS *e)
11964 {
11965   char *end;
11966   const reg_entry *r;
11967
11968   switch (*input_line_pointer)
11969     {
11970     case REGISTER_PREFIX:
11971       r = parse_real_register (input_line_pointer, &end);
11972       if (r)
11973         {
11974           e->X_op = O_register;
11975           e->X_add_number = r - i386_regtab;
11976           input_line_pointer = end;
11977         }
11978       break;
11979
11980     case '[':
11981       gas_assert (intel_syntax);
11982       end = input_line_pointer++;
11983       expression (e);
11984       if (*input_line_pointer == ']')
11985         {
11986           ++input_line_pointer;
11987           e->X_op_symbol = make_expr_symbol (e);
11988           e->X_add_symbol = NULL;
11989           e->X_add_number = 0;
11990           e->X_op = O_index;
11991         }
11992       else
11993         {
11994           e->X_op = O_absent;
11995           input_line_pointer = end;
11996         }
11997       break;
11998     }
11999 }
12000
12001 \f
12002 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12003 const char *md_shortopts = "kVQ:sqnO::";
12004 #else
12005 const char *md_shortopts = "qnO::";
12006 #endif
12007
12008 #define OPTION_32 (OPTION_MD_BASE + 0)
12009 #define OPTION_64 (OPTION_MD_BASE + 1)
12010 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12011 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12012 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12013 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12014 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12015 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12016 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12017 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12018 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12019 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12020 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12021 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12022 #define OPTION_X32 (OPTION_MD_BASE + 14)
12023 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12024 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12025 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12026 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12027 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12028 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12029 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12030 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12031 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12032 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12033 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12034 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12035 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12036 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12037 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12038 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12039
12040 struct option md_longopts[] =
12041 {
12042   {"32", no_argument, NULL, OPTION_32},
12043 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12044      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12045   {"64", no_argument, NULL, OPTION_64},
12046 #endif
12047 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12048   {"x32", no_argument, NULL, OPTION_X32},
12049   {"mshared", no_argument, NULL, OPTION_MSHARED},
12050   {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12051 #endif
12052   {"divide", no_argument, NULL, OPTION_DIVIDE},
12053   {"march", required_argument, NULL, OPTION_MARCH},
12054   {"mtune", required_argument, NULL, OPTION_MTUNE},
12055   {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12056   {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12057   {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12058   {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12059   {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12060   {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12061   {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12062   {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12063   {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12064   {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12065   {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12066   {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12067 # if defined (TE_PE) || defined (TE_PEP)
12068   {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12069 #endif
12070   {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12071   {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12072   {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12073   {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12074   {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12075   {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12076   {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12077   {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12078   {"mamd64", no_argument, NULL, OPTION_MAMD64},
12079   {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12080   {NULL, no_argument, NULL, 0}
12081 };
12082 size_t md_longopts_size = sizeof (md_longopts);
12083
12084 int
12085 md_parse_option (int c, const char *arg)
12086 {
12087   unsigned int j;
12088   char *arch, *next, *saved, *type;
12089
12090   switch (c)
12091     {
12092     case 'n':
12093       optimize_align_code = 0;
12094       break;
12095
12096     case 'q':
12097       quiet_warnings = 1;
12098       break;
12099
12100 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12101       /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12102          should be emitted or not.  FIXME: Not implemented.  */
12103     case 'Q':
12104       if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12105         return 0;
12106       break;
12107
12108       /* -V: SVR4 argument to print version ID.  */
12109     case 'V':
12110       print_version_id ();
12111       break;
12112
12113       /* -k: Ignore for FreeBSD compatibility.  */
12114     case 'k':
12115       break;
12116
12117     case 's':
12118       /* -s: On i386 Solaris, this tells the native assembler to use
12119          .stab instead of .stab.excl.  We always use .stab anyhow.  */
12120       break;
12121
12122     case OPTION_MSHARED:
12123       shared = 1;
12124       break;
12125
12126     case OPTION_X86_USED_NOTE:
12127       if (strcasecmp (arg, "yes") == 0)
12128         x86_used_note = 1;
12129       else if (strcasecmp (arg, "no") == 0)
12130         x86_used_note = 0;
12131       else
12132         as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12133       break;
12134
12135
12136 #endif
12137 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12138      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12139     case OPTION_64:
12140       {
12141         const char **list, **l;
12142
12143         list = bfd_target_list ();
12144         for (l = list; *l != NULL; l++)
12145           if (CONST_STRNEQ (*l, "elf64-x86-64")
12146               || strcmp (*l, "coff-x86-64") == 0
12147               || strcmp (*l, "pe-x86-64") == 0
12148               || strcmp (*l, "pei-x86-64") == 0
12149               || strcmp (*l, "mach-o-x86-64") == 0)
12150             {
12151               default_arch = "x86_64";
12152               break;
12153             }
12154         if (*l == NULL)
12155           as_fatal (_("no compiled in support for x86_64"));
12156         free (list);
12157       }
12158       break;
12159 #endif
12160
12161 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12162     case OPTION_X32:
12163       if (IS_ELF)
12164         {
12165           const char **list, **l;
12166
12167           list = bfd_target_list ();
12168           for (l = list; *l != NULL; l++)
12169             if (CONST_STRNEQ (*l, "elf32-x86-64"))
12170               {
12171                 default_arch = "x86_64:32";
12172                 break;
12173               }
12174           if (*l == NULL)
12175             as_fatal (_("no compiled in support for 32bit x86_64"));
12176           free (list);
12177         }
12178       else
12179         as_fatal (_("32bit x86_64 is only supported for ELF"));
12180       break;
12181 #endif
12182
12183     case OPTION_32:
12184       default_arch = "i386";
12185       break;
12186
12187     case OPTION_DIVIDE:
12188 #ifdef SVR4_COMMENT_CHARS
12189       {
12190         char *n, *t;
12191         const char *s;
12192
12193         n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
12194         t = n;
12195         for (s = i386_comment_chars; *s != '\0'; s++)
12196           if (*s != '/')
12197             *t++ = *s;
12198         *t = '\0';
12199         i386_comment_chars = n;
12200       }
12201 #endif
12202       break;
12203
12204     case OPTION_MARCH:
12205       saved = xstrdup (arg);
12206       arch = saved;
12207       /* Allow -march=+nosse.  */
12208       if (*arch == '+')
12209         arch++;
12210       do
12211         {
12212           if (*arch == '.')
12213             as_fatal (_("invalid -march= option: `%s'"), arg);
12214           next = strchr (arch, '+');
12215           if (next)
12216             *next++ = '\0';
12217           for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12218             {
12219               if (strcmp (arch, cpu_arch [j].name) == 0)
12220                 {
12221                   /* Processor.  */
12222                   if (! cpu_arch[j].flags.bitfield.cpui386)
12223                     continue;
12224
12225                   cpu_arch_name = cpu_arch[j].name;
12226                   cpu_sub_arch_name = NULL;
12227                   cpu_arch_flags = cpu_arch[j].flags;
12228                   cpu_arch_isa = cpu_arch[j].type;
12229                   cpu_arch_isa_flags = cpu_arch[j].flags;
12230                   if (!cpu_arch_tune_set)
12231                     {
12232                       cpu_arch_tune = cpu_arch_isa;
12233                       cpu_arch_tune_flags = cpu_arch_isa_flags;
12234                     }
12235                   break;
12236                 }
12237               else if (*cpu_arch [j].name == '.'
12238                        && strcmp (arch, cpu_arch [j].name + 1) == 0)
12239                 {
12240                   /* ISA extension.  */
12241                   i386_cpu_flags flags;
12242
12243                   flags = cpu_flags_or (cpu_arch_flags,
12244                                         cpu_arch[j].flags);
12245
12246                   if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12247                     {
12248                       if (cpu_sub_arch_name)
12249                         {
12250                           char *name = cpu_sub_arch_name;
12251                           cpu_sub_arch_name = concat (name,
12252                                                       cpu_arch[j].name,
12253                                                       (const char *) NULL);
12254                           free (name);
12255                         }
12256                       else
12257                         cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
12258                       cpu_arch_flags = flags;
12259                       cpu_arch_isa_flags = flags;
12260                     }
12261                   else
12262                     cpu_arch_isa_flags
12263                       = cpu_flags_or (cpu_arch_isa_flags,
12264                                       cpu_arch[j].flags);
12265                   break;
12266                 }
12267             }
12268
12269           if (j >= ARRAY_SIZE (cpu_arch))
12270             {
12271               /* Disable an ISA extension.  */
12272               for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12273                 if (strcmp (arch, cpu_noarch [j].name) == 0)
12274                   {
12275                     i386_cpu_flags flags;
12276
12277                     flags = cpu_flags_and_not (cpu_arch_flags,
12278                                                cpu_noarch[j].flags);
12279                     if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12280                       {
12281                         if (cpu_sub_arch_name)
12282                           {
12283                             char *name = cpu_sub_arch_name;
12284                             cpu_sub_arch_name = concat (arch,
12285                                                         (const char *) NULL);
12286                             free (name);
12287                           }
12288                         else
12289                           cpu_sub_arch_name = xstrdup (arch);
12290                         cpu_arch_flags = flags;
12291                         cpu_arch_isa_flags = flags;
12292                       }
12293                     break;
12294                   }
12295
12296               if (j >= ARRAY_SIZE (cpu_noarch))
12297                 j = ARRAY_SIZE (cpu_arch);
12298             }
12299
12300           if (j >= ARRAY_SIZE (cpu_arch))
12301             as_fatal (_("invalid -march= option: `%s'"), arg);
12302
12303           arch = next;
12304         }
12305       while (next != NULL);
12306       free (saved);
12307       break;
12308
12309     case OPTION_MTUNE:
12310       if (*arg == '.')
12311         as_fatal (_("invalid -mtune= option: `%s'"), arg);
12312       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12313         {
12314           if (strcmp (arg, cpu_arch [j].name) == 0)
12315             {
12316               cpu_arch_tune_set = 1;
12317               cpu_arch_tune = cpu_arch [j].type;
12318               cpu_arch_tune_flags = cpu_arch[j].flags;
12319               break;
12320             }
12321         }
12322       if (j >= ARRAY_SIZE (cpu_arch))
12323         as_fatal (_("invalid -mtune= option: `%s'"), arg);
12324       break;
12325
12326     case OPTION_MMNEMONIC:
12327       if (strcasecmp (arg, "att") == 0)
12328         intel_mnemonic = 0;
12329       else if (strcasecmp (arg, "intel") == 0)
12330         intel_mnemonic = 1;
12331       else
12332         as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
12333       break;
12334
12335     case OPTION_MSYNTAX:
12336       if (strcasecmp (arg, "att") == 0)
12337         intel_syntax = 0;
12338       else if (strcasecmp (arg, "intel") == 0)
12339         intel_syntax = 1;
12340       else
12341         as_fatal (_("invalid -msyntax= option: `%s'"), arg);
12342       break;
12343
12344     case OPTION_MINDEX_REG:
12345       allow_index_reg = 1;
12346       break;
12347
12348     case OPTION_MNAKED_REG:
12349       allow_naked_reg = 1;
12350       break;
12351
12352     case OPTION_MSSE2AVX:
12353       sse2avx = 1;
12354       break;
12355
12356     case OPTION_MSSE_CHECK:
12357       if (strcasecmp (arg, "error") == 0)
12358         sse_check = check_error;
12359       else if (strcasecmp (arg, "warning") == 0)
12360         sse_check = check_warning;
12361       else if (strcasecmp (arg, "none") == 0)
12362         sse_check = check_none;
12363       else
12364         as_fatal (_("invalid -msse-check= option: `%s'"), arg);
12365       break;
12366
12367     case OPTION_MOPERAND_CHECK:
12368       if (strcasecmp (arg, "error") == 0)
12369         operand_check = check_error;
12370       else if (strcasecmp (arg, "warning") == 0)
12371         operand_check = check_warning;
12372       else if (strcasecmp (arg, "none") == 0)
12373         operand_check = check_none;
12374       else
12375         as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
12376       break;
12377
12378     case OPTION_MAVXSCALAR:
12379       if (strcasecmp (arg, "128") == 0)
12380         avxscalar = vex128;
12381       else if (strcasecmp (arg, "256") == 0)
12382         avxscalar = vex256;
12383       else
12384         as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
12385       break;
12386
12387     case OPTION_MVEXWIG:
12388       if (strcmp (arg, "0") == 0)
12389         vexwig = vexw0;
12390       else if (strcmp (arg, "1") == 0)
12391         vexwig = vexw1;
12392       else
12393         as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
12394       break;
12395
12396     case OPTION_MADD_BND_PREFIX:
12397       add_bnd_prefix = 1;
12398       break;
12399
12400     case OPTION_MEVEXLIG:
12401       if (strcmp (arg, "128") == 0)
12402         evexlig = evexl128;
12403       else if (strcmp (arg, "256") == 0)
12404         evexlig = evexl256;
12405       else  if (strcmp (arg, "512") == 0)
12406         evexlig = evexl512;
12407       else
12408         as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
12409       break;
12410
12411     case OPTION_MEVEXRCIG:
12412       if (strcmp (arg, "rne") == 0)
12413         evexrcig = rne;
12414       else if (strcmp (arg, "rd") == 0)
12415         evexrcig = rd;
12416       else if (strcmp (arg, "ru") == 0)
12417         evexrcig = ru;
12418       else if (strcmp (arg, "rz") == 0)
12419         evexrcig = rz;
12420       else
12421         as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
12422       break;
12423
12424     case OPTION_MEVEXWIG:
12425       if (strcmp (arg, "0") == 0)
12426         evexwig = evexw0;
12427       else if (strcmp (arg, "1") == 0)
12428         evexwig = evexw1;
12429       else
12430         as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
12431       break;
12432
12433 # if defined (TE_PE) || defined (TE_PEP)
12434     case OPTION_MBIG_OBJ:
12435       use_big_obj = 1;
12436       break;
12437 #endif
12438
12439     case OPTION_MOMIT_LOCK_PREFIX:
12440       if (strcasecmp (arg, "yes") == 0)
12441         omit_lock_prefix = 1;
12442       else if (strcasecmp (arg, "no") == 0)
12443         omit_lock_prefix = 0;
12444       else
12445         as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
12446       break;
12447
12448     case OPTION_MFENCE_AS_LOCK_ADD:
12449       if (strcasecmp (arg, "yes") == 0)
12450         avoid_fence = 1;
12451       else if (strcasecmp (arg, "no") == 0)
12452         avoid_fence = 0;
12453       else
12454         as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
12455       break;
12456
12457     case OPTION_MRELAX_RELOCATIONS:
12458       if (strcasecmp (arg, "yes") == 0)
12459         generate_relax_relocations = 1;
12460       else if (strcasecmp (arg, "no") == 0)
12461         generate_relax_relocations = 0;
12462       else
12463         as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
12464       break;
12465
12466     case OPTION_MALIGN_BRANCH_BOUNDARY:
12467       {
12468         char *end;
12469         long int align = strtoul (arg, &end, 0);
12470         if (*end == '\0')
12471           {
12472             if (align == 0)
12473               {
12474                 align_branch_power = 0;
12475                 break;
12476               }
12477             else if (align >= 16)
12478               {
12479                 int align_power;
12480                 for (align_power = 0;
12481                      (align & 1) == 0;
12482                      align >>= 1, align_power++)
12483                   continue;
12484                 /* Limit alignment power to 31.  */
12485                 if (align == 1 && align_power < 32)
12486                   {
12487                     align_branch_power = align_power;
12488                     break;
12489                   }
12490               }
12491           }
12492         as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
12493       }
12494       break;
12495
12496     case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
12497       {
12498         char *end;
12499         int align = strtoul (arg, &end, 0);
12500         /* Some processors only support 5 prefixes.  */
12501         if (*end == '\0' && align >= 0 && align < 6)
12502           {
12503             align_branch_prefix_size = align;
12504             break;
12505           }
12506         as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
12507                   arg);
12508       }
12509       break;
12510
12511     case OPTION_MALIGN_BRANCH:
12512       align_branch = 0;
12513       saved = xstrdup (arg);
12514       type = saved;
12515       do
12516         {
12517           next = strchr (type, '+');
12518           if (next)
12519             *next++ = '\0';
12520           if (strcasecmp (type, "jcc") == 0)
12521             align_branch |= align_branch_jcc_bit;
12522           else if (strcasecmp (type, "fused") == 0)
12523             align_branch |= align_branch_fused_bit;
12524           else if (strcasecmp (type, "jmp") == 0)
12525             align_branch |= align_branch_jmp_bit;
12526           else if (strcasecmp (type, "call") == 0)
12527             align_branch |= align_branch_call_bit;
12528           else if (strcasecmp (type, "ret") == 0)
12529             align_branch |= align_branch_ret_bit;
12530           else if (strcasecmp (type, "indirect") == 0)
12531             align_branch |= align_branch_indirect_bit;
12532           else
12533             as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
12534           type = next;
12535         }
12536       while (next != NULL);
12537       free (saved);
12538       break;
12539
12540     case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
12541       align_branch_power = 5;
12542       align_branch_prefix_size = 5;
12543       align_branch = (align_branch_jcc_bit
12544                       | align_branch_fused_bit
12545                       | align_branch_jmp_bit);
12546       break;
12547
12548     case OPTION_MAMD64:
12549       intel64 = 0;
12550       break;
12551
12552     case OPTION_MINTEL64:
12553       intel64 = 1;
12554       break;
12555
12556     case 'O':
12557       if (arg == NULL)
12558         {
12559           optimize = 1;
12560           /* Turn off -Os.  */
12561           optimize_for_space = 0;
12562         }
12563       else if (*arg == 's')
12564         {
12565           optimize_for_space = 1;
12566           /* Turn on all encoding optimizations.  */
12567           optimize = INT_MAX;
12568         }
12569       else
12570         {
12571           optimize = atoi (arg);
12572           /* Turn off -Os.  */
12573           optimize_for_space = 0;
12574         }
12575       break;
12576
12577     default:
12578       return 0;
12579     }
12580   return 1;
12581 }
12582
12583 #define MESSAGE_TEMPLATE \
12584 "                                                                                "
12585
12586 static char *
12587 output_message (FILE *stream, char *p, char *message, char *start,
12588                 int *left_p, const char *name, int len)
12589 {
12590   int size = sizeof (MESSAGE_TEMPLATE);
12591   int left = *left_p;
12592
12593   /* Reserve 2 spaces for ", " or ",\0" */
12594   left -= len + 2;
12595
12596   /* Check if there is any room.  */
12597   if (left >= 0)
12598     {
12599       if (p != start)
12600         {
12601           *p++ = ',';
12602           *p++ = ' ';
12603         }
12604       p = mempcpy (p, name, len);
12605     }
12606   else
12607     {
12608       /* Output the current message now and start a new one.  */
12609       *p++ = ',';
12610       *p = '\0';
12611       fprintf (stream, "%s\n", message);
12612       p = start;
12613       left = size - (start - message) - len - 2;
12614
12615       gas_assert (left >= 0);
12616
12617       p = mempcpy (p, name, len);
12618     }
12619
12620   *left_p = left;
12621   return p;
12622 }
12623
12624 static void
12625 show_arch (FILE *stream, int ext, int check)
12626 {
12627   static char message[] = MESSAGE_TEMPLATE;
12628   char *start = message + 27;
12629   char *p;
12630   int size = sizeof (MESSAGE_TEMPLATE);
12631   int left;
12632   const char *name;
12633   int len;
12634   unsigned int j;
12635
12636   p = start;
12637   left = size - (start - message);
12638   for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12639     {
12640       /* Should it be skipped?  */
12641       if (cpu_arch [j].skip)
12642         continue;
12643
12644       name = cpu_arch [j].name;
12645       len = cpu_arch [j].len;
12646       if (*name == '.')
12647         {
12648           /* It is an extension.  Skip if we aren't asked to show it.  */
12649           if (ext)
12650             {
12651               name++;
12652               len--;
12653             }
12654           else
12655             continue;
12656         }
12657       else if (ext)
12658         {
12659           /* It is an processor.  Skip if we show only extension.  */
12660           continue;
12661         }
12662       else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
12663         {
12664           /* It is an impossible processor - skip.  */
12665           continue;
12666         }
12667
12668       p = output_message (stream, p, message, start, &left, name, len);
12669     }
12670
12671   /* Display disabled extensions.  */
12672   if (ext)
12673     for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12674       {
12675         name = cpu_noarch [j].name;
12676         len = cpu_noarch [j].len;
12677         p = output_message (stream, p, message, start, &left, name,
12678                             len);
12679       }
12680
12681   *p = '\0';
12682   fprintf (stream, "%s\n", message);
12683 }
12684
12685 void
12686 md_show_usage (FILE *stream)
12687 {
12688 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12689   fprintf (stream, _("\
12690   -Qy, -Qn                ignored\n\
12691   -V                      print assembler version number\n\
12692   -k                      ignored\n"));
12693 #endif
12694   fprintf (stream, _("\
12695   -n                      Do not optimize code alignment\n\
12696   -q                      quieten some warnings\n"));
12697 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12698   fprintf (stream, _("\
12699   -s                      ignored\n"));
12700 #endif
12701 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12702                       || defined (TE_PE) || defined (TE_PEP))
12703   fprintf (stream, _("\
12704   --32/--64/--x32         generate 32bit/64bit/x32 code\n"));
12705 #endif
12706 #ifdef SVR4_COMMENT_CHARS
12707   fprintf (stream, _("\
12708   --divide                do not treat `/' as a comment character\n"));
12709 #else
12710   fprintf (stream, _("\
12711   --divide                ignored\n"));
12712 #endif
12713   fprintf (stream, _("\
12714   -march=CPU[,+EXTENSION...]\n\
12715                           generate code for CPU and EXTENSION, CPU is one of:\n"));
12716   show_arch (stream, 0, 1);
12717   fprintf (stream, _("\
12718                           EXTENSION is combination of:\n"));
12719   show_arch (stream, 1, 0);
12720   fprintf (stream, _("\
12721   -mtune=CPU              optimize for CPU, CPU is one of:\n"));
12722   show_arch (stream, 0, 0);
12723   fprintf (stream, _("\
12724   -msse2avx               encode SSE instructions with VEX prefix\n"));
12725   fprintf (stream, _("\
12726   -msse-check=[none|error|warning] (default: warning)\n\
12727                           check SSE instructions\n"));
12728   fprintf (stream, _("\
12729   -moperand-check=[none|error|warning] (default: warning)\n\
12730                           check operand combinations for validity\n"));
12731   fprintf (stream, _("\
12732   -mavxscalar=[128|256] (default: 128)\n\
12733                           encode scalar AVX instructions with specific vector\n\
12734                            length\n"));
12735   fprintf (stream, _("\
12736   -mvexwig=[0|1] (default: 0)\n\
12737                           encode VEX instructions with specific VEX.W value\n\
12738                            for VEX.W bit ignored instructions\n"));
12739   fprintf (stream, _("\
12740   -mevexlig=[128|256|512] (default: 128)\n\
12741                           encode scalar EVEX instructions with specific vector\n\
12742                            length\n"));
12743   fprintf (stream, _("\
12744   -mevexwig=[0|1] (default: 0)\n\
12745                           encode EVEX instructions with specific EVEX.W value\n\
12746                            for EVEX.W bit ignored instructions\n"));
12747   fprintf (stream, _("\
12748   -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
12749                           encode EVEX instructions with specific EVEX.RC value\n\
12750                            for SAE-only ignored instructions\n"));
12751   fprintf (stream, _("\
12752   -mmnemonic=[att|intel] "));
12753   if (SYSV386_COMPAT)
12754     fprintf (stream, _("(default: att)\n"));
12755   else
12756     fprintf (stream, _("(default: intel)\n"));
12757   fprintf (stream, _("\
12758                           use AT&T/Intel mnemonic\n"));
12759   fprintf (stream, _("\
12760   -msyntax=[att|intel] (default: att)\n\
12761                           use AT&T/Intel syntax\n"));
12762   fprintf (stream, _("\
12763   -mindex-reg             support pseudo index registers\n"));
12764   fprintf (stream, _("\
12765   -mnaked-reg             don't require `%%' prefix for registers\n"));
12766   fprintf (stream, _("\
12767   -madd-bnd-prefix        add BND prefix for all valid branches\n"));
12768 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12769   fprintf (stream, _("\
12770   -mshared                disable branch optimization for shared code\n"));
12771   fprintf (stream, _("\
12772   -mx86-used-note=[no|yes] "));
12773   if (DEFAULT_X86_USED_NOTE)
12774     fprintf (stream, _("(default: yes)\n"));
12775   else
12776     fprintf (stream, _("(default: no)\n"));
12777   fprintf (stream, _("\
12778                           generate x86 used ISA and feature properties\n"));
12779 #endif
12780 #if defined (TE_PE) || defined (TE_PEP)
12781   fprintf (stream, _("\
12782   -mbig-obj               generate big object files\n"));
12783 #endif
12784   fprintf (stream, _("\
12785   -momit-lock-prefix=[no|yes] (default: no)\n\
12786                           strip all lock prefixes\n"));
12787   fprintf (stream, _("\
12788   -mfence-as-lock-add=[no|yes] (default: no)\n\
12789                           encode lfence, mfence and sfence as\n\
12790                            lock addl $0x0, (%%{re}sp)\n"));
12791   fprintf (stream, _("\
12792   -mrelax-relocations=[no|yes] "));
12793   if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
12794     fprintf (stream, _("(default: yes)\n"));
12795   else
12796     fprintf (stream, _("(default: no)\n"));
12797   fprintf (stream, _("\
12798                           generate relax relocations\n"));
12799   fprintf (stream, _("\
12800   -malign-branch-boundary=NUM (default: 0)\n\
12801                           align branches within NUM byte boundary\n"));
12802   fprintf (stream, _("\
12803   -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
12804                           TYPE is combination of jcc, fused, jmp, call, ret,\n\
12805                            indirect\n\
12806                           specify types of branches to align\n"));
12807   fprintf (stream, _("\
12808   -malign-branch-prefix-size=NUM (default: 5)\n\
12809                           align branches with NUM prefixes per instruction\n"));
12810   fprintf (stream, _("\
12811   -mbranches-within-32B-boundaries\n\
12812                           align branches within 32 byte boundary\n"));
12813   fprintf (stream, _("\
12814   -mamd64                 accept only AMD64 ISA [default]\n"));
12815   fprintf (stream, _("\
12816   -mintel64               accept only Intel64 ISA\n"));
12817 }
12818
12819 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
12820      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12821      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12822
12823 /* Pick the target format to use.  */
12824
12825 const char *
12826 i386_target_format (void)
12827 {
12828   if (!strncmp (default_arch, "x86_64", 6))
12829     {
12830       update_code_flag (CODE_64BIT, 1);
12831       if (default_arch[6] == '\0')
12832         x86_elf_abi = X86_64_ABI;
12833       else
12834         x86_elf_abi = X86_64_X32_ABI;
12835     }
12836   else if (!strcmp (default_arch, "i386"))
12837     update_code_flag (CODE_32BIT, 1);
12838   else if (!strcmp (default_arch, "iamcu"))
12839     {
12840       update_code_flag (CODE_32BIT, 1);
12841       if (cpu_arch_isa == PROCESSOR_UNKNOWN)
12842         {
12843           static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
12844           cpu_arch_name = "iamcu";
12845           cpu_sub_arch_name = NULL;
12846           cpu_arch_flags = iamcu_flags;
12847           cpu_arch_isa = PROCESSOR_IAMCU;
12848           cpu_arch_isa_flags = iamcu_flags;
12849           if (!cpu_arch_tune_set)
12850             {
12851               cpu_arch_tune = cpu_arch_isa;
12852               cpu_arch_tune_flags = cpu_arch_isa_flags;
12853             }
12854         }
12855       else if (cpu_arch_isa != PROCESSOR_IAMCU)
12856         as_fatal (_("Intel MCU doesn't support `%s' architecture"),
12857                   cpu_arch_name);
12858     }
12859   else
12860     as_fatal (_("unknown architecture"));
12861
12862   if (cpu_flags_all_zero (&cpu_arch_isa_flags))
12863     cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12864   if (cpu_flags_all_zero (&cpu_arch_tune_flags))
12865     cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12866
12867   switch (OUTPUT_FLAVOR)
12868     {
12869 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
12870     case bfd_target_aout_flavour:
12871       return AOUT_TARGET_FORMAT;
12872 #endif
12873 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
12874 # if defined (TE_PE) || defined (TE_PEP)
12875     case bfd_target_coff_flavour:
12876       if (flag_code == CODE_64BIT)
12877         return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
12878       else
12879         return "pe-i386";
12880 # elif defined (TE_GO32)
12881     case bfd_target_coff_flavour:
12882       return "coff-go32";
12883 # else
12884     case bfd_target_coff_flavour:
12885       return "coff-i386";
12886 # endif
12887 #endif
12888 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
12889     case bfd_target_elf_flavour:
12890       {
12891         const char *format;
12892
12893         switch (x86_elf_abi)
12894           {
12895           default:
12896             format = ELF_TARGET_FORMAT;
12897 #ifndef TE_SOLARIS
12898             tls_get_addr = "___tls_get_addr";
12899 #endif
12900             break;
12901           case X86_64_ABI:
12902             use_rela_relocations = 1;
12903             object_64bit = 1;
12904 #ifndef TE_SOLARIS
12905             tls_get_addr = "__tls_get_addr";
12906 #endif
12907             format = ELF_TARGET_FORMAT64;
12908             break;
12909           case X86_64_X32_ABI:
12910             use_rela_relocations = 1;
12911             object_64bit = 1;
12912 #ifndef TE_SOLARIS
12913             tls_get_addr = "__tls_get_addr";
12914 #endif
12915             disallow_64bit_reloc = 1;
12916             format = ELF_TARGET_FORMAT32;
12917             break;
12918           }
12919         if (cpu_arch_isa == PROCESSOR_L1OM)
12920           {
12921             if (x86_elf_abi != X86_64_ABI)
12922               as_fatal (_("Intel L1OM is 64bit only"));
12923             return ELF_TARGET_L1OM_FORMAT;
12924           }
12925         else if (cpu_arch_isa == PROCESSOR_K1OM)
12926           {
12927             if (x86_elf_abi != X86_64_ABI)
12928               as_fatal (_("Intel K1OM is 64bit only"));
12929             return ELF_TARGET_K1OM_FORMAT;
12930           }
12931         else if (cpu_arch_isa == PROCESSOR_IAMCU)
12932           {
12933             if (x86_elf_abi != I386_ABI)
12934               as_fatal (_("Intel MCU is 32bit only"));
12935             return ELF_TARGET_IAMCU_FORMAT;
12936           }
12937         else
12938           return format;
12939       }
12940 #endif
12941 #if defined (OBJ_MACH_O)
12942     case bfd_target_mach_o_flavour:
12943       if (flag_code == CODE_64BIT)
12944         {
12945           use_rela_relocations = 1;
12946           object_64bit = 1;
12947           return "mach-o-x86-64";
12948         }
12949       else
12950         return "mach-o-i386";
12951 #endif
12952     default:
12953       abort ();
12954       return NULL;
12955     }
12956 }
12957
12958 #endif /* OBJ_MAYBE_ more than one  */
12959 \f
12960 symbolS *
12961 md_undefined_symbol (char *name)
12962 {
12963   if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
12964       && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
12965       && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
12966       && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
12967     {
12968       if (!GOT_symbol)
12969         {
12970           if (symbol_find (name))
12971             as_bad (_("GOT already in symbol table"));
12972           GOT_symbol = symbol_new (name, undefined_section,
12973                                    (valueT) 0, &zero_address_frag);
12974         };
12975       return GOT_symbol;
12976     }
12977   return 0;
12978 }
12979
12980 /* Round up a section size to the appropriate boundary.  */
12981
12982 valueT
12983 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
12984 {
12985 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
12986   if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
12987     {
12988       /* For a.out, force the section size to be aligned.  If we don't do
12989          this, BFD will align it for us, but it will not write out the
12990          final bytes of the section.  This may be a bug in BFD, but it is
12991          easier to fix it here since that is how the other a.out targets
12992          work.  */
12993       int align;
12994
12995       align = bfd_section_alignment (segment);
12996       size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
12997     }
12998 #endif
12999
13000   return size;
13001 }
13002
13003 /* On the i386, PC-relative offsets are relative to the start of the
13004    next instruction.  That is, the address of the offset, plus its
13005    size, since the offset is always the last part of the insn.  */
13006
13007 long
13008 md_pcrel_from (fixS *fixP)
13009 {
13010   return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13011 }
13012
13013 #ifndef I386COFF
13014
13015 static void
13016 s_bss (int ignore ATTRIBUTE_UNUSED)
13017 {
13018   int temp;
13019
13020 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13021   if (IS_ELF)
13022     obj_elf_section_change_hook ();
13023 #endif
13024   temp = get_absolute_expression ();
13025   subseg_set (bss_section, (subsegT) temp);
13026   demand_empty_rest_of_line ();
13027 }
13028
13029 #endif
13030
13031 /* Remember constant directive.  */
13032
13033 void
13034 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13035 {
13036   if (last_insn.kind != last_insn_directive
13037       && (bfd_section_flags (now_seg) & SEC_CODE))
13038     {
13039       last_insn.seg = now_seg;
13040       last_insn.kind = last_insn_directive;
13041       last_insn.name = "constant directive";
13042       last_insn.file = as_where (&last_insn.line);
13043     }
13044 }
13045
13046 void
13047 i386_validate_fix (fixS *fixp)
13048 {
13049   if (fixp->fx_subsy)
13050     {
13051       if (fixp->fx_subsy == GOT_symbol)
13052         {
13053           if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13054             {
13055               if (!object_64bit)
13056                 abort ();
13057 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13058               if (fixp->fx_tcbit2)
13059                 fixp->fx_r_type = (fixp->fx_tcbit
13060                                    ? BFD_RELOC_X86_64_REX_GOTPCRELX
13061                                    : BFD_RELOC_X86_64_GOTPCRELX);
13062               else
13063 #endif
13064                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13065             }
13066           else
13067             {
13068               if (!object_64bit)
13069                 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13070               else
13071                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13072             }
13073           fixp->fx_subsy = 0;
13074         }
13075     }
13076 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13077   else if (!object_64bit)
13078     {
13079       if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13080           && fixp->fx_tcbit2)
13081         fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13082     }
13083 #endif
13084 }
13085
13086 arelent *
13087 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
13088 {
13089   arelent *rel;
13090   bfd_reloc_code_real_type code;
13091
13092   switch (fixp->fx_r_type)
13093     {
13094 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13095     case BFD_RELOC_SIZE32:
13096     case BFD_RELOC_SIZE64:
13097       if (S_IS_DEFINED (fixp->fx_addsy)
13098           && !S_IS_EXTERNAL (fixp->fx_addsy))
13099         {
13100           /* Resolve size relocation against local symbol to size of
13101              the symbol plus addend.  */
13102           valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13103           if (fixp->fx_r_type == BFD_RELOC_SIZE32
13104               && !fits_in_unsigned_long (value))
13105             as_bad_where (fixp->fx_file, fixp->fx_line,
13106                           _("symbol size computation overflow"));
13107           fixp->fx_addsy = NULL;
13108           fixp->fx_subsy = NULL;
13109           md_apply_fix (fixp, (valueT *) &value, NULL);
13110           return NULL;
13111         }
13112 #endif
13113       /* Fall through.  */
13114
13115     case BFD_RELOC_X86_64_PLT32:
13116     case BFD_RELOC_X86_64_GOT32:
13117     case BFD_RELOC_X86_64_GOTPCREL:
13118     case BFD_RELOC_X86_64_GOTPCRELX:
13119     case BFD_RELOC_X86_64_REX_GOTPCRELX:
13120     case BFD_RELOC_386_PLT32:
13121     case BFD_RELOC_386_GOT32:
13122     case BFD_RELOC_386_GOT32X:
13123     case BFD_RELOC_386_GOTOFF:
13124     case BFD_RELOC_386_GOTPC:
13125     case BFD_RELOC_386_TLS_GD:
13126     case BFD_RELOC_386_TLS_LDM:
13127     case BFD_RELOC_386_TLS_LDO_32:
13128     case BFD_RELOC_386_TLS_IE_32:
13129     case BFD_RELOC_386_TLS_IE:
13130     case BFD_RELOC_386_TLS_GOTIE:
13131     case BFD_RELOC_386_TLS_LE_32:
13132     case BFD_RELOC_386_TLS_LE:
13133     case BFD_RELOC_386_TLS_GOTDESC:
13134     case BFD_RELOC_386_TLS_DESC_CALL:
13135     case BFD_RELOC_X86_64_TLSGD:
13136     case BFD_RELOC_X86_64_TLSLD:
13137     case BFD_RELOC_X86_64_DTPOFF32:
13138     case BFD_RELOC_X86_64_DTPOFF64:
13139     case BFD_RELOC_X86_64_GOTTPOFF:
13140     case BFD_RELOC_X86_64_TPOFF32:
13141     case BFD_RELOC_X86_64_TPOFF64:
13142     case BFD_RELOC_X86_64_GOTOFF64:
13143     case BFD_RELOC_X86_64_GOTPC32:
13144     case BFD_RELOC_X86_64_GOT64:
13145     case BFD_RELOC_X86_64_GOTPCREL64:
13146     case BFD_RELOC_X86_64_GOTPC64:
13147     case BFD_RELOC_X86_64_GOTPLT64:
13148     case BFD_RELOC_X86_64_PLTOFF64:
13149     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13150     case BFD_RELOC_X86_64_TLSDESC_CALL:
13151     case BFD_RELOC_RVA:
13152     case BFD_RELOC_VTABLE_ENTRY:
13153     case BFD_RELOC_VTABLE_INHERIT:
13154 #ifdef TE_PE
13155     case BFD_RELOC_32_SECREL:
13156 #endif
13157       code = fixp->fx_r_type;
13158       break;
13159     case BFD_RELOC_X86_64_32S:
13160       if (!fixp->fx_pcrel)
13161         {
13162           /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32.  */
13163           code = fixp->fx_r_type;
13164           break;
13165         }
13166       /* Fall through.  */
13167     default:
13168       if (fixp->fx_pcrel)
13169         {
13170           switch (fixp->fx_size)
13171             {
13172             default:
13173               as_bad_where (fixp->fx_file, fixp->fx_line,
13174                             _("can not do %d byte pc-relative relocation"),
13175                             fixp->fx_size);
13176               code = BFD_RELOC_32_PCREL;
13177               break;
13178             case 1: code = BFD_RELOC_8_PCREL;  break;
13179             case 2: code = BFD_RELOC_16_PCREL; break;
13180             case 4: code = BFD_RELOC_32_PCREL; break;
13181 #ifdef BFD64
13182             case 8: code = BFD_RELOC_64_PCREL; break;
13183 #endif
13184             }
13185         }
13186       else
13187         {
13188           switch (fixp->fx_size)
13189             {
13190             default:
13191               as_bad_where (fixp->fx_file, fixp->fx_line,
13192                             _("can not do %d byte relocation"),
13193                             fixp->fx_size);
13194               code = BFD_RELOC_32;
13195               break;
13196             case 1: code = BFD_RELOC_8;  break;
13197             case 2: code = BFD_RELOC_16; break;
13198             case 4: code = BFD_RELOC_32; break;
13199 #ifdef BFD64
13200             case 8: code = BFD_RELOC_64; break;
13201 #endif
13202             }
13203         }
13204       break;
13205     }
13206
13207   if ((code == BFD_RELOC_32
13208        || code == BFD_RELOC_32_PCREL
13209        || code == BFD_RELOC_X86_64_32S)
13210       && GOT_symbol
13211       && fixp->fx_addsy == GOT_symbol)
13212     {
13213       if (!object_64bit)
13214         code = BFD_RELOC_386_GOTPC;
13215       else
13216         code = BFD_RELOC_X86_64_GOTPC32;
13217     }
13218   if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13219       && GOT_symbol
13220       && fixp->fx_addsy == GOT_symbol)
13221     {
13222       code = BFD_RELOC_X86_64_GOTPC64;
13223     }
13224
13225   rel = XNEW (arelent);
13226   rel->sym_ptr_ptr = XNEW (asymbol *);
13227   *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
13228
13229   rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
13230
13231   if (!use_rela_relocations)
13232     {
13233       /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
13234          vtable entry to be used in the relocation's section offset.  */
13235       if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
13236         rel->address = fixp->fx_offset;
13237 #if defined (OBJ_COFF) && defined (TE_PE)
13238       else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
13239         rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
13240       else
13241 #endif
13242       rel->addend = 0;
13243     }
13244   /* Use the rela in 64bit mode.  */
13245   else
13246     {
13247       if (disallow_64bit_reloc)
13248         switch (code)
13249           {
13250           case BFD_RELOC_X86_64_DTPOFF64:
13251           case BFD_RELOC_X86_64_TPOFF64:
13252           case BFD_RELOC_64_PCREL:
13253           case BFD_RELOC_X86_64_GOTOFF64:
13254           case BFD_RELOC_X86_64_GOT64:
13255           case BFD_RELOC_X86_64_GOTPCREL64:
13256           case BFD_RELOC_X86_64_GOTPC64:
13257           case BFD_RELOC_X86_64_GOTPLT64:
13258           case BFD_RELOC_X86_64_PLTOFF64:
13259             as_bad_where (fixp->fx_file, fixp->fx_line,
13260                           _("cannot represent relocation type %s in x32 mode"),
13261                           bfd_get_reloc_code_name (code));
13262             break;
13263           default:
13264             break;
13265           }
13266
13267       if (!fixp->fx_pcrel)
13268         rel->addend = fixp->fx_offset;
13269       else
13270         switch (code)
13271           {
13272           case BFD_RELOC_X86_64_PLT32:
13273           case BFD_RELOC_X86_64_GOT32:
13274           case BFD_RELOC_X86_64_GOTPCREL:
13275           case BFD_RELOC_X86_64_GOTPCRELX:
13276           case BFD_RELOC_X86_64_REX_GOTPCRELX:
13277           case BFD_RELOC_X86_64_TLSGD:
13278           case BFD_RELOC_X86_64_TLSLD:
13279           case BFD_RELOC_X86_64_GOTTPOFF:
13280           case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13281           case BFD_RELOC_X86_64_TLSDESC_CALL:
13282             rel->addend = fixp->fx_offset - fixp->fx_size;
13283             break;
13284           default:
13285             rel->addend = (section->vma
13286                            - fixp->fx_size
13287                            + fixp->fx_addnumber
13288                            + md_pcrel_from (fixp));
13289             break;
13290           }
13291     }
13292
13293   rel->howto = bfd_reloc_type_lookup (stdoutput, code);
13294   if (rel->howto == NULL)
13295     {
13296       as_bad_where (fixp->fx_file, fixp->fx_line,
13297                     _("cannot represent relocation type %s"),
13298                     bfd_get_reloc_code_name (code));
13299       /* Set howto to a garbage value so that we can keep going.  */
13300       rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
13301       gas_assert (rel->howto != NULL);
13302     }
13303
13304   return rel;
13305 }
13306
13307 #include "tc-i386-intel.c"
13308
13309 void
13310 tc_x86_parse_to_dw2regnum (expressionS *exp)
13311 {
13312   int saved_naked_reg;
13313   char saved_register_dot;
13314
13315   saved_naked_reg = allow_naked_reg;
13316   allow_naked_reg = 1;
13317   saved_register_dot = register_chars['.'];
13318   register_chars['.'] = '.';
13319   allow_pseudo_reg = 1;
13320   expression_and_evaluate (exp);
13321   allow_pseudo_reg = 0;
13322   register_chars['.'] = saved_register_dot;
13323   allow_naked_reg = saved_naked_reg;
13324
13325   if (exp->X_op == O_register && exp->X_add_number >= 0)
13326     {
13327       if ((addressT) exp->X_add_number < i386_regtab_size)
13328         {
13329           exp->X_op = O_constant;
13330           exp->X_add_number = i386_regtab[exp->X_add_number]
13331                               .dw2_regnum[flag_code >> 1];
13332         }
13333       else
13334         exp->X_op = O_illegal;
13335     }
13336 }
13337
13338 void
13339 tc_x86_frame_initial_instructions (void)
13340 {
13341   static unsigned int sp_regno[2];
13342
13343   if (!sp_regno[flag_code >> 1])
13344     {
13345       char *saved_input = input_line_pointer;
13346       char sp[][4] = {"esp", "rsp"};
13347       expressionS exp;
13348
13349       input_line_pointer = sp[flag_code >> 1];
13350       tc_x86_parse_to_dw2regnum (&exp);
13351       gas_assert (exp.X_op == O_constant);
13352       sp_regno[flag_code >> 1] = exp.X_add_number;
13353       input_line_pointer = saved_input;
13354     }
13355
13356   cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
13357   cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
13358 }
13359
13360 int
13361 x86_dwarf2_addr_size (void)
13362 {
13363 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13364   if (x86_elf_abi == X86_64_X32_ABI)
13365     return 4;
13366 #endif
13367   return bfd_arch_bits_per_address (stdoutput) / 8;
13368 }
13369
13370 int
13371 i386_elf_section_type (const char *str, size_t len)
13372 {
13373   if (flag_code == CODE_64BIT
13374       && len == sizeof ("unwind") - 1
13375       && strncmp (str, "unwind", 6) == 0)
13376     return SHT_X86_64_UNWIND;
13377
13378   return -1;
13379 }
13380
13381 #ifdef TE_SOLARIS
13382 void
13383 i386_solaris_fix_up_eh_frame (segT sec)
13384 {
13385   if (flag_code == CODE_64BIT)
13386     elf_section_type (sec) = SHT_X86_64_UNWIND;
13387 }
13388 #endif
13389
13390 #ifdef TE_PE
13391 void
13392 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
13393 {
13394   expressionS exp;
13395
13396   exp.X_op = O_secrel;
13397   exp.X_add_symbol = symbol;
13398   exp.X_add_number = 0;
13399   emit_expr (&exp, size);
13400 }
13401 #endif
13402
13403 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13404 /* For ELF on x86-64, add support for SHF_X86_64_LARGE.  */
13405
13406 bfd_vma
13407 x86_64_section_letter (int letter, const char **ptr_msg)
13408 {
13409   if (flag_code == CODE_64BIT)
13410     {
13411       if (letter == 'l')
13412         return SHF_X86_64_LARGE;
13413
13414       *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
13415     }
13416   else
13417     *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
13418   return -1;
13419 }
13420
13421 bfd_vma
13422 x86_64_section_word (char *str, size_t len)
13423 {
13424   if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
13425     return SHF_X86_64_LARGE;
13426
13427   return -1;
13428 }
13429
13430 static void
13431 handle_large_common (int small ATTRIBUTE_UNUSED)
13432 {
13433   if (flag_code != CODE_64BIT)
13434     {
13435       s_comm_internal (0, elf_common_parse);
13436       as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
13437     }
13438   else
13439     {
13440       static segT lbss_section;
13441       asection *saved_com_section_ptr = elf_com_section_ptr;
13442       asection *saved_bss_section = bss_section;
13443
13444       if (lbss_section == NULL)
13445         {
13446           flagword applicable;
13447           segT seg = now_seg;
13448           subsegT subseg = now_subseg;
13449
13450           /* The .lbss section is for local .largecomm symbols.  */
13451           lbss_section = subseg_new (".lbss", 0);
13452           applicable = bfd_applicable_section_flags (stdoutput);
13453           bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
13454           seg_info (lbss_section)->bss = 1;
13455
13456           subseg_set (seg, subseg);
13457         }
13458
13459       elf_com_section_ptr = &_bfd_elf_large_com_section;
13460       bss_section = lbss_section;
13461
13462       s_comm_internal (0, elf_common_parse);
13463
13464       elf_com_section_ptr = saved_com_section_ptr;
13465       bss_section = saved_bss_section;
13466     }
13467 }
13468 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */