x86: Support VEX base opcode length > 1
[deliverable/binutils-gdb.git] / gas / config / tc-i386.c
CommitLineData
b534c6d3 1/* tc-i386.c -- Assemble code for the Intel 80386
b3adc24a 2 Copyright (C) 1989-2020 Free Software Foundation, Inc.
252b5132
RH
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
ec2655a6 8 the Free Software Foundation; either version 3, or (at your option)
252b5132
RH
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
4b4da160
NC
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
252b5132 20
47926f60
KH
21/* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
3e73aa7c 23 x86_64 support by Jan Hubicka (jh@suse.cz)
0f10071e 24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
47926f60
KH
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
252b5132 27
252b5132 28#include "as.h"
3882b010 29#include "safe-ctype.h"
252b5132 30#include "subsegs.h"
316e2c05 31#include "dwarf2dbg.h"
54cfded0 32#include "dw2gencfi.h"
d2b2c203 33#include "elf/x86-64.h"
40fb9820 34#include "opcodes/i386-init.h"
252b5132 35
41fd2579
L
36#ifdef HAVE_LIMITS_H
37#include <limits.h>
38#else
39#ifdef HAVE_SYS_PARAM_H
40#include <sys/param.h>
41#endif
42#ifndef INT_MAX
43#define INT_MAX (int) (((unsigned) (-1)) >> 1)
44#endif
45#endif
46
c3332e24 47#ifndef INFER_ADDR_PREFIX
eecb386c 48#define INFER_ADDR_PREFIX 1
c3332e24
AM
49#endif
50
29b0f896
AM
51#ifndef DEFAULT_ARCH
52#define DEFAULT_ARCH "i386"
246fcdee 53#endif
252b5132 54
edde18a5
AM
55#ifndef INLINE
56#if __GNUC__ >= 2
57#define INLINE __inline__
58#else
59#define INLINE
60#endif
61#endif
62
6305a203
L
63/* Prefixes will be emitted in the order defined below.
64 WAIT_PREFIX must be the first prefix since FWAIT is really is an
65 instruction, and so must come before any prefixes.
66 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
42164a71 67 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
6305a203
L
68#define WAIT_PREFIX 0
69#define SEG_PREFIX 1
70#define ADDR_PREFIX 2
71#define DATA_PREFIX 3
c32fa91d 72#define REP_PREFIX 4
42164a71 73#define HLE_PREFIX REP_PREFIX
7e8b059b 74#define BND_PREFIX REP_PREFIX
c32fa91d 75#define LOCK_PREFIX 5
4e9ac44a
L
76#define REX_PREFIX 6 /* must come last. */
77#define MAX_PREFIXES 7 /* max prefixes per opcode */
6305a203
L
78
79/* we define the syntax here (modulo base,index,scale syntax) */
80#define REGISTER_PREFIX '%'
81#define IMMEDIATE_PREFIX '$'
82#define ABSOLUTE_PREFIX '*'
83
84/* these are the instruction mnemonic suffixes in AT&T syntax or
85 memory operand size in Intel syntax. */
86#define WORD_MNEM_SUFFIX 'w'
87#define BYTE_MNEM_SUFFIX 'b'
88#define SHORT_MNEM_SUFFIX 's'
89#define LONG_MNEM_SUFFIX 'l'
90#define QWORD_MNEM_SUFFIX 'q'
6305a203
L
91/* Intel Syntax. Use a non-ascii letter since since it never appears
92 in instructions. */
93#define LONG_DOUBLE_MNEM_SUFFIX '\1'
94
95#define END_OF_INSN '\0'
96
79dec6b7
JB
97/* This matches the C -> StaticRounding alias in the opcode table. */
98#define commutative staticrounding
99
6305a203
L
100/*
101 'templates' is for grouping together 'template' structures for opcodes
102 of the same name. This is only used for storing the insns in the grand
103 ole hash table of insns.
104 The templates themselves start at START and range up to (but not including)
105 END.
106 */
107typedef struct
108{
d3ce72d0
NC
109 const insn_template *start;
110 const insn_template *end;
6305a203
L
111}
112templates;
113
114/* 386 operand encoding bytes: see 386 book for details of this. */
115typedef struct
116{
117 unsigned int regmem; /* codes register or memory operand */
118 unsigned int reg; /* codes register operand (or extended opcode) */
119 unsigned int mode; /* how to interpret regmem & reg */
120}
121modrm_byte;
122
123/* x86-64 extension prefix. */
124typedef int rex_byte;
125
6305a203
L
126/* 386 opcode byte to code indirect addressing. */
127typedef struct
128{
129 unsigned base;
130 unsigned index;
131 unsigned scale;
132}
133sib_byte;
134
6305a203
L
135/* x86 arch names, types and features */
136typedef struct
137{
138 const char *name; /* arch name */
8a2c8fef 139 unsigned int len; /* arch string length */
6305a203
L
140 enum processor_type type; /* arch type */
141 i386_cpu_flags flags; /* cpu feature flags */
8a2c8fef 142 unsigned int skip; /* show_arch should skip this. */
6305a203
L
143}
144arch_entry;
145
293f5f65
L
146/* Used to turn off indicated flags. */
147typedef struct
148{
149 const char *name; /* arch name */
150 unsigned int len; /* arch string length */
151 i386_cpu_flags flags; /* cpu feature flags */
152}
153noarch_entry;
154
78f12dd3 155static void update_code_flag (int, int);
e3bb37b5
L
156static void set_code_flag (int);
157static void set_16bit_gcc_code_flag (int);
158static void set_intel_syntax (int);
1efbbeb4 159static void set_intel_mnemonic (int);
db51cc60 160static void set_allow_index_reg (int);
7bab8ab5 161static void set_check (int);
e3bb37b5 162static void set_cpu_arch (int);
6482c264 163#ifdef TE_PE
e3bb37b5 164static void pe_directive_secrel (int);
6482c264 165#endif
e3bb37b5
L
166static void signed_cons (int);
167static char *output_invalid (int c);
ee86248c
JB
168static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
169 const char *);
170static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
171 const char *);
a7619375 172static int i386_att_operand (char *);
e3bb37b5 173static int i386_intel_operand (char *, int);
ee86248c
JB
174static int i386_intel_simplify (expressionS *);
175static int i386_intel_parse_name (const char *, expressionS *);
e3bb37b5
L
176static const reg_entry *parse_register (char *, char **);
177static char *parse_insn (char *, char *);
178static char *parse_operands (char *, const char *);
179static void swap_operands (void);
4d456e3d 180static void swap_2_operands (int, int);
48bcea9f 181static enum flag_code i386_addressing_mode (void);
e3bb37b5
L
182static void optimize_imm (void);
183static void optimize_disp (void);
83b16ac6 184static const insn_template *match_template (char);
e3bb37b5
L
185static int check_string (void);
186static int process_suffix (void);
187static int check_byte_reg (void);
188static int check_long_reg (void);
189static int check_qword_reg (void);
190static int check_word_reg (void);
191static int finalize_imm (void);
192static int process_operands (void);
193static const seg_entry *build_modrm_byte (void);
194static void output_insn (void);
195static void output_imm (fragS *, offsetT);
196static void output_disp (fragS *, offsetT);
29b0f896 197#ifndef I386COFF
e3bb37b5 198static void s_bss (int);
252b5132 199#endif
17d4e2a2
L
200#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
201static void handle_large_common (int small ATTRIBUTE_UNUSED);
b4a3a7b4
L
202
203/* GNU_PROPERTY_X86_ISA_1_USED. */
204static unsigned int x86_isa_1_used;
205/* GNU_PROPERTY_X86_FEATURE_2_USED. */
206static unsigned int x86_feature_2_used;
207/* Generate x86 used ISA and feature properties. */
208static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
17d4e2a2 209#endif
252b5132 210
a847613f 211static const char *default_arch = DEFAULT_ARCH;
3e73aa7c 212
8a6fb3f9
JB
213/* parse_register() returns this when a register alias cannot be used. */
214static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
215 { Dw2Inval, Dw2Inval } };
216
43234a1e
L
217/* This struct describes rounding control and SAE in the instruction. */
218struct RC_Operation
219{
220 enum rc_type
221 {
222 rne = 0,
223 rd,
224 ru,
225 rz,
226 saeonly
227 } type;
228 int operand;
229};
230
231static struct RC_Operation rc_op;
232
233/* The struct describes masking, applied to OPERAND in the instruction.
234 MASK is a pointer to the corresponding mask register. ZEROING tells
235 whether merging or zeroing mask is used. */
236struct Mask_Operation
237{
238 const reg_entry *mask;
239 unsigned int zeroing;
240 /* The operand where this operation is associated. */
241 int operand;
242};
243
244static struct Mask_Operation mask_op;
245
246/* The struct describes broadcasting, applied to OPERAND. FACTOR is
247 broadcast factor. */
248struct Broadcast_Operation
249{
8e6e0792 250 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
43234a1e
L
251 int type;
252
253 /* Index of broadcasted operand. */
254 int operand;
4a1b91ea
L
255
256 /* Number of bytes to broadcast. */
257 int bytes;
43234a1e
L
258};
259
260static struct Broadcast_Operation broadcast_op;
261
c0f3af97
L
262/* VEX prefix. */
263typedef struct
264{
43234a1e
L
265 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
266 unsigned char bytes[4];
c0f3af97
L
267 unsigned int length;
268 /* Destination or source register specifier. */
269 const reg_entry *register_specifier;
270} vex_prefix;
271
252b5132 272/* 'md_assemble ()' gathers together information and puts it into a
47926f60 273 i386_insn. */
252b5132 274
520dc8e8
AM
275union i386_op
276 {
277 expressionS *disps;
278 expressionS *imms;
279 const reg_entry *regs;
280 };
281
a65babc9
L
282enum i386_error
283 {
86e026a4 284 operand_size_mismatch,
a65babc9
L
285 operand_type_mismatch,
286 register_type_mismatch,
287 number_of_operands_mismatch,
288 invalid_instruction_suffix,
289 bad_imm4,
a65babc9
L
290 unsupported_with_intel_mnemonic,
291 unsupported_syntax,
6c30d220
L
292 unsupported,
293 invalid_vsib_address,
7bab8ab5 294 invalid_vector_register_set,
43234a1e
L
295 unsupported_vector_index_register,
296 unsupported_broadcast,
43234a1e
L
297 broadcast_needed,
298 unsupported_masking,
299 mask_not_on_destination,
300 no_default_mask,
301 unsupported_rc_sae,
302 rc_sae_operand_not_last_imm,
303 invalid_register_operand,
a65babc9
L
304 };
305
252b5132
RH
306struct _i386_insn
307 {
47926f60 308 /* TM holds the template for the insn were currently assembling. */
d3ce72d0 309 insn_template tm;
252b5132 310
7d5e4556
L
311 /* SUFFIX holds the instruction size suffix for byte, word, dword
312 or qword, if given. */
252b5132
RH
313 char suffix;
314
47926f60 315 /* OPERANDS gives the number of given operands. */
252b5132
RH
316 unsigned int operands;
317
318 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
319 of given register, displacement, memory operands and immediate
47926f60 320 operands. */
252b5132
RH
321 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
322
323 /* TYPES [i] is the type (see above #defines) which tells us how to
520dc8e8 324 use OP[i] for the corresponding operand. */
40fb9820 325 i386_operand_type types[MAX_OPERANDS];
252b5132 326
520dc8e8
AM
327 /* Displacement expression, immediate expression, or register for each
328 operand. */
329 union i386_op op[MAX_OPERANDS];
252b5132 330
3e73aa7c
JH
331 /* Flags for operands. */
332 unsigned int flags[MAX_OPERANDS];
333#define Operand_PCrel 1
c48dadc9 334#define Operand_Mem 2
3e73aa7c 335
252b5132 336 /* Relocation type for operand */
f86103b7 337 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
252b5132 338
252b5132
RH
339 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
340 the base index byte below. */
341 const reg_entry *base_reg;
342 const reg_entry *index_reg;
343 unsigned int log2_scale_factor;
344
345 /* SEG gives the seg_entries of this insn. They are zero unless
47926f60 346 explicit segment overrides are given. */
ce8a8b2f 347 const seg_entry *seg[2];
252b5132 348
8325cc63
JB
349 /* Copied first memory operand string, for re-checking. */
350 char *memop1_string;
351
252b5132
RH
352 /* PREFIX holds all the given prefix opcodes (usually null).
353 PREFIXES is the number of prefix opcodes. */
354 unsigned int prefixes;
355 unsigned char prefix[MAX_PREFIXES];
356
50128d0c
JB
357 /* Register is in low 3 bits of opcode. */
358 bfd_boolean short_form;
359
6f2f06be
JB
360 /* The operand to a branch insn indicates an absolute branch. */
361 bfd_boolean jumpabsolute;
362
b4a3a7b4
L
363 /* Has MMX register operands. */
364 bfd_boolean has_regmmx;
365
366 /* Has XMM register operands. */
367 bfd_boolean has_regxmm;
368
369 /* Has YMM register operands. */
370 bfd_boolean has_regymm;
371
372 /* Has ZMM register operands. */
373 bfd_boolean has_regzmm;
374
e379e5f3
L
375 /* Has GOTPC or TLS relocation. */
376 bfd_boolean has_gotpc_tls_reloc;
377
252b5132 378 /* RM and SIB are the modrm byte and the sib byte where the
c1e679ec 379 addressing modes of this insn are encoded. */
252b5132 380 modrm_byte rm;
3e73aa7c 381 rex_byte rex;
43234a1e 382 rex_byte vrex;
252b5132 383 sib_byte sib;
c0f3af97 384 vex_prefix vex;
b6169b20 385
43234a1e
L
386 /* Masking attributes. */
387 struct Mask_Operation *mask;
388
389 /* Rounding control and SAE attributes. */
390 struct RC_Operation *rounding;
391
392 /* Broadcasting attributes. */
393 struct Broadcast_Operation *broadcast;
394
395 /* Compressed disp8*N attribute. */
396 unsigned int memshift;
397
86fa6981
L
398 /* Prefer load or store in encoding. */
399 enum
400 {
401 dir_encoding_default = 0,
402 dir_encoding_load,
64c49ab3
JB
403 dir_encoding_store,
404 dir_encoding_swap
86fa6981 405 } dir_encoding;
891edac4 406
a501d77e
L
407 /* Prefer 8bit or 32bit displacement in encoding. */
408 enum
409 {
410 disp_encoding_default = 0,
411 disp_encoding_8bit,
412 disp_encoding_32bit
413 } disp_encoding;
f8a5c266 414
6b6b6807
L
415 /* Prefer the REX byte in encoding. */
416 bfd_boolean rex_encoding;
417
b6f8c7c4
L
418 /* Disable instruction size optimization. */
419 bfd_boolean no_optimize;
420
86fa6981
L
421 /* How to encode vector instructions. */
422 enum
423 {
424 vex_encoding_default = 0,
42e04b36 425 vex_encoding_vex,
86fa6981 426 vex_encoding_vex3,
da4977e0
JB
427 vex_encoding_evex,
428 vex_encoding_error
86fa6981
L
429 } vec_encoding;
430
d5de92cf
L
431 /* REP prefix. */
432 const char *rep_prefix;
433
165de32a
L
434 /* HLE prefix. */
435 const char *hle_prefix;
42164a71 436
7e8b059b
L
437 /* Have BND prefix. */
438 const char *bnd_prefix;
439
04ef582a
L
440 /* Have NOTRACK prefix. */
441 const char *notrack_prefix;
442
891edac4 443 /* Error message. */
a65babc9 444 enum i386_error error;
252b5132
RH
445 };
446
447typedef struct _i386_insn i386_insn;
448
43234a1e
L
449/* Link RC type with corresponding string, that'll be looked for in
450 asm. */
451struct RC_name
452{
453 enum rc_type type;
454 const char *name;
455 unsigned int len;
456};
457
458static const struct RC_name RC_NamesTable[] =
459{
460 { rne, STRING_COMMA_LEN ("rn-sae") },
461 { rd, STRING_COMMA_LEN ("rd-sae") },
462 { ru, STRING_COMMA_LEN ("ru-sae") },
463 { rz, STRING_COMMA_LEN ("rz-sae") },
464 { saeonly, STRING_COMMA_LEN ("sae") },
465};
466
252b5132
RH
467/* List of chars besides those in app.c:symbol_chars that can start an
468 operand. Used to prevent the scrubber eating vital white-space. */
86fa6981 469const char extra_symbol_chars[] = "*%-([{}"
252b5132 470#ifdef LEX_AT
32137342
NC
471 "@"
472#endif
473#ifdef LEX_QM
474 "?"
252b5132 475#endif
32137342 476 ;
252b5132 477
29b0f896
AM
478#if (defined (TE_I386AIX) \
479 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
3896cfd5 480 && !defined (TE_GNU) \
29b0f896 481 && !defined (TE_LINUX) \
8d63c93e 482 && !defined (TE_NACL) \
29b0f896 483 && !defined (TE_FreeBSD) \
5b806d27 484 && !defined (TE_DragonFly) \
29b0f896 485 && !defined (TE_NetBSD)))
252b5132 486/* This array holds the chars that always start a comment. If the
b3b91714
AM
487 pre-processor is disabled, these aren't very useful. The option
488 --divide will remove '/' from this list. */
489const char *i386_comment_chars = "#/";
490#define SVR4_COMMENT_CHARS 1
252b5132 491#define PREFIX_SEPARATOR '\\'
252b5132 492
b3b91714
AM
493#else
494const char *i386_comment_chars = "#";
495#define PREFIX_SEPARATOR '/'
496#endif
497
252b5132
RH
498/* This array holds the chars that only start a comment at the beginning of
499 a line. If the line seems to have the form '# 123 filename'
ce8a8b2f
AM
500 .line and .file directives will appear in the pre-processed output.
501 Note that input_file.c hand checks for '#' at the beginning of the
252b5132 502 first line of the input file. This is because the compiler outputs
ce8a8b2f
AM
503 #NO_APP at the beginning of its output.
504 Also note that comments started like this one will always work if
252b5132 505 '/' isn't otherwise defined. */
b3b91714 506const char line_comment_chars[] = "#/";
252b5132 507
63a0b638 508const char line_separator_chars[] = ";";
252b5132 509
ce8a8b2f
AM
510/* Chars that can be used to separate mant from exp in floating point
511 nums. */
252b5132
RH
512const char EXP_CHARS[] = "eE";
513
ce8a8b2f
AM
514/* Chars that mean this number is a floating point constant
515 As in 0f12.456
516 or 0d1.2345e12. */
252b5132
RH
517const char FLT_CHARS[] = "fFdDxX";
518
ce8a8b2f 519/* Tables for lexical analysis. */
252b5132
RH
520static char mnemonic_chars[256];
521static char register_chars[256];
522static char operand_chars[256];
523static char identifier_chars[256];
524static char digit_chars[256];
525
ce8a8b2f 526/* Lexical macros. */
252b5132
RH
527#define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
528#define is_operand_char(x) (operand_chars[(unsigned char) x])
529#define is_register_char(x) (register_chars[(unsigned char) x])
530#define is_space_char(x) ((x) == ' ')
531#define is_identifier_char(x) (identifier_chars[(unsigned char) x])
532#define is_digit_char(x) (digit_chars[(unsigned char) x])
533
0234cb7c 534/* All non-digit non-letter characters that may occur in an operand. */
252b5132
RH
535static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
536
537/* md_assemble() always leaves the strings it's passed unaltered. To
538 effect this we maintain a stack of saved characters that we've smashed
539 with '\0's (indicating end of strings for various sub-fields of the
47926f60 540 assembler instruction). */
252b5132 541static char save_stack[32];
ce8a8b2f 542static char *save_stack_p;
252b5132
RH
543#define END_STRING_AND_SAVE(s) \
544 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
545#define RESTORE_END_STRING(s) \
546 do { *(s) = *--save_stack_p; } while (0)
547
47926f60 548/* The instruction we're assembling. */
252b5132
RH
549static i386_insn i;
550
551/* Possible templates for current insn. */
552static const templates *current_templates;
553
31b2323c
L
554/* Per instruction expressionS buffers: max displacements & immediates. */
555static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
556static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
252b5132 557
47926f60 558/* Current operand we are working on. */
ee86248c 559static int this_operand = -1;
252b5132 560
3e73aa7c
JH
561/* We support four different modes. FLAG_CODE variable is used to distinguish
562 these. */
563
564enum flag_code {
565 CODE_32BIT,
566 CODE_16BIT,
567 CODE_64BIT };
568
569static enum flag_code flag_code;
4fa24527 570static unsigned int object_64bit;
862be3fb 571static unsigned int disallow_64bit_reloc;
3e73aa7c 572static int use_rela_relocations = 0;
e379e5f3
L
573/* __tls_get_addr/___tls_get_addr symbol for TLS. */
574static const char *tls_get_addr;
3e73aa7c 575
7af8ed2d
NC
576#if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
577 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
578 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
579
351f65ca
L
580/* The ELF ABI to use. */
581enum x86_elf_abi
582{
583 I386_ABI,
7f56bc95
L
584 X86_64_ABI,
585 X86_64_X32_ABI
351f65ca
L
586};
587
588static enum x86_elf_abi x86_elf_abi = I386_ABI;
7af8ed2d 589#endif
351f65ca 590
167ad85b
TG
591#if defined (TE_PE) || defined (TE_PEP)
592/* Use big object file format. */
593static int use_big_obj = 0;
594#endif
595
8dcea932
L
596#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
597/* 1 if generating code for a shared library. */
598static int shared = 0;
599#endif
600
47926f60
KH
601/* 1 for intel syntax,
602 0 if att syntax. */
603static int intel_syntax = 0;
252b5132 604
4b5aaf5f
L
605static enum x86_64_isa
606{
607 amd64 = 1, /* AMD64 ISA. */
608 intel64 /* Intel64 ISA. */
609} isa64;
e89c5eaa 610
1efbbeb4
L
611/* 1 for intel mnemonic,
612 0 if att mnemonic. */
613static int intel_mnemonic = !SYSV386_COMPAT;
614
a60de03c
JB
615/* 1 if pseudo registers are permitted. */
616static int allow_pseudo_reg = 0;
617
47926f60
KH
618/* 1 if register prefix % not required. */
619static int allow_naked_reg = 0;
252b5132 620
33eaf5de 621/* 1 if the assembler should add BND prefix for all control-transferring
7e8b059b
L
622 instructions supporting it, even if this prefix wasn't specified
623 explicitly. */
624static int add_bnd_prefix = 0;
625
ba104c83 626/* 1 if pseudo index register, eiz/riz, is allowed . */
db51cc60
L
627static int allow_index_reg = 0;
628
d022bddd
IT
629/* 1 if the assembler should ignore LOCK prefix, even if it was
630 specified explicitly. */
631static int omit_lock_prefix = 0;
632
e4e00185
AS
633/* 1 if the assembler should encode lfence, mfence, and sfence as
634 "lock addl $0, (%{re}sp)". */
635static int avoid_fence = 0;
636
ae531041
L
637/* 1 if lfence should be inserted after every load. */
638static int lfence_after_load = 0;
639
640/* Non-zero if lfence should be inserted before indirect branch. */
641static enum lfence_before_indirect_branch_kind
642 {
643 lfence_branch_none = 0,
644 lfence_branch_register,
645 lfence_branch_memory,
646 lfence_branch_all
647 }
648lfence_before_indirect_branch;
649
650/* Non-zero if lfence should be inserted before ret. */
651static enum lfence_before_ret_kind
652 {
653 lfence_before_ret_none = 0,
654 lfence_before_ret_not,
a09f656b 655 lfence_before_ret_or,
656 lfence_before_ret_shl
ae531041
L
657 }
658lfence_before_ret;
659
660/* Types of previous instruction is .byte or prefix. */
e379e5f3
L
661static struct
662 {
663 segT seg;
664 const char *file;
665 const char *name;
666 unsigned int line;
667 enum last_insn_kind
668 {
669 last_insn_other = 0,
670 last_insn_directive,
671 last_insn_prefix
672 } kind;
673 } last_insn;
674
0cb4071e
L
675/* 1 if the assembler should generate relax relocations. */
676
677static int generate_relax_relocations
678 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
679
7bab8ab5 680static enum check_kind
daf50ae7 681 {
7bab8ab5
JB
682 check_none = 0,
683 check_warning,
684 check_error
daf50ae7 685 }
7bab8ab5 686sse_check, operand_check = check_warning;
daf50ae7 687
e379e5f3
L
688/* Non-zero if branches should be aligned within power of 2 boundary. */
689static int align_branch_power = 0;
690
691/* Types of branches to align. */
692enum align_branch_kind
693 {
694 align_branch_none = 0,
695 align_branch_jcc = 1,
696 align_branch_fused = 2,
697 align_branch_jmp = 3,
698 align_branch_call = 4,
699 align_branch_indirect = 5,
700 align_branch_ret = 6
701 };
702
703/* Type bits of branches to align. */
704enum align_branch_bit
705 {
706 align_branch_jcc_bit = 1 << align_branch_jcc,
707 align_branch_fused_bit = 1 << align_branch_fused,
708 align_branch_jmp_bit = 1 << align_branch_jmp,
709 align_branch_call_bit = 1 << align_branch_call,
710 align_branch_indirect_bit = 1 << align_branch_indirect,
711 align_branch_ret_bit = 1 << align_branch_ret
712 };
713
714static unsigned int align_branch = (align_branch_jcc_bit
715 | align_branch_fused_bit
716 | align_branch_jmp_bit);
717
79d72f45
HL
718/* Types of condition jump used by macro-fusion. */
719enum mf_jcc_kind
720 {
721 mf_jcc_jo = 0, /* base opcode 0x70 */
722 mf_jcc_jc, /* base opcode 0x72 */
723 mf_jcc_je, /* base opcode 0x74 */
724 mf_jcc_jna, /* base opcode 0x76 */
725 mf_jcc_js, /* base opcode 0x78 */
726 mf_jcc_jp, /* base opcode 0x7a */
727 mf_jcc_jl, /* base opcode 0x7c */
728 mf_jcc_jle, /* base opcode 0x7e */
729 };
730
731/* Types of compare flag-modifying insntructions used by macro-fusion. */
732enum mf_cmp_kind
733 {
734 mf_cmp_test_and, /* test/cmp */
735 mf_cmp_alu_cmp, /* add/sub/cmp */
736 mf_cmp_incdec /* inc/dec */
737 };
738
e379e5f3
L
739/* The maximum padding size for fused jcc. CMP like instruction can
740 be 9 bytes and jcc can be 6 bytes. Leave room just in case for
741 prefixes. */
742#define MAX_FUSED_JCC_PADDING_SIZE 20
743
744/* The maximum number of prefixes added for an instruction. */
745static unsigned int align_branch_prefix_size = 5;
746
b6f8c7c4
L
747/* Optimization:
748 1. Clear the REX_W bit with register operand if possible.
749 2. Above plus use 128bit vector instruction to clear the full vector
750 register.
751 */
752static int optimize = 0;
753
754/* Optimization:
755 1. Clear the REX_W bit with register operand if possible.
756 2. Above plus use 128bit vector instruction to clear the full vector
757 register.
758 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
759 "testb $imm7,%r8".
760 */
761static int optimize_for_space = 0;
762
2ca3ace5
L
763/* Register prefix used for error message. */
764static const char *register_prefix = "%";
765
47926f60
KH
766/* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
767 leave, push, and pop instructions so that gcc has the same stack
768 frame as in 32 bit mode. */
769static char stackop_size = '\0';
eecb386c 770
12b55ccc
L
771/* Non-zero to optimize code alignment. */
772int optimize_align_code = 1;
773
47926f60
KH
774/* Non-zero to quieten some warnings. */
775static int quiet_warnings = 0;
a38cf1db 776
47926f60
KH
777/* CPU name. */
778static const char *cpu_arch_name = NULL;
6305a203 779static char *cpu_sub_arch_name = NULL;
a38cf1db 780
47926f60 781/* CPU feature flags. */
40fb9820
L
782static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
783
ccc9c027
L
784/* If we have selected a cpu we are generating instructions for. */
785static int cpu_arch_tune_set = 0;
786
9103f4f4 787/* Cpu we are generating instructions for. */
fbf3f584 788enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
9103f4f4
L
789
790/* CPU feature flags of cpu we are generating instructions for. */
40fb9820 791static i386_cpu_flags cpu_arch_tune_flags;
9103f4f4 792
ccc9c027 793/* CPU instruction set architecture used. */
fbf3f584 794enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
ccc9c027 795
9103f4f4 796/* CPU feature flags of instruction set architecture used. */
fbf3f584 797i386_cpu_flags cpu_arch_isa_flags;
9103f4f4 798
fddf5b5b
AM
799/* If set, conditional jumps are not automatically promoted to handle
800 larger than a byte offset. */
801static unsigned int no_cond_jump_promotion = 0;
802
c0f3af97
L
803/* Encode SSE instructions with VEX prefix. */
804static unsigned int sse2avx;
805
539f890d
L
806/* Encode scalar AVX instructions with specific vector length. */
807static enum
808 {
809 vex128 = 0,
810 vex256
811 } avxscalar;
812
03751133
L
813/* Encode VEX WIG instructions with specific vex.w. */
814static enum
815 {
816 vexw0 = 0,
817 vexw1
818 } vexwig;
819
43234a1e
L
820/* Encode scalar EVEX LIG instructions with specific vector length. */
821static enum
822 {
823 evexl128 = 0,
824 evexl256,
825 evexl512
826 } evexlig;
827
828/* Encode EVEX WIG instructions with specific evex.w. */
829static enum
830 {
831 evexw0 = 0,
832 evexw1
833 } evexwig;
834
d3d3c6db
IT
835/* Value to encode in EVEX RC bits, for SAE-only instructions. */
836static enum rc_type evexrcig = rne;
837
29b0f896 838/* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
87c245cc 839static symbolS *GOT_symbol;
29b0f896 840
a4447b93
RH
841/* The dwarf2 return column, adjusted for 32 or 64 bit. */
842unsigned int x86_dwarf2_return_column;
843
844/* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
845int x86_cie_data_alignment;
846
252b5132 847/* Interface to relax_segment.
fddf5b5b
AM
848 There are 3 major relax states for 386 jump insns because the
849 different types of jumps add different sizes to frags when we're
e379e5f3
L
850 figuring out what sort of jump to choose to reach a given label.
851
852 BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
853 branches which are handled by md_estimate_size_before_relax() and
854 i386_generic_table_relax_frag(). */
252b5132 855
47926f60 856/* Types. */
93c2a809
AM
857#define UNCOND_JUMP 0
858#define COND_JUMP 1
859#define COND_JUMP86 2
e379e5f3
L
860#define BRANCH_PADDING 3
861#define BRANCH_PREFIX 4
862#define FUSED_JCC_PADDING 5
fddf5b5b 863
47926f60 864/* Sizes. */
252b5132
RH
865#define CODE16 1
866#define SMALL 0
29b0f896 867#define SMALL16 (SMALL | CODE16)
252b5132 868#define BIG 2
29b0f896 869#define BIG16 (BIG | CODE16)
252b5132
RH
870
871#ifndef INLINE
872#ifdef __GNUC__
873#define INLINE __inline__
874#else
875#define INLINE
876#endif
877#endif
878
fddf5b5b
AM
879#define ENCODE_RELAX_STATE(type, size) \
880 ((relax_substateT) (((type) << 2) | (size)))
881#define TYPE_FROM_RELAX_STATE(s) \
882 ((s) >> 2)
883#define DISP_SIZE_FROM_RELAX_STATE(s) \
884 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
252b5132
RH
885
886/* This table is used by relax_frag to promote short jumps to long
887 ones where necessary. SMALL (short) jumps may be promoted to BIG
888 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
889 don't allow a short jump in a 32 bit code segment to be promoted to
890 a 16 bit offset jump because it's slower (requires data size
891 prefix), and doesn't work, unless the destination is in the bottom
892 64k of the code segment (The top 16 bits of eip are zeroed). */
893
894const relax_typeS md_relax_table[] =
895{
24eab124
AM
896 /* The fields are:
897 1) most positive reach of this state,
898 2) most negative reach of this state,
93c2a809 899 3) how many bytes this mode will have in the variable part of the frag
ce8a8b2f 900 4) which index into the table to try if we can't fit into this one. */
252b5132 901
fddf5b5b 902 /* UNCOND_JUMP states. */
93c2a809
AM
903 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
904 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
905 /* dword jmp adds 4 bytes to frag:
906 0 extra opcode bytes, 4 displacement bytes. */
252b5132 907 {0, 0, 4, 0},
93c2a809
AM
908 /* word jmp adds 2 byte2 to frag:
909 0 extra opcode bytes, 2 displacement bytes. */
252b5132
RH
910 {0, 0, 2, 0},
911
93c2a809
AM
912 /* COND_JUMP states. */
913 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
914 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
915 /* dword conditionals adds 5 bytes to frag:
916 1 extra opcode byte, 4 displacement bytes. */
917 {0, 0, 5, 0},
fddf5b5b 918 /* word conditionals add 3 bytes to frag:
93c2a809
AM
919 1 extra opcode byte, 2 displacement bytes. */
920 {0, 0, 3, 0},
921
922 /* COND_JUMP86 states. */
923 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
924 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
925 /* dword conditionals adds 5 bytes to frag:
926 1 extra opcode byte, 4 displacement bytes. */
927 {0, 0, 5, 0},
928 /* word conditionals add 4 bytes to frag:
929 1 displacement byte and a 3 byte long branch insn. */
930 {0, 0, 4, 0}
252b5132
RH
931};
932
9103f4f4
L
933static const arch_entry cpu_arch[] =
934{
89507696
JB
935 /* Do not replace the first two entries - i386_target_format()
936 relies on them being there in this order. */
8a2c8fef 937 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
293f5f65 938 CPU_GENERIC32_FLAGS, 0 },
8a2c8fef 939 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
293f5f65 940 CPU_GENERIC64_FLAGS, 0 },
8a2c8fef 941 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
293f5f65 942 CPU_NONE_FLAGS, 0 },
8a2c8fef 943 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
293f5f65 944 CPU_I186_FLAGS, 0 },
8a2c8fef 945 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
293f5f65 946 CPU_I286_FLAGS, 0 },
8a2c8fef 947 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
293f5f65 948 CPU_I386_FLAGS, 0 },
8a2c8fef 949 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
293f5f65 950 CPU_I486_FLAGS, 0 },
8a2c8fef 951 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
293f5f65 952 CPU_I586_FLAGS, 0 },
8a2c8fef 953 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
293f5f65 954 CPU_I686_FLAGS, 0 },
8a2c8fef 955 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
293f5f65 956 CPU_I586_FLAGS, 0 },
8a2c8fef 957 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
293f5f65 958 CPU_PENTIUMPRO_FLAGS, 0 },
8a2c8fef 959 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
293f5f65 960 CPU_P2_FLAGS, 0 },
8a2c8fef 961 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
293f5f65 962 CPU_P3_FLAGS, 0 },
8a2c8fef 963 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
293f5f65 964 CPU_P4_FLAGS, 0 },
8a2c8fef 965 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
293f5f65 966 CPU_CORE_FLAGS, 0 },
8a2c8fef 967 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
293f5f65 968 CPU_NOCONA_FLAGS, 0 },
8a2c8fef 969 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
293f5f65 970 CPU_CORE_FLAGS, 1 },
8a2c8fef 971 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
293f5f65 972 CPU_CORE_FLAGS, 0 },
8a2c8fef 973 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
293f5f65 974 CPU_CORE2_FLAGS, 1 },
8a2c8fef 975 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
293f5f65 976 CPU_CORE2_FLAGS, 0 },
8a2c8fef 977 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
293f5f65 978 CPU_COREI7_FLAGS, 0 },
8a2c8fef 979 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
293f5f65 980 CPU_L1OM_FLAGS, 0 },
7a9068fe 981 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
293f5f65 982 CPU_K1OM_FLAGS, 0 },
81486035 983 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
293f5f65 984 CPU_IAMCU_FLAGS, 0 },
8a2c8fef 985 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
293f5f65 986 CPU_K6_FLAGS, 0 },
8a2c8fef 987 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
293f5f65 988 CPU_K6_2_FLAGS, 0 },
8a2c8fef 989 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
293f5f65 990 CPU_ATHLON_FLAGS, 0 },
8a2c8fef 991 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
293f5f65 992 CPU_K8_FLAGS, 1 },
8a2c8fef 993 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
293f5f65 994 CPU_K8_FLAGS, 0 },
8a2c8fef 995 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
293f5f65 996 CPU_K8_FLAGS, 0 },
8a2c8fef 997 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
293f5f65 998 CPU_AMDFAM10_FLAGS, 0 },
8aedb9fe 999 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
293f5f65 1000 CPU_BDVER1_FLAGS, 0 },
8aedb9fe 1001 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
293f5f65 1002 CPU_BDVER2_FLAGS, 0 },
5e5c50d3 1003 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
293f5f65 1004 CPU_BDVER3_FLAGS, 0 },
c7b0bd56 1005 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
293f5f65 1006 CPU_BDVER4_FLAGS, 0 },
029f3522 1007 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
293f5f65 1008 CPU_ZNVER1_FLAGS, 0 },
a9660a6f
AP
1009 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1010 CPU_ZNVER2_FLAGS, 0 },
7b458c12 1011 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
293f5f65 1012 CPU_BTVER1_FLAGS, 0 },
7b458c12 1013 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
293f5f65 1014 CPU_BTVER2_FLAGS, 0 },
8a2c8fef 1015 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
293f5f65 1016 CPU_8087_FLAGS, 0 },
8a2c8fef 1017 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
293f5f65 1018 CPU_287_FLAGS, 0 },
8a2c8fef 1019 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
293f5f65 1020 CPU_387_FLAGS, 0 },
1848e567
L
1021 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1022 CPU_687_FLAGS, 0 },
d871f3f4
L
1023 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1024 CPU_CMOV_FLAGS, 0 },
1025 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1026 CPU_FXSR_FLAGS, 0 },
8a2c8fef 1027 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
293f5f65 1028 CPU_MMX_FLAGS, 0 },
8a2c8fef 1029 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
293f5f65 1030 CPU_SSE_FLAGS, 0 },
8a2c8fef 1031 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
293f5f65 1032 CPU_SSE2_FLAGS, 0 },
8a2c8fef 1033 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
293f5f65 1034 CPU_SSE3_FLAGS, 0 },
af5c13b0
L
1035 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1036 CPU_SSE4A_FLAGS, 0 },
8a2c8fef 1037 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
293f5f65 1038 CPU_SSSE3_FLAGS, 0 },
8a2c8fef 1039 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
293f5f65 1040 CPU_SSE4_1_FLAGS, 0 },
8a2c8fef 1041 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
293f5f65 1042 CPU_SSE4_2_FLAGS, 0 },
8a2c8fef 1043 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
293f5f65 1044 CPU_SSE4_2_FLAGS, 0 },
8a2c8fef 1045 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
293f5f65 1046 CPU_AVX_FLAGS, 0 },
6c30d220 1047 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
293f5f65 1048 CPU_AVX2_FLAGS, 0 },
43234a1e 1049 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
293f5f65 1050 CPU_AVX512F_FLAGS, 0 },
43234a1e 1051 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
293f5f65 1052 CPU_AVX512CD_FLAGS, 0 },
43234a1e 1053 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
293f5f65 1054 CPU_AVX512ER_FLAGS, 0 },
43234a1e 1055 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
293f5f65 1056 CPU_AVX512PF_FLAGS, 0 },
1dfc6506 1057 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
293f5f65 1058 CPU_AVX512DQ_FLAGS, 0 },
1dfc6506 1059 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
293f5f65 1060 CPU_AVX512BW_FLAGS, 0 },
1dfc6506 1061 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
293f5f65 1062 CPU_AVX512VL_FLAGS, 0 },
8a2c8fef 1063 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
293f5f65 1064 CPU_VMX_FLAGS, 0 },
8729a6f6 1065 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
293f5f65 1066 CPU_VMFUNC_FLAGS, 0 },
8a2c8fef 1067 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
293f5f65 1068 CPU_SMX_FLAGS, 0 },
8a2c8fef 1069 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
293f5f65 1070 CPU_XSAVE_FLAGS, 0 },
c7b8aa3a 1071 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
293f5f65 1072 CPU_XSAVEOPT_FLAGS, 0 },
1dfc6506 1073 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
293f5f65 1074 CPU_XSAVEC_FLAGS, 0 },
1dfc6506 1075 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
293f5f65 1076 CPU_XSAVES_FLAGS, 0 },
8a2c8fef 1077 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
293f5f65 1078 CPU_AES_FLAGS, 0 },
8a2c8fef 1079 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
293f5f65 1080 CPU_PCLMUL_FLAGS, 0 },
8a2c8fef 1081 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
293f5f65 1082 CPU_PCLMUL_FLAGS, 1 },
c7b8aa3a 1083 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
293f5f65 1084 CPU_FSGSBASE_FLAGS, 0 },
c7b8aa3a 1085 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
293f5f65 1086 CPU_RDRND_FLAGS, 0 },
c7b8aa3a 1087 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
293f5f65 1088 CPU_F16C_FLAGS, 0 },
6c30d220 1089 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
293f5f65 1090 CPU_BMI2_FLAGS, 0 },
8a2c8fef 1091 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
293f5f65 1092 CPU_FMA_FLAGS, 0 },
8a2c8fef 1093 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
293f5f65 1094 CPU_FMA4_FLAGS, 0 },
8a2c8fef 1095 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
293f5f65 1096 CPU_XOP_FLAGS, 0 },
8a2c8fef 1097 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
293f5f65 1098 CPU_LWP_FLAGS, 0 },
8a2c8fef 1099 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
293f5f65 1100 CPU_MOVBE_FLAGS, 0 },
60aa667e 1101 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
293f5f65 1102 CPU_CX16_FLAGS, 0 },
8a2c8fef 1103 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
293f5f65 1104 CPU_EPT_FLAGS, 0 },
6c30d220 1105 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
293f5f65 1106 CPU_LZCNT_FLAGS, 0 },
272a84b1
L
1107 { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1108 CPU_POPCNT_FLAGS, 0 },
42164a71 1109 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
293f5f65 1110 CPU_HLE_FLAGS, 0 },
42164a71 1111 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
293f5f65 1112 CPU_RTM_FLAGS, 0 },
6c30d220 1113 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
293f5f65 1114 CPU_INVPCID_FLAGS, 0 },
8a2c8fef 1115 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
293f5f65 1116 CPU_CLFLUSH_FLAGS, 0 },
22109423 1117 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
293f5f65 1118 CPU_NOP_FLAGS, 0 },
8a2c8fef 1119 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
293f5f65 1120 CPU_SYSCALL_FLAGS, 0 },
8a2c8fef 1121 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
293f5f65 1122 CPU_RDTSCP_FLAGS, 0 },
8a2c8fef 1123 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
293f5f65 1124 CPU_3DNOW_FLAGS, 0 },
8a2c8fef 1125 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
293f5f65 1126 CPU_3DNOWA_FLAGS, 0 },
8a2c8fef 1127 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
293f5f65 1128 CPU_PADLOCK_FLAGS, 0 },
8a2c8fef 1129 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
293f5f65 1130 CPU_SVME_FLAGS, 1 },
8a2c8fef 1131 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
293f5f65 1132 CPU_SVME_FLAGS, 0 },
8a2c8fef 1133 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
293f5f65 1134 CPU_SSE4A_FLAGS, 0 },
8a2c8fef 1135 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
293f5f65 1136 CPU_ABM_FLAGS, 0 },
87973e9f 1137 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
293f5f65 1138 CPU_BMI_FLAGS, 0 },
2a2a0f38 1139 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
293f5f65 1140 CPU_TBM_FLAGS, 0 },
e2e1fcde 1141 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
293f5f65 1142 CPU_ADX_FLAGS, 0 },
e2e1fcde 1143 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
293f5f65 1144 CPU_RDSEED_FLAGS, 0 },
e2e1fcde 1145 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
293f5f65 1146 CPU_PRFCHW_FLAGS, 0 },
5c111e37 1147 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
293f5f65 1148 CPU_SMAP_FLAGS, 0 },
7e8b059b 1149 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
293f5f65 1150 CPU_MPX_FLAGS, 0 },
a0046408 1151 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
293f5f65 1152 CPU_SHA_FLAGS, 0 },
963f3586 1153 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
293f5f65 1154 CPU_CLFLUSHOPT_FLAGS, 0 },
dcf893b5 1155 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
293f5f65 1156 CPU_PREFETCHWT1_FLAGS, 0 },
2cf200a4 1157 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
293f5f65 1158 CPU_SE1_FLAGS, 0 },
c5e7287a 1159 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
293f5f65 1160 CPU_CLWB_FLAGS, 0 },
2cc1b5aa 1161 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
293f5f65 1162 CPU_AVX512IFMA_FLAGS, 0 },
14f195c9 1163 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
293f5f65 1164 CPU_AVX512VBMI_FLAGS, 0 },
920d2ddc
IT
1165 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1166 CPU_AVX512_4FMAPS_FLAGS, 0 },
47acf0bd
IT
1167 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1168 CPU_AVX512_4VNNIW_FLAGS, 0 },
620214f7
IT
1169 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1170 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
53467f57
IT
1171 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1172 CPU_AVX512_VBMI2_FLAGS, 0 },
8cfcb765
IT
1173 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1174 CPU_AVX512_VNNI_FLAGS, 0 },
ee6872be
IT
1175 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1176 CPU_AVX512_BITALG_FLAGS, 0 },
029f3522 1177 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
293f5f65 1178 CPU_CLZERO_FLAGS, 0 },
9916071f 1179 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
293f5f65 1180 CPU_MWAITX_FLAGS, 0 },
8eab4136 1181 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
293f5f65 1182 CPU_OSPKE_FLAGS, 0 },
8bc52696 1183 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
293f5f65 1184 CPU_RDPID_FLAGS, 0 },
6b40c462
L
1185 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1186 CPU_PTWRITE_FLAGS, 0 },
d777820b
IT
1187 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1188 CPU_IBT_FLAGS, 0 },
1189 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1190 CPU_SHSTK_FLAGS, 0 },
48521003
IT
1191 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1192 CPU_GFNI_FLAGS, 0 },
8dcf1fad
IT
1193 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1194 CPU_VAES_FLAGS, 0 },
ff1982d5
IT
1195 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1196 CPU_VPCLMULQDQ_FLAGS, 0 },
3233d7d0
IT
1197 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1198 CPU_WBNOINVD_FLAGS, 0 },
be3a8dca
IT
1199 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1200 CPU_PCONFIG_FLAGS, 0 },
de89d0a3
IT
1201 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1202 CPU_WAITPKG_FLAGS, 0 },
c48935d7
IT
1203 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1204 CPU_CLDEMOTE_FLAGS, 0 },
c0a30a9f
L
1205 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1206 CPU_MOVDIRI_FLAGS, 0 },
1207 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1208 CPU_MOVDIR64B_FLAGS, 0 },
d6aab7a1
XG
1209 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1210 CPU_AVX512_BF16_FLAGS, 0 },
9186c494
L
1211 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1212 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
dd455cf5
L
1213 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1214 CPU_ENQCMD_FLAGS, 0 },
4b27d27c
L
1215 { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1216 CPU_SERIALIZE_FLAGS, 0 },
142861df
JB
1217 { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1218 CPU_RDPRU_FLAGS, 0 },
1219 { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1220 CPU_MCOMMIT_FLAGS, 0 },
a847e322
JB
1221 { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1222 CPU_SEV_ES_FLAGS, 0 },
bb651e8b
CL
1223 { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1224 CPU_TSXLDTRK_FLAGS, 0 },
293f5f65
L
1225};
1226
1227static const noarch_entry cpu_noarch[] =
1228{
1229 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1848e567
L
1230 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1231 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1232 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
d871f3f4
L
1233 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1234 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
293f5f65
L
1235 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1236 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1848e567
L
1237 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1238 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
af5c13b0 1239 { STRING_COMMA_LEN ("nosse4a"), CPU_ANY_SSE4A_FLAGS },
1848e567
L
1240 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1241 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1242 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
af5c13b0 1243 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
293f5f65 1244 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1848e567 1245 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
144b71e2
L
1246 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1247 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1248 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1249 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1250 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1251 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1252 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1253 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1254 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
920d2ddc 1255 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
47acf0bd 1256 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
620214f7 1257 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
53467f57 1258 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
8cfcb765 1259 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
ee6872be 1260 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
d777820b
IT
1261 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1262 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
c0a30a9f
L
1263 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1264 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
d6aab7a1 1265 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
708a2fff
CL
1266 { STRING_COMMA_LEN ("noavx512_vp2intersect"),
1267 CPU_ANY_AVX512_VP2INTERSECT_FLAGS },
dd455cf5 1268 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
4b27d27c 1269 { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
bb651e8b 1270 { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
e413e4e9
AM
1271};
1272
704209c0 1273#ifdef I386COFF
a6c24e68
NC
1274/* Like s_lcomm_internal in gas/read.c but the alignment string
1275 is allowed to be optional. */
1276
1277static symbolS *
1278pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1279{
1280 addressT align = 0;
1281
1282 SKIP_WHITESPACE ();
1283
7ab9ffdd 1284 if (needs_align
a6c24e68
NC
1285 && *input_line_pointer == ',')
1286 {
1287 align = parse_align (needs_align - 1);
7ab9ffdd 1288
a6c24e68
NC
1289 if (align == (addressT) -1)
1290 return NULL;
1291 }
1292 else
1293 {
1294 if (size >= 8)
1295 align = 3;
1296 else if (size >= 4)
1297 align = 2;
1298 else if (size >= 2)
1299 align = 1;
1300 else
1301 align = 0;
1302 }
1303
1304 bss_alloc (symbolP, size, align);
1305 return symbolP;
1306}
1307
704209c0 1308static void
a6c24e68
NC
1309pe_lcomm (int needs_align)
1310{
1311 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1312}
704209c0 1313#endif
a6c24e68 1314
29b0f896
AM
1315const pseudo_typeS md_pseudo_table[] =
1316{
1317#if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1318 {"align", s_align_bytes, 0},
1319#else
1320 {"align", s_align_ptwo, 0},
1321#endif
1322 {"arch", set_cpu_arch, 0},
1323#ifndef I386COFF
1324 {"bss", s_bss, 0},
a6c24e68
NC
1325#else
1326 {"lcomm", pe_lcomm, 1},
29b0f896
AM
1327#endif
1328 {"ffloat", float_cons, 'f'},
1329 {"dfloat", float_cons, 'd'},
1330 {"tfloat", float_cons, 'x'},
1331 {"value", cons, 2},
d182319b 1332 {"slong", signed_cons, 4},
29b0f896
AM
1333 {"noopt", s_ignore, 0},
1334 {"optim", s_ignore, 0},
1335 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1336 {"code16", set_code_flag, CODE_16BIT},
1337 {"code32", set_code_flag, CODE_32BIT},
da5f19a2 1338#ifdef BFD64
29b0f896 1339 {"code64", set_code_flag, CODE_64BIT},
da5f19a2 1340#endif
29b0f896
AM
1341 {"intel_syntax", set_intel_syntax, 1},
1342 {"att_syntax", set_intel_syntax, 0},
1efbbeb4
L
1343 {"intel_mnemonic", set_intel_mnemonic, 1},
1344 {"att_mnemonic", set_intel_mnemonic, 0},
db51cc60
L
1345 {"allow_index_reg", set_allow_index_reg, 1},
1346 {"disallow_index_reg", set_allow_index_reg, 0},
7bab8ab5
JB
1347 {"sse_check", set_check, 0},
1348 {"operand_check", set_check, 1},
3b22753a
L
1349#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1350 {"largecomm", handle_large_common, 0},
07a53e5c 1351#else
68d20676 1352 {"file", dwarf2_directive_file, 0},
07a53e5c
RH
1353 {"loc", dwarf2_directive_loc, 0},
1354 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
3b22753a 1355#endif
6482c264
NC
1356#ifdef TE_PE
1357 {"secrel32", pe_directive_secrel, 0},
1358#endif
29b0f896
AM
1359 {0, 0, 0}
1360};
1361
1362/* For interface with expression (). */
1363extern char *input_line_pointer;
1364
1365/* Hash table for instruction mnemonic lookup. */
1366static struct hash_control *op_hash;
1367
1368/* Hash table for register lookup. */
1369static struct hash_control *reg_hash;
1370\f
ce8a8b2f
AM
1371 /* Various efficient no-op patterns for aligning code labels.
1372 Note: Don't try to assemble the instructions in the comments.
1373 0L and 0w are not legal. */
62a02d25
L
1374static const unsigned char f32_1[] =
1375 {0x90}; /* nop */
1376static const unsigned char f32_2[] =
1377 {0x66,0x90}; /* xchg %ax,%ax */
1378static const unsigned char f32_3[] =
1379 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1380static const unsigned char f32_4[] =
1381 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
62a02d25
L
1382static const unsigned char f32_6[] =
1383 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1384static const unsigned char f32_7[] =
1385 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
62a02d25 1386static const unsigned char f16_3[] =
3ae729d5 1387 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
62a02d25 1388static const unsigned char f16_4[] =
3ae729d5
L
1389 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1390static const unsigned char jump_disp8[] =
1391 {0xeb}; /* jmp disp8 */
1392static const unsigned char jump32_disp32[] =
1393 {0xe9}; /* jmp disp32 */
1394static const unsigned char jump16_disp32[] =
1395 {0x66,0xe9}; /* jmp disp32 */
62a02d25
L
1396/* 32-bit NOPs patterns. */
1397static const unsigned char *const f32_patt[] = {
3ae729d5 1398 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
62a02d25
L
1399};
1400/* 16-bit NOPs patterns. */
1401static const unsigned char *const f16_patt[] = {
3ae729d5 1402 f32_1, f32_2, f16_3, f16_4
62a02d25
L
1403};
1404/* nopl (%[re]ax) */
1405static const unsigned char alt_3[] =
1406 {0x0f,0x1f,0x00};
1407/* nopl 0(%[re]ax) */
1408static const unsigned char alt_4[] =
1409 {0x0f,0x1f,0x40,0x00};
1410/* nopl 0(%[re]ax,%[re]ax,1) */
1411static const unsigned char alt_5[] =
1412 {0x0f,0x1f,0x44,0x00,0x00};
1413/* nopw 0(%[re]ax,%[re]ax,1) */
1414static const unsigned char alt_6[] =
1415 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1416/* nopl 0L(%[re]ax) */
1417static const unsigned char alt_7[] =
1418 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1419/* nopl 0L(%[re]ax,%[re]ax,1) */
1420static const unsigned char alt_8[] =
1421 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1422/* nopw 0L(%[re]ax,%[re]ax,1) */
1423static const unsigned char alt_9[] =
1424 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1425/* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1426static const unsigned char alt_10[] =
1427 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
3ae729d5
L
1428/* data16 nopw %cs:0L(%eax,%eax,1) */
1429static const unsigned char alt_11[] =
1430 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
62a02d25
L
1431/* 32-bit and 64-bit NOPs patterns. */
1432static const unsigned char *const alt_patt[] = {
1433 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
3ae729d5 1434 alt_9, alt_10, alt_11
62a02d25
L
1435};
1436
1437/* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1438 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1439
1440static void
1441i386_output_nops (char *where, const unsigned char *const *patt,
1442 int count, int max_single_nop_size)
1443
1444{
3ae729d5
L
1445 /* Place the longer NOP first. */
1446 int last;
1447 int offset;
3076e594
NC
1448 const unsigned char *nops;
1449
1450 if (max_single_nop_size < 1)
1451 {
1452 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1453 max_single_nop_size);
1454 return;
1455 }
1456
1457 nops = patt[max_single_nop_size - 1];
3ae729d5
L
1458
1459 /* Use the smaller one if the requsted one isn't available. */
1460 if (nops == NULL)
62a02d25 1461 {
3ae729d5
L
1462 max_single_nop_size--;
1463 nops = patt[max_single_nop_size - 1];
62a02d25
L
1464 }
1465
3ae729d5
L
1466 last = count % max_single_nop_size;
1467
1468 count -= last;
1469 for (offset = 0; offset < count; offset += max_single_nop_size)
1470 memcpy (where + offset, nops, max_single_nop_size);
1471
1472 if (last)
1473 {
1474 nops = patt[last - 1];
1475 if (nops == NULL)
1476 {
1477 /* Use the smaller one plus one-byte NOP if the needed one
1478 isn't available. */
1479 last--;
1480 nops = patt[last - 1];
1481 memcpy (where + offset, nops, last);
1482 where[offset + last] = *patt[0];
1483 }
1484 else
1485 memcpy (where + offset, nops, last);
1486 }
62a02d25
L
1487}
1488
3ae729d5
L
1489static INLINE int
1490fits_in_imm7 (offsetT num)
1491{
1492 return (num & 0x7f) == num;
1493}
1494
1495static INLINE int
1496fits_in_imm31 (offsetT num)
1497{
1498 return (num & 0x7fffffff) == num;
1499}
62a02d25
L
1500
1501/* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1502 single NOP instruction LIMIT. */
1503
1504void
3ae729d5 1505i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
62a02d25 1506{
3ae729d5 1507 const unsigned char *const *patt = NULL;
62a02d25 1508 int max_single_nop_size;
3ae729d5
L
1509 /* Maximum number of NOPs before switching to jump over NOPs. */
1510 int max_number_of_nops;
62a02d25 1511
3ae729d5 1512 switch (fragP->fr_type)
62a02d25 1513 {
3ae729d5
L
1514 case rs_fill_nop:
1515 case rs_align_code:
1516 break;
e379e5f3
L
1517 case rs_machine_dependent:
1518 /* Allow NOP padding for jumps and calls. */
1519 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1520 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1521 break;
1522 /* Fall through. */
3ae729d5 1523 default:
62a02d25
L
1524 return;
1525 }
1526
ccc9c027
L
1527 /* We need to decide which NOP sequence to use for 32bit and
1528 64bit. When -mtune= is used:
4eed87de 1529
76bc74dc
L
1530 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1531 PROCESSOR_GENERIC32, f32_patt will be used.
80b8656c
L
1532 2. For the rest, alt_patt will be used.
1533
1534 When -mtune= isn't used, alt_patt will be used if
22109423 1535 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
76bc74dc 1536 be used.
ccc9c027
L
1537
1538 When -march= or .arch is used, we can't use anything beyond
1539 cpu_arch_isa_flags. */
1540
1541 if (flag_code == CODE_16BIT)
1542 {
3ae729d5
L
1543 patt = f16_patt;
1544 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1545 /* Limit number of NOPs to 2 in 16-bit mode. */
1546 max_number_of_nops = 2;
252b5132 1547 }
33fef721 1548 else
ccc9c027 1549 {
fbf3f584 1550 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
ccc9c027
L
1551 {
1552 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1553 switch (cpu_arch_tune)
1554 {
1555 case PROCESSOR_UNKNOWN:
1556 /* We use cpu_arch_isa_flags to check if we SHOULD
22109423
L
1557 optimize with nops. */
1558 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
80b8656c 1559 patt = alt_patt;
ccc9c027
L
1560 else
1561 patt = f32_patt;
1562 break;
ccc9c027
L
1563 case PROCESSOR_PENTIUM4:
1564 case PROCESSOR_NOCONA:
ef05d495 1565 case PROCESSOR_CORE:
76bc74dc 1566 case PROCESSOR_CORE2:
bd5295b2 1567 case PROCESSOR_COREI7:
3632d14b 1568 case PROCESSOR_L1OM:
7a9068fe 1569 case PROCESSOR_K1OM:
76bc74dc 1570 case PROCESSOR_GENERIC64:
ccc9c027
L
1571 case PROCESSOR_K6:
1572 case PROCESSOR_ATHLON:
1573 case PROCESSOR_K8:
4eed87de 1574 case PROCESSOR_AMDFAM10:
8aedb9fe 1575 case PROCESSOR_BD:
029f3522 1576 case PROCESSOR_ZNVER:
7b458c12 1577 case PROCESSOR_BT:
80b8656c 1578 patt = alt_patt;
ccc9c027 1579 break;
76bc74dc 1580 case PROCESSOR_I386:
ccc9c027
L
1581 case PROCESSOR_I486:
1582 case PROCESSOR_PENTIUM:
2dde1948 1583 case PROCESSOR_PENTIUMPRO:
81486035 1584 case PROCESSOR_IAMCU:
ccc9c027
L
1585 case PROCESSOR_GENERIC32:
1586 patt = f32_patt;
1587 break;
4eed87de 1588 }
ccc9c027
L
1589 }
1590 else
1591 {
fbf3f584 1592 switch (fragP->tc_frag_data.tune)
ccc9c027
L
1593 {
1594 case PROCESSOR_UNKNOWN:
e6a14101 1595 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
ccc9c027
L
1596 PROCESSOR_UNKNOWN. */
1597 abort ();
1598 break;
1599
76bc74dc 1600 case PROCESSOR_I386:
ccc9c027
L
1601 case PROCESSOR_I486:
1602 case PROCESSOR_PENTIUM:
81486035 1603 case PROCESSOR_IAMCU:
ccc9c027
L
1604 case PROCESSOR_K6:
1605 case PROCESSOR_ATHLON:
1606 case PROCESSOR_K8:
4eed87de 1607 case PROCESSOR_AMDFAM10:
8aedb9fe 1608 case PROCESSOR_BD:
029f3522 1609 case PROCESSOR_ZNVER:
7b458c12 1610 case PROCESSOR_BT:
ccc9c027
L
1611 case PROCESSOR_GENERIC32:
1612 /* We use cpu_arch_isa_flags to check if we CAN optimize
22109423
L
1613 with nops. */
1614 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
80b8656c 1615 patt = alt_patt;
ccc9c027
L
1616 else
1617 patt = f32_patt;
1618 break;
76bc74dc
L
1619 case PROCESSOR_PENTIUMPRO:
1620 case PROCESSOR_PENTIUM4:
1621 case PROCESSOR_NOCONA:
1622 case PROCESSOR_CORE:
ef05d495 1623 case PROCESSOR_CORE2:
bd5295b2 1624 case PROCESSOR_COREI7:
3632d14b 1625 case PROCESSOR_L1OM:
7a9068fe 1626 case PROCESSOR_K1OM:
22109423 1627 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
80b8656c 1628 patt = alt_patt;
ccc9c027
L
1629 else
1630 patt = f32_patt;
1631 break;
1632 case PROCESSOR_GENERIC64:
80b8656c 1633 patt = alt_patt;
ccc9c027 1634 break;
4eed87de 1635 }
ccc9c027
L
1636 }
1637
76bc74dc
L
1638 if (patt == f32_patt)
1639 {
3ae729d5
L
1640 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1641 /* Limit number of NOPs to 2 for older processors. */
1642 max_number_of_nops = 2;
76bc74dc
L
1643 }
1644 else
1645 {
3ae729d5
L
1646 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1647 /* Limit number of NOPs to 7 for newer processors. */
1648 max_number_of_nops = 7;
1649 }
1650 }
1651
1652 if (limit == 0)
1653 limit = max_single_nop_size;
1654
1655 if (fragP->fr_type == rs_fill_nop)
1656 {
1657 /* Output NOPs for .nop directive. */
1658 if (limit > max_single_nop_size)
1659 {
1660 as_bad_where (fragP->fr_file, fragP->fr_line,
1661 _("invalid single nop size: %d "
1662 "(expect within [0, %d])"),
1663 limit, max_single_nop_size);
1664 return;
1665 }
1666 }
e379e5f3 1667 else if (fragP->fr_type != rs_machine_dependent)
3ae729d5
L
1668 fragP->fr_var = count;
1669
1670 if ((count / max_single_nop_size) > max_number_of_nops)
1671 {
1672 /* Generate jump over NOPs. */
1673 offsetT disp = count - 2;
1674 if (fits_in_imm7 (disp))
1675 {
1676 /* Use "jmp disp8" if possible. */
1677 count = disp;
1678 where[0] = jump_disp8[0];
1679 where[1] = count;
1680 where += 2;
1681 }
1682 else
1683 {
1684 unsigned int size_of_jump;
1685
1686 if (flag_code == CODE_16BIT)
1687 {
1688 where[0] = jump16_disp32[0];
1689 where[1] = jump16_disp32[1];
1690 size_of_jump = 2;
1691 }
1692 else
1693 {
1694 where[0] = jump32_disp32[0];
1695 size_of_jump = 1;
1696 }
1697
1698 count -= size_of_jump + 4;
1699 if (!fits_in_imm31 (count))
1700 {
1701 as_bad_where (fragP->fr_file, fragP->fr_line,
1702 _("jump over nop padding out of range"));
1703 return;
1704 }
1705
1706 md_number_to_chars (where + size_of_jump, count, 4);
1707 where += size_of_jump + 4;
76bc74dc 1708 }
ccc9c027 1709 }
3ae729d5
L
1710
1711 /* Generate multiple NOPs. */
1712 i386_output_nops (where, patt, count, limit);
252b5132
RH
1713}
1714
c6fb90c8 1715static INLINE int
0dfbf9d7 1716operand_type_all_zero (const union i386_operand_type *x)
40fb9820 1717{
0dfbf9d7 1718 switch (ARRAY_SIZE(x->array))
c6fb90c8
L
1719 {
1720 case 3:
0dfbf9d7 1721 if (x->array[2])
c6fb90c8 1722 return 0;
1a0670f3 1723 /* Fall through. */
c6fb90c8 1724 case 2:
0dfbf9d7 1725 if (x->array[1])
c6fb90c8 1726 return 0;
1a0670f3 1727 /* Fall through. */
c6fb90c8 1728 case 1:
0dfbf9d7 1729 return !x->array[0];
c6fb90c8
L
1730 default:
1731 abort ();
1732 }
40fb9820
L
1733}
1734
c6fb90c8 1735static INLINE void
0dfbf9d7 1736operand_type_set (union i386_operand_type *x, unsigned int v)
40fb9820 1737{
0dfbf9d7 1738 switch (ARRAY_SIZE(x->array))
c6fb90c8
L
1739 {
1740 case 3:
0dfbf9d7 1741 x->array[2] = v;
1a0670f3 1742 /* Fall through. */
c6fb90c8 1743 case 2:
0dfbf9d7 1744 x->array[1] = v;
1a0670f3 1745 /* Fall through. */
c6fb90c8 1746 case 1:
0dfbf9d7 1747 x->array[0] = v;
1a0670f3 1748 /* Fall through. */
c6fb90c8
L
1749 break;
1750 default:
1751 abort ();
1752 }
bab6aec1
JB
1753
1754 x->bitfield.class = ClassNone;
75e5731b 1755 x->bitfield.instance = InstanceNone;
c6fb90c8 1756}
40fb9820 1757
c6fb90c8 1758static INLINE int
0dfbf9d7
L
1759operand_type_equal (const union i386_operand_type *x,
1760 const union i386_operand_type *y)
c6fb90c8 1761{
0dfbf9d7 1762 switch (ARRAY_SIZE(x->array))
c6fb90c8
L
1763 {
1764 case 3:
0dfbf9d7 1765 if (x->array[2] != y->array[2])
c6fb90c8 1766 return 0;
1a0670f3 1767 /* Fall through. */
c6fb90c8 1768 case 2:
0dfbf9d7 1769 if (x->array[1] != y->array[1])
c6fb90c8 1770 return 0;
1a0670f3 1771 /* Fall through. */
c6fb90c8 1772 case 1:
0dfbf9d7 1773 return x->array[0] == y->array[0];
c6fb90c8
L
1774 break;
1775 default:
1776 abort ();
1777 }
1778}
40fb9820 1779
0dfbf9d7
L
1780static INLINE int
1781cpu_flags_all_zero (const union i386_cpu_flags *x)
1782{
1783 switch (ARRAY_SIZE(x->array))
1784 {
53467f57
IT
1785 case 4:
1786 if (x->array[3])
1787 return 0;
1788 /* Fall through. */
0dfbf9d7
L
1789 case 3:
1790 if (x->array[2])
1791 return 0;
1a0670f3 1792 /* Fall through. */
0dfbf9d7
L
1793 case 2:
1794 if (x->array[1])
1795 return 0;
1a0670f3 1796 /* Fall through. */
0dfbf9d7
L
1797 case 1:
1798 return !x->array[0];
1799 default:
1800 abort ();
1801 }
1802}
1803
0dfbf9d7
L
1804static INLINE int
1805cpu_flags_equal (const union i386_cpu_flags *x,
1806 const union i386_cpu_flags *y)
1807{
1808 switch (ARRAY_SIZE(x->array))
1809 {
53467f57
IT
1810 case 4:
1811 if (x->array[3] != y->array[3])
1812 return 0;
1813 /* Fall through. */
0dfbf9d7
L
1814 case 3:
1815 if (x->array[2] != y->array[2])
1816 return 0;
1a0670f3 1817 /* Fall through. */
0dfbf9d7
L
1818 case 2:
1819 if (x->array[1] != y->array[1])
1820 return 0;
1a0670f3 1821 /* Fall through. */
0dfbf9d7
L
1822 case 1:
1823 return x->array[0] == y->array[0];
1824 break;
1825 default:
1826 abort ();
1827 }
1828}
c6fb90c8
L
1829
1830static INLINE int
1831cpu_flags_check_cpu64 (i386_cpu_flags f)
1832{
1833 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1834 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
40fb9820
L
1835}
1836
c6fb90c8
L
1837static INLINE i386_cpu_flags
1838cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
40fb9820 1839{
c6fb90c8
L
1840 switch (ARRAY_SIZE (x.array))
1841 {
53467f57
IT
1842 case 4:
1843 x.array [3] &= y.array [3];
1844 /* Fall through. */
c6fb90c8
L
1845 case 3:
1846 x.array [2] &= y.array [2];
1a0670f3 1847 /* Fall through. */
c6fb90c8
L
1848 case 2:
1849 x.array [1] &= y.array [1];
1a0670f3 1850 /* Fall through. */
c6fb90c8
L
1851 case 1:
1852 x.array [0] &= y.array [0];
1853 break;
1854 default:
1855 abort ();
1856 }
1857 return x;
1858}
40fb9820 1859
c6fb90c8
L
1860static INLINE i386_cpu_flags
1861cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
40fb9820 1862{
c6fb90c8 1863 switch (ARRAY_SIZE (x.array))
40fb9820 1864 {
53467f57
IT
1865 case 4:
1866 x.array [3] |= y.array [3];
1867 /* Fall through. */
c6fb90c8
L
1868 case 3:
1869 x.array [2] |= y.array [2];
1a0670f3 1870 /* Fall through. */
c6fb90c8
L
1871 case 2:
1872 x.array [1] |= y.array [1];
1a0670f3 1873 /* Fall through. */
c6fb90c8
L
1874 case 1:
1875 x.array [0] |= y.array [0];
40fb9820
L
1876 break;
1877 default:
1878 abort ();
1879 }
40fb9820
L
1880 return x;
1881}
1882
309d3373
JB
1883static INLINE i386_cpu_flags
1884cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1885{
1886 switch (ARRAY_SIZE (x.array))
1887 {
53467f57
IT
1888 case 4:
1889 x.array [3] &= ~y.array [3];
1890 /* Fall through. */
309d3373
JB
1891 case 3:
1892 x.array [2] &= ~y.array [2];
1a0670f3 1893 /* Fall through. */
309d3373
JB
1894 case 2:
1895 x.array [1] &= ~y.array [1];
1a0670f3 1896 /* Fall through. */
309d3373
JB
1897 case 1:
1898 x.array [0] &= ~y.array [0];
1899 break;
1900 default:
1901 abort ();
1902 }
1903 return x;
1904}
1905
6c0946d0
JB
1906static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1907
c0f3af97
L
1908#define CPU_FLAGS_ARCH_MATCH 0x1
1909#define CPU_FLAGS_64BIT_MATCH 0x2
1910
c0f3af97 1911#define CPU_FLAGS_PERFECT_MATCH \
db12e14e 1912 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
c0f3af97
L
1913
1914/* Return CPU flags match bits. */
3629bb00 1915
40fb9820 1916static int
d3ce72d0 1917cpu_flags_match (const insn_template *t)
40fb9820 1918{
c0f3af97
L
1919 i386_cpu_flags x = t->cpu_flags;
1920 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
40fb9820
L
1921
1922 x.bitfield.cpu64 = 0;
1923 x.bitfield.cpuno64 = 0;
1924
0dfbf9d7 1925 if (cpu_flags_all_zero (&x))
c0f3af97
L
1926 {
1927 /* This instruction is available on all archs. */
db12e14e 1928 match |= CPU_FLAGS_ARCH_MATCH;
c0f3af97 1929 }
3629bb00
L
1930 else
1931 {
c0f3af97 1932 /* This instruction is available only on some archs. */
3629bb00
L
1933 i386_cpu_flags cpu = cpu_arch_flags;
1934
ab592e75
JB
1935 /* AVX512VL is no standalone feature - match it and then strip it. */
1936 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1937 return match;
1938 x.bitfield.cpuavx512vl = 0;
1939
3629bb00 1940 cpu = cpu_flags_and (x, cpu);
c0f3af97
L
1941 if (!cpu_flags_all_zero (&cpu))
1942 {
a5ff0eb2
L
1943 if (x.bitfield.cpuavx)
1944 {
929f69fa 1945 /* We need to check a few extra flags with AVX. */
b9d49817 1946 if (cpu.bitfield.cpuavx
40d231b4
JB
1947 && (!t->opcode_modifier.sse2avx
1948 || (sse2avx && !i.prefix[DATA_PREFIX]))
b9d49817 1949 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
929f69fa 1950 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
b9d49817
JB
1951 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1952 match |= CPU_FLAGS_ARCH_MATCH;
a5ff0eb2 1953 }
929f69fa
JB
1954 else if (x.bitfield.cpuavx512f)
1955 {
1956 /* We need to check a few extra flags with AVX512F. */
1957 if (cpu.bitfield.cpuavx512f
1958 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1959 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1960 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1961 match |= CPU_FLAGS_ARCH_MATCH;
1962 }
a5ff0eb2 1963 else
db12e14e 1964 match |= CPU_FLAGS_ARCH_MATCH;
c0f3af97 1965 }
3629bb00 1966 }
c0f3af97 1967 return match;
40fb9820
L
1968}
1969
c6fb90c8
L
1970static INLINE i386_operand_type
1971operand_type_and (i386_operand_type x, i386_operand_type y)
40fb9820 1972{
bab6aec1
JB
1973 if (x.bitfield.class != y.bitfield.class)
1974 x.bitfield.class = ClassNone;
75e5731b
JB
1975 if (x.bitfield.instance != y.bitfield.instance)
1976 x.bitfield.instance = InstanceNone;
bab6aec1 1977
c6fb90c8
L
1978 switch (ARRAY_SIZE (x.array))
1979 {
1980 case 3:
1981 x.array [2] &= y.array [2];
1a0670f3 1982 /* Fall through. */
c6fb90c8
L
1983 case 2:
1984 x.array [1] &= y.array [1];
1a0670f3 1985 /* Fall through. */
c6fb90c8
L
1986 case 1:
1987 x.array [0] &= y.array [0];
1988 break;
1989 default:
1990 abort ();
1991 }
1992 return x;
40fb9820
L
1993}
1994
73053c1f
JB
1995static INLINE i386_operand_type
1996operand_type_and_not (i386_operand_type x, i386_operand_type y)
1997{
bab6aec1 1998 gas_assert (y.bitfield.class == ClassNone);
75e5731b 1999 gas_assert (y.bitfield.instance == InstanceNone);
bab6aec1 2000
73053c1f
JB
2001 switch (ARRAY_SIZE (x.array))
2002 {
2003 case 3:
2004 x.array [2] &= ~y.array [2];
2005 /* Fall through. */
2006 case 2:
2007 x.array [1] &= ~y.array [1];
2008 /* Fall through. */
2009 case 1:
2010 x.array [0] &= ~y.array [0];
2011 break;
2012 default:
2013 abort ();
2014 }
2015 return x;
2016}
2017
c6fb90c8
L
2018static INLINE i386_operand_type
2019operand_type_or (i386_operand_type x, i386_operand_type y)
40fb9820 2020{
bab6aec1
JB
2021 gas_assert (x.bitfield.class == ClassNone ||
2022 y.bitfield.class == ClassNone ||
2023 x.bitfield.class == y.bitfield.class);
75e5731b
JB
2024 gas_assert (x.bitfield.instance == InstanceNone ||
2025 y.bitfield.instance == InstanceNone ||
2026 x.bitfield.instance == y.bitfield.instance);
bab6aec1 2027
c6fb90c8 2028 switch (ARRAY_SIZE (x.array))
40fb9820 2029 {
c6fb90c8
L
2030 case 3:
2031 x.array [2] |= y.array [2];
1a0670f3 2032 /* Fall through. */
c6fb90c8
L
2033 case 2:
2034 x.array [1] |= y.array [1];
1a0670f3 2035 /* Fall through. */
c6fb90c8
L
2036 case 1:
2037 x.array [0] |= y.array [0];
40fb9820
L
2038 break;
2039 default:
2040 abort ();
2041 }
c6fb90c8
L
2042 return x;
2043}
40fb9820 2044
c6fb90c8
L
2045static INLINE i386_operand_type
2046operand_type_xor (i386_operand_type x, i386_operand_type y)
2047{
bab6aec1 2048 gas_assert (y.bitfield.class == ClassNone);
75e5731b 2049 gas_assert (y.bitfield.instance == InstanceNone);
bab6aec1 2050
c6fb90c8
L
2051 switch (ARRAY_SIZE (x.array))
2052 {
2053 case 3:
2054 x.array [2] ^= y.array [2];
1a0670f3 2055 /* Fall through. */
c6fb90c8
L
2056 case 2:
2057 x.array [1] ^= y.array [1];
1a0670f3 2058 /* Fall through. */
c6fb90c8
L
2059 case 1:
2060 x.array [0] ^= y.array [0];
2061 break;
2062 default:
2063 abort ();
2064 }
40fb9820
L
2065 return x;
2066}
2067
40fb9820
L
2068static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2069static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2070static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2071static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
bab6aec1
JB
2072static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2073static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
40fb9820 2074static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
43234a1e 2075static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
40fb9820
L
2076static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2077static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2078static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2079static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2080static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2081static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2082static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2083static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2084static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2085
2086enum operand_type
2087{
2088 reg,
40fb9820
L
2089 imm,
2090 disp,
2091 anymem
2092};
2093
c6fb90c8 2094static INLINE int
40fb9820
L
2095operand_type_check (i386_operand_type t, enum operand_type c)
2096{
2097 switch (c)
2098 {
2099 case reg:
bab6aec1 2100 return t.bitfield.class == Reg;
40fb9820 2101
40fb9820
L
2102 case imm:
2103 return (t.bitfield.imm8
2104 || t.bitfield.imm8s
2105 || t.bitfield.imm16
2106 || t.bitfield.imm32
2107 || t.bitfield.imm32s
2108 || t.bitfield.imm64);
2109
2110 case disp:
2111 return (t.bitfield.disp8
2112 || t.bitfield.disp16
2113 || t.bitfield.disp32
2114 || t.bitfield.disp32s
2115 || t.bitfield.disp64);
2116
2117 case anymem:
2118 return (t.bitfield.disp8
2119 || t.bitfield.disp16
2120 || t.bitfield.disp32
2121 || t.bitfield.disp32s
2122 || t.bitfield.disp64
2123 || t.bitfield.baseindex);
2124
2125 default:
2126 abort ();
2127 }
2cfe26b6
AM
2128
2129 return 0;
40fb9820
L
2130}
2131
7a54636a
L
2132/* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2133 between operand GIVEN and opeand WANTED for instruction template T. */
5c07affc
L
2134
2135static INLINE int
7a54636a
L
2136match_operand_size (const insn_template *t, unsigned int wanted,
2137 unsigned int given)
5c07affc 2138{
3ac21baa
JB
2139 return !((i.types[given].bitfield.byte
2140 && !t->operand_types[wanted].bitfield.byte)
2141 || (i.types[given].bitfield.word
2142 && !t->operand_types[wanted].bitfield.word)
2143 || (i.types[given].bitfield.dword
2144 && !t->operand_types[wanted].bitfield.dword)
2145 || (i.types[given].bitfield.qword
2146 && !t->operand_types[wanted].bitfield.qword)
2147 || (i.types[given].bitfield.tbyte
2148 && !t->operand_types[wanted].bitfield.tbyte));
5c07affc
L
2149}
2150
dd40ce22
L
2151/* Return 1 if there is no conflict in SIMD register between operand
2152 GIVEN and opeand WANTED for instruction template T. */
1b54b8d7
JB
2153
2154static INLINE int
dd40ce22
L
2155match_simd_size (const insn_template *t, unsigned int wanted,
2156 unsigned int given)
1b54b8d7 2157{
3ac21baa
JB
2158 return !((i.types[given].bitfield.xmmword
2159 && !t->operand_types[wanted].bitfield.xmmword)
2160 || (i.types[given].bitfield.ymmword
2161 && !t->operand_types[wanted].bitfield.ymmword)
2162 || (i.types[given].bitfield.zmmword
2163 && !t->operand_types[wanted].bitfield.zmmword));
1b54b8d7
JB
2164}
2165
7a54636a
L
2166/* Return 1 if there is no conflict in any size between operand GIVEN
2167 and opeand WANTED for instruction template T. */
5c07affc
L
2168
2169static INLINE int
dd40ce22
L
2170match_mem_size (const insn_template *t, unsigned int wanted,
2171 unsigned int given)
5c07affc 2172{
7a54636a 2173 return (match_operand_size (t, wanted, given)
3ac21baa 2174 && !((i.types[given].bitfield.unspecified
af508cb9 2175 && !i.broadcast
3ac21baa
JB
2176 && !t->operand_types[wanted].bitfield.unspecified)
2177 || (i.types[given].bitfield.fword
2178 && !t->operand_types[wanted].bitfield.fword)
1b54b8d7
JB
2179 /* For scalar opcode templates to allow register and memory
2180 operands at the same time, some special casing is needed
d6793fa1
JB
2181 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2182 down-conversion vpmov*. */
3528c362 2183 || ((t->operand_types[wanted].bitfield.class == RegSIMD
bc49bfd8
JB
2184 && t->operand_types[wanted].bitfield.byte
2185 + t->operand_types[wanted].bitfield.word
2186 + t->operand_types[wanted].bitfield.dword
2187 + t->operand_types[wanted].bitfield.qword
2188 > !!t->opcode_modifier.broadcast)
3ac21baa
JB
2189 ? (i.types[given].bitfield.xmmword
2190 || i.types[given].bitfield.ymmword
2191 || i.types[given].bitfield.zmmword)
2192 : !match_simd_size(t, wanted, given))));
5c07affc
L
2193}
2194
3ac21baa
JB
2195/* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2196 operands for instruction template T, and it has MATCH_REVERSE set if there
2197 is no size conflict on any operands for the template with operands reversed
2198 (and the template allows for reversing in the first place). */
5c07affc 2199
3ac21baa
JB
2200#define MATCH_STRAIGHT 1
2201#define MATCH_REVERSE 2
2202
2203static INLINE unsigned int
d3ce72d0 2204operand_size_match (const insn_template *t)
5c07affc 2205{
3ac21baa 2206 unsigned int j, match = MATCH_STRAIGHT;
5c07affc 2207
0cfa3eb3 2208 /* Don't check non-absolute jump instructions. */
5c07affc 2209 if (t->opcode_modifier.jump
0cfa3eb3 2210 && t->opcode_modifier.jump != JUMP_ABSOLUTE)
5c07affc
L
2211 return match;
2212
2213 /* Check memory and accumulator operand size. */
2214 for (j = 0; j < i.operands; j++)
2215 {
3528c362
JB
2216 if (i.types[j].bitfield.class != Reg
2217 && i.types[j].bitfield.class != RegSIMD
601e8564 2218 && t->opcode_modifier.anysize)
5c07affc
L
2219 continue;
2220
bab6aec1 2221 if (t->operand_types[j].bitfield.class == Reg
7a54636a 2222 && !match_operand_size (t, j, j))
5c07affc
L
2223 {
2224 match = 0;
2225 break;
2226 }
2227
3528c362 2228 if (t->operand_types[j].bitfield.class == RegSIMD
3ac21baa 2229 && !match_simd_size (t, j, j))
1b54b8d7
JB
2230 {
2231 match = 0;
2232 break;
2233 }
2234
75e5731b 2235 if (t->operand_types[j].bitfield.instance == Accum
7a54636a 2236 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
1b54b8d7
JB
2237 {
2238 match = 0;
2239 break;
2240 }
2241
c48dadc9 2242 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
5c07affc
L
2243 {
2244 match = 0;
2245 break;
2246 }
2247 }
2248
3ac21baa 2249 if (!t->opcode_modifier.d)
891edac4 2250 {
dc1e8a47 2251 mismatch:
3ac21baa
JB
2252 if (!match)
2253 i.error = operand_size_mismatch;
2254 return match;
891edac4 2255 }
5c07affc
L
2256
2257 /* Check reverse. */
f5eb1d70 2258 gas_assert (i.operands >= 2 && i.operands <= 3);
5c07affc 2259
f5eb1d70 2260 for (j = 0; j < i.operands; j++)
5c07affc 2261 {
f5eb1d70
JB
2262 unsigned int given = i.operands - j - 1;
2263
bab6aec1 2264 if (t->operand_types[j].bitfield.class == Reg
f5eb1d70 2265 && !match_operand_size (t, j, given))
891edac4 2266 goto mismatch;
5c07affc 2267
3528c362 2268 if (t->operand_types[j].bitfield.class == RegSIMD
f5eb1d70 2269 && !match_simd_size (t, j, given))
dbbc8b7e
JB
2270 goto mismatch;
2271
75e5731b 2272 if (t->operand_types[j].bitfield.instance == Accum
f5eb1d70
JB
2273 && (!match_operand_size (t, j, given)
2274 || !match_simd_size (t, j, given)))
dbbc8b7e
JB
2275 goto mismatch;
2276
f5eb1d70 2277 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
891edac4 2278 goto mismatch;
5c07affc
L
2279 }
2280
3ac21baa 2281 return match | MATCH_REVERSE;
5c07affc
L
2282}
2283
c6fb90c8 2284static INLINE int
40fb9820
L
2285operand_type_match (i386_operand_type overlap,
2286 i386_operand_type given)
2287{
2288 i386_operand_type temp = overlap;
2289
7d5e4556 2290 temp.bitfield.unspecified = 0;
5c07affc
L
2291 temp.bitfield.byte = 0;
2292 temp.bitfield.word = 0;
2293 temp.bitfield.dword = 0;
2294 temp.bitfield.fword = 0;
2295 temp.bitfield.qword = 0;
2296 temp.bitfield.tbyte = 0;
2297 temp.bitfield.xmmword = 0;
c0f3af97 2298 temp.bitfield.ymmword = 0;
43234a1e 2299 temp.bitfield.zmmword = 0;
0dfbf9d7 2300 if (operand_type_all_zero (&temp))
891edac4 2301 goto mismatch;
40fb9820 2302
6f2f06be 2303 if (given.bitfield.baseindex == overlap.bitfield.baseindex)
891edac4
L
2304 return 1;
2305
dc1e8a47 2306 mismatch:
a65babc9 2307 i.error = operand_type_mismatch;
891edac4 2308 return 0;
40fb9820
L
2309}
2310
7d5e4556 2311/* If given types g0 and g1 are registers they must be of the same type
10c17abd 2312 unless the expected operand type register overlap is null.
5de4d9ef 2313 Some Intel syntax memory operand size checking also happens here. */
40fb9820 2314
c6fb90c8 2315static INLINE int
dc821c5f 2316operand_type_register_match (i386_operand_type g0,
40fb9820 2317 i386_operand_type t0,
40fb9820
L
2318 i386_operand_type g1,
2319 i386_operand_type t1)
2320{
bab6aec1 2321 if (g0.bitfield.class != Reg
3528c362 2322 && g0.bitfield.class != RegSIMD
10c17abd
JB
2323 && (!operand_type_check (g0, anymem)
2324 || g0.bitfield.unspecified
5de4d9ef
JB
2325 || (t0.bitfield.class != Reg
2326 && t0.bitfield.class != RegSIMD)))
40fb9820
L
2327 return 1;
2328
bab6aec1 2329 if (g1.bitfield.class != Reg
3528c362 2330 && g1.bitfield.class != RegSIMD
10c17abd
JB
2331 && (!operand_type_check (g1, anymem)
2332 || g1.bitfield.unspecified
5de4d9ef
JB
2333 || (t1.bitfield.class != Reg
2334 && t1.bitfield.class != RegSIMD)))
40fb9820
L
2335 return 1;
2336
dc821c5f
JB
2337 if (g0.bitfield.byte == g1.bitfield.byte
2338 && g0.bitfield.word == g1.bitfield.word
2339 && g0.bitfield.dword == g1.bitfield.dword
10c17abd
JB
2340 && g0.bitfield.qword == g1.bitfield.qword
2341 && g0.bitfield.xmmword == g1.bitfield.xmmword
2342 && g0.bitfield.ymmword == g1.bitfield.ymmword
2343 && g0.bitfield.zmmword == g1.bitfield.zmmword)
40fb9820
L
2344 return 1;
2345
dc821c5f
JB
2346 if (!(t0.bitfield.byte & t1.bitfield.byte)
2347 && !(t0.bitfield.word & t1.bitfield.word)
2348 && !(t0.bitfield.dword & t1.bitfield.dword)
10c17abd
JB
2349 && !(t0.bitfield.qword & t1.bitfield.qword)
2350 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2351 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2352 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
891edac4
L
2353 return 1;
2354
a65babc9 2355 i.error = register_type_mismatch;
891edac4
L
2356
2357 return 0;
40fb9820
L
2358}
2359
4c692bc7
JB
2360static INLINE unsigned int
2361register_number (const reg_entry *r)
2362{
2363 unsigned int nr = r->reg_num;
2364
2365 if (r->reg_flags & RegRex)
2366 nr += 8;
2367
200cbe0f
L
2368 if (r->reg_flags & RegVRex)
2369 nr += 16;
2370
4c692bc7
JB
2371 return nr;
2372}
2373
252b5132 2374static INLINE unsigned int
40fb9820 2375mode_from_disp_size (i386_operand_type t)
252b5132 2376{
b5014f7a 2377 if (t.bitfield.disp8)
40fb9820
L
2378 return 1;
2379 else if (t.bitfield.disp16
2380 || t.bitfield.disp32
2381 || t.bitfield.disp32s)
2382 return 2;
2383 else
2384 return 0;
252b5132
RH
2385}
2386
2387static INLINE int
65879393 2388fits_in_signed_byte (addressT num)
252b5132 2389{
65879393 2390 return num + 0x80 <= 0xff;
47926f60 2391}
252b5132
RH
2392
2393static INLINE int
65879393 2394fits_in_unsigned_byte (addressT num)
252b5132 2395{
65879393 2396 return num <= 0xff;
47926f60 2397}
252b5132
RH
2398
2399static INLINE int
65879393 2400fits_in_unsigned_word (addressT num)
252b5132 2401{
65879393 2402 return num <= 0xffff;
47926f60 2403}
252b5132
RH
2404
2405static INLINE int
65879393 2406fits_in_signed_word (addressT num)
252b5132 2407{
65879393 2408 return num + 0x8000 <= 0xffff;
47926f60 2409}
2a962e6d 2410
3e73aa7c 2411static INLINE int
65879393 2412fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
3e73aa7c
JH
2413{
2414#ifndef BFD64
2415 return 1;
2416#else
65879393 2417 return num + 0x80000000 <= 0xffffffff;
3e73aa7c
JH
2418#endif
2419} /* fits_in_signed_long() */
2a962e6d 2420
3e73aa7c 2421static INLINE int
65879393 2422fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
3e73aa7c
JH
2423{
2424#ifndef BFD64
2425 return 1;
2426#else
65879393 2427 return num <= 0xffffffff;
3e73aa7c
JH
2428#endif
2429} /* fits_in_unsigned_long() */
252b5132 2430
43234a1e 2431static INLINE int
b5014f7a 2432fits_in_disp8 (offsetT num)
43234a1e
L
2433{
2434 int shift = i.memshift;
2435 unsigned int mask;
2436
2437 if (shift == -1)
2438 abort ();
2439
2440 mask = (1 << shift) - 1;
2441
2442 /* Return 0 if NUM isn't properly aligned. */
2443 if ((num & mask))
2444 return 0;
2445
2446 /* Check if NUM will fit in 8bit after shift. */
2447 return fits_in_signed_byte (num >> shift);
2448}
2449
a683cc34
SP
2450static INLINE int
2451fits_in_imm4 (offsetT num)
2452{
2453 return (num & 0xf) == num;
2454}
2455
40fb9820 2456static i386_operand_type
e3bb37b5 2457smallest_imm_type (offsetT num)
252b5132 2458{
40fb9820 2459 i386_operand_type t;
7ab9ffdd 2460
0dfbf9d7 2461 operand_type_set (&t, 0);
40fb9820
L
2462 t.bitfield.imm64 = 1;
2463
2464 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
e413e4e9
AM
2465 {
2466 /* This code is disabled on the 486 because all the Imm1 forms
2467 in the opcode table are slower on the i486. They're the
2468 versions with the implicitly specified single-position
2469 displacement, which has another syntax if you really want to
2470 use that form. */
40fb9820
L
2471 t.bitfield.imm1 = 1;
2472 t.bitfield.imm8 = 1;
2473 t.bitfield.imm8s = 1;
2474 t.bitfield.imm16 = 1;
2475 t.bitfield.imm32 = 1;
2476 t.bitfield.imm32s = 1;
2477 }
2478 else if (fits_in_signed_byte (num))
2479 {
2480 t.bitfield.imm8 = 1;
2481 t.bitfield.imm8s = 1;
2482 t.bitfield.imm16 = 1;
2483 t.bitfield.imm32 = 1;
2484 t.bitfield.imm32s = 1;
2485 }
2486 else if (fits_in_unsigned_byte (num))
2487 {
2488 t.bitfield.imm8 = 1;
2489 t.bitfield.imm16 = 1;
2490 t.bitfield.imm32 = 1;
2491 t.bitfield.imm32s = 1;
2492 }
2493 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2494 {
2495 t.bitfield.imm16 = 1;
2496 t.bitfield.imm32 = 1;
2497 t.bitfield.imm32s = 1;
2498 }
2499 else if (fits_in_signed_long (num))
2500 {
2501 t.bitfield.imm32 = 1;
2502 t.bitfield.imm32s = 1;
2503 }
2504 else if (fits_in_unsigned_long (num))
2505 t.bitfield.imm32 = 1;
2506
2507 return t;
47926f60 2508}
252b5132 2509
847f7ad4 2510static offsetT
e3bb37b5 2511offset_in_range (offsetT val, int size)
847f7ad4 2512{
508866be 2513 addressT mask;
ba2adb93 2514
847f7ad4
AM
2515 switch (size)
2516 {
508866be
L
2517 case 1: mask = ((addressT) 1 << 8) - 1; break;
2518 case 2: mask = ((addressT) 1 << 16) - 1; break;
3b0ec529 2519 case 4: mask = ((addressT) 2 << 31) - 1; break;
3e73aa7c
JH
2520#ifdef BFD64
2521 case 8: mask = ((addressT) 2 << 63) - 1; break;
2522#endif
47926f60 2523 default: abort ();
847f7ad4
AM
2524 }
2525
9de868bf
L
2526#ifdef BFD64
2527 /* If BFD64, sign extend val for 32bit address mode. */
2528 if (flag_code != CODE_64BIT
2529 || i.prefix[ADDR_PREFIX])
3e73aa7c
JH
2530 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2531 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
fa289fb8 2532#endif
ba2adb93 2533
47926f60 2534 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
847f7ad4
AM
2535 {
2536 char buf1[40], buf2[40];
2537
2538 sprint_value (buf1, val);
2539 sprint_value (buf2, val & mask);
2540 as_warn (_("%s shortened to %s"), buf1, buf2);
2541 }
2542 return val & mask;
2543}
2544
c32fa91d
L
2545enum PREFIX_GROUP
2546{
2547 PREFIX_EXIST = 0,
2548 PREFIX_LOCK,
2549 PREFIX_REP,
04ef582a 2550 PREFIX_DS,
c32fa91d
L
2551 PREFIX_OTHER
2552};
2553
2554/* Returns
2555 a. PREFIX_EXIST if attempting to add a prefix where one from the
2556 same class already exists.
2557 b. PREFIX_LOCK if lock prefix is added.
2558 c. PREFIX_REP if rep/repne prefix is added.
04ef582a
L
2559 d. PREFIX_DS if ds prefix is added.
2560 e. PREFIX_OTHER if other prefix is added.
c32fa91d
L
2561 */
2562
2563static enum PREFIX_GROUP
e3bb37b5 2564add_prefix (unsigned int prefix)
252b5132 2565{
c32fa91d 2566 enum PREFIX_GROUP ret = PREFIX_OTHER;
b1905489 2567 unsigned int q;
252b5132 2568
29b0f896
AM
2569 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2570 && flag_code == CODE_64BIT)
b1905489 2571 {
161a04f6 2572 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
44846f29
JB
2573 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2574 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2575 || (i.prefix[REX_PREFIX] & prefix & REX_B))
c32fa91d 2576 ret = PREFIX_EXIST;
b1905489
JB
2577 q = REX_PREFIX;
2578 }
3e73aa7c 2579 else
b1905489
JB
2580 {
2581 switch (prefix)
2582 {
2583 default:
2584 abort ();
2585
b1905489 2586 case DS_PREFIX_OPCODE:
04ef582a
L
2587 ret = PREFIX_DS;
2588 /* Fall through. */
2589 case CS_PREFIX_OPCODE:
b1905489
JB
2590 case ES_PREFIX_OPCODE:
2591 case FS_PREFIX_OPCODE:
2592 case GS_PREFIX_OPCODE:
2593 case SS_PREFIX_OPCODE:
2594 q = SEG_PREFIX;
2595 break;
2596
2597 case REPNE_PREFIX_OPCODE:
2598 case REPE_PREFIX_OPCODE:
c32fa91d
L
2599 q = REP_PREFIX;
2600 ret = PREFIX_REP;
2601 break;
2602
b1905489 2603 case LOCK_PREFIX_OPCODE:
c32fa91d
L
2604 q = LOCK_PREFIX;
2605 ret = PREFIX_LOCK;
b1905489
JB
2606 break;
2607
2608 case FWAIT_OPCODE:
2609 q = WAIT_PREFIX;
2610 break;
2611
2612 case ADDR_PREFIX_OPCODE:
2613 q = ADDR_PREFIX;
2614 break;
2615
2616 case DATA_PREFIX_OPCODE:
2617 q = DATA_PREFIX;
2618 break;
2619 }
2620 if (i.prefix[q] != 0)
c32fa91d 2621 ret = PREFIX_EXIST;
b1905489 2622 }
252b5132 2623
b1905489 2624 if (ret)
252b5132 2625 {
b1905489
JB
2626 if (!i.prefix[q])
2627 ++i.prefixes;
2628 i.prefix[q] |= prefix;
252b5132 2629 }
b1905489
JB
2630 else
2631 as_bad (_("same type of prefix used twice"));
252b5132 2632
252b5132
RH
2633 return ret;
2634}
2635
2636static void
78f12dd3 2637update_code_flag (int value, int check)
eecb386c 2638{
78f12dd3
L
2639 PRINTF_LIKE ((*as_error));
2640
1e9cc1c2 2641 flag_code = (enum flag_code) value;
40fb9820
L
2642 if (flag_code == CODE_64BIT)
2643 {
2644 cpu_arch_flags.bitfield.cpu64 = 1;
2645 cpu_arch_flags.bitfield.cpuno64 = 0;
40fb9820
L
2646 }
2647 else
2648 {
2649 cpu_arch_flags.bitfield.cpu64 = 0;
2650 cpu_arch_flags.bitfield.cpuno64 = 1;
40fb9820
L
2651 }
2652 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
3e73aa7c 2653 {
78f12dd3
L
2654 if (check)
2655 as_error = as_fatal;
2656 else
2657 as_error = as_bad;
2658 (*as_error) (_("64bit mode not supported on `%s'."),
2659 cpu_arch_name ? cpu_arch_name : default_arch);
3e73aa7c 2660 }
40fb9820 2661 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
3e73aa7c 2662 {
78f12dd3
L
2663 if (check)
2664 as_error = as_fatal;
2665 else
2666 as_error = as_bad;
2667 (*as_error) (_("32bit mode not supported on `%s'."),
2668 cpu_arch_name ? cpu_arch_name : default_arch);
3e73aa7c 2669 }
eecb386c
AM
2670 stackop_size = '\0';
2671}
2672
78f12dd3
L
2673static void
2674set_code_flag (int value)
2675{
2676 update_code_flag (value, 0);
2677}
2678
eecb386c 2679static void
e3bb37b5 2680set_16bit_gcc_code_flag (int new_code_flag)
252b5132 2681{
1e9cc1c2 2682 flag_code = (enum flag_code) new_code_flag;
40fb9820
L
2683 if (flag_code != CODE_16BIT)
2684 abort ();
2685 cpu_arch_flags.bitfield.cpu64 = 0;
2686 cpu_arch_flags.bitfield.cpuno64 = 1;
9306ca4a 2687 stackop_size = LONG_MNEM_SUFFIX;
252b5132
RH
2688}
2689
2690static void
e3bb37b5 2691set_intel_syntax (int syntax_flag)
252b5132
RH
2692{
2693 /* Find out if register prefixing is specified. */
2694 int ask_naked_reg = 0;
2695
2696 SKIP_WHITESPACE ();
29b0f896 2697 if (!is_end_of_line[(unsigned char) *input_line_pointer])
252b5132 2698 {
d02603dc
NC
2699 char *string;
2700 int e = get_symbol_name (&string);
252b5132 2701
47926f60 2702 if (strcmp (string, "prefix") == 0)
252b5132 2703 ask_naked_reg = 1;
47926f60 2704 else if (strcmp (string, "noprefix") == 0)
252b5132
RH
2705 ask_naked_reg = -1;
2706 else
d0b47220 2707 as_bad (_("bad argument to syntax directive."));
d02603dc 2708 (void) restore_line_pointer (e);
252b5132
RH
2709 }
2710 demand_empty_rest_of_line ();
c3332e24 2711
252b5132
RH
2712 intel_syntax = syntax_flag;
2713
2714 if (ask_naked_reg == 0)
f86103b7
AM
2715 allow_naked_reg = (intel_syntax
2716 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
252b5132
RH
2717 else
2718 allow_naked_reg = (ask_naked_reg < 0);
9306ca4a 2719
ee86248c 2720 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
7ab9ffdd 2721
e4a3b5a4 2722 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
9306ca4a 2723 identifier_chars['$'] = intel_syntax ? '$' : 0;
e4a3b5a4 2724 register_prefix = allow_naked_reg ? "" : "%";
252b5132
RH
2725}
2726
1efbbeb4
L
2727static void
2728set_intel_mnemonic (int mnemonic_flag)
2729{
e1d4d893 2730 intel_mnemonic = mnemonic_flag;
1efbbeb4
L
2731}
2732
db51cc60
L
2733static void
2734set_allow_index_reg (int flag)
2735{
2736 allow_index_reg = flag;
2737}
2738
cb19c032 2739static void
7bab8ab5 2740set_check (int what)
cb19c032 2741{
7bab8ab5
JB
2742 enum check_kind *kind;
2743 const char *str;
2744
2745 if (what)
2746 {
2747 kind = &operand_check;
2748 str = "operand";
2749 }
2750 else
2751 {
2752 kind = &sse_check;
2753 str = "sse";
2754 }
2755
cb19c032
L
2756 SKIP_WHITESPACE ();
2757
2758 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2759 {
d02603dc
NC
2760 char *string;
2761 int e = get_symbol_name (&string);
cb19c032
L
2762
2763 if (strcmp (string, "none") == 0)
7bab8ab5 2764 *kind = check_none;
cb19c032 2765 else if (strcmp (string, "warning") == 0)
7bab8ab5 2766 *kind = check_warning;
cb19c032 2767 else if (strcmp (string, "error") == 0)
7bab8ab5 2768 *kind = check_error;
cb19c032 2769 else
7bab8ab5 2770 as_bad (_("bad argument to %s_check directive."), str);
d02603dc 2771 (void) restore_line_pointer (e);
cb19c032
L
2772 }
2773 else
7bab8ab5 2774 as_bad (_("missing argument for %s_check directive"), str);
cb19c032
L
2775
2776 demand_empty_rest_of_line ();
2777}
2778
8a9036a4
L
2779static void
2780check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
1e9cc1c2 2781 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
8a9036a4
L
2782{
2783#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2784 static const char *arch;
2785
2786 /* Intel LIOM is only supported on ELF. */
2787 if (!IS_ELF)
2788 return;
2789
2790 if (!arch)
2791 {
2792 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2793 use default_arch. */
2794 arch = cpu_arch_name;
2795 if (!arch)
2796 arch = default_arch;
2797 }
2798
81486035
L
2799 /* If we are targeting Intel MCU, we must enable it. */
2800 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2801 || new_flag.bitfield.cpuiamcu)
2802 return;
2803
3632d14b 2804 /* If we are targeting Intel L1OM, we must enable it. */
8a9036a4 2805 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
1e9cc1c2 2806 || new_flag.bitfield.cpul1om)
8a9036a4 2807 return;
76ba9986 2808
7a9068fe
L
2809 /* If we are targeting Intel K1OM, we must enable it. */
2810 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2811 || new_flag.bitfield.cpuk1om)
2812 return;
2813
8a9036a4
L
2814 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2815#endif
2816}
2817
e413e4e9 2818static void
e3bb37b5 2819set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
e413e4e9 2820{
47926f60 2821 SKIP_WHITESPACE ();
e413e4e9 2822
29b0f896 2823 if (!is_end_of_line[(unsigned char) *input_line_pointer])
e413e4e9 2824 {
d02603dc
NC
2825 char *string;
2826 int e = get_symbol_name (&string);
91d6fa6a 2827 unsigned int j;
40fb9820 2828 i386_cpu_flags flags;
e413e4e9 2829
91d6fa6a 2830 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
e413e4e9 2831 {
91d6fa6a 2832 if (strcmp (string, cpu_arch[j].name) == 0)
e413e4e9 2833 {
91d6fa6a 2834 check_cpu_arch_compatible (string, cpu_arch[j].flags);
8a9036a4 2835
5c6af06e
JB
2836 if (*string != '.')
2837 {
91d6fa6a 2838 cpu_arch_name = cpu_arch[j].name;
5c6af06e 2839 cpu_sub_arch_name = NULL;
91d6fa6a 2840 cpu_arch_flags = cpu_arch[j].flags;
40fb9820
L
2841 if (flag_code == CODE_64BIT)
2842 {
2843 cpu_arch_flags.bitfield.cpu64 = 1;
2844 cpu_arch_flags.bitfield.cpuno64 = 0;
2845 }
2846 else
2847 {
2848 cpu_arch_flags.bitfield.cpu64 = 0;
2849 cpu_arch_flags.bitfield.cpuno64 = 1;
2850 }
91d6fa6a
NC
2851 cpu_arch_isa = cpu_arch[j].type;
2852 cpu_arch_isa_flags = cpu_arch[j].flags;
ccc9c027
L
2853 if (!cpu_arch_tune_set)
2854 {
2855 cpu_arch_tune = cpu_arch_isa;
2856 cpu_arch_tune_flags = cpu_arch_isa_flags;
2857 }
5c6af06e
JB
2858 break;
2859 }
40fb9820 2860
293f5f65
L
2861 flags = cpu_flags_or (cpu_arch_flags,
2862 cpu_arch[j].flags);
81486035 2863
5b64d091 2864 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
5c6af06e 2865 {
6305a203
L
2866 if (cpu_sub_arch_name)
2867 {
2868 char *name = cpu_sub_arch_name;
2869 cpu_sub_arch_name = concat (name,
91d6fa6a 2870 cpu_arch[j].name,
1bf57e9f 2871 (const char *) NULL);
6305a203
L
2872 free (name);
2873 }
2874 else
91d6fa6a 2875 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
40fb9820 2876 cpu_arch_flags = flags;
a586129e 2877 cpu_arch_isa_flags = flags;
5c6af06e 2878 }
0089dace
L
2879 else
2880 cpu_arch_isa_flags
2881 = cpu_flags_or (cpu_arch_isa_flags,
2882 cpu_arch[j].flags);
d02603dc 2883 (void) restore_line_pointer (e);
5c6af06e
JB
2884 demand_empty_rest_of_line ();
2885 return;
e413e4e9
AM
2886 }
2887 }
293f5f65
L
2888
2889 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2890 {
33eaf5de 2891 /* Disable an ISA extension. */
293f5f65
L
2892 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2893 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2894 {
2895 flags = cpu_flags_and_not (cpu_arch_flags,
2896 cpu_noarch[j].flags);
2897 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2898 {
2899 if (cpu_sub_arch_name)
2900 {
2901 char *name = cpu_sub_arch_name;
2902 cpu_sub_arch_name = concat (name, string,
2903 (const char *) NULL);
2904 free (name);
2905 }
2906 else
2907 cpu_sub_arch_name = xstrdup (string);
2908 cpu_arch_flags = flags;
2909 cpu_arch_isa_flags = flags;
2910 }
2911 (void) restore_line_pointer (e);
2912 demand_empty_rest_of_line ();
2913 return;
2914 }
2915
2916 j = ARRAY_SIZE (cpu_arch);
2917 }
2918
91d6fa6a 2919 if (j >= ARRAY_SIZE (cpu_arch))
e413e4e9
AM
2920 as_bad (_("no such architecture: `%s'"), string);
2921
2922 *input_line_pointer = e;
2923 }
2924 else
2925 as_bad (_("missing cpu architecture"));
2926
fddf5b5b
AM
2927 no_cond_jump_promotion = 0;
2928 if (*input_line_pointer == ','
29b0f896 2929 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
fddf5b5b 2930 {
d02603dc
NC
2931 char *string;
2932 char e;
2933
2934 ++input_line_pointer;
2935 e = get_symbol_name (&string);
fddf5b5b
AM
2936
2937 if (strcmp (string, "nojumps") == 0)
2938 no_cond_jump_promotion = 1;
2939 else if (strcmp (string, "jumps") == 0)
2940 ;
2941 else
2942 as_bad (_("no such architecture modifier: `%s'"), string);
2943
d02603dc 2944 (void) restore_line_pointer (e);
fddf5b5b
AM
2945 }
2946
e413e4e9
AM
2947 demand_empty_rest_of_line ();
2948}
2949
8a9036a4
L
2950enum bfd_architecture
2951i386_arch (void)
2952{
3632d14b 2953 if (cpu_arch_isa == PROCESSOR_L1OM)
8a9036a4
L
2954 {
2955 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2956 || flag_code != CODE_64BIT)
2957 as_fatal (_("Intel L1OM is 64bit ELF only"));
2958 return bfd_arch_l1om;
2959 }
7a9068fe
L
2960 else if (cpu_arch_isa == PROCESSOR_K1OM)
2961 {
2962 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2963 || flag_code != CODE_64BIT)
2964 as_fatal (_("Intel K1OM is 64bit ELF only"));
2965 return bfd_arch_k1om;
2966 }
81486035
L
2967 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2968 {
2969 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2970 || flag_code == CODE_64BIT)
2971 as_fatal (_("Intel MCU is 32bit ELF only"));
2972 return bfd_arch_iamcu;
2973 }
8a9036a4
L
2974 else
2975 return bfd_arch_i386;
2976}
2977
b9d79e03 2978unsigned long
7016a5d5 2979i386_mach (void)
b9d79e03 2980{
351f65ca 2981 if (!strncmp (default_arch, "x86_64", 6))
8a9036a4 2982 {
3632d14b 2983 if (cpu_arch_isa == PROCESSOR_L1OM)
8a9036a4 2984 {
351f65ca
L
2985 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2986 || default_arch[6] != '\0')
8a9036a4
L
2987 as_fatal (_("Intel L1OM is 64bit ELF only"));
2988 return bfd_mach_l1om;
2989 }
7a9068fe
L
2990 else if (cpu_arch_isa == PROCESSOR_K1OM)
2991 {
2992 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2993 || default_arch[6] != '\0')
2994 as_fatal (_("Intel K1OM is 64bit ELF only"));
2995 return bfd_mach_k1om;
2996 }
351f65ca 2997 else if (default_arch[6] == '\0')
8a9036a4 2998 return bfd_mach_x86_64;
351f65ca
L
2999 else
3000 return bfd_mach_x64_32;
8a9036a4 3001 }
5197d474
L
3002 else if (!strcmp (default_arch, "i386")
3003 || !strcmp (default_arch, "iamcu"))
81486035
L
3004 {
3005 if (cpu_arch_isa == PROCESSOR_IAMCU)
3006 {
3007 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3008 as_fatal (_("Intel MCU is 32bit ELF only"));
3009 return bfd_mach_i386_iamcu;
3010 }
3011 else
3012 return bfd_mach_i386_i386;
3013 }
b9d79e03 3014 else
2b5d6a91 3015 as_fatal (_("unknown architecture"));
b9d79e03 3016}
b9d79e03 3017\f
252b5132 3018void
7016a5d5 3019md_begin (void)
252b5132
RH
3020{
3021 const char *hash_err;
3022
86fa6981
L
3023 /* Support pseudo prefixes like {disp32}. */
3024 lex_type ['{'] = LEX_BEGIN_NAME;
3025
47926f60 3026 /* Initialize op_hash hash table. */
252b5132
RH
3027 op_hash = hash_new ();
3028
3029 {
d3ce72d0 3030 const insn_template *optab;
29b0f896 3031 templates *core_optab;
252b5132 3032
47926f60
KH
3033 /* Setup for loop. */
3034 optab = i386_optab;
add39d23 3035 core_optab = XNEW (templates);
252b5132
RH
3036 core_optab->start = optab;
3037
3038 while (1)
3039 {
3040 ++optab;
3041 if (optab->name == NULL
3042 || strcmp (optab->name, (optab - 1)->name) != 0)
3043 {
3044 /* different name --> ship out current template list;
47926f60 3045 add to hash table; & begin anew. */
252b5132
RH
3046 core_optab->end = optab;
3047 hash_err = hash_insert (op_hash,
3048 (optab - 1)->name,
5a49b8ac 3049 (void *) core_optab);
252b5132
RH
3050 if (hash_err)
3051 {
b37df7c4 3052 as_fatal (_("can't hash %s: %s"),
252b5132
RH
3053 (optab - 1)->name,
3054 hash_err);
3055 }
3056 if (optab->name == NULL)
3057 break;
add39d23 3058 core_optab = XNEW (templates);
252b5132
RH
3059 core_optab->start = optab;
3060 }
3061 }
3062 }
3063
47926f60 3064 /* Initialize reg_hash hash table. */
252b5132
RH
3065 reg_hash = hash_new ();
3066 {
29b0f896 3067 const reg_entry *regtab;
c3fe08fa 3068 unsigned int regtab_size = i386_regtab_size;
252b5132 3069
c3fe08fa 3070 for (regtab = i386_regtab; regtab_size--; regtab++)
252b5132 3071 {
5a49b8ac 3072 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
252b5132 3073 if (hash_err)
b37df7c4 3074 as_fatal (_("can't hash %s: %s"),
3e73aa7c
JH
3075 regtab->reg_name,
3076 hash_err);
252b5132
RH
3077 }
3078 }
3079
47926f60 3080 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
252b5132 3081 {
29b0f896
AM
3082 int c;
3083 char *p;
252b5132
RH
3084
3085 for (c = 0; c < 256; c++)
3086 {
3882b010 3087 if (ISDIGIT (c))
252b5132
RH
3088 {
3089 digit_chars[c] = c;
3090 mnemonic_chars[c] = c;
3091 register_chars[c] = c;
3092 operand_chars[c] = c;
3093 }
3882b010 3094 else if (ISLOWER (c))
252b5132
RH
3095 {
3096 mnemonic_chars[c] = c;
3097 register_chars[c] = c;
3098 operand_chars[c] = c;
3099 }
3882b010 3100 else if (ISUPPER (c))
252b5132 3101 {
3882b010 3102 mnemonic_chars[c] = TOLOWER (c);
252b5132
RH
3103 register_chars[c] = mnemonic_chars[c];
3104 operand_chars[c] = c;
3105 }
43234a1e 3106 else if (c == '{' || c == '}')
86fa6981
L
3107 {
3108 mnemonic_chars[c] = c;
3109 operand_chars[c] = c;
3110 }
252b5132 3111
3882b010 3112 if (ISALPHA (c) || ISDIGIT (c))
252b5132
RH
3113 identifier_chars[c] = c;
3114 else if (c >= 128)
3115 {
3116 identifier_chars[c] = c;
3117 operand_chars[c] = c;
3118 }
3119 }
3120
3121#ifdef LEX_AT
3122 identifier_chars['@'] = '@';
32137342
NC
3123#endif
3124#ifdef LEX_QM
3125 identifier_chars['?'] = '?';
3126 operand_chars['?'] = '?';
252b5132 3127#endif
252b5132 3128 digit_chars['-'] = '-';
c0f3af97 3129 mnemonic_chars['_'] = '_';
791fe849 3130 mnemonic_chars['-'] = '-';
0003779b 3131 mnemonic_chars['.'] = '.';
252b5132
RH
3132 identifier_chars['_'] = '_';
3133 identifier_chars['.'] = '.';
3134
3135 for (p = operand_special_chars; *p != '\0'; p++)
3136 operand_chars[(unsigned char) *p] = *p;
3137 }
3138
a4447b93
RH
3139 if (flag_code == CODE_64BIT)
3140 {
ca19b261
KT
3141#if defined (OBJ_COFF) && defined (TE_PE)
3142 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3143 ? 32 : 16);
3144#else
a4447b93 3145 x86_dwarf2_return_column = 16;
ca19b261 3146#endif
61ff971f 3147 x86_cie_data_alignment = -8;
a4447b93
RH
3148 }
3149 else
3150 {
3151 x86_dwarf2_return_column = 8;
3152 x86_cie_data_alignment = -4;
3153 }
e379e5f3
L
3154
3155 /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3156 can be turned into BRANCH_PREFIX frag. */
3157 if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3158 abort ();
252b5132
RH
3159}
3160
3161void
e3bb37b5 3162i386_print_statistics (FILE *file)
252b5132
RH
3163{
3164 hash_print_statistics (file, "i386 opcode", op_hash);
3165 hash_print_statistics (file, "i386 register", reg_hash);
3166}
3167\f
252b5132
RH
3168#ifdef DEBUG386
3169
ce8a8b2f 3170/* Debugging routines for md_assemble. */
d3ce72d0 3171static void pte (insn_template *);
40fb9820 3172static void pt (i386_operand_type);
e3bb37b5
L
3173static void pe (expressionS *);
3174static void ps (symbolS *);
252b5132
RH
3175
3176static void
2c703856 3177pi (const char *line, i386_insn *x)
252b5132 3178{
09137c09 3179 unsigned int j;
252b5132
RH
3180
3181 fprintf (stdout, "%s: template ", line);
3182 pte (&x->tm);
09f131f2
JH
3183 fprintf (stdout, " address: base %s index %s scale %x\n",
3184 x->base_reg ? x->base_reg->reg_name : "none",
3185 x->index_reg ? x->index_reg->reg_name : "none",
3186 x->log2_scale_factor);
3187 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
252b5132 3188 x->rm.mode, x->rm.reg, x->rm.regmem);
09f131f2
JH
3189 fprintf (stdout, " sib: base %x index %x scale %x\n",
3190 x->sib.base, x->sib.index, x->sib.scale);
3191 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
161a04f6
L
3192 (x->rex & REX_W) != 0,
3193 (x->rex & REX_R) != 0,
3194 (x->rex & REX_X) != 0,
3195 (x->rex & REX_B) != 0);
09137c09 3196 for (j = 0; j < x->operands; j++)
252b5132 3197 {
09137c09
SP
3198 fprintf (stdout, " #%d: ", j + 1);
3199 pt (x->types[j]);
252b5132 3200 fprintf (stdout, "\n");
bab6aec1 3201 if (x->types[j].bitfield.class == Reg
3528c362
JB
3202 || x->types[j].bitfield.class == RegMMX
3203 || x->types[j].bitfield.class == RegSIMD
dd6b8a0b 3204 || x->types[j].bitfield.class == RegMask
00cee14f 3205 || x->types[j].bitfield.class == SReg
4a5c67ed
JB
3206 || x->types[j].bitfield.class == RegCR
3207 || x->types[j].bitfield.class == RegDR
dd6b8a0b
JB
3208 || x->types[j].bitfield.class == RegTR
3209 || x->types[j].bitfield.class == RegBND)
09137c09
SP
3210 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3211 if (operand_type_check (x->types[j], imm))
3212 pe (x->op[j].imms);
3213 if (operand_type_check (x->types[j], disp))
3214 pe (x->op[j].disps);
252b5132
RH
3215 }
3216}
3217
3218static void
d3ce72d0 3219pte (insn_template *t)
252b5132 3220{
09137c09 3221 unsigned int j;
252b5132 3222 fprintf (stdout, " %d operands ", t->operands);
47926f60 3223 fprintf (stdout, "opcode %x ", t->base_opcode);
252b5132
RH
3224 if (t->extension_opcode != None)
3225 fprintf (stdout, "ext %x ", t->extension_opcode);
40fb9820 3226 if (t->opcode_modifier.d)
252b5132 3227 fprintf (stdout, "D");
40fb9820 3228 if (t->opcode_modifier.w)
252b5132
RH
3229 fprintf (stdout, "W");
3230 fprintf (stdout, "\n");
09137c09 3231 for (j = 0; j < t->operands; j++)
252b5132 3232 {
09137c09
SP
3233 fprintf (stdout, " #%d type ", j + 1);
3234 pt (t->operand_types[j]);
252b5132
RH
3235 fprintf (stdout, "\n");
3236 }
3237}
3238
3239static void
e3bb37b5 3240pe (expressionS *e)
252b5132 3241{
24eab124 3242 fprintf (stdout, " operation %d\n", e->X_op);
b77ad1d4
AM
3243 fprintf (stdout, " add_number %ld (%lx)\n",
3244 (long) e->X_add_number, (long) e->X_add_number);
252b5132
RH
3245 if (e->X_add_symbol)
3246 {
3247 fprintf (stdout, " add_symbol ");
3248 ps (e->X_add_symbol);
3249 fprintf (stdout, "\n");
3250 }
3251 if (e->X_op_symbol)
3252 {
3253 fprintf (stdout, " op_symbol ");
3254 ps (e->X_op_symbol);
3255 fprintf (stdout, "\n");
3256 }
3257}
3258
3259static void
e3bb37b5 3260ps (symbolS *s)
252b5132
RH
3261{
3262 fprintf (stdout, "%s type %s%s",
3263 S_GET_NAME (s),
3264 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3265 segment_name (S_GET_SEGMENT (s)));
3266}
3267
7b81dfbb 3268static struct type_name
252b5132 3269 {
40fb9820
L
3270 i386_operand_type mask;
3271 const char *name;
252b5132 3272 }
7b81dfbb 3273const type_names[] =
252b5132 3274{
40fb9820
L
3275 { OPERAND_TYPE_REG8, "r8" },
3276 { OPERAND_TYPE_REG16, "r16" },
3277 { OPERAND_TYPE_REG32, "r32" },
3278 { OPERAND_TYPE_REG64, "r64" },
2c703856
JB
3279 { OPERAND_TYPE_ACC8, "acc8" },
3280 { OPERAND_TYPE_ACC16, "acc16" },
3281 { OPERAND_TYPE_ACC32, "acc32" },
3282 { OPERAND_TYPE_ACC64, "acc64" },
40fb9820
L
3283 { OPERAND_TYPE_IMM8, "i8" },
3284 { OPERAND_TYPE_IMM8, "i8s" },
3285 { OPERAND_TYPE_IMM16, "i16" },
3286 { OPERAND_TYPE_IMM32, "i32" },
3287 { OPERAND_TYPE_IMM32S, "i32s" },
3288 { OPERAND_TYPE_IMM64, "i64" },
3289 { OPERAND_TYPE_IMM1, "i1" },
3290 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3291 { OPERAND_TYPE_DISP8, "d8" },
3292 { OPERAND_TYPE_DISP16, "d16" },
3293 { OPERAND_TYPE_DISP32, "d32" },
3294 { OPERAND_TYPE_DISP32S, "d32s" },
3295 { OPERAND_TYPE_DISP64, "d64" },
3296 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3297 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3298 { OPERAND_TYPE_CONTROL, "control reg" },
3299 { OPERAND_TYPE_TEST, "test reg" },
3300 { OPERAND_TYPE_DEBUG, "debug reg" },
3301 { OPERAND_TYPE_FLOATREG, "FReg" },
3302 { OPERAND_TYPE_FLOATACC, "FAcc" },
21df382b 3303 { OPERAND_TYPE_SREG, "SReg" },
40fb9820
L
3304 { OPERAND_TYPE_REGMMX, "rMMX" },
3305 { OPERAND_TYPE_REGXMM, "rXMM" },
0349dc08 3306 { OPERAND_TYPE_REGYMM, "rYMM" },
43234a1e
L
3307 { OPERAND_TYPE_REGZMM, "rZMM" },
3308 { OPERAND_TYPE_REGMASK, "Mask reg" },
252b5132
RH
3309};
3310
3311static void
40fb9820 3312pt (i386_operand_type t)
252b5132 3313{
40fb9820 3314 unsigned int j;
c6fb90c8 3315 i386_operand_type a;
252b5132 3316
40fb9820 3317 for (j = 0; j < ARRAY_SIZE (type_names); j++)
c6fb90c8
L
3318 {
3319 a = operand_type_and (t, type_names[j].mask);
2c703856 3320 if (operand_type_equal (&a, &type_names[j].mask))
c6fb90c8
L
3321 fprintf (stdout, "%s, ", type_names[j].name);
3322 }
252b5132
RH
3323 fflush (stdout);
3324}
3325
3326#endif /* DEBUG386 */
3327\f
252b5132 3328static bfd_reloc_code_real_type
3956db08 3329reloc (unsigned int size,
64e74474
AM
3330 int pcrel,
3331 int sign,
3332 bfd_reloc_code_real_type other)
252b5132 3333{
47926f60 3334 if (other != NO_RELOC)
3956db08 3335 {
91d6fa6a 3336 reloc_howto_type *rel;
3956db08
JB
3337
3338 if (size == 8)
3339 switch (other)
3340 {
64e74474
AM
3341 case BFD_RELOC_X86_64_GOT32:
3342 return BFD_RELOC_X86_64_GOT64;
3343 break;
553d1284
L
3344 case BFD_RELOC_X86_64_GOTPLT64:
3345 return BFD_RELOC_X86_64_GOTPLT64;
3346 break;
64e74474
AM
3347 case BFD_RELOC_X86_64_PLTOFF64:
3348 return BFD_RELOC_X86_64_PLTOFF64;
3349 break;
3350 case BFD_RELOC_X86_64_GOTPC32:
3351 other = BFD_RELOC_X86_64_GOTPC64;
3352 break;
3353 case BFD_RELOC_X86_64_GOTPCREL:
3354 other = BFD_RELOC_X86_64_GOTPCREL64;
3355 break;
3356 case BFD_RELOC_X86_64_TPOFF32:
3357 other = BFD_RELOC_X86_64_TPOFF64;
3358 break;
3359 case BFD_RELOC_X86_64_DTPOFF32:
3360 other = BFD_RELOC_X86_64_DTPOFF64;
3361 break;
3362 default:
3363 break;
3956db08 3364 }
e05278af 3365
8ce3d284 3366#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8fd4256d
L
3367 if (other == BFD_RELOC_SIZE32)
3368 {
3369 if (size == 8)
1ab668bf 3370 other = BFD_RELOC_SIZE64;
8fd4256d 3371 if (pcrel)
1ab668bf
AM
3372 {
3373 as_bad (_("there are no pc-relative size relocations"));
3374 return NO_RELOC;
3375 }
8fd4256d 3376 }
8ce3d284 3377#endif
8fd4256d 3378
e05278af 3379 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
f2d8a97c 3380 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
e05278af
JB
3381 sign = -1;
3382
91d6fa6a
NC
3383 rel = bfd_reloc_type_lookup (stdoutput, other);
3384 if (!rel)
3956db08 3385 as_bad (_("unknown relocation (%u)"), other);
91d6fa6a 3386 else if (size != bfd_get_reloc_size (rel))
3956db08 3387 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
91d6fa6a 3388 bfd_get_reloc_size (rel),
3956db08 3389 size);
91d6fa6a 3390 else if (pcrel && !rel->pc_relative)
3956db08 3391 as_bad (_("non-pc-relative relocation for pc-relative field"));
91d6fa6a 3392 else if ((rel->complain_on_overflow == complain_overflow_signed
3956db08 3393 && !sign)
91d6fa6a 3394 || (rel->complain_on_overflow == complain_overflow_unsigned
64e74474 3395 && sign > 0))
3956db08
JB
3396 as_bad (_("relocated field and relocation type differ in signedness"));
3397 else
3398 return other;
3399 return NO_RELOC;
3400 }
252b5132
RH
3401
3402 if (pcrel)
3403 {
3e73aa7c 3404 if (!sign)
3956db08 3405 as_bad (_("there are no unsigned pc-relative relocations"));
252b5132
RH
3406 switch (size)
3407 {
3408 case 1: return BFD_RELOC_8_PCREL;
3409 case 2: return BFD_RELOC_16_PCREL;
d258b828 3410 case 4: return BFD_RELOC_32_PCREL;
d6ab8113 3411 case 8: return BFD_RELOC_64_PCREL;
252b5132 3412 }
3956db08 3413 as_bad (_("cannot do %u byte pc-relative relocation"), size);
252b5132
RH
3414 }
3415 else
3416 {
3956db08 3417 if (sign > 0)
e5cb08ac 3418 switch (size)
3e73aa7c
JH
3419 {
3420 case 4: return BFD_RELOC_X86_64_32S;
3421 }
3422 else
3423 switch (size)
3424 {
3425 case 1: return BFD_RELOC_8;
3426 case 2: return BFD_RELOC_16;
3427 case 4: return BFD_RELOC_32;
3428 case 8: return BFD_RELOC_64;
3429 }
3956db08
JB
3430 as_bad (_("cannot do %s %u byte relocation"),
3431 sign > 0 ? "signed" : "unsigned", size);
252b5132
RH
3432 }
3433
0cc9e1d3 3434 return NO_RELOC;
252b5132
RH
3435}
3436
47926f60
KH
3437/* Here we decide which fixups can be adjusted to make them relative to
3438 the beginning of the section instead of the symbol. Basically we need
3439 to make sure that the dynamic relocations are done correctly, so in
3440 some cases we force the original symbol to be used. */
3441
252b5132 3442int
e3bb37b5 3443tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
252b5132 3444{
6d249963 3445#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 3446 if (!IS_ELF)
31312f95
AM
3447 return 1;
3448
a161fe53
AM
3449 /* Don't adjust pc-relative references to merge sections in 64-bit
3450 mode. */
3451 if (use_rela_relocations
3452 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3453 && fixP->fx_pcrel)
252b5132 3454 return 0;
31312f95 3455
8d01d9a9
AJ
3456 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3457 and changed later by validate_fix. */
3458 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3459 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3460 return 0;
3461
8fd4256d
L
3462 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3463 for size relocations. */
3464 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3465 || fixP->fx_r_type == BFD_RELOC_SIZE64
3466 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
252b5132 3467 || fixP->fx_r_type == BFD_RELOC_386_GOT32
02a86693 3468 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
13ae64f3
JJ
3469 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3470 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3471 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3472 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
37e55690
JJ
3473 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3474 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
13ae64f3
JJ
3475 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3476 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
67a4f2b7
AO
3477 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3478 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3e73aa7c 3479 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
80b3ee89 3480 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
56ceb5b5
L
3481 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3482 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
bffbf940
JJ
3483 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3484 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3485 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
d6ab8113 3486 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
bffbf940
JJ
3487 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3488 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
d6ab8113
JB
3489 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3490 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
67a4f2b7
AO
3491 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3492 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
252b5132
RH
3493 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3494 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3495 return 0;
31312f95 3496#endif
252b5132
RH
3497 return 1;
3498}
252b5132 3499
b4cac588 3500static int
e3bb37b5 3501intel_float_operand (const char *mnemonic)
252b5132 3502{
9306ca4a
JB
3503 /* Note that the value returned is meaningful only for opcodes with (memory)
3504 operands, hence the code here is free to improperly handle opcodes that
3505 have no operands (for better performance and smaller code). */
3506
3507 if (mnemonic[0] != 'f')
3508 return 0; /* non-math */
3509
3510 switch (mnemonic[1])
3511 {
3512 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3513 the fs segment override prefix not currently handled because no
3514 call path can make opcodes without operands get here */
3515 case 'i':
3516 return 2 /* integer op */;
3517 case 'l':
3518 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3519 return 3; /* fldcw/fldenv */
3520 break;
3521 case 'n':
3522 if (mnemonic[2] != 'o' /* fnop */)
3523 return 3; /* non-waiting control op */
3524 break;
3525 case 'r':
3526 if (mnemonic[2] == 's')
3527 return 3; /* frstor/frstpm */
3528 break;
3529 case 's':
3530 if (mnemonic[2] == 'a')
3531 return 3; /* fsave */
3532 if (mnemonic[2] == 't')
3533 {
3534 switch (mnemonic[3])
3535 {
3536 case 'c': /* fstcw */
3537 case 'd': /* fstdw */
3538 case 'e': /* fstenv */
3539 case 's': /* fsts[gw] */
3540 return 3;
3541 }
3542 }
3543 break;
3544 case 'x':
3545 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3546 return 0; /* fxsave/fxrstor are not really math ops */
3547 break;
3548 }
252b5132 3549
9306ca4a 3550 return 1;
252b5132
RH
3551}
3552
c0f3af97
L
3553/* Build the VEX prefix. */
3554
3555static void
d3ce72d0 3556build_vex_prefix (const insn_template *t)
c0f3af97
L
3557{
3558 unsigned int register_specifier;
3559 unsigned int implied_prefix;
3560 unsigned int vector_length;
03751133 3561 unsigned int w;
c0f3af97
L
3562
3563 /* Check register specifier. */
3564 if (i.vex.register_specifier)
43234a1e
L
3565 {
3566 register_specifier =
3567 ~register_number (i.vex.register_specifier) & 0xf;
3568 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3569 }
c0f3af97
L
3570 else
3571 register_specifier = 0xf;
3572
79f0fa25
L
3573 /* Use 2-byte VEX prefix by swapping destination and source operand
3574 if there are more than 1 register operand. */
3575 if (i.reg_operands > 1
3576 && i.vec_encoding != vex_encoding_vex3
86fa6981 3577 && i.dir_encoding == dir_encoding_default
fa99fab2 3578 && i.operands == i.reg_operands
dbbc8b7e 3579 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
7f399153 3580 && i.tm.opcode_modifier.vexopcode == VEX0F
dbbc8b7e 3581 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
fa99fab2
L
3582 && i.rex == REX_B)
3583 {
3584 unsigned int xchg = i.operands - 1;
3585 union i386_op temp_op;
3586 i386_operand_type temp_type;
3587
3588 temp_type = i.types[xchg];
3589 i.types[xchg] = i.types[0];
3590 i.types[0] = temp_type;
3591 temp_op = i.op[xchg];
3592 i.op[xchg] = i.op[0];
3593 i.op[0] = temp_op;
3594
9c2799c2 3595 gas_assert (i.rm.mode == 3);
fa99fab2
L
3596
3597 i.rex = REX_R;
3598 xchg = i.rm.regmem;
3599 i.rm.regmem = i.rm.reg;
3600 i.rm.reg = xchg;
3601
dbbc8b7e
JB
3602 if (i.tm.opcode_modifier.d)
3603 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3604 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3605 else /* Use the next insn. */
3606 i.tm = t[1];
fa99fab2
L
3607 }
3608
79dec6b7
JB
3609 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3610 are no memory operands and at least 3 register ones. */
3611 if (i.reg_operands >= 3
3612 && i.vec_encoding != vex_encoding_vex3
3613 && i.reg_operands == i.operands - i.imm_operands
3614 && i.tm.opcode_modifier.vex
3615 && i.tm.opcode_modifier.commutative
3616 && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3617 && i.rex == REX_B
3618 && i.vex.register_specifier
3619 && !(i.vex.register_specifier->reg_flags & RegRex))
3620 {
3621 unsigned int xchg = i.operands - i.reg_operands;
3622 union i386_op temp_op;
3623 i386_operand_type temp_type;
3624
3625 gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3626 gas_assert (!i.tm.opcode_modifier.sae);
3627 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3628 &i.types[i.operands - 3]));
3629 gas_assert (i.rm.mode == 3);
3630
3631 temp_type = i.types[xchg];
3632 i.types[xchg] = i.types[xchg + 1];
3633 i.types[xchg + 1] = temp_type;
3634 temp_op = i.op[xchg];
3635 i.op[xchg] = i.op[xchg + 1];
3636 i.op[xchg + 1] = temp_op;
3637
3638 i.rex = 0;
3639 xchg = i.rm.regmem | 8;
3640 i.rm.regmem = ~register_specifier & 0xf;
3641 gas_assert (!(i.rm.regmem & 8));
3642 i.vex.register_specifier += xchg - i.rm.regmem;
3643 register_specifier = ~xchg & 0xf;
3644 }
3645
539f890d
L
3646 if (i.tm.opcode_modifier.vex == VEXScalar)
3647 vector_length = avxscalar;
10c17abd
JB
3648 else if (i.tm.opcode_modifier.vex == VEX256)
3649 vector_length = 1;
539f890d 3650 else
10c17abd 3651 {
56522fc5 3652 unsigned int op;
10c17abd 3653
c7213af9
L
3654 /* Determine vector length from the last multi-length vector
3655 operand. */
10c17abd 3656 vector_length = 0;
56522fc5 3657 for (op = t->operands; op--;)
10c17abd
JB
3658 if (t->operand_types[op].bitfield.xmmword
3659 && t->operand_types[op].bitfield.ymmword
3660 && i.types[op].bitfield.ymmword)
3661 {
3662 vector_length = 1;
3663 break;
3664 }
3665 }
c0f3af97 3666
8c190ce0 3667 switch ((i.tm.base_opcode >> (i.tm.opcode_length << 3)) & 0xff)
c0f3af97
L
3668 {
3669 case 0:
3670 implied_prefix = 0;
3671 break;
3672 case DATA_PREFIX_OPCODE:
3673 implied_prefix = 1;
3674 break;
3675 case REPE_PREFIX_OPCODE:
3676 implied_prefix = 2;
3677 break;
3678 case REPNE_PREFIX_OPCODE:
3679 implied_prefix = 3;
3680 break;
3681 default:
3682 abort ();
3683 }
3684
03751133
L
3685 /* Check the REX.W bit and VEXW. */
3686 if (i.tm.opcode_modifier.vexw == VEXWIG)
3687 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3688 else if (i.tm.opcode_modifier.vexw)
3689 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3690 else
931d03b7 3691 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
03751133 3692
c0f3af97 3693 /* Use 2-byte VEX prefix if possible. */
03751133
L
3694 if (w == 0
3695 && i.vec_encoding != vex_encoding_vex3
86fa6981 3696 && i.tm.opcode_modifier.vexopcode == VEX0F
c0f3af97
L
3697 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3698 {
3699 /* 2-byte VEX prefix. */
3700 unsigned int r;
3701
3702 i.vex.length = 2;
3703 i.vex.bytes[0] = 0xc5;
3704
3705 /* Check the REX.R bit. */
3706 r = (i.rex & REX_R) ? 0 : 1;
3707 i.vex.bytes[1] = (r << 7
3708 | register_specifier << 3
3709 | vector_length << 2
3710 | implied_prefix);
3711 }
3712 else
3713 {
3714 /* 3-byte VEX prefix. */
03751133 3715 unsigned int m;
c0f3af97 3716
f88c9eb0 3717 i.vex.length = 3;
f88c9eb0 3718
7f399153 3719 switch (i.tm.opcode_modifier.vexopcode)
5dd85c99 3720 {
7f399153
L
3721 case VEX0F:
3722 m = 0x1;
80de6e00 3723 i.vex.bytes[0] = 0xc4;
7f399153
L
3724 break;
3725 case VEX0F38:
3726 m = 0x2;
80de6e00 3727 i.vex.bytes[0] = 0xc4;
7f399153
L
3728 break;
3729 case VEX0F3A:
3730 m = 0x3;
80de6e00 3731 i.vex.bytes[0] = 0xc4;
7f399153
L
3732 break;
3733 case XOP08:
5dd85c99
SP
3734 m = 0x8;
3735 i.vex.bytes[0] = 0x8f;
7f399153
L
3736 break;
3737 case XOP09:
f88c9eb0
SP
3738 m = 0x9;
3739 i.vex.bytes[0] = 0x8f;
7f399153
L
3740 break;
3741 case XOP0A:
f88c9eb0
SP
3742 m = 0xa;
3743 i.vex.bytes[0] = 0x8f;
7f399153
L
3744 break;
3745 default:
3746 abort ();
f88c9eb0 3747 }
c0f3af97 3748
c0f3af97
L
3749 /* The high 3 bits of the second VEX byte are 1's compliment
3750 of RXB bits from REX. */
3751 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3752
c0f3af97
L
3753 i.vex.bytes[2] = (w << 7
3754 | register_specifier << 3
3755 | vector_length << 2
3756 | implied_prefix);
3757 }
3758}
3759
e771e7c9
JB
3760static INLINE bfd_boolean
3761is_evex_encoding (const insn_template *t)
3762{
7091c612 3763 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
e771e7c9 3764 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
a80195f1 3765 || t->opcode_modifier.sae;
e771e7c9
JB
3766}
3767
7a8655d2
JB
3768static INLINE bfd_boolean
3769is_any_vex_encoding (const insn_template *t)
3770{
3771 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3772 || is_evex_encoding (t);
3773}
3774
43234a1e
L
3775/* Build the EVEX prefix. */
3776
3777static void
3778build_evex_prefix (void)
3779{
3780 unsigned int register_specifier;
3781 unsigned int implied_prefix;
3782 unsigned int m, w;
3783 rex_byte vrex_used = 0;
3784
3785 /* Check register specifier. */
3786 if (i.vex.register_specifier)
3787 {
3788 gas_assert ((i.vrex & REX_X) == 0);
3789
3790 register_specifier = i.vex.register_specifier->reg_num;
3791 if ((i.vex.register_specifier->reg_flags & RegRex))
3792 register_specifier += 8;
3793 /* The upper 16 registers are encoded in the fourth byte of the
3794 EVEX prefix. */
3795 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3796 i.vex.bytes[3] = 0x8;
3797 register_specifier = ~register_specifier & 0xf;
3798 }
3799 else
3800 {
3801 register_specifier = 0xf;
3802
3803 /* Encode upper 16 vector index register in the fourth byte of
3804 the EVEX prefix. */
3805 if (!(i.vrex & REX_X))
3806 i.vex.bytes[3] = 0x8;
3807 else
3808 vrex_used |= REX_X;
3809 }
3810
3811 switch ((i.tm.base_opcode >> 8) & 0xff)
3812 {
3813 case 0:
3814 implied_prefix = 0;
3815 break;
3816 case DATA_PREFIX_OPCODE:
3817 implied_prefix = 1;
3818 break;
3819 case REPE_PREFIX_OPCODE:
3820 implied_prefix = 2;
3821 break;
3822 case REPNE_PREFIX_OPCODE:
3823 implied_prefix = 3;
3824 break;
3825 default:
3826 abort ();
3827 }
3828
3829 /* 4 byte EVEX prefix. */
3830 i.vex.length = 4;
3831 i.vex.bytes[0] = 0x62;
3832
3833 /* mmmm bits. */
3834 switch (i.tm.opcode_modifier.vexopcode)
3835 {
3836 case VEX0F:
3837 m = 1;
3838 break;
3839 case VEX0F38:
3840 m = 2;
3841 break;
3842 case VEX0F3A:
3843 m = 3;
3844 break;
3845 default:
3846 abort ();
3847 break;
3848 }
3849
3850 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3851 bits from REX. */
3852 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3853
3854 /* The fifth bit of the second EVEX byte is 1's compliment of the
3855 REX_R bit in VREX. */
3856 if (!(i.vrex & REX_R))
3857 i.vex.bytes[1] |= 0x10;
3858 else
3859 vrex_used |= REX_R;
3860
3861 if ((i.reg_operands + i.imm_operands) == i.operands)
3862 {
3863 /* When all operands are registers, the REX_X bit in REX is not
3864 used. We reuse it to encode the upper 16 registers, which is
3865 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3866 as 1's compliment. */
3867 if ((i.vrex & REX_B))
3868 {
3869 vrex_used |= REX_B;
3870 i.vex.bytes[1] &= ~0x40;
3871 }
3872 }
3873
3874 /* EVEX instructions shouldn't need the REX prefix. */
3875 i.vrex &= ~vrex_used;
3876 gas_assert (i.vrex == 0);
3877
6865c043
L
3878 /* Check the REX.W bit and VEXW. */
3879 if (i.tm.opcode_modifier.vexw == VEXWIG)
3880 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3881 else if (i.tm.opcode_modifier.vexw)
3882 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3883 else
931d03b7 3884 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
43234a1e
L
3885
3886 /* Encode the U bit. */
3887 implied_prefix |= 0x4;
3888
3889 /* The third byte of the EVEX prefix. */
3890 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3891
3892 /* The fourth byte of the EVEX prefix. */
3893 /* The zeroing-masking bit. */
3894 if (i.mask && i.mask->zeroing)
3895 i.vex.bytes[3] |= 0x80;
3896
3897 /* Don't always set the broadcast bit if there is no RC. */
3898 if (!i.rounding)
3899 {
3900 /* Encode the vector length. */
3901 unsigned int vec_length;
3902
e771e7c9
JB
3903 if (!i.tm.opcode_modifier.evex
3904 || i.tm.opcode_modifier.evex == EVEXDYN)
3905 {
56522fc5 3906 unsigned int op;
e771e7c9 3907
c7213af9
L
3908 /* Determine vector length from the last multi-length vector
3909 operand. */
56522fc5 3910 for (op = i.operands; op--;)
e771e7c9
JB
3911 if (i.tm.operand_types[op].bitfield.xmmword
3912 + i.tm.operand_types[op].bitfield.ymmword
3913 + i.tm.operand_types[op].bitfield.zmmword > 1)
3914 {
3915 if (i.types[op].bitfield.zmmword)
c7213af9
L
3916 {
3917 i.tm.opcode_modifier.evex = EVEX512;
3918 break;
3919 }
e771e7c9 3920 else if (i.types[op].bitfield.ymmword)
c7213af9
L
3921 {
3922 i.tm.opcode_modifier.evex = EVEX256;
3923 break;
3924 }
e771e7c9 3925 else if (i.types[op].bitfield.xmmword)
c7213af9
L
3926 {
3927 i.tm.opcode_modifier.evex = EVEX128;
3928 break;
3929 }
625cbd7a
JB
3930 else if (i.broadcast && (int) op == i.broadcast->operand)
3931 {
4a1b91ea 3932 switch (i.broadcast->bytes)
625cbd7a
JB
3933 {
3934 case 64:
3935 i.tm.opcode_modifier.evex = EVEX512;
3936 break;
3937 case 32:
3938 i.tm.opcode_modifier.evex = EVEX256;
3939 break;
3940 case 16:
3941 i.tm.opcode_modifier.evex = EVEX128;
3942 break;
3943 default:
c7213af9 3944 abort ();
625cbd7a 3945 }
c7213af9 3946 break;
625cbd7a 3947 }
e771e7c9 3948 }
c7213af9 3949
56522fc5 3950 if (op >= MAX_OPERANDS)
c7213af9 3951 abort ();
e771e7c9
JB
3952 }
3953
43234a1e
L
3954 switch (i.tm.opcode_modifier.evex)
3955 {
3956 case EVEXLIG: /* LL' is ignored */
3957 vec_length = evexlig << 5;
3958 break;
3959 case EVEX128:
3960 vec_length = 0 << 5;
3961 break;
3962 case EVEX256:
3963 vec_length = 1 << 5;
3964 break;
3965 case EVEX512:
3966 vec_length = 2 << 5;
3967 break;
3968 default:
3969 abort ();
3970 break;
3971 }
3972 i.vex.bytes[3] |= vec_length;
3973 /* Encode the broadcast bit. */
3974 if (i.broadcast)
3975 i.vex.bytes[3] |= 0x10;
3976 }
3977 else
3978 {
3979 if (i.rounding->type != saeonly)
3980 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3981 else
d3d3c6db 3982 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
43234a1e
L
3983 }
3984
3985 if (i.mask && i.mask->mask)
3986 i.vex.bytes[3] |= i.mask->mask->reg_num;
3987}
3988
65da13b5
L
3989static void
3990process_immext (void)
3991{
3992 expressionS *exp;
3993
c0f3af97 3994 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
65da13b5
L
3995 which is coded in the same place as an 8-bit immediate field
3996 would be. Here we fake an 8-bit immediate operand from the
3997 opcode suffix stored in tm.extension_opcode.
3998
c1e679ec 3999 AVX instructions also use this encoding, for some of
c0f3af97 4000 3 argument instructions. */
65da13b5 4001
43234a1e 4002 gas_assert (i.imm_operands <= 1
7ab9ffdd 4003 && (i.operands <= 2
7a8655d2 4004 || (is_any_vex_encoding (&i.tm)
7ab9ffdd 4005 && i.operands <= 4)));
65da13b5
L
4006
4007 exp = &im_expressions[i.imm_operands++];
4008 i.op[i.operands].imms = exp;
4009 i.types[i.operands] = imm8;
4010 i.operands++;
4011 exp->X_op = O_constant;
4012 exp->X_add_number = i.tm.extension_opcode;
4013 i.tm.extension_opcode = None;
4014}
4015
42164a71
L
4016
4017static int
4018check_hle (void)
4019{
4020 switch (i.tm.opcode_modifier.hleprefixok)
4021 {
4022 default:
4023 abort ();
82c2def5 4024 case HLEPrefixNone:
165de32a
L
4025 as_bad (_("invalid instruction `%s' after `%s'"),
4026 i.tm.name, i.hle_prefix);
42164a71 4027 return 0;
82c2def5 4028 case HLEPrefixLock:
42164a71
L
4029 if (i.prefix[LOCK_PREFIX])
4030 return 1;
165de32a 4031 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
42164a71 4032 return 0;
82c2def5 4033 case HLEPrefixAny:
42164a71 4034 return 1;
82c2def5 4035 case HLEPrefixRelease:
42164a71
L
4036 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4037 {
4038 as_bad (_("instruction `%s' after `xacquire' not allowed"),
4039 i.tm.name);
4040 return 0;
4041 }
8dc0818e 4042 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
42164a71
L
4043 {
4044 as_bad (_("memory destination needed for instruction `%s'"
4045 " after `xrelease'"), i.tm.name);
4046 return 0;
4047 }
4048 return 1;
4049 }
4050}
4051
b6f8c7c4
L
4052/* Try the shortest encoding by shortening operand size. */
4053
4054static void
4055optimize_encoding (void)
4056{
a0a1771e 4057 unsigned int j;
b6f8c7c4
L
4058
4059 if (optimize_for_space
72aea328 4060 && !is_any_vex_encoding (&i.tm)
b6f8c7c4
L
4061 && i.reg_operands == 1
4062 && i.imm_operands == 1
4063 && !i.types[1].bitfield.byte
4064 && i.op[0].imms->X_op == O_constant
4065 && fits_in_imm7 (i.op[0].imms->X_add_number)
72aea328 4066 && (i.tm.base_opcode == 0xa8
b6f8c7c4
L
4067 || (i.tm.base_opcode == 0xf6
4068 && i.tm.extension_opcode == 0x0)))
4069 {
4070 /* Optimize: -Os:
4071 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
4072 */
4073 unsigned int base_regnum = i.op[1].regs->reg_num;
4074 if (flag_code == CODE_64BIT || base_regnum < 4)
4075 {
4076 i.types[1].bitfield.byte = 1;
4077 /* Ignore the suffix. */
4078 i.suffix = 0;
7697afb6
JB
4079 /* Convert to byte registers. */
4080 if (i.types[1].bitfield.word)
4081 j = 16;
4082 else if (i.types[1].bitfield.dword)
4083 j = 32;
4084 else
4085 j = 48;
4086 if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4087 j += 8;
4088 i.op[1].regs -= j;
b6f8c7c4
L
4089 }
4090 }
4091 else if (flag_code == CODE_64BIT
72aea328 4092 && !is_any_vex_encoding (&i.tm)
d3d50934
L
4093 && ((i.types[1].bitfield.qword
4094 && i.reg_operands == 1
b6f8c7c4
L
4095 && i.imm_operands == 1
4096 && i.op[0].imms->X_op == O_constant
507916b8 4097 && ((i.tm.base_opcode == 0xb8
b6f8c7c4
L
4098 && i.tm.extension_opcode == None
4099 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4100 || (fits_in_imm31 (i.op[0].imms->X_add_number)
72aea328
JB
4101 && ((i.tm.base_opcode == 0x24
4102 || i.tm.base_opcode == 0xa8)
b6f8c7c4
L
4103 || (i.tm.base_opcode == 0x80
4104 && i.tm.extension_opcode == 0x4)
4105 || ((i.tm.base_opcode == 0xf6
507916b8 4106 || (i.tm.base_opcode | 1) == 0xc7)
b8364fa7
JB
4107 && i.tm.extension_opcode == 0x0)))
4108 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4109 && i.tm.base_opcode == 0x83
4110 && i.tm.extension_opcode == 0x4)))
d3d50934
L
4111 || (i.types[0].bitfield.qword
4112 && ((i.reg_operands == 2
4113 && i.op[0].regs == i.op[1].regs
72aea328
JB
4114 && (i.tm.base_opcode == 0x30
4115 || i.tm.base_opcode == 0x28))
d3d50934
L
4116 || (i.reg_operands == 1
4117 && i.operands == 1
72aea328 4118 && i.tm.base_opcode == 0x30)))))
b6f8c7c4
L
4119 {
4120 /* Optimize: -O:
4121 andq $imm31, %r64 -> andl $imm31, %r32
b8364fa7 4122 andq $imm7, %r64 -> andl $imm7, %r32
b6f8c7c4
L
4123 testq $imm31, %r64 -> testl $imm31, %r32
4124 xorq %r64, %r64 -> xorl %r32, %r32
4125 subq %r64, %r64 -> subl %r32, %r32
4126 movq $imm31, %r64 -> movl $imm31, %r32
4127 movq $imm32, %r64 -> movl $imm32, %r32
4128 */
4129 i.tm.opcode_modifier.norex64 = 1;
507916b8 4130 if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
b6f8c7c4
L
4131 {
4132 /* Handle
4133 movq $imm31, %r64 -> movl $imm31, %r32
4134 movq $imm32, %r64 -> movl $imm32, %r32
4135 */
4136 i.tm.operand_types[0].bitfield.imm32 = 1;
4137 i.tm.operand_types[0].bitfield.imm32s = 0;
4138 i.tm.operand_types[0].bitfield.imm64 = 0;
4139 i.types[0].bitfield.imm32 = 1;
4140 i.types[0].bitfield.imm32s = 0;
4141 i.types[0].bitfield.imm64 = 0;
4142 i.types[1].bitfield.dword = 1;
4143 i.types[1].bitfield.qword = 0;
507916b8 4144 if ((i.tm.base_opcode | 1) == 0xc7)
b6f8c7c4
L
4145 {
4146 /* Handle
4147 movq $imm31, %r64 -> movl $imm31, %r32
4148 */
507916b8 4149 i.tm.base_opcode = 0xb8;
b6f8c7c4 4150 i.tm.extension_opcode = None;
507916b8 4151 i.tm.opcode_modifier.w = 0;
b6f8c7c4
L
4152 i.tm.opcode_modifier.modrm = 0;
4153 }
4154 }
4155 }
5641ec01
JB
4156 else if (optimize > 1
4157 && !optimize_for_space
72aea328 4158 && !is_any_vex_encoding (&i.tm)
5641ec01
JB
4159 && i.reg_operands == 2
4160 && i.op[0].regs == i.op[1].regs
4161 && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4162 || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4163 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4164 {
4165 /* Optimize: -O2:
4166 andb %rN, %rN -> testb %rN, %rN
4167 andw %rN, %rN -> testw %rN, %rN
4168 andq %rN, %rN -> testq %rN, %rN
4169 orb %rN, %rN -> testb %rN, %rN
4170 orw %rN, %rN -> testw %rN, %rN
4171 orq %rN, %rN -> testq %rN, %rN
4172
4173 and outside of 64-bit mode
4174
4175 andl %rN, %rN -> testl %rN, %rN
4176 orl %rN, %rN -> testl %rN, %rN
4177 */
4178 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4179 }
99112332 4180 else if (i.reg_operands == 3
b6f8c7c4
L
4181 && i.op[0].regs == i.op[1].regs
4182 && !i.types[2].bitfield.xmmword
4183 && (i.tm.opcode_modifier.vex
7a69eac3 4184 || ((!i.mask || i.mask->zeroing)
b6f8c7c4 4185 && !i.rounding
e771e7c9 4186 && is_evex_encoding (&i.tm)
80c34c38 4187 && (i.vec_encoding != vex_encoding_evex
dd22218c 4188 || cpu_arch_isa_flags.bitfield.cpuavx512vl
80c34c38 4189 || i.tm.cpu_flags.bitfield.cpuavx512vl
7091c612 4190 || (i.tm.operand_types[2].bitfield.zmmword
dd22218c 4191 && i.types[2].bitfield.ymmword))))
b6f8c7c4
L
4192 && ((i.tm.base_opcode == 0x55
4193 || i.tm.base_opcode == 0x6655
4194 || i.tm.base_opcode == 0x66df
4195 || i.tm.base_opcode == 0x57
4196 || i.tm.base_opcode == 0x6657
8305403a
L
4197 || i.tm.base_opcode == 0x66ef
4198 || i.tm.base_opcode == 0x66f8
4199 || i.tm.base_opcode == 0x66f9
4200 || i.tm.base_opcode == 0x66fa
1424ad86
JB
4201 || i.tm.base_opcode == 0x66fb
4202 || i.tm.base_opcode == 0x42
4203 || i.tm.base_opcode == 0x6642
4204 || i.tm.base_opcode == 0x47
4205 || i.tm.base_opcode == 0x6647)
b6f8c7c4
L
4206 && i.tm.extension_opcode == None))
4207 {
99112332 4208 /* Optimize: -O1:
8305403a
L
4209 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4210 vpsubq and vpsubw:
b6f8c7c4
L
4211 EVEX VOP %zmmM, %zmmM, %zmmN
4212 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4213 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4214 EVEX VOP %ymmM, %ymmM, %ymmN
4215 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4216 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4217 VEX VOP %ymmM, %ymmM, %ymmN
4218 -> VEX VOP %xmmM, %xmmM, %xmmN
4219 VOP, one of vpandn and vpxor:
4220 VEX VOP %ymmM, %ymmM, %ymmN
4221 -> VEX VOP %xmmM, %xmmM, %xmmN
4222 VOP, one of vpandnd and vpandnq:
4223 EVEX VOP %zmmM, %zmmM, %zmmN
4224 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4225 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4226 EVEX VOP %ymmM, %ymmM, %ymmN
4227 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4228 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4229 VOP, one of vpxord and vpxorq:
4230 EVEX VOP %zmmM, %zmmM, %zmmN
4231 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4232 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4233 EVEX VOP %ymmM, %ymmM, %ymmN
4234 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4235 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
1424ad86
JB
4236 VOP, one of kxord and kxorq:
4237 VEX VOP %kM, %kM, %kN
4238 -> VEX kxorw %kM, %kM, %kN
4239 VOP, one of kandnd and kandnq:
4240 VEX VOP %kM, %kM, %kN
4241 -> VEX kandnw %kM, %kM, %kN
b6f8c7c4 4242 */
e771e7c9 4243 if (is_evex_encoding (&i.tm))
b6f8c7c4 4244 {
7b1d7ca1 4245 if (i.vec_encoding != vex_encoding_evex)
b6f8c7c4
L
4246 {
4247 i.tm.opcode_modifier.vex = VEX128;
4248 i.tm.opcode_modifier.vexw = VEXW0;
4249 i.tm.opcode_modifier.evex = 0;
4250 }
7b1d7ca1 4251 else if (optimize > 1)
dd22218c
L
4252 i.tm.opcode_modifier.evex = EVEX128;
4253 else
4254 return;
b6f8c7c4 4255 }
f74a6307 4256 else if (i.tm.operand_types[0].bitfield.class == RegMask)
1424ad86
JB
4257 {
4258 i.tm.base_opcode &= 0xff;
4259 i.tm.opcode_modifier.vexw = VEXW0;
4260 }
b6f8c7c4
L
4261 else
4262 i.tm.opcode_modifier.vex = VEX128;
4263
4264 if (i.tm.opcode_modifier.vex)
4265 for (j = 0; j < 3; j++)
4266 {
4267 i.types[j].bitfield.xmmword = 1;
4268 i.types[j].bitfield.ymmword = 0;
4269 }
4270 }
392a5972 4271 else if (i.vec_encoding != vex_encoding_evex
97ed31ae 4272 && !i.types[0].bitfield.zmmword
392a5972 4273 && !i.types[1].bitfield.zmmword
97ed31ae 4274 && !i.mask
a0a1771e 4275 && !i.broadcast
97ed31ae 4276 && is_evex_encoding (&i.tm)
392a5972
L
4277 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4278 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
a0a1771e
JB
4279 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4280 || (i.tm.base_opcode & ~4) == 0x66db
4281 || (i.tm.base_opcode & ~4) == 0x66eb)
97ed31ae
L
4282 && i.tm.extension_opcode == None)
4283 {
4284 /* Optimize: -O1:
4285 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4286 vmovdqu32 and vmovdqu64:
4287 EVEX VOP %xmmM, %xmmN
4288 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4289 EVEX VOP %ymmM, %ymmN
4290 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4291 EVEX VOP %xmmM, mem
4292 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4293 EVEX VOP %ymmM, mem
4294 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4295 EVEX VOP mem, %xmmN
4296 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4297 EVEX VOP mem, %ymmN
4298 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
a0a1771e
JB
4299 VOP, one of vpand, vpandn, vpor, vpxor:
4300 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4301 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4302 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4303 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4304 EVEX VOP{d,q} mem, %xmmM, %xmmN
4305 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4306 EVEX VOP{d,q} mem, %ymmM, %ymmN
4307 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
97ed31ae 4308 */
a0a1771e 4309 for (j = 0; j < i.operands; j++)
392a5972
L
4310 if (operand_type_check (i.types[j], disp)
4311 && i.op[j].disps->X_op == O_constant)
4312 {
4313 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4314 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4315 bytes, we choose EVEX Disp8 over VEX Disp32. */
4316 int evex_disp8, vex_disp8;
4317 unsigned int memshift = i.memshift;
4318 offsetT n = i.op[j].disps->X_add_number;
4319
4320 evex_disp8 = fits_in_disp8 (n);
4321 i.memshift = 0;
4322 vex_disp8 = fits_in_disp8 (n);
4323 if (evex_disp8 != vex_disp8)
4324 {
4325 i.memshift = memshift;
4326 return;
4327 }
4328
4329 i.types[j].bitfield.disp8 = vex_disp8;
4330 break;
4331 }
4332 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4333 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
97ed31ae
L
4334 i.tm.opcode_modifier.vex
4335 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4336 i.tm.opcode_modifier.vexw = VEXW0;
79dec6b7
JB
4337 /* VPAND, VPOR, and VPXOR are commutative. */
4338 if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4339 i.tm.opcode_modifier.commutative = 1;
97ed31ae
L
4340 i.tm.opcode_modifier.evex = 0;
4341 i.tm.opcode_modifier.masking = 0;
a0a1771e 4342 i.tm.opcode_modifier.broadcast = 0;
97ed31ae
L
4343 i.tm.opcode_modifier.disp8memshift = 0;
4344 i.memshift = 0;
a0a1771e
JB
4345 if (j < i.operands)
4346 i.types[j].bitfield.disp8
4347 = fits_in_disp8 (i.op[j].disps->X_add_number);
97ed31ae 4348 }
b6f8c7c4
L
4349}
4350
ae531041
L
4351/* Return non-zero for load instruction. */
4352
4353static int
4354load_insn_p (void)
4355{
4356 unsigned int dest;
4357 int any_vex_p = is_any_vex_encoding (&i.tm);
4358 unsigned int base_opcode = i.tm.base_opcode | 1;
4359
4360 if (!any_vex_p)
4361 {
a09f656b 4362 /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4363 prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4364 bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote. */
4365 if (i.tm.opcode_modifier.anysize)
ae531041
L
4366 return 0;
4367
a09f656b 4368 /* pop, popf, popa. */
4369 if (strcmp (i.tm.name, "pop") == 0
4370 || i.tm.base_opcode == 0x9d
4371 || i.tm.base_opcode == 0x61)
ae531041
L
4372 return 1;
4373
4374 /* movs, cmps, lods, scas. */
4375 if ((i.tm.base_opcode | 0xb) == 0xaf)
4376 return 1;
4377
a09f656b 4378 /* outs, xlatb. */
4379 if (base_opcode == 0x6f
4380 || i.tm.base_opcode == 0xd7)
ae531041 4381 return 1;
a09f656b 4382 /* NB: For AMD-specific insns with implicit memory operands,
4383 they're intentionally not covered. */
ae531041
L
4384 }
4385
4386 /* No memory operand. */
4387 if (!i.mem_operands)
4388 return 0;
4389
4390 if (any_vex_p)
4391 {
4392 /* vldmxcsr. */
4393 if (i.tm.base_opcode == 0xae
4394 && i.tm.opcode_modifier.vex
4395 && i.tm.opcode_modifier.vexopcode == VEX0F
4396 && i.tm.extension_opcode == 2)
4397 return 1;
4398 }
4399 else
4400 {
4401 /* test, not, neg, mul, imul, div, idiv. */
4402 if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4403 && i.tm.extension_opcode != 1)
4404 return 1;
4405
4406 /* inc, dec. */
4407 if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4408 return 1;
4409
4410 /* add, or, adc, sbb, and, sub, xor, cmp. */
4411 if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4412 return 1;
4413
4414 /* bt, bts, btr, btc. */
4415 if (i.tm.base_opcode == 0xfba
4416 && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4417 return 1;
4418
4419 /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4420 if ((base_opcode == 0xc1
4421 || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4422 && i.tm.extension_opcode != 6)
4423 return 1;
4424
4425 /* cmpxchg8b, cmpxchg16b, xrstors. */
4426 if (i.tm.base_opcode == 0xfc7
4427 && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3))
4428 return 1;
4429
4430 /* fxrstor, ldmxcsr, xrstor. */
4431 if (i.tm.base_opcode == 0xfae
4432 && (i.tm.extension_opcode == 1
4433 || i.tm.extension_opcode == 2
4434 || i.tm.extension_opcode == 5))
4435 return 1;
4436
4437 /* lgdt, lidt, lmsw. */
4438 if (i.tm.base_opcode == 0xf01
4439 && (i.tm.extension_opcode == 2
4440 || i.tm.extension_opcode == 3
4441 || i.tm.extension_opcode == 6))
4442 return 1;
4443
4444 /* vmptrld */
4445 if (i.tm.base_opcode == 0xfc7
4446 && i.tm.extension_opcode == 6)
4447 return 1;
4448
4449 /* Check for x87 instructions. */
4450 if (i.tm.base_opcode >= 0xd8 && i.tm.base_opcode <= 0xdf)
4451 {
4452 /* Skip fst, fstp, fstenv, fstcw. */
4453 if (i.tm.base_opcode == 0xd9
4454 && (i.tm.extension_opcode == 2
4455 || i.tm.extension_opcode == 3
4456 || i.tm.extension_opcode == 6
4457 || i.tm.extension_opcode == 7))
4458 return 0;
4459
4460 /* Skip fisttp, fist, fistp, fstp. */
4461 if (i.tm.base_opcode == 0xdb
4462 && (i.tm.extension_opcode == 1
4463 || i.tm.extension_opcode == 2
4464 || i.tm.extension_opcode == 3
4465 || i.tm.extension_opcode == 7))
4466 return 0;
4467
4468 /* Skip fisttp, fst, fstp, fsave, fstsw. */
4469 if (i.tm.base_opcode == 0xdd
4470 && (i.tm.extension_opcode == 1
4471 || i.tm.extension_opcode == 2
4472 || i.tm.extension_opcode == 3
4473 || i.tm.extension_opcode == 6
4474 || i.tm.extension_opcode == 7))
4475 return 0;
4476
4477 /* Skip fisttp, fist, fistp, fbstp, fistp. */
4478 if (i.tm.base_opcode == 0xdf
4479 && (i.tm.extension_opcode == 1
4480 || i.tm.extension_opcode == 2
4481 || i.tm.extension_opcode == 3
4482 || i.tm.extension_opcode == 6
4483 || i.tm.extension_opcode == 7))
4484 return 0;
4485
4486 return 1;
4487 }
4488 }
4489
4490 dest = i.operands - 1;
4491
4492 /* Check fake imm8 operand and 3 source operands. */
4493 if ((i.tm.opcode_modifier.immext
4494 || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4495 && i.types[dest].bitfield.imm8)
4496 dest--;
4497
4498 /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg, xadd */
4499 if (!any_vex_p
4500 && (base_opcode == 0x1
4501 || base_opcode == 0x9
4502 || base_opcode == 0x11
4503 || base_opcode == 0x19
4504 || base_opcode == 0x21
4505 || base_opcode == 0x29
4506 || base_opcode == 0x31
4507 || base_opcode == 0x39
4508 || (i.tm.base_opcode >= 0x84 && i.tm.base_opcode <= 0x87)
4509 || base_opcode == 0xfc1))
4510 return 1;
4511
4512 /* Check for load instruction. */
4513 return (i.types[dest].bitfield.class != ClassNone
4514 || i.types[dest].bitfield.instance == Accum);
4515}
4516
4517/* Output lfence, 0xfaee8, after instruction. */
4518
4519static void
4520insert_lfence_after (void)
4521{
4522 if (lfence_after_load && load_insn_p ())
4523 {
a09f656b 4524 /* There are also two REP string instructions that require
4525 special treatment. Specifically, the compare string (CMPS)
4526 and scan string (SCAS) instructions set EFLAGS in a manner
4527 that depends on the data being compared/scanned. When used
4528 with a REP prefix, the number of iterations may therefore
4529 vary depending on this data. If the data is a program secret
4530 chosen by the adversary using an LVI method,
4531 then this data-dependent behavior may leak some aspect
4532 of the secret. */
4533 if (((i.tm.base_opcode | 0x1) == 0xa7
4534 || (i.tm.base_opcode | 0x1) == 0xaf)
4535 && i.prefix[REP_PREFIX])
4536 {
4537 as_warn (_("`%s` changes flags which would affect control flow behavior"),
4538 i.tm.name);
4539 }
ae531041
L
4540 char *p = frag_more (3);
4541 *p++ = 0xf;
4542 *p++ = 0xae;
4543 *p = 0xe8;
4544 }
4545}
4546
4547/* Output lfence, 0xfaee8, before instruction. */
4548
4549static void
4550insert_lfence_before (void)
4551{
4552 char *p;
4553
4554 if (is_any_vex_encoding (&i.tm))
4555 return;
4556
4557 if (i.tm.base_opcode == 0xff
4558 && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4559 {
4560 /* Insert lfence before indirect branch if needed. */
4561
4562 if (lfence_before_indirect_branch == lfence_branch_none)
4563 return;
4564
4565 if (i.operands != 1)
4566 abort ();
4567
4568 if (i.reg_operands == 1)
4569 {
4570 /* Indirect branch via register. Don't insert lfence with
4571 -mlfence-after-load=yes. */
4572 if (lfence_after_load
4573 || lfence_before_indirect_branch == lfence_branch_memory)
4574 return;
4575 }
4576 else if (i.mem_operands == 1
4577 && lfence_before_indirect_branch != lfence_branch_register)
4578 {
4579 as_warn (_("indirect `%s` with memory operand should be avoided"),
4580 i.tm.name);
4581 return;
4582 }
4583 else
4584 return;
4585
4586 if (last_insn.kind != last_insn_other
4587 && last_insn.seg == now_seg)
4588 {
4589 as_warn_where (last_insn.file, last_insn.line,
4590 _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4591 last_insn.name, i.tm.name);
4592 return;
4593 }
4594
4595 p = frag_more (3);
4596 *p++ = 0xf;
4597 *p++ = 0xae;
4598 *p = 0xe8;
4599 return;
4600 }
4601
503648e4 4602 /* Output or/not/shl and lfence before near ret. */
ae531041
L
4603 if (lfence_before_ret != lfence_before_ret_none
4604 && (i.tm.base_opcode == 0xc2
503648e4 4605 || i.tm.base_opcode == 0xc3))
ae531041
L
4606 {
4607 if (last_insn.kind != last_insn_other
4608 && last_insn.seg == now_seg)
4609 {
4610 as_warn_where (last_insn.file, last_insn.line,
4611 _("`%s` skips -mlfence-before-ret on `%s`"),
4612 last_insn.name, i.tm.name);
4613 return;
4614 }
a09f656b 4615
a09f656b 4616 /* Near ret ingore operand size override under CPU64. */
503648e4 4617 char prefix = flag_code == CODE_64BIT
4618 ? 0x48
4619 : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
a09f656b 4620
4621 if (lfence_before_ret == lfence_before_ret_not)
4622 {
4623 /* not: 0xf71424, may add prefix
4624 for operand size override or 64-bit code. */
4625 p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4626 if (prefix)
4627 *p++ = prefix;
ae531041
L
4628 *p++ = 0xf7;
4629 *p++ = 0x14;
4630 *p++ = 0x24;
a09f656b 4631 if (prefix)
4632 *p++ = prefix;
ae531041
L
4633 *p++ = 0xf7;
4634 *p++ = 0x14;
4635 *p++ = 0x24;
4636 }
a09f656b 4637 else
4638 {
4639 p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4640 if (prefix)
4641 *p++ = prefix;
4642 if (lfence_before_ret == lfence_before_ret_or)
4643 {
4644 /* or: 0x830c2400, may add prefix
4645 for operand size override or 64-bit code. */
4646 *p++ = 0x83;
4647 *p++ = 0x0c;
4648 }
4649 else
4650 {
4651 /* shl: 0xc1242400, may add prefix
4652 for operand size override or 64-bit code. */
4653 *p++ = 0xc1;
4654 *p++ = 0x24;
4655 }
4656
4657 *p++ = 0x24;
4658 *p++ = 0x0;
4659 }
4660
ae531041
L
4661 *p++ = 0xf;
4662 *p++ = 0xae;
4663 *p = 0xe8;
4664 }
4665}
4666
252b5132
RH
4667/* This is the guts of the machine-dependent assembler. LINE points to a
4668 machine dependent instruction. This function is supposed to emit
4669 the frags/bytes it assembles to. */
4670
4671void
65da13b5 4672md_assemble (char *line)
252b5132 4673{
40fb9820 4674 unsigned int j;
83b16ac6 4675 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
d3ce72d0 4676 const insn_template *t;
252b5132 4677
47926f60 4678 /* Initialize globals. */
252b5132
RH
4679 memset (&i, '\0', sizeof (i));
4680 for (j = 0; j < MAX_OPERANDS; j++)
1ae12ab7 4681 i.reloc[j] = NO_RELOC;
252b5132
RH
4682 memset (disp_expressions, '\0', sizeof (disp_expressions));
4683 memset (im_expressions, '\0', sizeof (im_expressions));
ce8a8b2f 4684 save_stack_p = save_stack;
252b5132
RH
4685
4686 /* First parse an instruction mnemonic & call i386_operand for the operands.
4687 We assume that the scrubber has arranged it so that line[0] is the valid
47926f60 4688 start of a (possibly prefixed) mnemonic. */
252b5132 4689
29b0f896
AM
4690 line = parse_insn (line, mnemonic);
4691 if (line == NULL)
4692 return;
83b16ac6 4693 mnem_suffix = i.suffix;
252b5132 4694
29b0f896 4695 line = parse_operands (line, mnemonic);
ee86248c 4696 this_operand = -1;
8325cc63
JB
4697 xfree (i.memop1_string);
4698 i.memop1_string = NULL;
29b0f896
AM
4699 if (line == NULL)
4700 return;
252b5132 4701
29b0f896
AM
4702 /* Now we've parsed the mnemonic into a set of templates, and have the
4703 operands at hand. */
4704
b630c145
JB
4705 /* All Intel opcodes have reversed operands except for "bound", "enter",
4706 "monitor*", "mwait*", "tpause", and "umwait". We also don't reverse
4707 intersegment "jmp" and "call" instructions with 2 immediate operands so
4708 that the immediate segment precedes the offset, as it does when in AT&T
4709 mode. */
4d456e3d
L
4710 if (intel_syntax
4711 && i.operands > 1
29b0f896 4712 && (strcmp (mnemonic, "bound") != 0)
30123838 4713 && (strcmp (mnemonic, "invlpga") != 0)
eedb0f2c
JB
4714 && (strncmp (mnemonic, "monitor", 7) != 0)
4715 && (strncmp (mnemonic, "mwait", 5) != 0)
b630c145
JB
4716 && (strcmp (mnemonic, "tpause") != 0)
4717 && (strcmp (mnemonic, "umwait") != 0)
40fb9820
L
4718 && !(operand_type_check (i.types[0], imm)
4719 && operand_type_check (i.types[1], imm)))
29b0f896
AM
4720 swap_operands ();
4721
ec56d5c0
JB
4722 /* The order of the immediates should be reversed
4723 for 2 immediates extrq and insertq instructions */
4724 if (i.imm_operands == 2
4725 && (strcmp (mnemonic, "extrq") == 0
4726 || strcmp (mnemonic, "insertq") == 0))
4727 swap_2_operands (0, 1);
4728
29b0f896
AM
4729 if (i.imm_operands)
4730 optimize_imm ();
4731
b300c311
L
4732 /* Don't optimize displacement for movabs since it only takes 64bit
4733 displacement. */
4734 if (i.disp_operands
a501d77e 4735 && i.disp_encoding != disp_encoding_32bit
862be3fb
L
4736 && (flag_code != CODE_64BIT
4737 || strcmp (mnemonic, "movabs") != 0))
4738 optimize_disp ();
29b0f896
AM
4739
4740 /* Next, we find a template that matches the given insn,
4741 making sure the overlap of the given operands types is consistent
4742 with the template operand types. */
252b5132 4743
83b16ac6 4744 if (!(t = match_template (mnem_suffix)))
29b0f896 4745 return;
252b5132 4746
7bab8ab5 4747 if (sse_check != check_none
81f8a913 4748 && !i.tm.opcode_modifier.noavx
6e3e5c9e 4749 && !i.tm.cpu_flags.bitfield.cpuavx
569d50f1 4750 && !i.tm.cpu_flags.bitfield.cpuavx512f
daf50ae7
L
4751 && (i.tm.cpu_flags.bitfield.cpusse
4752 || i.tm.cpu_flags.bitfield.cpusse2
4753 || i.tm.cpu_flags.bitfield.cpusse3
4754 || i.tm.cpu_flags.bitfield.cpussse3
4755 || i.tm.cpu_flags.bitfield.cpusse4_1
6e3e5c9e
JB
4756 || i.tm.cpu_flags.bitfield.cpusse4_2
4757 || i.tm.cpu_flags.bitfield.cpupclmul
4758 || i.tm.cpu_flags.bitfield.cpuaes
569d50f1 4759 || i.tm.cpu_flags.bitfield.cpusha
6e3e5c9e 4760 || i.tm.cpu_flags.bitfield.cpugfni))
daf50ae7 4761 {
7bab8ab5 4762 (sse_check == check_warning
daf50ae7
L
4763 ? as_warn
4764 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4765 }
4766
40fb9820 4767 if (i.tm.opcode_modifier.fwait)
29b0f896
AM
4768 if (!add_prefix (FWAIT_OPCODE))
4769 return;
252b5132 4770
d5de92cf
L
4771 /* Check if REP prefix is OK. */
4772 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4773 {
4774 as_bad (_("invalid instruction `%s' after `%s'"),
4775 i.tm.name, i.rep_prefix);
4776 return;
4777 }
4778
c1ba0266
L
4779 /* Check for lock without a lockable instruction. Destination operand
4780 must be memory unless it is xchg (0x86). */
c32fa91d
L
4781 if (i.prefix[LOCK_PREFIX]
4782 && (!i.tm.opcode_modifier.islockable
c1ba0266
L
4783 || i.mem_operands == 0
4784 || (i.tm.base_opcode != 0x86
8dc0818e 4785 && !(i.flags[i.operands - 1] & Operand_Mem))))
c32fa91d
L
4786 {
4787 as_bad (_("expecting lockable instruction after `lock'"));
4788 return;
4789 }
4790
40d231b4
JB
4791 /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns. */
4792 if (i.prefix[DATA_PREFIX]
4793 && (is_any_vex_encoding (&i.tm)
4794 || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
4795 || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX))
7a8655d2
JB
4796 {
4797 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4798 return;
4799 }
4800
42164a71 4801 /* Check if HLE prefix is OK. */
165de32a 4802 if (i.hle_prefix && !check_hle ())
42164a71
L
4803 return;
4804
7e8b059b
L
4805 /* Check BND prefix. */
4806 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4807 as_bad (_("expecting valid branch instruction after `bnd'"));
4808
04ef582a 4809 /* Check NOTRACK prefix. */
9fef80d6
L
4810 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4811 as_bad (_("expecting indirect branch instruction after `notrack'"));
04ef582a 4812
327e8c42
JB
4813 if (i.tm.cpu_flags.bitfield.cpumpx)
4814 {
4815 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4816 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4817 else if (flag_code != CODE_16BIT
4818 ? i.prefix[ADDR_PREFIX]
4819 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4820 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4821 }
7e8b059b
L
4822
4823 /* Insert BND prefix. */
76d3a78a
JB
4824 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4825 {
4826 if (!i.prefix[BND_PREFIX])
4827 add_prefix (BND_PREFIX_OPCODE);
4828 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4829 {
4830 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4831 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4832 }
4833 }
7e8b059b 4834
29b0f896 4835 /* Check string instruction segment overrides. */
51c8edf6 4836 if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
29b0f896 4837 {
51c8edf6 4838 gas_assert (i.mem_operands);
29b0f896 4839 if (!check_string ())
5dd0794d 4840 return;
fc0763e6 4841 i.disp_operands = 0;
29b0f896 4842 }
5dd0794d 4843
b6f8c7c4
L
4844 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4845 optimize_encoding ();
4846
29b0f896
AM
4847 if (!process_suffix ())
4848 return;
e413e4e9 4849
bc0844ae
L
4850 /* Update operand types. */
4851 for (j = 0; j < i.operands; j++)
4852 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4853
29b0f896
AM
4854 /* Make still unresolved immediate matches conform to size of immediate
4855 given in i.suffix. */
4856 if (!finalize_imm ())
4857 return;
252b5132 4858
40fb9820 4859 if (i.types[0].bitfield.imm1)
29b0f896 4860 i.imm_operands = 0; /* kludge for shift insns. */
252b5132 4861
9afe6eb8
L
4862 /* We only need to check those implicit registers for instructions
4863 with 3 operands or less. */
4864 if (i.operands <= 3)
4865 for (j = 0; j < i.operands; j++)
75e5731b
JB
4866 if (i.types[j].bitfield.instance != InstanceNone
4867 && !i.types[j].bitfield.xmmword)
9afe6eb8 4868 i.reg_operands--;
40fb9820 4869
29b0f896
AM
4870 /* For insns with operands there are more diddles to do to the opcode. */
4871 if (i.operands)
4872 {
4873 if (!process_operands ())
4874 return;
4875 }
8c190ce0 4876 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
29b0f896
AM
4877 {
4878 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4879 as_warn (_("translating to `%sp'"), i.tm.name);
4880 }
252b5132 4881
7a8655d2 4882 if (is_any_vex_encoding (&i.tm))
9e5e5283 4883 {
c1dc7af5 4884 if (!cpu_arch_flags.bitfield.cpui286)
9e5e5283 4885 {
c1dc7af5 4886 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
9e5e5283
L
4887 i.tm.name);
4888 return;
4889 }
c0f3af97 4890
0b9404fd
JB
4891 /* Check for explicit REX prefix. */
4892 if (i.prefix[REX_PREFIX] || i.rex_encoding)
4893 {
4894 as_bad (_("REX prefix invalid with `%s'"), i.tm.name);
4895 return;
4896 }
4897
9e5e5283
L
4898 if (i.tm.opcode_modifier.vex)
4899 build_vex_prefix (t);
4900 else
4901 build_evex_prefix ();
0b9404fd
JB
4902
4903 /* The individual REX.RXBW bits got consumed. */
4904 i.rex &= REX_OPCODE;
9e5e5283 4905 }
43234a1e 4906
5dd85c99
SP
4907 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4908 instructions may define INT_OPCODE as well, so avoid this corner
4909 case for those instructions that use MODRM. */
4910 if (i.tm.base_opcode == INT_OPCODE
a6461c02
SP
4911 && !i.tm.opcode_modifier.modrm
4912 && i.op[0].imms->X_add_number == 3)
29b0f896
AM
4913 {
4914 i.tm.base_opcode = INT3_OPCODE;
4915 i.imm_operands = 0;
4916 }
252b5132 4917
0cfa3eb3
JB
4918 if ((i.tm.opcode_modifier.jump == JUMP
4919 || i.tm.opcode_modifier.jump == JUMP_BYTE
4920 || i.tm.opcode_modifier.jump == JUMP_DWORD)
29b0f896
AM
4921 && i.op[0].disps->X_op == O_constant)
4922 {
4923 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4924 the absolute address given by the constant. Since ix86 jumps and
4925 calls are pc relative, we need to generate a reloc. */
4926 i.op[0].disps->X_add_symbol = &abs_symbol;
4927 i.op[0].disps->X_op = O_symbol;
4928 }
252b5132 4929
29b0f896
AM
4930 /* For 8 bit registers we need an empty rex prefix. Also if the
4931 instruction already has a prefix, we need to convert old
4932 registers to new ones. */
773f551c 4933
bab6aec1 4934 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
29b0f896 4935 && (i.op[0].regs->reg_flags & RegRex64) != 0)
bab6aec1 4936 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
29b0f896 4937 && (i.op[1].regs->reg_flags & RegRex64) != 0)
bab6aec1
JB
4938 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4939 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
29b0f896
AM
4940 && i.rex != 0))
4941 {
4942 int x;
726c5dcd 4943
29b0f896
AM
4944 i.rex |= REX_OPCODE;
4945 for (x = 0; x < 2; x++)
4946 {
4947 /* Look for 8 bit operand that uses old registers. */
bab6aec1 4948 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
29b0f896 4949 && (i.op[x].regs->reg_flags & RegRex64) == 0)
773f551c 4950 {
3f93af61 4951 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
29b0f896
AM
4952 /* In case it is "hi" register, give up. */
4953 if (i.op[x].regs->reg_num > 3)
a540244d 4954 as_bad (_("can't encode register '%s%s' in an "
4eed87de 4955 "instruction requiring REX prefix."),
a540244d 4956 register_prefix, i.op[x].regs->reg_name);
773f551c 4957
29b0f896
AM
4958 /* Otherwise it is equivalent to the extended register.
4959 Since the encoding doesn't change this is merely
4960 cosmetic cleanup for debug output. */
4961
4962 i.op[x].regs = i.op[x].regs + 8;
773f551c 4963 }
29b0f896
AM
4964 }
4965 }
773f551c 4966
6b6b6807
L
4967 if (i.rex == 0 && i.rex_encoding)
4968 {
4969 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
3f93af61 4970 that uses legacy register. If it is "hi" register, don't add
6b6b6807
L
4971 the REX_OPCODE byte. */
4972 int x;
4973 for (x = 0; x < 2; x++)
bab6aec1 4974 if (i.types[x].bitfield.class == Reg
6b6b6807
L
4975 && i.types[x].bitfield.byte
4976 && (i.op[x].regs->reg_flags & RegRex64) == 0
4977 && i.op[x].regs->reg_num > 3)
4978 {
3f93af61 4979 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
6b6b6807
L
4980 i.rex_encoding = FALSE;
4981 break;
4982 }
4983
4984 if (i.rex_encoding)
4985 i.rex = REX_OPCODE;
4986 }
4987
7ab9ffdd 4988 if (i.rex != 0)
29b0f896
AM
4989 add_prefix (REX_OPCODE | i.rex);
4990
ae531041
L
4991 insert_lfence_before ();
4992
29b0f896
AM
4993 /* We are ready to output the insn. */
4994 output_insn ();
e379e5f3 4995
ae531041
L
4996 insert_lfence_after ();
4997
e379e5f3
L
4998 last_insn.seg = now_seg;
4999
5000 if (i.tm.opcode_modifier.isprefix)
5001 {
5002 last_insn.kind = last_insn_prefix;
5003 last_insn.name = i.tm.name;
5004 last_insn.file = as_where (&last_insn.line);
5005 }
5006 else
5007 last_insn.kind = last_insn_other;
29b0f896
AM
5008}
5009
5010static char *
e3bb37b5 5011parse_insn (char *line, char *mnemonic)
29b0f896
AM
5012{
5013 char *l = line;
5014 char *token_start = l;
5015 char *mnem_p;
5c6af06e 5016 int supported;
d3ce72d0 5017 const insn_template *t;
b6169b20 5018 char *dot_p = NULL;
29b0f896 5019
29b0f896
AM
5020 while (1)
5021 {
5022 mnem_p = mnemonic;
5023 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5024 {
b6169b20
L
5025 if (*mnem_p == '.')
5026 dot_p = mnem_p;
29b0f896
AM
5027 mnem_p++;
5028 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
45288df1 5029 {
29b0f896
AM
5030 as_bad (_("no such instruction: `%s'"), token_start);
5031 return NULL;
5032 }
5033 l++;
5034 }
5035 if (!is_space_char (*l)
5036 && *l != END_OF_INSN
e44823cf
JB
5037 && (intel_syntax
5038 || (*l != PREFIX_SEPARATOR
5039 && *l != ',')))
29b0f896
AM
5040 {
5041 as_bad (_("invalid character %s in mnemonic"),
5042 output_invalid (*l));
5043 return NULL;
5044 }
5045 if (token_start == l)
5046 {
e44823cf 5047 if (!intel_syntax && *l == PREFIX_SEPARATOR)
29b0f896
AM
5048 as_bad (_("expecting prefix; got nothing"));
5049 else
5050 as_bad (_("expecting mnemonic; got nothing"));
5051 return NULL;
5052 }
45288df1 5053
29b0f896 5054 /* Look up instruction (or prefix) via hash table. */
d3ce72d0 5055 current_templates = (const templates *) hash_find (op_hash, mnemonic);
47926f60 5056
29b0f896
AM
5057 if (*l != END_OF_INSN
5058 && (!is_space_char (*l) || l[1] != END_OF_INSN)
5059 && current_templates
40fb9820 5060 && current_templates->start->opcode_modifier.isprefix)
29b0f896 5061 {
c6fb90c8 5062 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
2dd88dca
JB
5063 {
5064 as_bad ((flag_code != CODE_64BIT
5065 ? _("`%s' is only supported in 64-bit mode")
5066 : _("`%s' is not supported in 64-bit mode")),
5067 current_templates->start->name);
5068 return NULL;
5069 }
29b0f896
AM
5070 /* If we are in 16-bit mode, do not allow addr16 or data16.
5071 Similarly, in 32-bit mode, do not allow addr32 or data32. */
673fe0f0
JB
5072 if ((current_templates->start->opcode_modifier.size == SIZE16
5073 || current_templates->start->opcode_modifier.size == SIZE32)
29b0f896 5074 && flag_code != CODE_64BIT
673fe0f0 5075 && ((current_templates->start->opcode_modifier.size == SIZE32)
29b0f896
AM
5076 ^ (flag_code == CODE_16BIT)))
5077 {
5078 as_bad (_("redundant %s prefix"),
5079 current_templates->start->name);
5080 return NULL;
45288df1 5081 }
86fa6981 5082 if (current_templates->start->opcode_length == 0)
29b0f896 5083 {
86fa6981
L
5084 /* Handle pseudo prefixes. */
5085 switch (current_templates->start->base_opcode)
5086 {
5087 case 0x0:
5088 /* {disp8} */
5089 i.disp_encoding = disp_encoding_8bit;
5090 break;
5091 case 0x1:
5092 /* {disp32} */
5093 i.disp_encoding = disp_encoding_32bit;
5094 break;
5095 case 0x2:
5096 /* {load} */
5097 i.dir_encoding = dir_encoding_load;
5098 break;
5099 case 0x3:
5100 /* {store} */
5101 i.dir_encoding = dir_encoding_store;
5102 break;
5103 case 0x4:
42e04b36
L
5104 /* {vex} */
5105 i.vec_encoding = vex_encoding_vex;
86fa6981
L
5106 break;
5107 case 0x5:
5108 /* {vex3} */
5109 i.vec_encoding = vex_encoding_vex3;
5110 break;
5111 case 0x6:
5112 /* {evex} */
5113 i.vec_encoding = vex_encoding_evex;
5114 break;
6b6b6807
L
5115 case 0x7:
5116 /* {rex} */
5117 i.rex_encoding = TRUE;
5118 break;
b6f8c7c4
L
5119 case 0x8:
5120 /* {nooptimize} */
5121 i.no_optimize = TRUE;
5122 break;
86fa6981
L
5123 default:
5124 abort ();
5125 }
5126 }
5127 else
5128 {
5129 /* Add prefix, checking for repeated prefixes. */
4e9ac44a 5130 switch (add_prefix (current_templates->start->base_opcode))
86fa6981 5131 {
4e9ac44a
L
5132 case PREFIX_EXIST:
5133 return NULL;
5134 case PREFIX_DS:
d777820b 5135 if (current_templates->start->cpu_flags.bitfield.cpuibt)
4e9ac44a
L
5136 i.notrack_prefix = current_templates->start->name;
5137 break;
5138 case PREFIX_REP:
5139 if (current_templates->start->cpu_flags.bitfield.cpuhle)
5140 i.hle_prefix = current_templates->start->name;
5141 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5142 i.bnd_prefix = current_templates->start->name;
5143 else
5144 i.rep_prefix = current_templates->start->name;
5145 break;
5146 default:
5147 break;
86fa6981 5148 }
29b0f896
AM
5149 }
5150 /* Skip past PREFIX_SEPARATOR and reset token_start. */
5151 token_start = ++l;
5152 }
5153 else
5154 break;
5155 }
45288df1 5156
30a55f88 5157 if (!current_templates)
b6169b20 5158 {
07d5e953
JB
5159 /* Deprecated functionality (new code should use pseudo-prefixes instead):
5160 Check if we should swap operand or force 32bit displacement in
f8a5c266 5161 encoding. */
30a55f88 5162 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
64c49ab3 5163 i.dir_encoding = dir_encoding_swap;
8d63c93e 5164 else if (mnem_p - 3 == dot_p
a501d77e
L
5165 && dot_p[1] == 'd'
5166 && dot_p[2] == '8')
5167 i.disp_encoding = disp_encoding_8bit;
8d63c93e 5168 else if (mnem_p - 4 == dot_p
f8a5c266
L
5169 && dot_p[1] == 'd'
5170 && dot_p[2] == '3'
5171 && dot_p[3] == '2')
a501d77e 5172 i.disp_encoding = disp_encoding_32bit;
30a55f88
L
5173 else
5174 goto check_suffix;
5175 mnem_p = dot_p;
5176 *dot_p = '\0';
d3ce72d0 5177 current_templates = (const templates *) hash_find (op_hash, mnemonic);
b6169b20
L
5178 }
5179
29b0f896
AM
5180 if (!current_templates)
5181 {
dc1e8a47 5182 check_suffix:
1c529385 5183 if (mnem_p > mnemonic)
29b0f896 5184 {
1c529385
LH
5185 /* See if we can get a match by trimming off a suffix. */
5186 switch (mnem_p[-1])
29b0f896 5187 {
1c529385
LH
5188 case WORD_MNEM_SUFFIX:
5189 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
29b0f896
AM
5190 i.suffix = SHORT_MNEM_SUFFIX;
5191 else
1c529385
LH
5192 /* Fall through. */
5193 case BYTE_MNEM_SUFFIX:
5194 case QWORD_MNEM_SUFFIX:
5195 i.suffix = mnem_p[-1];
29b0f896 5196 mnem_p[-1] = '\0';
d3ce72d0 5197 current_templates = (const templates *) hash_find (op_hash,
1c529385
LH
5198 mnemonic);
5199 break;
5200 case SHORT_MNEM_SUFFIX:
5201 case LONG_MNEM_SUFFIX:
5202 if (!intel_syntax)
5203 {
5204 i.suffix = mnem_p[-1];
5205 mnem_p[-1] = '\0';
5206 current_templates = (const templates *) hash_find (op_hash,
5207 mnemonic);
5208 }
5209 break;
5210
5211 /* Intel Syntax. */
5212 case 'd':
5213 if (intel_syntax)
5214 {
5215 if (intel_float_operand (mnemonic) == 1)
5216 i.suffix = SHORT_MNEM_SUFFIX;
5217 else
5218 i.suffix = LONG_MNEM_SUFFIX;
5219 mnem_p[-1] = '\0';
5220 current_templates = (const templates *) hash_find (op_hash,
5221 mnemonic);
5222 }
5223 break;
29b0f896 5224 }
29b0f896 5225 }
1c529385 5226
29b0f896
AM
5227 if (!current_templates)
5228 {
5229 as_bad (_("no such instruction: `%s'"), token_start);
5230 return NULL;
5231 }
5232 }
252b5132 5233
0cfa3eb3
JB
5234 if (current_templates->start->opcode_modifier.jump == JUMP
5235 || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
29b0f896
AM
5236 {
5237 /* Check for a branch hint. We allow ",pt" and ",pn" for
5238 predict taken and predict not taken respectively.
5239 I'm not sure that branch hints actually do anything on loop
5240 and jcxz insns (JumpByte) for current Pentium4 chips. They
5241 may work in the future and it doesn't hurt to accept them
5242 now. */
5243 if (l[0] == ',' && l[1] == 'p')
5244 {
5245 if (l[2] == 't')
5246 {
5247 if (!add_prefix (DS_PREFIX_OPCODE))
5248 return NULL;
5249 l += 3;
5250 }
5251 else if (l[2] == 'n')
5252 {
5253 if (!add_prefix (CS_PREFIX_OPCODE))
5254 return NULL;
5255 l += 3;
5256 }
5257 }
5258 }
5259 /* Any other comma loses. */
5260 if (*l == ',')
5261 {
5262 as_bad (_("invalid character %s in mnemonic"),
5263 output_invalid (*l));
5264 return NULL;
5265 }
252b5132 5266
29b0f896 5267 /* Check if instruction is supported on specified architecture. */
5c6af06e
JB
5268 supported = 0;
5269 for (t = current_templates->start; t < current_templates->end; ++t)
5270 {
c0f3af97
L
5271 supported |= cpu_flags_match (t);
5272 if (supported == CPU_FLAGS_PERFECT_MATCH)
548d0ee6
JB
5273 {
5274 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5275 as_warn (_("use .code16 to ensure correct addressing mode"));
3629bb00 5276
548d0ee6
JB
5277 return l;
5278 }
29b0f896 5279 }
3629bb00 5280
548d0ee6
JB
5281 if (!(supported & CPU_FLAGS_64BIT_MATCH))
5282 as_bad (flag_code == CODE_64BIT
5283 ? _("`%s' is not supported in 64-bit mode")
5284 : _("`%s' is only supported in 64-bit mode"),
5285 current_templates->start->name);
5286 else
5287 as_bad (_("`%s' is not supported on `%s%s'"),
5288 current_templates->start->name,
5289 cpu_arch_name ? cpu_arch_name : default_arch,
5290 cpu_sub_arch_name ? cpu_sub_arch_name : "");
252b5132 5291
548d0ee6 5292 return NULL;
29b0f896 5293}
252b5132 5294
29b0f896 5295static char *
e3bb37b5 5296parse_operands (char *l, const char *mnemonic)
29b0f896
AM
5297{
5298 char *token_start;
3138f287 5299
29b0f896
AM
5300 /* 1 if operand is pending after ','. */
5301 unsigned int expecting_operand = 0;
252b5132 5302
29b0f896
AM
5303 /* Non-zero if operand parens not balanced. */
5304 unsigned int paren_not_balanced;
5305
5306 while (*l != END_OF_INSN)
5307 {
5308 /* Skip optional white space before operand. */
5309 if (is_space_char (*l))
5310 ++l;
d02603dc 5311 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
29b0f896
AM
5312 {
5313 as_bad (_("invalid character %s before operand %d"),
5314 output_invalid (*l),
5315 i.operands + 1);
5316 return NULL;
5317 }
d02603dc 5318 token_start = l; /* After white space. */
29b0f896
AM
5319 paren_not_balanced = 0;
5320 while (paren_not_balanced || *l != ',')
5321 {
5322 if (*l == END_OF_INSN)
5323 {
5324 if (paren_not_balanced)
5325 {
5326 if (!intel_syntax)
5327 as_bad (_("unbalanced parenthesis in operand %d."),
5328 i.operands + 1);
5329 else
5330 as_bad (_("unbalanced brackets in operand %d."),
5331 i.operands + 1);
5332 return NULL;
5333 }
5334 else
5335 break; /* we are done */
5336 }
d02603dc 5337 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
29b0f896
AM
5338 {
5339 as_bad (_("invalid character %s in operand %d"),
5340 output_invalid (*l),
5341 i.operands + 1);
5342 return NULL;
5343 }
5344 if (!intel_syntax)
5345 {
5346 if (*l == '(')
5347 ++paren_not_balanced;
5348 if (*l == ')')
5349 --paren_not_balanced;
5350 }
5351 else
5352 {
5353 if (*l == '[')
5354 ++paren_not_balanced;
5355 if (*l == ']')
5356 --paren_not_balanced;
5357 }
5358 l++;
5359 }
5360 if (l != token_start)
5361 { /* Yes, we've read in another operand. */
5362 unsigned int operand_ok;
5363 this_operand = i.operands++;
5364 if (i.operands > MAX_OPERANDS)
5365 {
5366 as_bad (_("spurious operands; (%d operands/instruction max)"),
5367 MAX_OPERANDS);
5368 return NULL;
5369 }
9d46ce34 5370 i.types[this_operand].bitfield.unspecified = 1;
29b0f896
AM
5371 /* Now parse operand adding info to 'i' as we go along. */
5372 END_STRING_AND_SAVE (l);
5373
1286ab78
L
5374 if (i.mem_operands > 1)
5375 {
5376 as_bad (_("too many memory references for `%s'"),
5377 mnemonic);
5378 return 0;
5379 }
5380
29b0f896
AM
5381 if (intel_syntax)
5382 operand_ok =
5383 i386_intel_operand (token_start,
5384 intel_float_operand (mnemonic));
5385 else
a7619375 5386 operand_ok = i386_att_operand (token_start);
29b0f896
AM
5387
5388 RESTORE_END_STRING (l);
5389 if (!operand_ok)
5390 return NULL;
5391 }
5392 else
5393 {
5394 if (expecting_operand)
5395 {
5396 expecting_operand_after_comma:
5397 as_bad (_("expecting operand after ','; got nothing"));
5398 return NULL;
5399 }
5400 if (*l == ',')
5401 {
5402 as_bad (_("expecting operand before ','; got nothing"));
5403 return NULL;
5404 }
5405 }
7f3f1ea2 5406
29b0f896
AM
5407 /* Now *l must be either ',' or END_OF_INSN. */
5408 if (*l == ',')
5409 {
5410 if (*++l == END_OF_INSN)
5411 {
5412 /* Just skip it, if it's \n complain. */
5413 goto expecting_operand_after_comma;
5414 }
5415 expecting_operand = 1;
5416 }
5417 }
5418 return l;
5419}
7f3f1ea2 5420
050dfa73 5421static void
4d456e3d 5422swap_2_operands (int xchg1, int xchg2)
050dfa73
MM
5423{
5424 union i386_op temp_op;
40fb9820 5425 i386_operand_type temp_type;
c48dadc9 5426 unsigned int temp_flags;
050dfa73 5427 enum bfd_reloc_code_real temp_reloc;
4eed87de 5428
050dfa73
MM
5429 temp_type = i.types[xchg2];
5430 i.types[xchg2] = i.types[xchg1];
5431 i.types[xchg1] = temp_type;
c48dadc9
JB
5432
5433 temp_flags = i.flags[xchg2];
5434 i.flags[xchg2] = i.flags[xchg1];
5435 i.flags[xchg1] = temp_flags;
5436
050dfa73
MM
5437 temp_op = i.op[xchg2];
5438 i.op[xchg2] = i.op[xchg1];
5439 i.op[xchg1] = temp_op;
c48dadc9 5440
050dfa73
MM
5441 temp_reloc = i.reloc[xchg2];
5442 i.reloc[xchg2] = i.reloc[xchg1];
5443 i.reloc[xchg1] = temp_reloc;
43234a1e
L
5444
5445 if (i.mask)
5446 {
5447 if (i.mask->operand == xchg1)
5448 i.mask->operand = xchg2;
5449 else if (i.mask->operand == xchg2)
5450 i.mask->operand = xchg1;
5451 }
5452 if (i.broadcast)
5453 {
5454 if (i.broadcast->operand == xchg1)
5455 i.broadcast->operand = xchg2;
5456 else if (i.broadcast->operand == xchg2)
5457 i.broadcast->operand = xchg1;
5458 }
5459 if (i.rounding)
5460 {
5461 if (i.rounding->operand == xchg1)
5462 i.rounding->operand = xchg2;
5463 else if (i.rounding->operand == xchg2)
5464 i.rounding->operand = xchg1;
5465 }
050dfa73
MM
5466}
5467
29b0f896 5468static void
e3bb37b5 5469swap_operands (void)
29b0f896 5470{
b7c61d9a 5471 switch (i.operands)
050dfa73 5472 {
c0f3af97 5473 case 5:
b7c61d9a 5474 case 4:
4d456e3d 5475 swap_2_operands (1, i.operands - 2);
1a0670f3 5476 /* Fall through. */
b7c61d9a
L
5477 case 3:
5478 case 2:
4d456e3d 5479 swap_2_operands (0, i.operands - 1);
b7c61d9a
L
5480 break;
5481 default:
5482 abort ();
29b0f896 5483 }
29b0f896
AM
5484
5485 if (i.mem_operands == 2)
5486 {
5487 const seg_entry *temp_seg;
5488 temp_seg = i.seg[0];
5489 i.seg[0] = i.seg[1];
5490 i.seg[1] = temp_seg;
5491 }
5492}
252b5132 5493
29b0f896
AM
5494/* Try to ensure constant immediates are represented in the smallest
5495 opcode possible. */
5496static void
e3bb37b5 5497optimize_imm (void)
29b0f896
AM
5498{
5499 char guess_suffix = 0;
5500 int op;
252b5132 5501
29b0f896
AM
5502 if (i.suffix)
5503 guess_suffix = i.suffix;
5504 else if (i.reg_operands)
5505 {
5506 /* Figure out a suffix from the last register operand specified.
75e5731b
JB
5507 We can't do this properly yet, i.e. excluding special register
5508 instances, but the following works for instructions with
5509 immediates. In any case, we can't set i.suffix yet. */
29b0f896 5510 for (op = i.operands; --op >= 0;)
bab6aec1
JB
5511 if (i.types[op].bitfield.class != Reg)
5512 continue;
5513 else if (i.types[op].bitfield.byte)
7ab9ffdd 5514 {
40fb9820
L
5515 guess_suffix = BYTE_MNEM_SUFFIX;
5516 break;
5517 }
bab6aec1 5518 else if (i.types[op].bitfield.word)
252b5132 5519 {
40fb9820
L
5520 guess_suffix = WORD_MNEM_SUFFIX;
5521 break;
5522 }
bab6aec1 5523 else if (i.types[op].bitfield.dword)
40fb9820
L
5524 {
5525 guess_suffix = LONG_MNEM_SUFFIX;
5526 break;
5527 }
bab6aec1 5528 else if (i.types[op].bitfield.qword)
40fb9820
L
5529 {
5530 guess_suffix = QWORD_MNEM_SUFFIX;
29b0f896 5531 break;
252b5132 5532 }
29b0f896
AM
5533 }
5534 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5535 guess_suffix = WORD_MNEM_SUFFIX;
5536
5537 for (op = i.operands; --op >= 0;)
40fb9820 5538 if (operand_type_check (i.types[op], imm))
29b0f896
AM
5539 {
5540 switch (i.op[op].imms->X_op)
252b5132 5541 {
29b0f896
AM
5542 case O_constant:
5543 /* If a suffix is given, this operand may be shortened. */
5544 switch (guess_suffix)
252b5132 5545 {
29b0f896 5546 case LONG_MNEM_SUFFIX:
40fb9820
L
5547 i.types[op].bitfield.imm32 = 1;
5548 i.types[op].bitfield.imm64 = 1;
29b0f896
AM
5549 break;
5550 case WORD_MNEM_SUFFIX:
40fb9820
L
5551 i.types[op].bitfield.imm16 = 1;
5552 i.types[op].bitfield.imm32 = 1;
5553 i.types[op].bitfield.imm32s = 1;
5554 i.types[op].bitfield.imm64 = 1;
29b0f896
AM
5555 break;
5556 case BYTE_MNEM_SUFFIX:
40fb9820
L
5557 i.types[op].bitfield.imm8 = 1;
5558 i.types[op].bitfield.imm8s = 1;
5559 i.types[op].bitfield.imm16 = 1;
5560 i.types[op].bitfield.imm32 = 1;
5561 i.types[op].bitfield.imm32s = 1;
5562 i.types[op].bitfield.imm64 = 1;
29b0f896 5563 break;
252b5132 5564 }
252b5132 5565
29b0f896
AM
5566 /* If this operand is at most 16 bits, convert it
5567 to a signed 16 bit number before trying to see
5568 whether it will fit in an even smaller size.
5569 This allows a 16-bit operand such as $0xffe0 to
5570 be recognised as within Imm8S range. */
40fb9820 5571 if ((i.types[op].bitfield.imm16)
29b0f896 5572 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
252b5132 5573 {
29b0f896
AM
5574 i.op[op].imms->X_add_number =
5575 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5576 }
a28def75
L
5577#ifdef BFD64
5578 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
40fb9820 5579 if ((i.types[op].bitfield.imm32)
29b0f896
AM
5580 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5581 == 0))
5582 {
5583 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5584 ^ ((offsetT) 1 << 31))
5585 - ((offsetT) 1 << 31));
5586 }
a28def75 5587#endif
40fb9820 5588 i.types[op]
c6fb90c8
L
5589 = operand_type_or (i.types[op],
5590 smallest_imm_type (i.op[op].imms->X_add_number));
252b5132 5591
29b0f896
AM
5592 /* We must avoid matching of Imm32 templates when 64bit
5593 only immediate is available. */
5594 if (guess_suffix == QWORD_MNEM_SUFFIX)
40fb9820 5595 i.types[op].bitfield.imm32 = 0;
29b0f896 5596 break;
252b5132 5597
29b0f896
AM
5598 case O_absent:
5599 case O_register:
5600 abort ();
5601
5602 /* Symbols and expressions. */
5603 default:
9cd96992
JB
5604 /* Convert symbolic operand to proper sizes for matching, but don't
5605 prevent matching a set of insns that only supports sizes other
5606 than those matching the insn suffix. */
5607 {
40fb9820 5608 i386_operand_type mask, allowed;
d3ce72d0 5609 const insn_template *t;
9cd96992 5610
0dfbf9d7
L
5611 operand_type_set (&mask, 0);
5612 operand_type_set (&allowed, 0);
40fb9820 5613
4eed87de
AM
5614 for (t = current_templates->start;
5615 t < current_templates->end;
5616 ++t)
bab6aec1
JB
5617 {
5618 allowed = operand_type_or (allowed, t->operand_types[op]);
5619 allowed = operand_type_and (allowed, anyimm);
5620 }
9cd96992
JB
5621 switch (guess_suffix)
5622 {
5623 case QWORD_MNEM_SUFFIX:
40fb9820
L
5624 mask.bitfield.imm64 = 1;
5625 mask.bitfield.imm32s = 1;
9cd96992
JB
5626 break;
5627 case LONG_MNEM_SUFFIX:
40fb9820 5628 mask.bitfield.imm32 = 1;
9cd96992
JB
5629 break;
5630 case WORD_MNEM_SUFFIX:
40fb9820 5631 mask.bitfield.imm16 = 1;
9cd96992
JB
5632 break;
5633 case BYTE_MNEM_SUFFIX:
40fb9820 5634 mask.bitfield.imm8 = 1;
9cd96992
JB
5635 break;
5636 default:
9cd96992
JB
5637 break;
5638 }
c6fb90c8 5639 allowed = operand_type_and (mask, allowed);
0dfbf9d7 5640 if (!operand_type_all_zero (&allowed))
c6fb90c8 5641 i.types[op] = operand_type_and (i.types[op], mask);
9cd96992 5642 }
29b0f896 5643 break;
252b5132 5644 }
29b0f896
AM
5645 }
5646}
47926f60 5647
29b0f896
AM
5648/* Try to use the smallest displacement type too. */
5649static void
e3bb37b5 5650optimize_disp (void)
29b0f896
AM
5651{
5652 int op;
3e73aa7c 5653
29b0f896 5654 for (op = i.operands; --op >= 0;)
40fb9820 5655 if (operand_type_check (i.types[op], disp))
252b5132 5656 {
b300c311 5657 if (i.op[op].disps->X_op == O_constant)
252b5132 5658 {
91d6fa6a 5659 offsetT op_disp = i.op[op].disps->X_add_number;
29b0f896 5660
40fb9820 5661 if (i.types[op].bitfield.disp16
91d6fa6a 5662 && (op_disp & ~(offsetT) 0xffff) == 0)
b300c311
L
5663 {
5664 /* If this operand is at most 16 bits, convert
5665 to a signed 16 bit number and don't use 64bit
5666 displacement. */
91d6fa6a 5667 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
40fb9820 5668 i.types[op].bitfield.disp64 = 0;
b300c311 5669 }
a28def75
L
5670#ifdef BFD64
5671 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
40fb9820 5672 if (i.types[op].bitfield.disp32
91d6fa6a 5673 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
b300c311
L
5674 {
5675 /* If this operand is at most 32 bits, convert
5676 to a signed 32 bit number and don't use 64bit
5677 displacement. */
91d6fa6a
NC
5678 op_disp &= (((offsetT) 2 << 31) - 1);
5679 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
40fb9820 5680 i.types[op].bitfield.disp64 = 0;
b300c311 5681 }
a28def75 5682#endif
91d6fa6a 5683 if (!op_disp && i.types[op].bitfield.baseindex)
b300c311 5684 {
40fb9820
L
5685 i.types[op].bitfield.disp8 = 0;
5686 i.types[op].bitfield.disp16 = 0;
5687 i.types[op].bitfield.disp32 = 0;
5688 i.types[op].bitfield.disp32s = 0;
5689 i.types[op].bitfield.disp64 = 0;
b300c311
L
5690 i.op[op].disps = 0;
5691 i.disp_operands--;
5692 }
5693 else if (flag_code == CODE_64BIT)
5694 {
91d6fa6a 5695 if (fits_in_signed_long (op_disp))
28a9d8f5 5696 {
40fb9820
L
5697 i.types[op].bitfield.disp64 = 0;
5698 i.types[op].bitfield.disp32s = 1;
28a9d8f5 5699 }
0e1147d9 5700 if (i.prefix[ADDR_PREFIX]
91d6fa6a 5701 && fits_in_unsigned_long (op_disp))
40fb9820 5702 i.types[op].bitfield.disp32 = 1;
b300c311 5703 }
40fb9820
L
5704 if ((i.types[op].bitfield.disp32
5705 || i.types[op].bitfield.disp32s
5706 || i.types[op].bitfield.disp16)
b5014f7a 5707 && fits_in_disp8 (op_disp))
40fb9820 5708 i.types[op].bitfield.disp8 = 1;
252b5132 5709 }
67a4f2b7
AO
5710 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5711 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5712 {
5713 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5714 i.op[op].disps, 0, i.reloc[op]);
40fb9820
L
5715 i.types[op].bitfield.disp8 = 0;
5716 i.types[op].bitfield.disp16 = 0;
5717 i.types[op].bitfield.disp32 = 0;
5718 i.types[op].bitfield.disp32s = 0;
5719 i.types[op].bitfield.disp64 = 0;
67a4f2b7
AO
5720 }
5721 else
b300c311 5722 /* We only support 64bit displacement on constants. */
40fb9820 5723 i.types[op].bitfield.disp64 = 0;
252b5132 5724 }
29b0f896
AM
5725}
5726
4a1b91ea
L
5727/* Return 1 if there is a match in broadcast bytes between operand
5728 GIVEN and instruction template T. */
5729
5730static INLINE int
5731match_broadcast_size (const insn_template *t, unsigned int given)
5732{
5733 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5734 && i.types[given].bitfield.byte)
5735 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5736 && i.types[given].bitfield.word)
5737 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5738 && i.types[given].bitfield.dword)
5739 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5740 && i.types[given].bitfield.qword));
5741}
5742
6c30d220
L
5743/* Check if operands are valid for the instruction. */
5744
5745static int
5746check_VecOperands (const insn_template *t)
5747{
43234a1e 5748 unsigned int op;
e2195274 5749 i386_cpu_flags cpu;
e2195274
JB
5750
5751 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5752 any one operand are implicity requiring AVX512VL support if the actual
5753 operand size is YMMword or XMMword. Since this function runs after
5754 template matching, there's no need to check for YMMword/XMMword in
5755 the template. */
5756 cpu = cpu_flags_and (t->cpu_flags, avx512);
5757 if (!cpu_flags_all_zero (&cpu)
5758 && !t->cpu_flags.bitfield.cpuavx512vl
5759 && !cpu_arch_flags.bitfield.cpuavx512vl)
5760 {
5761 for (op = 0; op < t->operands; ++op)
5762 {
5763 if (t->operand_types[op].bitfield.zmmword
5764 && (i.types[op].bitfield.ymmword
5765 || i.types[op].bitfield.xmmword))
5766 {
5767 i.error = unsupported;
5768 return 1;
5769 }
5770 }
5771 }
43234a1e 5772
6c30d220 5773 /* Without VSIB byte, we can't have a vector register for index. */
63112cd6 5774 if (!t->opcode_modifier.sib
6c30d220 5775 && i.index_reg
1b54b8d7
JB
5776 && (i.index_reg->reg_type.bitfield.xmmword
5777 || i.index_reg->reg_type.bitfield.ymmword
5778 || i.index_reg->reg_type.bitfield.zmmword))
6c30d220
L
5779 {
5780 i.error = unsupported_vector_index_register;
5781 return 1;
5782 }
5783
ad8ecc81
MZ
5784 /* Check if default mask is allowed. */
5785 if (t->opcode_modifier.nodefmask
5786 && (!i.mask || i.mask->mask->reg_num == 0))
5787 {
5788 i.error = no_default_mask;
5789 return 1;
5790 }
5791
7bab8ab5
JB
5792 /* For VSIB byte, we need a vector register for index, and all vector
5793 registers must be distinct. */
63112cd6 5794 if (t->opcode_modifier.sib)
7bab8ab5
JB
5795 {
5796 if (!i.index_reg
63112cd6 5797 || !((t->opcode_modifier.sib == VECSIB128
1b54b8d7 5798 && i.index_reg->reg_type.bitfield.xmmword)
63112cd6 5799 || (t->opcode_modifier.sib == VECSIB256
1b54b8d7 5800 && i.index_reg->reg_type.bitfield.ymmword)
63112cd6 5801 || (t->opcode_modifier.sib == VECSIB512
1b54b8d7 5802 && i.index_reg->reg_type.bitfield.zmmword)))
7bab8ab5
JB
5803 {
5804 i.error = invalid_vsib_address;
5805 return 1;
5806 }
5807
43234a1e
L
5808 gas_assert (i.reg_operands == 2 || i.mask);
5809 if (i.reg_operands == 2 && !i.mask)
5810 {
3528c362 5811 gas_assert (i.types[0].bitfield.class == RegSIMD);
1b54b8d7
JB
5812 gas_assert (i.types[0].bitfield.xmmword
5813 || i.types[0].bitfield.ymmword);
3528c362 5814 gas_assert (i.types[2].bitfield.class == RegSIMD);
1b54b8d7
JB
5815 gas_assert (i.types[2].bitfield.xmmword
5816 || i.types[2].bitfield.ymmword);
43234a1e
L
5817 if (operand_check == check_none)
5818 return 0;
5819 if (register_number (i.op[0].regs)
5820 != register_number (i.index_reg)
5821 && register_number (i.op[2].regs)
5822 != register_number (i.index_reg)
5823 && register_number (i.op[0].regs)
5824 != register_number (i.op[2].regs))
5825 return 0;
5826 if (operand_check == check_error)
5827 {
5828 i.error = invalid_vector_register_set;
5829 return 1;
5830 }
5831 as_warn (_("mask, index, and destination registers should be distinct"));
5832 }
8444f82a
MZ
5833 else if (i.reg_operands == 1 && i.mask)
5834 {
3528c362 5835 if (i.types[1].bitfield.class == RegSIMD
1b54b8d7
JB
5836 && (i.types[1].bitfield.xmmword
5837 || i.types[1].bitfield.ymmword
5838 || i.types[1].bitfield.zmmword)
8444f82a
MZ
5839 && (register_number (i.op[1].regs)
5840 == register_number (i.index_reg)))
5841 {
5842 if (operand_check == check_error)
5843 {
5844 i.error = invalid_vector_register_set;
5845 return 1;
5846 }
5847 if (operand_check != check_none)
5848 as_warn (_("index and destination registers should be distinct"));
5849 }
5850 }
43234a1e 5851 }
7bab8ab5 5852
43234a1e
L
5853 /* Check if broadcast is supported by the instruction and is applied
5854 to the memory operand. */
5855 if (i.broadcast)
5856 {
8e6e0792 5857 i386_operand_type type, overlap;
43234a1e
L
5858
5859 /* Check if specified broadcast is supported in this instruction,
4a1b91ea 5860 and its broadcast bytes match the memory operand. */
32546502 5861 op = i.broadcast->operand;
8e6e0792 5862 if (!t->opcode_modifier.broadcast
c48dadc9 5863 || !(i.flags[op] & Operand_Mem)
c39e5b26 5864 || (!i.types[op].bitfield.unspecified
4a1b91ea 5865 && !match_broadcast_size (t, op)))
43234a1e
L
5866 {
5867 bad_broadcast:
5868 i.error = unsupported_broadcast;
5869 return 1;
5870 }
8e6e0792 5871
4a1b91ea
L
5872 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5873 * i.broadcast->type);
8e6e0792 5874 operand_type_set (&type, 0);
4a1b91ea 5875 switch (i.broadcast->bytes)
8e6e0792 5876 {
4a1b91ea
L
5877 case 2:
5878 type.bitfield.word = 1;
5879 break;
5880 case 4:
5881 type.bitfield.dword = 1;
5882 break;
8e6e0792
JB
5883 case 8:
5884 type.bitfield.qword = 1;
5885 break;
5886 case 16:
5887 type.bitfield.xmmword = 1;
5888 break;
5889 case 32:
5890 type.bitfield.ymmword = 1;
5891 break;
5892 case 64:
5893 type.bitfield.zmmword = 1;
5894 break;
5895 default:
5896 goto bad_broadcast;
5897 }
5898
5899 overlap = operand_type_and (type, t->operand_types[op]);
bc49bfd8
JB
5900 if (t->operand_types[op].bitfield.class == RegSIMD
5901 && t->operand_types[op].bitfield.byte
5902 + t->operand_types[op].bitfield.word
5903 + t->operand_types[op].bitfield.dword
5904 + t->operand_types[op].bitfield.qword > 1)
5905 {
5906 overlap.bitfield.xmmword = 0;
5907 overlap.bitfield.ymmword = 0;
5908 overlap.bitfield.zmmword = 0;
5909 }
8e6e0792
JB
5910 if (operand_type_all_zero (&overlap))
5911 goto bad_broadcast;
5912
5913 if (t->opcode_modifier.checkregsize)
5914 {
5915 unsigned int j;
5916
e2195274 5917 type.bitfield.baseindex = 1;
8e6e0792
JB
5918 for (j = 0; j < i.operands; ++j)
5919 {
5920 if (j != op
5921 && !operand_type_register_match(i.types[j],
5922 t->operand_types[j],
5923 type,
5924 t->operand_types[op]))
5925 goto bad_broadcast;
5926 }
5927 }
43234a1e
L
5928 }
5929 /* If broadcast is supported in this instruction, we need to check if
5930 operand of one-element size isn't specified without broadcast. */
5931 else if (t->opcode_modifier.broadcast && i.mem_operands)
5932 {
5933 /* Find memory operand. */
5934 for (op = 0; op < i.operands; op++)
8dc0818e 5935 if (i.flags[op] & Operand_Mem)
43234a1e
L
5936 break;
5937 gas_assert (op < i.operands);
5938 /* Check size of the memory operand. */
4a1b91ea 5939 if (match_broadcast_size (t, op))
43234a1e
L
5940 {
5941 i.error = broadcast_needed;
5942 return 1;
5943 }
5944 }
c39e5b26
JB
5945 else
5946 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
43234a1e
L
5947
5948 /* Check if requested masking is supported. */
ae2387fe 5949 if (i.mask)
43234a1e 5950 {
ae2387fe
JB
5951 switch (t->opcode_modifier.masking)
5952 {
5953 case BOTH_MASKING:
5954 break;
5955 case MERGING_MASKING:
5956 if (i.mask->zeroing)
5957 {
5958 case 0:
5959 i.error = unsupported_masking;
5960 return 1;
5961 }
5962 break;
5963 case DYNAMIC_MASKING:
5964 /* Memory destinations allow only merging masking. */
5965 if (i.mask->zeroing && i.mem_operands)
5966 {
5967 /* Find memory operand. */
5968 for (op = 0; op < i.operands; op++)
c48dadc9 5969 if (i.flags[op] & Operand_Mem)
ae2387fe
JB
5970 break;
5971 gas_assert (op < i.operands);
5972 if (op == i.operands - 1)
5973 {
5974 i.error = unsupported_masking;
5975 return 1;
5976 }
5977 }
5978 break;
5979 default:
5980 abort ();
5981 }
43234a1e
L
5982 }
5983
5984 /* Check if masking is applied to dest operand. */
5985 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5986 {
5987 i.error = mask_not_on_destination;
5988 return 1;
5989 }
5990
43234a1e
L
5991 /* Check RC/SAE. */
5992 if (i.rounding)
5993 {
a80195f1
JB
5994 if (!t->opcode_modifier.sae
5995 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
43234a1e
L
5996 {
5997 i.error = unsupported_rc_sae;
5998 return 1;
5999 }
6000 /* If the instruction has several immediate operands and one of
6001 them is rounding, the rounding operand should be the last
6002 immediate operand. */
6003 if (i.imm_operands > 1
6004 && i.rounding->operand != (int) (i.imm_operands - 1))
7bab8ab5 6005 {
43234a1e 6006 i.error = rc_sae_operand_not_last_imm;
7bab8ab5
JB
6007 return 1;
6008 }
6c30d220
L
6009 }
6010
da4977e0
JB
6011 /* Check the special Imm4 cases; must be the first operand. */
6012 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6013 {
6014 if (i.op[0].imms->X_op != O_constant
6015 || !fits_in_imm4 (i.op[0].imms->X_add_number))
6016 {
6017 i.error = bad_imm4;
6018 return 1;
6019 }
6020
6021 /* Turn off Imm<N> so that update_imm won't complain. */
6022 operand_type_set (&i.types[0], 0);
6023 }
6024
43234a1e 6025 /* Check vector Disp8 operand. */
b5014f7a
JB
6026 if (t->opcode_modifier.disp8memshift
6027 && i.disp_encoding != disp_encoding_32bit)
43234a1e
L
6028 {
6029 if (i.broadcast)
4a1b91ea 6030 i.memshift = t->opcode_modifier.broadcast - 1;
7091c612 6031 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
43234a1e 6032 i.memshift = t->opcode_modifier.disp8memshift;
7091c612
JB
6033 else
6034 {
6035 const i386_operand_type *type = NULL;
6036
6037 i.memshift = 0;
6038 for (op = 0; op < i.operands; op++)
8dc0818e 6039 if (i.flags[op] & Operand_Mem)
7091c612 6040 {
4174bfff
JB
6041 if (t->opcode_modifier.evex == EVEXLIG)
6042 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6043 else if (t->operand_types[op].bitfield.xmmword
6044 + t->operand_types[op].bitfield.ymmword
6045 + t->operand_types[op].bitfield.zmmword <= 1)
7091c612
JB
6046 type = &t->operand_types[op];
6047 else if (!i.types[op].bitfield.unspecified)
6048 type = &i.types[op];
6049 }
3528c362 6050 else if (i.types[op].bitfield.class == RegSIMD
4174bfff 6051 && t->opcode_modifier.evex != EVEXLIG)
7091c612
JB
6052 {
6053 if (i.types[op].bitfield.zmmword)
6054 i.memshift = 6;
6055 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6056 i.memshift = 5;
6057 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6058 i.memshift = 4;
6059 }
6060
6061 if (type)
6062 {
6063 if (type->bitfield.zmmword)
6064 i.memshift = 6;
6065 else if (type->bitfield.ymmword)
6066 i.memshift = 5;
6067 else if (type->bitfield.xmmword)
6068 i.memshift = 4;
6069 }
6070
6071 /* For the check in fits_in_disp8(). */
6072 if (i.memshift == 0)
6073 i.memshift = -1;
6074 }
43234a1e
L
6075
6076 for (op = 0; op < i.operands; op++)
6077 if (operand_type_check (i.types[op], disp)
6078 && i.op[op].disps->X_op == O_constant)
6079 {
b5014f7a 6080 if (fits_in_disp8 (i.op[op].disps->X_add_number))
43234a1e 6081 {
b5014f7a
JB
6082 i.types[op].bitfield.disp8 = 1;
6083 return 0;
43234a1e 6084 }
b5014f7a 6085 i.types[op].bitfield.disp8 = 0;
43234a1e
L
6086 }
6087 }
b5014f7a
JB
6088
6089 i.memshift = 0;
43234a1e 6090
6c30d220
L
6091 return 0;
6092}
6093
da4977e0 6094/* Check if encoding requirements are met by the instruction. */
a683cc34
SP
6095
6096static int
da4977e0 6097VEX_check_encoding (const insn_template *t)
a683cc34 6098{
da4977e0
JB
6099 if (i.vec_encoding == vex_encoding_error)
6100 {
6101 i.error = unsupported;
6102 return 1;
6103 }
6104
86fa6981 6105 if (i.vec_encoding == vex_encoding_evex)
43234a1e 6106 {
86fa6981 6107 /* This instruction must be encoded with EVEX prefix. */
e771e7c9 6108 if (!is_evex_encoding (t))
86fa6981
L
6109 {
6110 i.error = unsupported;
6111 return 1;
6112 }
6113 return 0;
43234a1e
L
6114 }
6115
a683cc34 6116 if (!t->opcode_modifier.vex)
86fa6981
L
6117 {
6118 /* This instruction template doesn't have VEX prefix. */
6119 if (i.vec_encoding != vex_encoding_default)
6120 {
6121 i.error = unsupported;
6122 return 1;
6123 }
6124 return 0;
6125 }
a683cc34 6126
a683cc34
SP
6127 return 0;
6128}
6129
d3ce72d0 6130static const insn_template *
83b16ac6 6131match_template (char mnem_suffix)
29b0f896
AM
6132{
6133 /* Points to template once we've found it. */
d3ce72d0 6134 const insn_template *t;
40fb9820 6135 i386_operand_type overlap0, overlap1, overlap2, overlap3;
c0f3af97 6136 i386_operand_type overlap4;
29b0f896 6137 unsigned int found_reverse_match;
dc2be329 6138 i386_opcode_modifier suffix_check;
40fb9820 6139 i386_operand_type operand_types [MAX_OPERANDS];
539e75ad 6140 int addr_prefix_disp;
45a4bb20 6141 unsigned int j, size_match, check_register;
5614d22c 6142 enum i386_error specific_error = 0;
29b0f896 6143
c0f3af97
L
6144#if MAX_OPERANDS != 5
6145# error "MAX_OPERANDS must be 5."
f48ff2ae
L
6146#endif
6147
29b0f896 6148 found_reverse_match = 0;
539e75ad 6149 addr_prefix_disp = -1;
40fb9820 6150
dc2be329 6151 /* Prepare for mnemonic suffix check. */
40fb9820 6152 memset (&suffix_check, 0, sizeof (suffix_check));
dc2be329
L
6153 switch (mnem_suffix)
6154 {
6155 case BYTE_MNEM_SUFFIX:
6156 suffix_check.no_bsuf = 1;
6157 break;
6158 case WORD_MNEM_SUFFIX:
6159 suffix_check.no_wsuf = 1;
6160 break;
6161 case SHORT_MNEM_SUFFIX:
6162 suffix_check.no_ssuf = 1;
6163 break;
6164 case LONG_MNEM_SUFFIX:
6165 suffix_check.no_lsuf = 1;
6166 break;
6167 case QWORD_MNEM_SUFFIX:
6168 suffix_check.no_qsuf = 1;
6169 break;
6170 default:
6171 /* NB: In Intel syntax, normally we can check for memory operand
6172 size when there is no mnemonic suffix. But jmp and call have
6173 2 different encodings with Dword memory operand size, one with
6174 No_ldSuf and the other without. i.suffix is set to
6175 LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf. */
6176 if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6177 suffix_check.no_ldsuf = 1;
83b16ac6
JB
6178 }
6179
01559ecc
L
6180 /* Must have right number of operands. */
6181 i.error = number_of_operands_mismatch;
6182
45aa61fe 6183 for (t = current_templates->start; t < current_templates->end; t++)
29b0f896 6184 {
539e75ad 6185 addr_prefix_disp = -1;
dbbc8b7e 6186 found_reverse_match = 0;
539e75ad 6187
29b0f896
AM
6188 if (i.operands != t->operands)
6189 continue;
6190
50aecf8c 6191 /* Check processor support. */
a65babc9 6192 i.error = unsupported;
45a4bb20 6193 if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
50aecf8c
L
6194 continue;
6195
e1d4d893 6196 /* Check AT&T mnemonic. */
a65babc9 6197 i.error = unsupported_with_intel_mnemonic;
e1d4d893 6198 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
1efbbeb4
L
6199 continue;
6200
4b5aaf5f 6201 /* Check AT&T/Intel syntax. */
a65babc9 6202 i.error = unsupported_syntax;
5c07affc 6203 if ((intel_syntax && t->opcode_modifier.attsyntax)
4b5aaf5f 6204 || (!intel_syntax && t->opcode_modifier.intelsyntax))
1efbbeb4
L
6205 continue;
6206
4b5aaf5f
L
6207 /* Check Intel64/AMD64 ISA. */
6208 switch (isa64)
6209 {
6210 default:
6211 /* Default: Don't accept Intel64. */
6212 if (t->opcode_modifier.isa64 == INTEL64)
6213 continue;
6214 break;
6215 case amd64:
6216 /* -mamd64: Don't accept Intel64 and Intel64 only. */
6217 if (t->opcode_modifier.isa64 >= INTEL64)
6218 continue;
6219 break;
6220 case intel64:
6221 /* -mintel64: Don't accept AMD64. */
5990e377 6222 if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
4b5aaf5f
L
6223 continue;
6224 break;
6225 }
6226
dc2be329 6227 /* Check the suffix. */
a65babc9 6228 i.error = invalid_instruction_suffix;
dc2be329
L
6229 if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6230 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6231 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6232 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6233 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6234 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
83b16ac6 6235 continue;
29b0f896 6236
3ac21baa
JB
6237 size_match = operand_size_match (t);
6238 if (!size_match)
7d5e4556 6239 continue;
539e75ad 6240
6f2f06be
JB
6241 /* This is intentionally not
6242
0cfa3eb3 6243 if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6f2f06be
JB
6244
6245 as the case of a missing * on the operand is accepted (perhaps with
6246 a warning, issued further down). */
0cfa3eb3 6247 if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6f2f06be
JB
6248 {
6249 i.error = operand_type_mismatch;
6250 continue;
6251 }
6252
5c07affc
L
6253 for (j = 0; j < MAX_OPERANDS; j++)
6254 operand_types[j] = t->operand_types[j];
6255
e365e234
JB
6256 /* In general, don't allow
6257 - 64-bit operands outside of 64-bit mode,
6258 - 32-bit operands on pre-386. */
4873e243 6259 j = i.imm_operands + (t->operands > i.imm_operands + 1);
e365e234
JB
6260 if (((i.suffix == QWORD_MNEM_SUFFIX
6261 && flag_code != CODE_64BIT
6262 && (t->base_opcode != 0x0fc7
6263 || t->extension_opcode != 1 /* cmpxchg8b */))
6264 || (i.suffix == LONG_MNEM_SUFFIX
6265 && !cpu_arch_flags.bitfield.cpui386))
45aa61fe 6266 && (intel_syntax
3cd7f3e3 6267 ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
45aa61fe
AM
6268 && !intel_float_operand (t->name))
6269 : intel_float_operand (t->name) != 2)
4873e243
JB
6270 && (t->operands == i.imm_operands
6271 || (operand_types[i.imm_operands].bitfield.class != RegMMX
6272 && operand_types[i.imm_operands].bitfield.class != RegSIMD
6273 && operand_types[i.imm_operands].bitfield.class != RegMask)
6274 || (operand_types[j].bitfield.class != RegMMX
6275 && operand_types[j].bitfield.class != RegSIMD
6276 && operand_types[j].bitfield.class != RegMask))
63112cd6 6277 && !t->opcode_modifier.sib)
192dc9c6
JB
6278 continue;
6279
29b0f896 6280 /* Do not verify operands when there are none. */
e365e234 6281 if (!t->operands)
da4977e0
JB
6282 {
6283 if (VEX_check_encoding (t))
6284 {
6285 specific_error = i.error;
6286 continue;
6287 }
6288
6289 /* We've found a match; break out of loop. */
6290 break;
6291 }
252b5132 6292
48bcea9f
JB
6293 if (!t->opcode_modifier.jump
6294 || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6295 {
6296 /* There should be only one Disp operand. */
6297 for (j = 0; j < MAX_OPERANDS; j++)
6298 if (operand_type_check (operand_types[j], disp))
539e75ad 6299 break;
48bcea9f
JB
6300 if (j < MAX_OPERANDS)
6301 {
6302 bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
6303
6304 addr_prefix_disp = j;
6305
6306 /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6307 operand into Disp32/Disp32/Disp16/Disp32 operand. */
6308 switch (flag_code)
40fb9820 6309 {
48bcea9f
JB
6310 case CODE_16BIT:
6311 override = !override;
6312 /* Fall through. */
6313 case CODE_32BIT:
6314 if (operand_types[j].bitfield.disp32
6315 && operand_types[j].bitfield.disp16)
40fb9820 6316 {
48bcea9f
JB
6317 operand_types[j].bitfield.disp16 = override;
6318 operand_types[j].bitfield.disp32 = !override;
40fb9820 6319 }
48bcea9f
JB
6320 operand_types[j].bitfield.disp32s = 0;
6321 operand_types[j].bitfield.disp64 = 0;
6322 break;
6323
6324 case CODE_64BIT:
6325 if (operand_types[j].bitfield.disp32s
6326 || operand_types[j].bitfield.disp64)
40fb9820 6327 {
48bcea9f
JB
6328 operand_types[j].bitfield.disp64 &= !override;
6329 operand_types[j].bitfield.disp32s &= !override;
6330 operand_types[j].bitfield.disp32 = override;
40fb9820 6331 }
48bcea9f
JB
6332 operand_types[j].bitfield.disp16 = 0;
6333 break;
40fb9820 6334 }
539e75ad 6335 }
48bcea9f 6336 }
539e75ad 6337
02a86693
L
6338 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
6339 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
6340 continue;
6341
56ffb741 6342 /* We check register size if needed. */
e2195274
JB
6343 if (t->opcode_modifier.checkregsize)
6344 {
6345 check_register = (1 << t->operands) - 1;
6346 if (i.broadcast)
6347 check_register &= ~(1 << i.broadcast->operand);
6348 }
6349 else
6350 check_register = 0;
6351
c6fb90c8 6352 overlap0 = operand_type_and (i.types[0], operand_types[0]);
29b0f896
AM
6353 switch (t->operands)
6354 {
6355 case 1:
40fb9820 6356 if (!operand_type_match (overlap0, i.types[0]))
29b0f896
AM
6357 continue;
6358 break;
6359 case 2:
33eaf5de 6360 /* xchg %eax, %eax is a special case. It is an alias for nop
8b38ad71
L
6361 only in 32bit mode and we can use opcode 0x90. In 64bit
6362 mode, we can't use 0x90 for xchg %eax, %eax since it should
6363 zero-extend %eax to %rax. */
6364 if (flag_code == CODE_64BIT
6365 && t->base_opcode == 0x90
75e5731b
JB
6366 && i.types[0].bitfield.instance == Accum
6367 && i.types[0].bitfield.dword
6368 && i.types[1].bitfield.instance == Accum
6369 && i.types[1].bitfield.dword)
8b38ad71 6370 continue;
1212781b
JB
6371 /* xrelease mov %eax, <disp> is another special case. It must not
6372 match the accumulator-only encoding of mov. */
6373 if (flag_code != CODE_64BIT
6374 && i.hle_prefix
6375 && t->base_opcode == 0xa0
75e5731b 6376 && i.types[0].bitfield.instance == Accum
8dc0818e 6377 && (i.flags[1] & Operand_Mem))
1212781b 6378 continue;
f5eb1d70
JB
6379 /* Fall through. */
6380
6381 case 3:
3ac21baa
JB
6382 if (!(size_match & MATCH_STRAIGHT))
6383 goto check_reverse;
64c49ab3
JB
6384 /* Reverse direction of operands if swapping is possible in the first
6385 place (operands need to be symmetric) and
6386 - the load form is requested, and the template is a store form,
6387 - the store form is requested, and the template is a load form,
6388 - the non-default (swapped) form is requested. */
6389 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
f5eb1d70 6390 if (t->opcode_modifier.d && i.reg_operands == i.operands
64c49ab3
JB
6391 && !operand_type_all_zero (&overlap1))
6392 switch (i.dir_encoding)
6393 {
6394 case dir_encoding_load:
6395 if (operand_type_check (operand_types[i.operands - 1], anymem)
dfd69174 6396 || t->opcode_modifier.regmem)
64c49ab3
JB
6397 goto check_reverse;
6398 break;
6399
6400 case dir_encoding_store:
6401 if (!operand_type_check (operand_types[i.operands - 1], anymem)
dfd69174 6402 && !t->opcode_modifier.regmem)
64c49ab3
JB
6403 goto check_reverse;
6404 break;
6405
6406 case dir_encoding_swap:
6407 goto check_reverse;
6408
6409 case dir_encoding_default:
6410 break;
6411 }
86fa6981 6412 /* If we want store form, we skip the current load. */
64c49ab3
JB
6413 if ((i.dir_encoding == dir_encoding_store
6414 || i.dir_encoding == dir_encoding_swap)
86fa6981
L
6415 && i.mem_operands == 0
6416 && t->opcode_modifier.load)
fa99fab2 6417 continue;
1a0670f3 6418 /* Fall through. */
f48ff2ae 6419 case 4:
c0f3af97 6420 case 5:
c6fb90c8 6421 overlap1 = operand_type_and (i.types[1], operand_types[1]);
40fb9820
L
6422 if (!operand_type_match (overlap0, i.types[0])
6423 || !operand_type_match (overlap1, i.types[1])
e2195274 6424 || ((check_register & 3) == 3
dc821c5f 6425 && !operand_type_register_match (i.types[0],
40fb9820 6426 operand_types[0],
dc821c5f 6427 i.types[1],
40fb9820 6428 operand_types[1])))
29b0f896
AM
6429 {
6430 /* Check if other direction is valid ... */
38e314eb 6431 if (!t->opcode_modifier.d)
29b0f896
AM
6432 continue;
6433
dc1e8a47 6434 check_reverse:
3ac21baa
JB
6435 if (!(size_match & MATCH_REVERSE))
6436 continue;
29b0f896 6437 /* Try reversing direction of operands. */
f5eb1d70
JB
6438 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6439 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
40fb9820 6440 if (!operand_type_match (overlap0, i.types[0])
f5eb1d70 6441 || !operand_type_match (overlap1, i.types[i.operands - 1])
45664ddb 6442 || (check_register
dc821c5f 6443 && !operand_type_register_match (i.types[0],
f5eb1d70
JB
6444 operand_types[i.operands - 1],
6445 i.types[i.operands - 1],
45664ddb 6446 operand_types[0])))
29b0f896
AM
6447 {
6448 /* Does not match either direction. */
6449 continue;
6450 }
38e314eb 6451 /* found_reverse_match holds which of D or FloatR
29b0f896 6452 we've found. */
38e314eb
JB
6453 if (!t->opcode_modifier.d)
6454 found_reverse_match = 0;
6455 else if (operand_types[0].bitfield.tbyte)
8a2ed489 6456 found_reverse_match = Opcode_FloatD;
dbbc8b7e 6457 else if (operand_types[0].bitfield.xmmword
f5eb1d70 6458 || operand_types[i.operands - 1].bitfield.xmmword
3528c362
JB
6459 || operand_types[0].bitfield.class == RegMMX
6460 || operand_types[i.operands - 1].bitfield.class == RegMMX
dbbc8b7e
JB
6461 || is_any_vex_encoding(t))
6462 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6463 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
8a2ed489 6464 else
38e314eb 6465 found_reverse_match = Opcode_D;
40fb9820 6466 if (t->opcode_modifier.floatr)
8a2ed489 6467 found_reverse_match |= Opcode_FloatR;
29b0f896 6468 }
f48ff2ae 6469 else
29b0f896 6470 {
f48ff2ae 6471 /* Found a forward 2 operand match here. */
d1cbb4db
L
6472 switch (t->operands)
6473 {
c0f3af97
L
6474 case 5:
6475 overlap4 = operand_type_and (i.types[4],
6476 operand_types[4]);
1a0670f3 6477 /* Fall through. */
d1cbb4db 6478 case 4:
c6fb90c8
L
6479 overlap3 = operand_type_and (i.types[3],
6480 operand_types[3]);
1a0670f3 6481 /* Fall through. */
d1cbb4db 6482 case 3:
c6fb90c8
L
6483 overlap2 = operand_type_and (i.types[2],
6484 operand_types[2]);
d1cbb4db
L
6485 break;
6486 }
29b0f896 6487
f48ff2ae
L
6488 switch (t->operands)
6489 {
c0f3af97
L
6490 case 5:
6491 if (!operand_type_match (overlap4, i.types[4])
dc821c5f 6492 || !operand_type_register_match (i.types[3],
c0f3af97 6493 operand_types[3],
c0f3af97
L
6494 i.types[4],
6495 operand_types[4]))
6496 continue;
1a0670f3 6497 /* Fall through. */
f48ff2ae 6498 case 4:
40fb9820 6499 if (!operand_type_match (overlap3, i.types[3])
e2195274
JB
6500 || ((check_register & 0xa) == 0xa
6501 && !operand_type_register_match (i.types[1],
f7768225
JB
6502 operand_types[1],
6503 i.types[3],
e2195274
JB
6504 operand_types[3]))
6505 || ((check_register & 0xc) == 0xc
6506 && !operand_type_register_match (i.types[2],
6507 operand_types[2],
6508 i.types[3],
6509 operand_types[3])))
f48ff2ae 6510 continue;
1a0670f3 6511 /* Fall through. */
f48ff2ae
L
6512 case 3:
6513 /* Here we make use of the fact that there are no
23e42951 6514 reverse match 3 operand instructions. */
40fb9820 6515 if (!operand_type_match (overlap2, i.types[2])
e2195274
JB
6516 || ((check_register & 5) == 5
6517 && !operand_type_register_match (i.types[0],
23e42951
JB
6518 operand_types[0],
6519 i.types[2],
e2195274
JB
6520 operand_types[2]))
6521 || ((check_register & 6) == 6
6522 && !operand_type_register_match (i.types[1],
6523 operand_types[1],
6524 i.types[2],
6525 operand_types[2])))
f48ff2ae
L
6526 continue;
6527 break;
6528 }
29b0f896 6529 }
f48ff2ae 6530 /* Found either forward/reverse 2, 3 or 4 operand match here:
29b0f896
AM
6531 slip through to break. */
6532 }
c0f3af97 6533
da4977e0
JB
6534 /* Check if vector operands are valid. */
6535 if (check_VecOperands (t))
6536 {
6537 specific_error = i.error;
6538 continue;
6539 }
6540
6541 /* Check if VEX/EVEX encoding requirements can be satisfied. */
6542 if (VEX_check_encoding (t))
5614d22c
JB
6543 {
6544 specific_error = i.error;
6545 continue;
6546 }
a683cc34 6547
29b0f896
AM
6548 /* We've found a match; break out of loop. */
6549 break;
6550 }
6551
6552 if (t == current_templates->end)
6553 {
6554 /* We found no match. */
a65babc9 6555 const char *err_msg;
5614d22c 6556 switch (specific_error ? specific_error : i.error)
a65babc9
L
6557 {
6558 default:
6559 abort ();
86e026a4 6560 case operand_size_mismatch:
a65babc9
L
6561 err_msg = _("operand size mismatch");
6562 break;
6563 case operand_type_mismatch:
6564 err_msg = _("operand type mismatch");
6565 break;
6566 case register_type_mismatch:
6567 err_msg = _("register type mismatch");
6568 break;
6569 case number_of_operands_mismatch:
6570 err_msg = _("number of operands mismatch");
6571 break;
6572 case invalid_instruction_suffix:
6573 err_msg = _("invalid instruction suffix");
6574 break;
6575 case bad_imm4:
4a2608e3 6576 err_msg = _("constant doesn't fit in 4 bits");
a65babc9 6577 break;
a65babc9
L
6578 case unsupported_with_intel_mnemonic:
6579 err_msg = _("unsupported with Intel mnemonic");
6580 break;
6581 case unsupported_syntax:
6582 err_msg = _("unsupported syntax");
6583 break;
6584 case unsupported:
35262a23 6585 as_bad (_("unsupported instruction `%s'"),
10efe3f6
L
6586 current_templates->start->name);
6587 return NULL;
6c30d220
L
6588 case invalid_vsib_address:
6589 err_msg = _("invalid VSIB address");
6590 break;
7bab8ab5
JB
6591 case invalid_vector_register_set:
6592 err_msg = _("mask, index, and destination registers must be distinct");
6593 break;
6c30d220
L
6594 case unsupported_vector_index_register:
6595 err_msg = _("unsupported vector index register");
6596 break;
43234a1e
L
6597 case unsupported_broadcast:
6598 err_msg = _("unsupported broadcast");
6599 break;
43234a1e
L
6600 case broadcast_needed:
6601 err_msg = _("broadcast is needed for operand of such type");
6602 break;
6603 case unsupported_masking:
6604 err_msg = _("unsupported masking");
6605 break;
6606 case mask_not_on_destination:
6607 err_msg = _("mask not on destination operand");
6608 break;
6609 case no_default_mask:
6610 err_msg = _("default mask isn't allowed");
6611 break;
6612 case unsupported_rc_sae:
6613 err_msg = _("unsupported static rounding/sae");
6614 break;
6615 case rc_sae_operand_not_last_imm:
6616 if (intel_syntax)
6617 err_msg = _("RC/SAE operand must precede immediate operands");
6618 else
6619 err_msg = _("RC/SAE operand must follow immediate operands");
6620 break;
6621 case invalid_register_operand:
6622 err_msg = _("invalid register operand");
6623 break;
a65babc9
L
6624 }
6625 as_bad (_("%s for `%s'"), err_msg,
891edac4 6626 current_templates->start->name);
fa99fab2 6627 return NULL;
29b0f896 6628 }
252b5132 6629
29b0f896
AM
6630 if (!quiet_warnings)
6631 {
6632 if (!intel_syntax
0cfa3eb3 6633 && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6f2f06be 6634 as_warn (_("indirect %s without `*'"), t->name);
29b0f896 6635
40fb9820 6636 if (t->opcode_modifier.isprefix
3cd7f3e3 6637 && t->opcode_modifier.mnemonicsize == IGNORESIZE)
29b0f896
AM
6638 {
6639 /* Warn them that a data or address size prefix doesn't
6640 affect assembly of the next line of code. */
6641 as_warn (_("stand-alone `%s' prefix"), t->name);
6642 }
6643 }
6644
6645 /* Copy the template we found. */
6646 i.tm = *t;
539e75ad
L
6647
6648 if (addr_prefix_disp != -1)
6649 i.tm.operand_types[addr_prefix_disp]
6650 = operand_types[addr_prefix_disp];
6651
29b0f896
AM
6652 if (found_reverse_match)
6653 {
dfd69174
JB
6654 /* If we found a reverse match we must alter the opcode direction
6655 bit and clear/flip the regmem modifier one. found_reverse_match
6656 holds bits to change (different for int & float insns). */
29b0f896
AM
6657
6658 i.tm.base_opcode ^= found_reverse_match;
6659
f5eb1d70
JB
6660 i.tm.operand_types[0] = operand_types[i.operands - 1];
6661 i.tm.operand_types[i.operands - 1] = operand_types[0];
dfd69174
JB
6662
6663 /* Certain SIMD insns have their load forms specified in the opcode
6664 table, and hence we need to _set_ RegMem instead of clearing it.
6665 We need to avoid setting the bit though on insns like KMOVW. */
6666 i.tm.opcode_modifier.regmem
6667 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6668 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6669 && !i.tm.opcode_modifier.regmem;
29b0f896
AM
6670 }
6671
fa99fab2 6672 return t;
29b0f896
AM
6673}
6674
6675static int
e3bb37b5 6676check_string (void)
29b0f896 6677{
51c8edf6
JB
6678 unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6679 unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
8dc0818e 6680
51c8edf6 6681 if (i.seg[op] != NULL && i.seg[op] != &es)
29b0f896 6682 {
51c8edf6
JB
6683 as_bad (_("`%s' operand %u must use `%ses' segment"),
6684 i.tm.name,
6685 intel_syntax ? i.tm.operands - es_op : es_op + 1,
6686 register_prefix);
6687 return 0;
29b0f896 6688 }
51c8edf6
JB
6689
6690 /* There's only ever one segment override allowed per instruction.
6691 This instruction possibly has a legal segment override on the
6692 second operand, so copy the segment to where non-string
6693 instructions store it, allowing common code. */
6694 i.seg[op] = i.seg[1];
6695
29b0f896
AM
6696 return 1;
6697}
6698
6699static int
543613e9 6700process_suffix (void)
29b0f896
AM
6701{
6702 /* If matched instruction specifies an explicit instruction mnemonic
6703 suffix, use it. */
673fe0f0 6704 if (i.tm.opcode_modifier.size == SIZE16)
40fb9820 6705 i.suffix = WORD_MNEM_SUFFIX;
673fe0f0 6706 else if (i.tm.opcode_modifier.size == SIZE32)
40fb9820 6707 i.suffix = LONG_MNEM_SUFFIX;
673fe0f0 6708 else if (i.tm.opcode_modifier.size == SIZE64)
40fb9820 6709 i.suffix = QWORD_MNEM_SUFFIX;
13e600d0 6710 else if (i.reg_operands
c8f8eebc
JB
6711 && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6712 && !i.tm.opcode_modifier.addrprefixopreg)
29b0f896 6713 {
65fca059
JB
6714 unsigned int numop = i.operands;
6715
6716 /* movsx/movzx want only their source operand considered here, for the
6717 ambiguity checking below. The suffix will be replaced afterwards
6718 to represent the destination (register). */
6719 if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6720 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6721 --i.operands;
6722
643bb870
JB
6723 /* crc32 needs REX.W set regardless of suffix / source operand size. */
6724 if (i.tm.base_opcode == 0xf20f38f0
6725 && i.tm.operand_types[1].bitfield.qword)
6726 i.rex |= REX_W;
6727
29b0f896 6728 /* If there's no instruction mnemonic suffix we try to invent one
13e600d0 6729 based on GPR operands. */
29b0f896
AM
6730 if (!i.suffix)
6731 {
6732 /* We take i.suffix from the last register operand specified,
6733 Destination register type is more significant than source
381d071f
L
6734 register type. crc32 in SSE4.2 prefers source register
6735 type. */
1a035124 6736 unsigned int op = i.tm.base_opcode != 0xf20f38f0 ? i.operands : 1;
20592a94 6737
1a035124
JB
6738 while (op--)
6739 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6740 || i.tm.operand_types[op].bitfield.instance == Accum)
6741 {
6742 if (i.types[op].bitfield.class != Reg)
6743 continue;
6744 if (i.types[op].bitfield.byte)
6745 i.suffix = BYTE_MNEM_SUFFIX;
6746 else if (i.types[op].bitfield.word)
6747 i.suffix = WORD_MNEM_SUFFIX;
6748 else if (i.types[op].bitfield.dword)
6749 i.suffix = LONG_MNEM_SUFFIX;
6750 else if (i.types[op].bitfield.qword)
6751 i.suffix = QWORD_MNEM_SUFFIX;
6752 else
6753 continue;
6754 break;
6755 }
65fca059
JB
6756
6757 /* As an exception, movsx/movzx silently default to a byte source
6758 in AT&T mode. */
6759 if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6760 && !i.suffix && !intel_syntax)
6761 i.suffix = BYTE_MNEM_SUFFIX;
29b0f896
AM
6762 }
6763 else if (i.suffix == BYTE_MNEM_SUFFIX)
6764 {
2eb952a4 6765 if (intel_syntax
3cd7f3e3 6766 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
2eb952a4
L
6767 && i.tm.opcode_modifier.no_bsuf)
6768 i.suffix = 0;
6769 else if (!check_byte_reg ())
29b0f896
AM
6770 return 0;
6771 }
6772 else if (i.suffix == LONG_MNEM_SUFFIX)
6773 {
2eb952a4 6774 if (intel_syntax
3cd7f3e3 6775 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
9f123b91
JB
6776 && i.tm.opcode_modifier.no_lsuf
6777 && !i.tm.opcode_modifier.todword
6778 && !i.tm.opcode_modifier.toqword)
2eb952a4
L
6779 i.suffix = 0;
6780 else if (!check_long_reg ())
29b0f896
AM
6781 return 0;
6782 }
6783 else if (i.suffix == QWORD_MNEM_SUFFIX)
6784 {
955e1e6a 6785 if (intel_syntax
3cd7f3e3 6786 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
9f123b91
JB
6787 && i.tm.opcode_modifier.no_qsuf
6788 && !i.tm.opcode_modifier.todword
6789 && !i.tm.opcode_modifier.toqword)
955e1e6a
L
6790 i.suffix = 0;
6791 else if (!check_qword_reg ())
29b0f896
AM
6792 return 0;
6793 }
6794 else if (i.suffix == WORD_MNEM_SUFFIX)
6795 {
2eb952a4 6796 if (intel_syntax
3cd7f3e3 6797 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
2eb952a4
L
6798 && i.tm.opcode_modifier.no_wsuf)
6799 i.suffix = 0;
6800 else if (!check_word_reg ())
29b0f896
AM
6801 return 0;
6802 }
3cd7f3e3
L
6803 else if (intel_syntax
6804 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
29b0f896
AM
6805 /* Do nothing if the instruction is going to ignore the prefix. */
6806 ;
6807 else
6808 abort ();
65fca059
JB
6809
6810 /* Undo the movsx/movzx change done above. */
6811 i.operands = numop;
29b0f896 6812 }
3cd7f3e3
L
6813 else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
6814 && !i.suffix)
29b0f896 6815 {
13e600d0
JB
6816 i.suffix = stackop_size;
6817 if (stackop_size == LONG_MNEM_SUFFIX)
06f74c5c
L
6818 {
6819 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6820 .code16gcc directive to support 16-bit mode with
6821 32-bit address. For IRET without a suffix, generate
6822 16-bit IRET (opcode 0xcf) to return from an interrupt
6823 handler. */
13e600d0
JB
6824 if (i.tm.base_opcode == 0xcf)
6825 {
6826 i.suffix = WORD_MNEM_SUFFIX;
6827 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6828 }
6829 /* Warn about changed behavior for segment register push/pop. */
6830 else if ((i.tm.base_opcode | 1) == 0x07)
6831 as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6832 i.tm.name);
06f74c5c 6833 }
29b0f896 6834 }
c006a730 6835 else if (!i.suffix
0cfa3eb3
JB
6836 && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6837 || i.tm.opcode_modifier.jump == JUMP_BYTE
6838 || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
64e74474
AM
6839 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6840 && i.tm.extension_opcode <= 3)))
9306ca4a
JB
6841 {
6842 switch (flag_code)
6843 {
6844 case CODE_64BIT:
40fb9820 6845 if (!i.tm.opcode_modifier.no_qsuf)
9306ca4a 6846 {
828c2a25
JB
6847 if (i.tm.opcode_modifier.jump == JUMP_BYTE
6848 || i.tm.opcode_modifier.no_lsuf)
6849 i.suffix = QWORD_MNEM_SUFFIX;
9306ca4a
JB
6850 break;
6851 }
1a0670f3 6852 /* Fall through. */
9306ca4a 6853 case CODE_32BIT:
40fb9820 6854 if (!i.tm.opcode_modifier.no_lsuf)
9306ca4a
JB
6855 i.suffix = LONG_MNEM_SUFFIX;
6856 break;
6857 case CODE_16BIT:
40fb9820 6858 if (!i.tm.opcode_modifier.no_wsuf)
9306ca4a
JB
6859 i.suffix = WORD_MNEM_SUFFIX;
6860 break;
6861 }
6862 }
252b5132 6863
c006a730 6864 if (!i.suffix
3cd7f3e3 6865 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
873494c8
JB
6866 /* Also cover lret/retf/iret in 64-bit mode. */
6867 || (flag_code == CODE_64BIT
6868 && !i.tm.opcode_modifier.no_lsuf
6869 && !i.tm.opcode_modifier.no_qsuf))
3cd7f3e3 6870 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
8bbb3ad8
JB
6871 /* Explicit sizing prefixes are assumed to disambiguate insns. */
6872 && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
62b3f548
JB
6873 /* Accept FLDENV et al without suffix. */
6874 && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
29b0f896 6875 {
6c0946d0 6876 unsigned int suffixes, evex = 0;
c006a730
JB
6877
6878 suffixes = !i.tm.opcode_modifier.no_bsuf;
6879 if (!i.tm.opcode_modifier.no_wsuf)
6880 suffixes |= 1 << 1;
6881 if (!i.tm.opcode_modifier.no_lsuf)
6882 suffixes |= 1 << 2;
6883 if (!i.tm.opcode_modifier.no_ldsuf)
6884 suffixes |= 1 << 3;
6885 if (!i.tm.opcode_modifier.no_ssuf)
6886 suffixes |= 1 << 4;
6887 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6888 suffixes |= 1 << 5;
6889
6c0946d0
JB
6890 /* For [XYZ]MMWORD operands inspect operand sizes. While generally
6891 also suitable for AT&T syntax mode, it was requested that this be
6892 restricted to just Intel syntax. */
b9915cbc 6893 if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6c0946d0 6894 {
b9915cbc 6895 unsigned int op;
6c0946d0 6896
b9915cbc 6897 for (op = 0; op < i.tm.operands; ++op)
6c0946d0 6898 {
b9915cbc
JB
6899 if (is_evex_encoding (&i.tm)
6900 && !cpu_arch_flags.bitfield.cpuavx512vl)
6c0946d0 6901 {
b9915cbc
JB
6902 if (i.tm.operand_types[op].bitfield.ymmword)
6903 i.tm.operand_types[op].bitfield.xmmword = 0;
6904 if (i.tm.operand_types[op].bitfield.zmmword)
6905 i.tm.operand_types[op].bitfield.ymmword = 0;
6906 if (!i.tm.opcode_modifier.evex
6907 || i.tm.opcode_modifier.evex == EVEXDYN)
6908 i.tm.opcode_modifier.evex = EVEX512;
6909 }
6c0946d0 6910
b9915cbc
JB
6911 if (i.tm.operand_types[op].bitfield.xmmword
6912 + i.tm.operand_types[op].bitfield.ymmword
6913 + i.tm.operand_types[op].bitfield.zmmword < 2)
6914 continue;
6c0946d0 6915
b9915cbc
JB
6916 /* Any properly sized operand disambiguates the insn. */
6917 if (i.types[op].bitfield.xmmword
6918 || i.types[op].bitfield.ymmword
6919 || i.types[op].bitfield.zmmword)
6920 {
6921 suffixes &= ~(7 << 6);
6922 evex = 0;
6923 break;
6924 }
6c0946d0 6925
b9915cbc
JB
6926 if ((i.flags[op] & Operand_Mem)
6927 && i.tm.operand_types[op].bitfield.unspecified)
6928 {
6929 if (i.tm.operand_types[op].bitfield.xmmword)
6930 suffixes |= 1 << 6;
6931 if (i.tm.operand_types[op].bitfield.ymmword)
6932 suffixes |= 1 << 7;
6933 if (i.tm.operand_types[op].bitfield.zmmword)
6934 suffixes |= 1 << 8;
6935 if (is_evex_encoding (&i.tm))
6936 evex = EVEX512;
6c0946d0
JB
6937 }
6938 }
6939 }
6940
6941 /* Are multiple suffixes / operand sizes allowed? */
c006a730 6942 if (suffixes & (suffixes - 1))
9306ca4a 6943 {
873494c8 6944 if (intel_syntax
3cd7f3e3 6945 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
873494c8 6946 || operand_check == check_error))
9306ca4a 6947 {
c006a730 6948 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
9306ca4a
JB
6949 return 0;
6950 }
c006a730 6951 if (operand_check == check_error)
9306ca4a 6952 {
c006a730
JB
6953 as_bad (_("no instruction mnemonic suffix given and "
6954 "no register operands; can't size `%s'"), i.tm.name);
9306ca4a
JB
6955 return 0;
6956 }
c006a730 6957 if (operand_check == check_warning)
873494c8
JB
6958 as_warn (_("%s; using default for `%s'"),
6959 intel_syntax
6960 ? _("ambiguous operand size")
6961 : _("no instruction mnemonic suffix given and "
6962 "no register operands"),
6963 i.tm.name);
c006a730
JB
6964
6965 if (i.tm.opcode_modifier.floatmf)
6966 i.suffix = SHORT_MNEM_SUFFIX;
65fca059
JB
6967 else if ((i.tm.base_opcode | 8) == 0xfbe
6968 || (i.tm.base_opcode == 0x63
6969 && i.tm.cpu_flags.bitfield.cpu64))
6970 /* handled below */;
6c0946d0
JB
6971 else if (evex)
6972 i.tm.opcode_modifier.evex = evex;
c006a730
JB
6973 else if (flag_code == CODE_16BIT)
6974 i.suffix = WORD_MNEM_SUFFIX;
1a035124 6975 else if (!i.tm.opcode_modifier.no_lsuf)
c006a730 6976 i.suffix = LONG_MNEM_SUFFIX;
1a035124
JB
6977 else
6978 i.suffix = QWORD_MNEM_SUFFIX;
9306ca4a 6979 }
29b0f896 6980 }
252b5132 6981
65fca059
JB
6982 if ((i.tm.base_opcode | 8) == 0xfbe
6983 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6984 {
6985 /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
6986 In AT&T syntax, if there is no suffix (warned about above), the default
6987 will be byte extension. */
6988 if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
6989 i.tm.base_opcode |= 1;
6990
6991 /* For further processing, the suffix should represent the destination
6992 (register). This is already the case when one was used with
6993 mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
6994 no suffix to begin with. */
6995 if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
6996 {
6997 if (i.types[1].bitfield.word)
6998 i.suffix = WORD_MNEM_SUFFIX;
6999 else if (i.types[1].bitfield.qword)
7000 i.suffix = QWORD_MNEM_SUFFIX;
7001 else
7002 i.suffix = LONG_MNEM_SUFFIX;
7003
7004 i.tm.opcode_modifier.w = 0;
7005 }
7006 }
7007
50128d0c
JB
7008 if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7009 i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7010 != (i.tm.operand_types[1].bitfield.class == Reg);
7011
d2224064
JB
7012 /* Change the opcode based on the operand size given by i.suffix. */
7013 switch (i.suffix)
29b0f896 7014 {
d2224064
JB
7015 /* Size floating point instruction. */
7016 case LONG_MNEM_SUFFIX:
7017 if (i.tm.opcode_modifier.floatmf)
7018 {
7019 i.tm.base_opcode ^= 4;
7020 break;
7021 }
7022 /* fall through */
7023 case WORD_MNEM_SUFFIX:
7024 case QWORD_MNEM_SUFFIX:
29b0f896 7025 /* It's not a byte, select word/dword operation. */
40fb9820 7026 if (i.tm.opcode_modifier.w)
29b0f896 7027 {
50128d0c 7028 if (i.short_form)
29b0f896
AM
7029 i.tm.base_opcode |= 8;
7030 else
7031 i.tm.base_opcode |= 1;
7032 }
d2224064
JB
7033 /* fall through */
7034 case SHORT_MNEM_SUFFIX:
29b0f896
AM
7035 /* Now select between word & dword operations via the operand
7036 size prefix, except for instructions that will ignore this
7037 prefix anyway. */
c8f8eebc 7038 if (i.suffix != QWORD_MNEM_SUFFIX
3cd7f3e3 7039 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
c8f8eebc
JB
7040 && !i.tm.opcode_modifier.floatmf
7041 && !is_any_vex_encoding (&i.tm)
7042 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7043 || (flag_code == CODE_64BIT
7044 && i.tm.opcode_modifier.jump == JUMP_BYTE)))
24eab124
AM
7045 {
7046 unsigned int prefix = DATA_PREFIX_OPCODE;
543613e9 7047
0cfa3eb3 7048 if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
29b0f896 7049 prefix = ADDR_PREFIX_OPCODE;
252b5132 7050
29b0f896
AM
7051 if (!add_prefix (prefix))
7052 return 0;
24eab124 7053 }
252b5132 7054
29b0f896
AM
7055 /* Set mode64 for an operand. */
7056 if (i.suffix == QWORD_MNEM_SUFFIX
9146926a 7057 && flag_code == CODE_64BIT
d2224064 7058 && !i.tm.opcode_modifier.norex64
4ed21b58 7059 && !i.tm.opcode_modifier.vexw
46e883c5 7060 /* Special case for xchg %rax,%rax. It is NOP and doesn't
d2224064
JB
7061 need rex64. */
7062 && ! (i.operands == 2
7063 && i.tm.base_opcode == 0x90
7064 && i.tm.extension_opcode == None
75e5731b
JB
7065 && i.types[0].bitfield.instance == Accum
7066 && i.types[0].bitfield.qword
7067 && i.types[1].bitfield.instance == Accum
7068 && i.types[1].bitfield.qword))
d2224064 7069 i.rex |= REX_W;
3e73aa7c 7070
d2224064 7071 break;
8bbb3ad8
JB
7072
7073 case 0:
7074 /* Select word/dword/qword operation with explict data sizing prefix
7075 when there are no suitable register operands. */
7076 if (i.tm.opcode_modifier.w
7077 && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7078 && (!i.reg_operands
7079 || (i.reg_operands == 1
7080 /* ShiftCount */
7081 && (i.tm.operand_types[0].bitfield.instance == RegC
7082 /* InOutPortReg */
7083 || i.tm.operand_types[0].bitfield.instance == RegD
7084 || i.tm.operand_types[1].bitfield.instance == RegD
7085 /* CRC32 */
7086 || i.tm.base_opcode == 0xf20f38f0))))
7087 i.tm.base_opcode |= 1;
7088 break;
29b0f896 7089 }
7ecd2f8b 7090
c8f8eebc 7091 if (i.tm.opcode_modifier.addrprefixopreg)
c0a30a9f 7092 {
c8f8eebc
JB
7093 gas_assert (!i.suffix);
7094 gas_assert (i.reg_operands);
c0a30a9f 7095
c8f8eebc
JB
7096 if (i.tm.operand_types[0].bitfield.instance == Accum
7097 || i.operands == 1)
7098 {
7099 /* The address size override prefix changes the size of the
7100 first operand. */
7101 if (flag_code == CODE_64BIT
7102 && i.op[0].regs->reg_type.bitfield.word)
7103 {
7104 as_bad (_("16-bit addressing unavailable for `%s'"),
7105 i.tm.name);
7106 return 0;
7107 }
7108
7109 if ((flag_code == CODE_32BIT
7110 ? i.op[0].regs->reg_type.bitfield.word
7111 : i.op[0].regs->reg_type.bitfield.dword)
7112 && !add_prefix (ADDR_PREFIX_OPCODE))
7113 return 0;
7114 }
c0a30a9f
L
7115 else
7116 {
c8f8eebc
JB
7117 /* Check invalid register operand when the address size override
7118 prefix changes the size of register operands. */
7119 unsigned int op;
7120 enum { need_word, need_dword, need_qword } need;
7121
7122 if (flag_code == CODE_32BIT)
7123 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7124 else if (i.prefix[ADDR_PREFIX])
c0a30a9f
L
7125 need = need_dword;
7126 else
7127 need = flag_code == CODE_64BIT ? need_qword : need_word;
c0a30a9f 7128
c8f8eebc
JB
7129 for (op = 0; op < i.operands; op++)
7130 {
7131 if (i.types[op].bitfield.class != Reg)
7132 continue;
7133
7134 switch (need)
7135 {
7136 case need_word:
7137 if (i.op[op].regs->reg_type.bitfield.word)
7138 continue;
7139 break;
7140 case need_dword:
7141 if (i.op[op].regs->reg_type.bitfield.dword)
7142 continue;
7143 break;
7144 case need_qword:
7145 if (i.op[op].regs->reg_type.bitfield.qword)
7146 continue;
7147 break;
7148 }
7149
7150 as_bad (_("invalid register operand size for `%s'"),
7151 i.tm.name);
7152 return 0;
7153 }
7154 }
c0a30a9f
L
7155 }
7156
29b0f896
AM
7157 return 1;
7158}
3e73aa7c 7159
29b0f896 7160static int
543613e9 7161check_byte_reg (void)
29b0f896
AM
7162{
7163 int op;
543613e9 7164
29b0f896
AM
7165 for (op = i.operands; --op >= 0;)
7166 {
dc821c5f 7167 /* Skip non-register operands. */
bab6aec1 7168 if (i.types[op].bitfield.class != Reg)
dc821c5f
JB
7169 continue;
7170
29b0f896
AM
7171 /* If this is an eight bit register, it's OK. If it's the 16 or
7172 32 bit version of an eight bit register, we will just use the
7173 low portion, and that's OK too. */
dc821c5f 7174 if (i.types[op].bitfield.byte)
29b0f896
AM
7175 continue;
7176
5a819eb9 7177 /* I/O port address operands are OK too. */
75e5731b
JB
7178 if (i.tm.operand_types[op].bitfield.instance == RegD
7179 && i.tm.operand_types[op].bitfield.word)
5a819eb9
JB
7180 continue;
7181
9706160a
JB
7182 /* crc32 only wants its source operand checked here. */
7183 if (i.tm.base_opcode == 0xf20f38f0 && op)
9344ff29
L
7184 continue;
7185
29b0f896 7186 /* Any other register is bad. */
73c76375
JB
7187 as_bad (_("`%s%s' not allowed with `%s%c'"),
7188 register_prefix, i.op[op].regs->reg_name,
7189 i.tm.name, i.suffix);
7190 return 0;
29b0f896
AM
7191 }
7192 return 1;
7193}
7194
7195static int
e3bb37b5 7196check_long_reg (void)
29b0f896
AM
7197{
7198 int op;
7199
7200 for (op = i.operands; --op >= 0;)
dc821c5f 7201 /* Skip non-register operands. */
bab6aec1 7202 if (i.types[op].bitfield.class != Reg)
dc821c5f 7203 continue;
29b0f896
AM
7204 /* Reject eight bit registers, except where the template requires
7205 them. (eg. movzb) */
dc821c5f 7206 else if (i.types[op].bitfield.byte
bab6aec1 7207 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7208 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f
JB
7209 && (i.tm.operand_types[op].bitfield.word
7210 || i.tm.operand_types[op].bitfield.dword))
29b0f896 7211 {
a540244d
L
7212 as_bad (_("`%s%s' not allowed with `%s%c'"),
7213 register_prefix,
29b0f896
AM
7214 i.op[op].regs->reg_name,
7215 i.tm.name,
7216 i.suffix);
7217 return 0;
7218 }
be4c5e58
L
7219 /* Error if the e prefix on a general reg is missing. */
7220 else if (i.types[op].bitfield.word
bab6aec1 7221 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7222 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7223 && i.tm.operand_types[op].bitfield.dword)
29b0f896 7224 {
be4c5e58
L
7225 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7226 register_prefix, i.op[op].regs->reg_name,
7227 i.suffix);
7228 return 0;
252b5132 7229 }
e4630f71 7230 /* Warn if the r prefix on a general reg is present. */
dc821c5f 7231 else if (i.types[op].bitfield.qword
bab6aec1 7232 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7233 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7234 && i.tm.operand_types[op].bitfield.dword)
252b5132 7235 {
34828aad 7236 if (intel_syntax
65fca059 7237 && i.tm.opcode_modifier.toqword
3528c362 7238 && i.types[0].bitfield.class != RegSIMD)
34828aad 7239 {
ca61edf2 7240 /* Convert to QWORD. We want REX byte. */
34828aad
L
7241 i.suffix = QWORD_MNEM_SUFFIX;
7242 }
7243 else
7244 {
2b5d6a91 7245 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
34828aad
L
7246 register_prefix, i.op[op].regs->reg_name,
7247 i.suffix);
7248 return 0;
7249 }
29b0f896
AM
7250 }
7251 return 1;
7252}
252b5132 7253
29b0f896 7254static int
e3bb37b5 7255check_qword_reg (void)
29b0f896
AM
7256{
7257 int op;
252b5132 7258
29b0f896 7259 for (op = i.operands; --op >= 0; )
dc821c5f 7260 /* Skip non-register operands. */
bab6aec1 7261 if (i.types[op].bitfield.class != Reg)
dc821c5f 7262 continue;
29b0f896
AM
7263 /* Reject eight bit registers, except where the template requires
7264 them. (eg. movzb) */
dc821c5f 7265 else if (i.types[op].bitfield.byte
bab6aec1 7266 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7267 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f
JB
7268 && (i.tm.operand_types[op].bitfield.word
7269 || i.tm.operand_types[op].bitfield.dword))
29b0f896 7270 {
a540244d
L
7271 as_bad (_("`%s%s' not allowed with `%s%c'"),
7272 register_prefix,
29b0f896
AM
7273 i.op[op].regs->reg_name,
7274 i.tm.name,
7275 i.suffix);
7276 return 0;
7277 }
e4630f71 7278 /* Warn if the r prefix on a general reg is missing. */
dc821c5f
JB
7279 else if ((i.types[op].bitfield.word
7280 || i.types[op].bitfield.dword)
bab6aec1 7281 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7282 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7283 && i.tm.operand_types[op].bitfield.qword)
29b0f896
AM
7284 {
7285 /* Prohibit these changes in the 64bit mode, since the
7286 lowering is more complicated. */
34828aad 7287 if (intel_syntax
ca61edf2 7288 && i.tm.opcode_modifier.todword
3528c362 7289 && i.types[0].bitfield.class != RegSIMD)
34828aad 7290 {
ca61edf2 7291 /* Convert to DWORD. We don't want REX byte. */
34828aad
L
7292 i.suffix = LONG_MNEM_SUFFIX;
7293 }
7294 else
7295 {
2b5d6a91 7296 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
34828aad
L
7297 register_prefix, i.op[op].regs->reg_name,
7298 i.suffix);
7299 return 0;
7300 }
252b5132 7301 }
29b0f896
AM
7302 return 1;
7303}
252b5132 7304
29b0f896 7305static int
e3bb37b5 7306check_word_reg (void)
29b0f896
AM
7307{
7308 int op;
7309 for (op = i.operands; --op >= 0;)
dc821c5f 7310 /* Skip non-register operands. */
bab6aec1 7311 if (i.types[op].bitfield.class != Reg)
dc821c5f 7312 continue;
29b0f896
AM
7313 /* Reject eight bit registers, except where the template requires
7314 them. (eg. movzb) */
dc821c5f 7315 else if (i.types[op].bitfield.byte
bab6aec1 7316 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7317 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f
JB
7318 && (i.tm.operand_types[op].bitfield.word
7319 || i.tm.operand_types[op].bitfield.dword))
29b0f896 7320 {
a540244d
L
7321 as_bad (_("`%s%s' not allowed with `%s%c'"),
7322 register_prefix,
29b0f896
AM
7323 i.op[op].regs->reg_name,
7324 i.tm.name,
7325 i.suffix);
7326 return 0;
7327 }
9706160a
JB
7328 /* Error if the e or r prefix on a general reg is present. */
7329 else if ((i.types[op].bitfield.dword
dc821c5f 7330 || i.types[op].bitfield.qword)
bab6aec1 7331 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7332 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7333 && i.tm.operand_types[op].bitfield.word)
252b5132 7334 {
9706160a
JB
7335 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7336 register_prefix, i.op[op].regs->reg_name,
7337 i.suffix);
7338 return 0;
29b0f896
AM
7339 }
7340 return 1;
7341}
252b5132 7342
29b0f896 7343static int
40fb9820 7344update_imm (unsigned int j)
29b0f896 7345{
bc0844ae 7346 i386_operand_type overlap = i.types[j];
40fb9820
L
7347 if ((overlap.bitfield.imm8
7348 || overlap.bitfield.imm8s
7349 || overlap.bitfield.imm16
7350 || overlap.bitfield.imm32
7351 || overlap.bitfield.imm32s
7352 || overlap.bitfield.imm64)
0dfbf9d7
L
7353 && !operand_type_equal (&overlap, &imm8)
7354 && !operand_type_equal (&overlap, &imm8s)
7355 && !operand_type_equal (&overlap, &imm16)
7356 && !operand_type_equal (&overlap, &imm32)
7357 && !operand_type_equal (&overlap, &imm32s)
7358 && !operand_type_equal (&overlap, &imm64))
29b0f896
AM
7359 {
7360 if (i.suffix)
7361 {
40fb9820
L
7362 i386_operand_type temp;
7363
0dfbf9d7 7364 operand_type_set (&temp, 0);
7ab9ffdd 7365 if (i.suffix == BYTE_MNEM_SUFFIX)
40fb9820
L
7366 {
7367 temp.bitfield.imm8 = overlap.bitfield.imm8;
7368 temp.bitfield.imm8s = overlap.bitfield.imm8s;
7369 }
7370 else if (i.suffix == WORD_MNEM_SUFFIX)
7371 temp.bitfield.imm16 = overlap.bitfield.imm16;
7372 else if (i.suffix == QWORD_MNEM_SUFFIX)
7373 {
7374 temp.bitfield.imm64 = overlap.bitfield.imm64;
7375 temp.bitfield.imm32s = overlap.bitfield.imm32s;
7376 }
7377 else
7378 temp.bitfield.imm32 = overlap.bitfield.imm32;
7379 overlap = temp;
29b0f896 7380 }
0dfbf9d7
L
7381 else if (operand_type_equal (&overlap, &imm16_32_32s)
7382 || operand_type_equal (&overlap, &imm16_32)
7383 || operand_type_equal (&overlap, &imm16_32s))
29b0f896 7384 {
40fb9820 7385 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
65da13b5 7386 overlap = imm16;
40fb9820 7387 else
65da13b5 7388 overlap = imm32s;
29b0f896 7389 }
8bbb3ad8
JB
7390 else if (i.prefix[REX_PREFIX] & REX_W)
7391 overlap = operand_type_and (overlap, imm32s);
7392 else if (i.prefix[DATA_PREFIX])
7393 overlap = operand_type_and (overlap,
7394 flag_code != CODE_16BIT ? imm16 : imm32);
0dfbf9d7
L
7395 if (!operand_type_equal (&overlap, &imm8)
7396 && !operand_type_equal (&overlap, &imm8s)
7397 && !operand_type_equal (&overlap, &imm16)
7398 && !operand_type_equal (&overlap, &imm32)
7399 && !operand_type_equal (&overlap, &imm32s)
7400 && !operand_type_equal (&overlap, &imm64))
29b0f896 7401 {
4eed87de
AM
7402 as_bad (_("no instruction mnemonic suffix given; "
7403 "can't determine immediate size"));
29b0f896
AM
7404 return 0;
7405 }
7406 }
40fb9820 7407 i.types[j] = overlap;
29b0f896 7408
40fb9820
L
7409 return 1;
7410}
7411
7412static int
7413finalize_imm (void)
7414{
bc0844ae 7415 unsigned int j, n;
29b0f896 7416
bc0844ae
L
7417 /* Update the first 2 immediate operands. */
7418 n = i.operands > 2 ? 2 : i.operands;
7419 if (n)
7420 {
7421 for (j = 0; j < n; j++)
7422 if (update_imm (j) == 0)
7423 return 0;
40fb9820 7424
bc0844ae
L
7425 /* The 3rd operand can't be immediate operand. */
7426 gas_assert (operand_type_check (i.types[2], imm) == 0);
7427 }
29b0f896
AM
7428
7429 return 1;
7430}
7431
7432static int
e3bb37b5 7433process_operands (void)
29b0f896
AM
7434{
7435 /* Default segment register this instruction will use for memory
7436 accesses. 0 means unknown. This is only for optimizing out
7437 unnecessary segment overrides. */
7438 const seg_entry *default_seg = 0;
7439
a5aeccd9
JB
7440 if (i.tm.opcode_modifier.sse2avx)
7441 {
7442 /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
7443 need converting. */
7444 i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
7445 i.prefix[REX_PREFIX] = 0;
7446 i.rex_encoding = 0;
7447 }
c423d21a
JB
7448 /* ImmExt should be processed after SSE2AVX. */
7449 else if (i.tm.opcode_modifier.immext)
7450 process_immext ();
a5aeccd9 7451
2426c15f 7452 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
29b0f896 7453 {
91d6fa6a
NC
7454 unsigned int dupl = i.operands;
7455 unsigned int dest = dupl - 1;
9fcfb3d7
L
7456 unsigned int j;
7457
c0f3af97 7458 /* The destination must be an xmm register. */
9c2799c2 7459 gas_assert (i.reg_operands
91d6fa6a 7460 && MAX_OPERANDS > dupl
7ab9ffdd 7461 && operand_type_equal (&i.types[dest], &regxmm));
c0f3af97 7462
75e5731b 7463 if (i.tm.operand_types[0].bitfield.instance == Accum
1b54b8d7 7464 && i.tm.operand_types[0].bitfield.xmmword)
e2ec9d29 7465 {
8cd7925b 7466 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
c0f3af97
L
7467 {
7468 /* Keep xmm0 for instructions with VEX prefix and 3
7469 sources. */
75e5731b 7470 i.tm.operand_types[0].bitfield.instance = InstanceNone;
3528c362 7471 i.tm.operand_types[0].bitfield.class = RegSIMD;
c0f3af97
L
7472 goto duplicate;
7473 }
e2ec9d29 7474 else
c0f3af97
L
7475 {
7476 /* We remove the first xmm0 and keep the number of
7477 operands unchanged, which in fact duplicates the
7478 destination. */
7479 for (j = 1; j < i.operands; j++)
7480 {
7481 i.op[j - 1] = i.op[j];
7482 i.types[j - 1] = i.types[j];
7483 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
8dc0818e 7484 i.flags[j - 1] = i.flags[j];
c0f3af97
L
7485 }
7486 }
7487 }
7488 else if (i.tm.opcode_modifier.implicit1stxmm0)
7ab9ffdd 7489 {
91d6fa6a 7490 gas_assert ((MAX_OPERANDS - 1) > dupl
8cd7925b
L
7491 && (i.tm.opcode_modifier.vexsources
7492 == VEX3SOURCES));
c0f3af97
L
7493
7494 /* Add the implicit xmm0 for instructions with VEX prefix
7495 and 3 sources. */
7496 for (j = i.operands; j > 0; j--)
7497 {
7498 i.op[j] = i.op[j - 1];
7499 i.types[j] = i.types[j - 1];
7500 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
8dc0818e 7501 i.flags[j] = i.flags[j - 1];
c0f3af97
L
7502 }
7503 i.op[0].regs
7504 = (const reg_entry *) hash_find (reg_hash, "xmm0");
7ab9ffdd 7505 i.types[0] = regxmm;
c0f3af97
L
7506 i.tm.operand_types[0] = regxmm;
7507
7508 i.operands += 2;
7509 i.reg_operands += 2;
7510 i.tm.operands += 2;
7511
91d6fa6a 7512 dupl++;
c0f3af97 7513 dest++;
91d6fa6a
NC
7514 i.op[dupl] = i.op[dest];
7515 i.types[dupl] = i.types[dest];
7516 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
8dc0818e 7517 i.flags[dupl] = i.flags[dest];
e2ec9d29 7518 }
c0f3af97
L
7519 else
7520 {
dc1e8a47 7521 duplicate:
c0f3af97
L
7522 i.operands++;
7523 i.reg_operands++;
7524 i.tm.operands++;
7525
91d6fa6a
NC
7526 i.op[dupl] = i.op[dest];
7527 i.types[dupl] = i.types[dest];
7528 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
8dc0818e 7529 i.flags[dupl] = i.flags[dest];
c0f3af97
L
7530 }
7531
7532 if (i.tm.opcode_modifier.immext)
7533 process_immext ();
7534 }
75e5731b 7535 else if (i.tm.operand_types[0].bitfield.instance == Accum
1b54b8d7 7536 && i.tm.operand_types[0].bitfield.xmmword)
c0f3af97
L
7537 {
7538 unsigned int j;
7539
9fcfb3d7
L
7540 for (j = 1; j < i.operands; j++)
7541 {
7542 i.op[j - 1] = i.op[j];
7543 i.types[j - 1] = i.types[j];
7544
7545 /* We need to adjust fields in i.tm since they are used by
7546 build_modrm_byte. */
7547 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
8dc0818e
JB
7548
7549 i.flags[j - 1] = i.flags[j];
9fcfb3d7
L
7550 }
7551
e2ec9d29
L
7552 i.operands--;
7553 i.reg_operands--;
e2ec9d29
L
7554 i.tm.operands--;
7555 }
920d2ddc
IT
7556 else if (i.tm.opcode_modifier.implicitquadgroup)
7557 {
a477a8c4
JB
7558 unsigned int regnum, first_reg_in_group, last_reg_in_group;
7559
920d2ddc 7560 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
3528c362 7561 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
a477a8c4
JB
7562 regnum = register_number (i.op[1].regs);
7563 first_reg_in_group = regnum & ~3;
7564 last_reg_in_group = first_reg_in_group + 3;
7565 if (regnum != first_reg_in_group)
7566 as_warn (_("source register `%s%s' implicitly denotes"
7567 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7568 register_prefix, i.op[1].regs->reg_name,
7569 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7570 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7571 i.tm.name);
7572 }
e2ec9d29
L
7573 else if (i.tm.opcode_modifier.regkludge)
7574 {
7575 /* The imul $imm, %reg instruction is converted into
7576 imul $imm, %reg, %reg, and the clr %reg instruction
7577 is converted into xor %reg, %reg. */
7578
7579 unsigned int first_reg_op;
7580
7581 if (operand_type_check (i.types[0], reg))
7582 first_reg_op = 0;
7583 else
7584 first_reg_op = 1;
7585 /* Pretend we saw the extra register operand. */
9c2799c2 7586 gas_assert (i.reg_operands == 1
7ab9ffdd 7587 && i.op[first_reg_op + 1].regs == 0);
e2ec9d29
L
7588 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7589 i.types[first_reg_op + 1] = i.types[first_reg_op];
7590 i.operands++;
7591 i.reg_operands++;
29b0f896
AM
7592 }
7593
85b80b0f 7594 if (i.tm.opcode_modifier.modrm)
29b0f896
AM
7595 {
7596 /* The opcode is completed (modulo i.tm.extension_opcode which
52271982
AM
7597 must be put into the modrm byte). Now, we make the modrm and
7598 index base bytes based on all the info we've collected. */
29b0f896
AM
7599
7600 default_seg = build_modrm_byte ();
7601 }
00cee14f 7602 else if (i.types[0].bitfield.class == SReg)
85b80b0f
JB
7603 {
7604 if (flag_code != CODE_64BIT
7605 ? i.tm.base_opcode == POP_SEG_SHORT
7606 && i.op[0].regs->reg_num == 1
7607 : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7608 && i.op[0].regs->reg_num < 4)
7609 {
7610 as_bad (_("you can't `%s %s%s'"),
7611 i.tm.name, register_prefix, i.op[0].regs->reg_name);
7612 return 0;
7613 }
7614 if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7615 {
7616 i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7617 i.tm.opcode_length = 2;
7618 }
7619 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7620 }
8a2ed489 7621 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
29b0f896
AM
7622 {
7623 default_seg = &ds;
7624 }
40fb9820 7625 else if (i.tm.opcode_modifier.isstring)
29b0f896
AM
7626 {
7627 /* For the string instructions that allow a segment override
7628 on one of their operands, the default segment is ds. */
7629 default_seg = &ds;
7630 }
50128d0c 7631 else if (i.short_form)
85b80b0f
JB
7632 {
7633 /* The register or float register operand is in operand
7634 0 or 1. */
bab6aec1 7635 unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
85b80b0f
JB
7636
7637 /* Register goes in low 3 bits of opcode. */
7638 i.tm.base_opcode |= i.op[op].regs->reg_num;
7639 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7640 i.rex |= REX_B;
7641 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7642 {
7643 /* Warn about some common errors, but press on regardless.
7644 The first case can be generated by gcc (<= 2.8.1). */
7645 if (i.operands == 2)
7646 {
7647 /* Reversed arguments on faddp, fsubp, etc. */
7648 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7649 register_prefix, i.op[!intel_syntax].regs->reg_name,
7650 register_prefix, i.op[intel_syntax].regs->reg_name);
7651 }
7652 else
7653 {
7654 /* Extraneous `l' suffix on fp insn. */
7655 as_warn (_("translating to `%s %s%s'"), i.tm.name,
7656 register_prefix, i.op[0].regs->reg_name);
7657 }
7658 }
7659 }
29b0f896 7660
514a8bb0 7661 if ((i.seg[0] || i.prefix[SEG_PREFIX])
514a8bb0
JB
7662 && i.tm.base_opcode == 0x8d /* lea */
7663 && !is_any_vex_encoding(&i.tm))
92334ad2
JB
7664 {
7665 if (!quiet_warnings)
7666 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7667 if (optimize)
7668 {
7669 i.seg[0] = NULL;
7670 i.prefix[SEG_PREFIX] = 0;
7671 }
7672 }
52271982
AM
7673
7674 /* If a segment was explicitly specified, and the specified segment
b6773884
JB
7675 is neither the default nor the one already recorded from a prefix,
7676 use an opcode prefix to select it. If we never figured out what
7677 the default segment is, then default_seg will be zero at this
7678 point, and the specified segment prefix will always be used. */
7679 if (i.seg[0]
7680 && i.seg[0] != default_seg
7681 && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
29b0f896
AM
7682 {
7683 if (!add_prefix (i.seg[0]->seg_prefix))
7684 return 0;
7685 }
7686 return 1;
7687}
7688
a5aeccd9
JB
7689static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
7690 bfd_boolean do_sse2avx)
7691{
7692 if (r->reg_flags & RegRex)
7693 {
7694 if (i.rex & rex_bit)
7695 as_bad (_("same type of prefix used twice"));
7696 i.rex |= rex_bit;
7697 }
7698 else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
7699 {
7700 gas_assert (i.vex.register_specifier == r);
7701 i.vex.register_specifier += 8;
7702 }
7703
7704 if (r->reg_flags & RegVRex)
7705 i.vrex |= rex_bit;
7706}
7707
29b0f896 7708static const seg_entry *
e3bb37b5 7709build_modrm_byte (void)
29b0f896
AM
7710{
7711 const seg_entry *default_seg = 0;
c0f3af97 7712 unsigned int source, dest;
8cd7925b 7713 int vex_3_sources;
c0f3af97 7714
8cd7925b 7715 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
c0f3af97
L
7716 if (vex_3_sources)
7717 {
91d6fa6a 7718 unsigned int nds, reg_slot;
4c2c6516 7719 expressionS *exp;
c0f3af97 7720
6b8d3588 7721 dest = i.operands - 1;
c0f3af97 7722 nds = dest - 1;
922d8de8 7723
a683cc34 7724 /* There are 2 kinds of instructions:
bed3d976 7725 1. 5 operands: 4 register operands or 3 register operands
9d3bf266 7726 plus 1 memory operand plus one Imm4 operand, VexXDS, and
bed3d976 7727 VexW0 or VexW1. The destination must be either XMM, YMM or
43234a1e 7728 ZMM register.
bed3d976 7729 2. 4 operands: 4 register operands or 3 register operands
2f1bada2 7730 plus 1 memory operand, with VexXDS. */
922d8de8 7731 gas_assert ((i.reg_operands == 4
bed3d976
JB
7732 || (i.reg_operands == 3 && i.mem_operands == 1))
7733 && i.tm.opcode_modifier.vexvvvv == VEXXDS
dcd7e323 7734 && i.tm.opcode_modifier.vexw
3528c362 7735 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
a683cc34 7736
48db9223
JB
7737 /* If VexW1 is set, the first non-immediate operand is the source and
7738 the second non-immediate one is encoded in the immediate operand. */
7739 if (i.tm.opcode_modifier.vexw == VEXW1)
7740 {
7741 source = i.imm_operands;
7742 reg_slot = i.imm_operands + 1;
7743 }
7744 else
7745 {
7746 source = i.imm_operands + 1;
7747 reg_slot = i.imm_operands;
7748 }
7749
a683cc34 7750 if (i.imm_operands == 0)
bed3d976
JB
7751 {
7752 /* When there is no immediate operand, generate an 8bit
7753 immediate operand to encode the first operand. */
7754 exp = &im_expressions[i.imm_operands++];
7755 i.op[i.operands].imms = exp;
7756 i.types[i.operands] = imm8;
7757 i.operands++;
7758
3528c362 7759 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
bed3d976
JB
7760 exp->X_op = O_constant;
7761 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
43234a1e
L
7762 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7763 }
922d8de8 7764 else
bed3d976 7765 {
9d3bf266
JB
7766 gas_assert (i.imm_operands == 1);
7767 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7768 gas_assert (!i.tm.opcode_modifier.immext);
a683cc34 7769
9d3bf266
JB
7770 /* Turn on Imm8 again so that output_imm will generate it. */
7771 i.types[0].bitfield.imm8 = 1;
bed3d976 7772
3528c362 7773 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
9d3bf266 7774 i.op[0].imms->X_add_number
bed3d976 7775 |= register_number (i.op[reg_slot].regs) << 4;
43234a1e 7776 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
bed3d976 7777 }
a683cc34 7778
3528c362 7779 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
dae39acc 7780 i.vex.register_specifier = i.op[nds].regs;
c0f3af97
L
7781 }
7782 else
7783 source = dest = 0;
29b0f896
AM
7784
7785 /* i.reg_operands MUST be the number of real register operands;
c0f3af97
L
7786 implicit registers do not count. If there are 3 register
7787 operands, it must be a instruction with VexNDS. For a
7788 instruction with VexNDD, the destination register is encoded
7789 in VEX prefix. If there are 4 register operands, it must be
7790 a instruction with VEX prefix and 3 sources. */
7ab9ffdd
L
7791 if (i.mem_operands == 0
7792 && ((i.reg_operands == 2
2426c15f 7793 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7ab9ffdd 7794 || (i.reg_operands == 3
2426c15f 7795 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7ab9ffdd 7796 || (i.reg_operands == 4 && vex_3_sources)))
29b0f896 7797 {
cab737b9
L
7798 switch (i.operands)
7799 {
7800 case 2:
7801 source = 0;
7802 break;
7803 case 3:
c81128dc
L
7804 /* When there are 3 operands, one of them may be immediate,
7805 which may be the first or the last operand. Otherwise,
c0f3af97
L
7806 the first operand must be shift count register (cl) or it
7807 is an instruction with VexNDS. */
9c2799c2 7808 gas_assert (i.imm_operands == 1
7ab9ffdd 7809 || (i.imm_operands == 0
2426c15f 7810 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
75e5731b
JB
7811 || (i.types[0].bitfield.instance == RegC
7812 && i.types[0].bitfield.byte))));
40fb9820 7813 if (operand_type_check (i.types[0], imm)
75e5731b
JB
7814 || (i.types[0].bitfield.instance == RegC
7815 && i.types[0].bitfield.byte))
40fb9820
L
7816 source = 1;
7817 else
7818 source = 0;
cab737b9
L
7819 break;
7820 case 4:
368d64cc
L
7821 /* When there are 4 operands, the first two must be 8bit
7822 immediate operands. The source operand will be the 3rd
c0f3af97
L
7823 one.
7824
7825 For instructions with VexNDS, if the first operand
7826 an imm8, the source operand is the 2nd one. If the last
7827 operand is imm8, the source operand is the first one. */
9c2799c2 7828 gas_assert ((i.imm_operands == 2
7ab9ffdd
L
7829 && i.types[0].bitfield.imm8
7830 && i.types[1].bitfield.imm8)
2426c15f 7831 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7ab9ffdd
L
7832 && i.imm_operands == 1
7833 && (i.types[0].bitfield.imm8
43234a1e
L
7834 || i.types[i.operands - 1].bitfield.imm8
7835 || i.rounding)));
9f2670f2
L
7836 if (i.imm_operands == 2)
7837 source = 2;
7838 else
c0f3af97
L
7839 {
7840 if (i.types[0].bitfield.imm8)
7841 source = 1;
7842 else
7843 source = 0;
7844 }
c0f3af97
L
7845 break;
7846 case 5:
e771e7c9 7847 if (is_evex_encoding (&i.tm))
43234a1e
L
7848 {
7849 /* For EVEX instructions, when there are 5 operands, the
7850 first one must be immediate operand. If the second one
7851 is immediate operand, the source operand is the 3th
7852 one. If the last one is immediate operand, the source
7853 operand is the 2nd one. */
7854 gas_assert (i.imm_operands == 2
7855 && i.tm.opcode_modifier.sae
7856 && operand_type_check (i.types[0], imm));
7857 if (operand_type_check (i.types[1], imm))
7858 source = 2;
7859 else if (operand_type_check (i.types[4], imm))
7860 source = 1;
7861 else
7862 abort ();
7863 }
cab737b9
L
7864 break;
7865 default:
7866 abort ();
7867 }
7868
c0f3af97
L
7869 if (!vex_3_sources)
7870 {
7871 dest = source + 1;
7872
43234a1e
L
7873 /* RC/SAE operand could be between DEST and SRC. That happens
7874 when one operand is GPR and the other one is XMM/YMM/ZMM
7875 register. */
7876 if (i.rounding && i.rounding->operand == (int) dest)
7877 dest++;
7878
2426c15f 7879 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
c0f3af97 7880 {
43234a1e 7881 /* For instructions with VexNDS, the register-only source
c5d0745b 7882 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
dfd69174 7883 register. It is encoded in VEX prefix. */
f12dc422
L
7884
7885 i386_operand_type op;
7886 unsigned int vvvv;
7887
7888 /* Check register-only source operand when two source
7889 operands are swapped. */
7890 if (!i.tm.operand_types[source].bitfield.baseindex
7891 && i.tm.operand_types[dest].bitfield.baseindex)
7892 {
7893 vvvv = source;
7894 source = dest;
7895 }
7896 else
7897 vvvv = dest;
7898
7899 op = i.tm.operand_types[vvvv];
c0f3af97 7900 if ((dest + 1) >= i.operands
bab6aec1 7901 || ((op.bitfield.class != Reg
dc821c5f 7902 || (!op.bitfield.dword && !op.bitfield.qword))
3528c362 7903 && op.bitfield.class != RegSIMD
43234a1e 7904 && !operand_type_equal (&op, &regmask)))
c0f3af97 7905 abort ();
f12dc422 7906 i.vex.register_specifier = i.op[vvvv].regs;
c0f3af97
L
7907 dest++;
7908 }
7909 }
29b0f896
AM
7910
7911 i.rm.mode = 3;
dfd69174
JB
7912 /* One of the register operands will be encoded in the i.rm.reg
7913 field, the other in the combined i.rm.mode and i.rm.regmem
29b0f896
AM
7914 fields. If no form of this instruction supports a memory
7915 destination operand, then we assume the source operand may
7916 sometimes be a memory operand and so we need to store the
7917 destination in the i.rm.reg field. */
dfd69174 7918 if (!i.tm.opcode_modifier.regmem
40fb9820 7919 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
29b0f896
AM
7920 {
7921 i.rm.reg = i.op[dest].regs->reg_num;
7922 i.rm.regmem = i.op[source].regs->reg_num;
3528c362
JB
7923 if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7924 || i.op[source].regs->reg_type.bitfield.class == RegMMX)
b4a3a7b4 7925 i.has_regmmx = TRUE;
3528c362
JB
7926 else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7927 || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
b4a3a7b4
L
7928 {
7929 if (i.types[dest].bitfield.zmmword
7930 || i.types[source].bitfield.zmmword)
7931 i.has_regzmm = TRUE;
7932 else if (i.types[dest].bitfield.ymmword
7933 || i.types[source].bitfield.ymmword)
7934 i.has_regymm = TRUE;
7935 else
7936 i.has_regxmm = TRUE;
7937 }
a5aeccd9
JB
7938 set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
7939 set_rex_vrex (i.op[source].regs, REX_B, FALSE);
29b0f896
AM
7940 }
7941 else
7942 {
7943 i.rm.reg = i.op[source].regs->reg_num;
7944 i.rm.regmem = i.op[dest].regs->reg_num;
a5aeccd9
JB
7945 set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
7946 set_rex_vrex (i.op[source].regs, REX_R, FALSE);
29b0f896 7947 }
e0c7f900 7948 if (flag_code != CODE_64BIT && (i.rex & REX_R))
c4a530c5 7949 {
4a5c67ed 7950 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
c4a530c5 7951 abort ();
e0c7f900 7952 i.rex &= ~REX_R;
c4a530c5
JB
7953 add_prefix (LOCK_PREFIX_OPCODE);
7954 }
29b0f896
AM
7955 }
7956 else
7957 { /* If it's not 2 reg operands... */
c0f3af97
L
7958 unsigned int mem;
7959
29b0f896
AM
7960 if (i.mem_operands)
7961 {
7962 unsigned int fake_zero_displacement = 0;
99018f42 7963 unsigned int op;
4eed87de 7964
7ab9ffdd 7965 for (op = 0; op < i.operands; op++)
8dc0818e 7966 if (i.flags[op] & Operand_Mem)
7ab9ffdd 7967 break;
7ab9ffdd 7968 gas_assert (op < i.operands);
29b0f896 7969
63112cd6 7970 if (i.tm.opcode_modifier.sib)
6c30d220 7971 {
e968fc9b 7972 if (i.index_reg->reg_num == RegIZ)
6c30d220
L
7973 abort ();
7974
7975 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7976 if (!i.base_reg)
7977 {
7978 i.sib.base = NO_BASE_REGISTER;
7979 i.sib.scale = i.log2_scale_factor;
7980 i.types[op].bitfield.disp8 = 0;
7981 i.types[op].bitfield.disp16 = 0;
7982 i.types[op].bitfield.disp64 = 0;
43083a50 7983 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
6c30d220
L
7984 {
7985 /* Must be 32 bit */
7986 i.types[op].bitfield.disp32 = 1;
7987 i.types[op].bitfield.disp32s = 0;
7988 }
7989 else
7990 {
7991 i.types[op].bitfield.disp32 = 0;
7992 i.types[op].bitfield.disp32s = 1;
7993 }
7994 }
7995 i.sib.index = i.index_reg->reg_num;
a5aeccd9 7996 set_rex_vrex (i.index_reg, REX_X, FALSE);
6c30d220
L
7997 }
7998
29b0f896
AM
7999 default_seg = &ds;
8000
8001 if (i.base_reg == 0)
8002 {
8003 i.rm.mode = 0;
8004 if (!i.disp_operands)
9bb129e8 8005 fake_zero_displacement = 1;
29b0f896
AM
8006 if (i.index_reg == 0)
8007 {
73053c1f
JB
8008 i386_operand_type newdisp;
8009
63112cd6 8010 gas_assert (!i.tm.opcode_modifier.sib);
29b0f896 8011 /* Operand is just <disp> */
20f0a1fc 8012 if (flag_code == CODE_64BIT)
29b0f896
AM
8013 {
8014 /* 64bit mode overwrites the 32bit absolute
8015 addressing by RIP relative addressing and
8016 absolute addressing is encoded by one of the
8017 redundant SIB forms. */
8018 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8019 i.sib.base = NO_BASE_REGISTER;
8020 i.sib.index = NO_INDEX_REGISTER;
73053c1f 8021 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
20f0a1fc 8022 }
fc225355
L
8023 else if ((flag_code == CODE_16BIT)
8024 ^ (i.prefix[ADDR_PREFIX] != 0))
20f0a1fc
NC
8025 {
8026 i.rm.regmem = NO_BASE_REGISTER_16;
73053c1f 8027 newdisp = disp16;
20f0a1fc
NC
8028 }
8029 else
8030 {
8031 i.rm.regmem = NO_BASE_REGISTER;
73053c1f 8032 newdisp = disp32;
29b0f896 8033 }
73053c1f
JB
8034 i.types[op] = operand_type_and_not (i.types[op], anydisp);
8035 i.types[op] = operand_type_or (i.types[op], newdisp);
29b0f896 8036 }
63112cd6 8037 else if (!i.tm.opcode_modifier.sib)
29b0f896 8038 {
6c30d220 8039 /* !i.base_reg && i.index_reg */
e968fc9b 8040 if (i.index_reg->reg_num == RegIZ)
db51cc60
L
8041 i.sib.index = NO_INDEX_REGISTER;
8042 else
8043 i.sib.index = i.index_reg->reg_num;
29b0f896
AM
8044 i.sib.base = NO_BASE_REGISTER;
8045 i.sib.scale = i.log2_scale_factor;
8046 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
40fb9820
L
8047 i.types[op].bitfield.disp8 = 0;
8048 i.types[op].bitfield.disp16 = 0;
8049 i.types[op].bitfield.disp64 = 0;
43083a50 8050 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
40fb9820
L
8051 {
8052 /* Must be 32 bit */
8053 i.types[op].bitfield.disp32 = 1;
8054 i.types[op].bitfield.disp32s = 0;
8055 }
29b0f896 8056 else
40fb9820
L
8057 {
8058 i.types[op].bitfield.disp32 = 0;
8059 i.types[op].bitfield.disp32s = 1;
8060 }
29b0f896 8061 if ((i.index_reg->reg_flags & RegRex) != 0)
161a04f6 8062 i.rex |= REX_X;
29b0f896
AM
8063 }
8064 }
8065 /* RIP addressing for 64bit mode. */
e968fc9b 8066 else if (i.base_reg->reg_num == RegIP)
29b0f896 8067 {
63112cd6 8068 gas_assert (!i.tm.opcode_modifier.sib);
29b0f896 8069 i.rm.regmem = NO_BASE_REGISTER;
40fb9820
L
8070 i.types[op].bitfield.disp8 = 0;
8071 i.types[op].bitfield.disp16 = 0;
8072 i.types[op].bitfield.disp32 = 0;
8073 i.types[op].bitfield.disp32s = 1;
8074 i.types[op].bitfield.disp64 = 0;
71903a11 8075 i.flags[op] |= Operand_PCrel;
20f0a1fc
NC
8076 if (! i.disp_operands)
8077 fake_zero_displacement = 1;
29b0f896 8078 }
dc821c5f 8079 else if (i.base_reg->reg_type.bitfield.word)
29b0f896 8080 {
63112cd6 8081 gas_assert (!i.tm.opcode_modifier.sib);
29b0f896
AM
8082 switch (i.base_reg->reg_num)
8083 {
8084 case 3: /* (%bx) */
8085 if (i.index_reg == 0)
8086 i.rm.regmem = 7;
8087 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
8088 i.rm.regmem = i.index_reg->reg_num - 6;
8089 break;
8090 case 5: /* (%bp) */
8091 default_seg = &ss;
8092 if (i.index_reg == 0)
8093 {
8094 i.rm.regmem = 6;
40fb9820 8095 if (operand_type_check (i.types[op], disp) == 0)
29b0f896
AM
8096 {
8097 /* fake (%bp) into 0(%bp) */
b5014f7a 8098 i.types[op].bitfield.disp8 = 1;
252b5132 8099 fake_zero_displacement = 1;
29b0f896
AM
8100 }
8101 }
8102 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
8103 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8104 break;
8105 default: /* (%si) -> 4 or (%di) -> 5 */
8106 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8107 }
8108 i.rm.mode = mode_from_disp_size (i.types[op]);
8109 }
8110 else /* i.base_reg and 32/64 bit mode */
8111 {
8112 if (flag_code == CODE_64BIT
40fb9820
L
8113 && operand_type_check (i.types[op], disp))
8114 {
73053c1f
JB
8115 i.types[op].bitfield.disp16 = 0;
8116 i.types[op].bitfield.disp64 = 0;
40fb9820 8117 if (i.prefix[ADDR_PREFIX] == 0)
73053c1f
JB
8118 {
8119 i.types[op].bitfield.disp32 = 0;
8120 i.types[op].bitfield.disp32s = 1;
8121 }
40fb9820 8122 else
73053c1f
JB
8123 {
8124 i.types[op].bitfield.disp32 = 1;
8125 i.types[op].bitfield.disp32s = 0;
8126 }
40fb9820 8127 }
20f0a1fc 8128
63112cd6 8129 if (!i.tm.opcode_modifier.sib)
6c30d220 8130 i.rm.regmem = i.base_reg->reg_num;
29b0f896 8131 if ((i.base_reg->reg_flags & RegRex) != 0)
161a04f6 8132 i.rex |= REX_B;
29b0f896
AM
8133 i.sib.base = i.base_reg->reg_num;
8134 /* x86-64 ignores REX prefix bit here to avoid decoder
8135 complications. */
848930b2
JB
8136 if (!(i.base_reg->reg_flags & RegRex)
8137 && (i.base_reg->reg_num == EBP_REG_NUM
8138 || i.base_reg->reg_num == ESP_REG_NUM))
29b0f896 8139 default_seg = &ss;
848930b2 8140 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
29b0f896 8141 {
848930b2 8142 fake_zero_displacement = 1;
b5014f7a 8143 i.types[op].bitfield.disp8 = 1;
29b0f896
AM
8144 }
8145 i.sib.scale = i.log2_scale_factor;
8146 if (i.index_reg == 0)
8147 {
63112cd6 8148 gas_assert (!i.tm.opcode_modifier.sib);
29b0f896
AM
8149 /* <disp>(%esp) becomes two byte modrm with no index
8150 register. We've already stored the code for esp
8151 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8152 Any base register besides %esp will not use the
8153 extra modrm byte. */
8154 i.sib.index = NO_INDEX_REGISTER;
29b0f896 8155 }
63112cd6 8156 else if (!i.tm.opcode_modifier.sib)
29b0f896 8157 {
e968fc9b 8158 if (i.index_reg->reg_num == RegIZ)
db51cc60
L
8159 i.sib.index = NO_INDEX_REGISTER;
8160 else
8161 i.sib.index = i.index_reg->reg_num;
29b0f896
AM
8162 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8163 if ((i.index_reg->reg_flags & RegRex) != 0)
161a04f6 8164 i.rex |= REX_X;
29b0f896 8165 }
67a4f2b7
AO
8166
8167 if (i.disp_operands
8168 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8169 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8170 i.rm.mode = 0;
8171 else
a501d77e
L
8172 {
8173 if (!fake_zero_displacement
8174 && !i.disp_operands
8175 && i.disp_encoding)
8176 {
8177 fake_zero_displacement = 1;
8178 if (i.disp_encoding == disp_encoding_8bit)
8179 i.types[op].bitfield.disp8 = 1;
8180 else
8181 i.types[op].bitfield.disp32 = 1;
8182 }
8183 i.rm.mode = mode_from_disp_size (i.types[op]);
8184 }
29b0f896 8185 }
252b5132 8186
29b0f896
AM
8187 if (fake_zero_displacement)
8188 {
8189 /* Fakes a zero displacement assuming that i.types[op]
8190 holds the correct displacement size. */
8191 expressionS *exp;
8192
9c2799c2 8193 gas_assert (i.op[op].disps == 0);
29b0f896
AM
8194 exp = &disp_expressions[i.disp_operands++];
8195 i.op[op].disps = exp;
8196 exp->X_op = O_constant;
8197 exp->X_add_number = 0;
8198 exp->X_add_symbol = (symbolS *) 0;
8199 exp->X_op_symbol = (symbolS *) 0;
8200 }
c0f3af97
L
8201
8202 mem = op;
29b0f896 8203 }
c0f3af97
L
8204 else
8205 mem = ~0;
252b5132 8206
8c43a48b 8207 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
5dd85c99
SP
8208 {
8209 if (operand_type_check (i.types[0], imm))
8210 i.vex.register_specifier = NULL;
8211 else
8212 {
8213 /* VEX.vvvv encodes one of the sources when the first
8214 operand is not an immediate. */
1ef99a7b 8215 if (i.tm.opcode_modifier.vexw == VEXW0)
5dd85c99
SP
8216 i.vex.register_specifier = i.op[0].regs;
8217 else
8218 i.vex.register_specifier = i.op[1].regs;
8219 }
8220
8221 /* Destination is a XMM register encoded in the ModRM.reg
8222 and VEX.R bit. */
8223 i.rm.reg = i.op[2].regs->reg_num;
8224 if ((i.op[2].regs->reg_flags & RegRex) != 0)
8225 i.rex |= REX_R;
8226
8227 /* ModRM.rm and VEX.B encodes the other source. */
8228 if (!i.mem_operands)
8229 {
8230 i.rm.mode = 3;
8231
1ef99a7b 8232 if (i.tm.opcode_modifier.vexw == VEXW0)
5dd85c99
SP
8233 i.rm.regmem = i.op[1].regs->reg_num;
8234 else
8235 i.rm.regmem = i.op[0].regs->reg_num;
8236
8237 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8238 i.rex |= REX_B;
8239 }
8240 }
2426c15f 8241 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
f88c9eb0
SP
8242 {
8243 i.vex.register_specifier = i.op[2].regs;
8244 if (!i.mem_operands)
8245 {
8246 i.rm.mode = 3;
8247 i.rm.regmem = i.op[1].regs->reg_num;
8248 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8249 i.rex |= REX_B;
8250 }
8251 }
29b0f896
AM
8252 /* Fill in i.rm.reg or i.rm.regmem field with register operand
8253 (if any) based on i.tm.extension_opcode. Again, we must be
8254 careful to make sure that segment/control/debug/test/MMX
8255 registers are coded into the i.rm.reg field. */
f88c9eb0 8256 else if (i.reg_operands)
29b0f896 8257 {
99018f42 8258 unsigned int op;
7ab9ffdd
L
8259 unsigned int vex_reg = ~0;
8260
8261 for (op = 0; op < i.operands; op++)
b4a3a7b4 8262 {
bab6aec1 8263 if (i.types[op].bitfield.class == Reg
f74a6307
JB
8264 || i.types[op].bitfield.class == RegBND
8265 || i.types[op].bitfield.class == RegMask
00cee14f 8266 || i.types[op].bitfield.class == SReg
4a5c67ed
JB
8267 || i.types[op].bitfield.class == RegCR
8268 || i.types[op].bitfield.class == RegDR
8269 || i.types[op].bitfield.class == RegTR)
b4a3a7b4 8270 break;
3528c362 8271 if (i.types[op].bitfield.class == RegSIMD)
b4a3a7b4
L
8272 {
8273 if (i.types[op].bitfield.zmmword)
8274 i.has_regzmm = TRUE;
8275 else if (i.types[op].bitfield.ymmword)
8276 i.has_regymm = TRUE;
8277 else
8278 i.has_regxmm = TRUE;
8279 break;
8280 }
3528c362 8281 if (i.types[op].bitfield.class == RegMMX)
b4a3a7b4
L
8282 {
8283 i.has_regmmx = TRUE;
8284 break;
8285 }
8286 }
c0209578 8287
7ab9ffdd
L
8288 if (vex_3_sources)
8289 op = dest;
2426c15f 8290 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7ab9ffdd
L
8291 {
8292 /* For instructions with VexNDS, the register-only
8293 source operand is encoded in VEX prefix. */
8294 gas_assert (mem != (unsigned int) ~0);
c0f3af97 8295
7ab9ffdd 8296 if (op > mem)
c0f3af97 8297 {
7ab9ffdd
L
8298 vex_reg = op++;
8299 gas_assert (op < i.operands);
c0f3af97
L
8300 }
8301 else
c0f3af97 8302 {
f12dc422
L
8303 /* Check register-only source operand when two source
8304 operands are swapped. */
8305 if (!i.tm.operand_types[op].bitfield.baseindex
8306 && i.tm.operand_types[op + 1].bitfield.baseindex)
8307 {
8308 vex_reg = op;
8309 op += 2;
8310 gas_assert (mem == (vex_reg + 1)
8311 && op < i.operands);
8312 }
8313 else
8314 {
8315 vex_reg = op + 1;
8316 gas_assert (vex_reg < i.operands);
8317 }
c0f3af97 8318 }
7ab9ffdd 8319 }
2426c15f 8320 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7ab9ffdd 8321 {
f12dc422 8322 /* For instructions with VexNDD, the register destination
7ab9ffdd 8323 is encoded in VEX prefix. */
f12dc422
L
8324 if (i.mem_operands == 0)
8325 {
8326 /* There is no memory operand. */
8327 gas_assert ((op + 2) == i.operands);
8328 vex_reg = op + 1;
8329 }
8330 else
8d63c93e 8331 {
ed438a93
JB
8332 /* There are only 2 non-immediate operands. */
8333 gas_assert (op < i.imm_operands + 2
8334 && i.operands == i.imm_operands + 2);
8335 vex_reg = i.imm_operands + 1;
f12dc422 8336 }
7ab9ffdd
L
8337 }
8338 else
8339 gas_assert (op < i.operands);
99018f42 8340
7ab9ffdd
L
8341 if (vex_reg != (unsigned int) ~0)
8342 {
f12dc422 8343 i386_operand_type *type = &i.tm.operand_types[vex_reg];
7ab9ffdd 8344
bab6aec1 8345 if ((type->bitfield.class != Reg
dc821c5f 8346 || (!type->bitfield.dword && !type->bitfield.qword))
3528c362 8347 && type->bitfield.class != RegSIMD
43234a1e 8348 && !operand_type_equal (type, &regmask))
7ab9ffdd 8349 abort ();
f88c9eb0 8350
7ab9ffdd
L
8351 i.vex.register_specifier = i.op[vex_reg].regs;
8352 }
8353
1b9f0c97
L
8354 /* Don't set OP operand twice. */
8355 if (vex_reg != op)
7ab9ffdd 8356 {
1b9f0c97
L
8357 /* If there is an extension opcode to put here, the
8358 register number must be put into the regmem field. */
8359 if (i.tm.extension_opcode != None)
8360 {
8361 i.rm.regmem = i.op[op].regs->reg_num;
a5aeccd9
JB
8362 set_rex_vrex (i.op[op].regs, REX_B,
8363 i.tm.opcode_modifier.sse2avx);
1b9f0c97
L
8364 }
8365 else
8366 {
8367 i.rm.reg = i.op[op].regs->reg_num;
a5aeccd9
JB
8368 set_rex_vrex (i.op[op].regs, REX_R,
8369 i.tm.opcode_modifier.sse2avx);
1b9f0c97 8370 }
7ab9ffdd 8371 }
252b5132 8372
29b0f896
AM
8373 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8374 must set it to 3 to indicate this is a register operand
8375 in the regmem field. */
8376 if (!i.mem_operands)
8377 i.rm.mode = 3;
8378 }
252b5132 8379
29b0f896 8380 /* Fill in i.rm.reg field with extension opcode (if any). */
c1e679ec 8381 if (i.tm.extension_opcode != None)
29b0f896
AM
8382 i.rm.reg = i.tm.extension_opcode;
8383 }
8384 return default_seg;
8385}
252b5132 8386
376cd056
JB
8387static unsigned int
8388flip_code16 (unsigned int code16)
8389{
8390 gas_assert (i.tm.operands == 1);
8391
8392 return !(i.prefix[REX_PREFIX] & REX_W)
8393 && (code16 ? i.tm.operand_types[0].bitfield.disp32
8394 || i.tm.operand_types[0].bitfield.disp32s
8395 : i.tm.operand_types[0].bitfield.disp16)
8396 ? CODE16 : 0;
8397}
8398
29b0f896 8399static void
e3bb37b5 8400output_branch (void)
29b0f896
AM
8401{
8402 char *p;
f8a5c266 8403 int size;
29b0f896
AM
8404 int code16;
8405 int prefix;
8406 relax_substateT subtype;
8407 symbolS *sym;
8408 offsetT off;
8409
f8a5c266 8410 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
a501d77e 8411 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
29b0f896
AM
8412
8413 prefix = 0;
8414 if (i.prefix[DATA_PREFIX] != 0)
252b5132 8415 {
29b0f896
AM
8416 prefix = 1;
8417 i.prefixes -= 1;
376cd056 8418 code16 ^= flip_code16(code16);
252b5132 8419 }
29b0f896
AM
8420 /* Pentium4 branch hints. */
8421 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8422 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
2f66722d 8423 {
29b0f896
AM
8424 prefix++;
8425 i.prefixes--;
8426 }
8427 if (i.prefix[REX_PREFIX] != 0)
8428 {
8429 prefix++;
8430 i.prefixes--;
2f66722d
AM
8431 }
8432
7e8b059b
L
8433 /* BND prefixed jump. */
8434 if (i.prefix[BND_PREFIX] != 0)
8435 {
6cb0a70e
JB
8436 prefix++;
8437 i.prefixes--;
7e8b059b
L
8438 }
8439
f2810fe0
JB
8440 if (i.prefixes != 0)
8441 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
29b0f896
AM
8442
8443 /* It's always a symbol; End frag & setup for relax.
8444 Make sure there is enough room in this frag for the largest
8445 instruction we may generate in md_convert_frag. This is 2
8446 bytes for the opcode and room for the prefix and largest
8447 displacement. */
8448 frag_grow (prefix + 2 + 4);
8449 /* Prefix and 1 opcode byte go in fr_fix. */
8450 p = frag_more (prefix + 1);
8451 if (i.prefix[DATA_PREFIX] != 0)
8452 *p++ = DATA_PREFIX_OPCODE;
8453 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8454 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8455 *p++ = i.prefix[SEG_PREFIX];
6cb0a70e
JB
8456 if (i.prefix[BND_PREFIX] != 0)
8457 *p++ = BND_PREFIX_OPCODE;
29b0f896
AM
8458 if (i.prefix[REX_PREFIX] != 0)
8459 *p++ = i.prefix[REX_PREFIX];
8460 *p = i.tm.base_opcode;
8461
8462 if ((unsigned char) *p == JUMP_PC_RELATIVE)
f8a5c266 8463 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
40fb9820 8464 else if (cpu_arch_flags.bitfield.cpui386)
f8a5c266 8465 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
29b0f896 8466 else
f8a5c266 8467 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
29b0f896 8468 subtype |= code16;
3e73aa7c 8469
29b0f896
AM
8470 sym = i.op[0].disps->X_add_symbol;
8471 off = i.op[0].disps->X_add_number;
3e73aa7c 8472
29b0f896
AM
8473 if (i.op[0].disps->X_op != O_constant
8474 && i.op[0].disps->X_op != O_symbol)
3e73aa7c 8475 {
29b0f896
AM
8476 /* Handle complex expressions. */
8477 sym = make_expr_symbol (i.op[0].disps);
8478 off = 0;
8479 }
3e73aa7c 8480
29b0f896
AM
8481 /* 1 possible extra opcode + 4 byte displacement go in var part.
8482 Pass reloc in fr_var. */
d258b828 8483 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
29b0f896 8484}
3e73aa7c 8485
bd7ab16b
L
8486#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8487/* Return TRUE iff PLT32 relocation should be used for branching to
8488 symbol S. */
8489
8490static bfd_boolean
8491need_plt32_p (symbolS *s)
8492{
8493 /* PLT32 relocation is ELF only. */
8494 if (!IS_ELF)
8495 return FALSE;
8496
a5def729
RO
8497#ifdef TE_SOLARIS
8498 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8499 krtld support it. */
8500 return FALSE;
8501#endif
8502
bd7ab16b
L
8503 /* Since there is no need to prepare for PLT branch on x86-64, we
8504 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8505 be used as a marker for 32-bit PC-relative branches. */
8506 if (!object_64bit)
8507 return FALSE;
8508
8509 /* Weak or undefined symbol need PLT32 relocation. */
8510 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8511 return TRUE;
8512
8513 /* Non-global symbol doesn't need PLT32 relocation. */
8514 if (! S_IS_EXTERNAL (s))
8515 return FALSE;
8516
8517 /* Other global symbols need PLT32 relocation. NB: Symbol with
8518 non-default visibilities are treated as normal global symbol
8519 so that PLT32 relocation can be used as a marker for 32-bit
8520 PC-relative branches. It is useful for linker relaxation. */
8521 return TRUE;
8522}
8523#endif
8524
29b0f896 8525static void
e3bb37b5 8526output_jump (void)
29b0f896
AM
8527{
8528 char *p;
8529 int size;
3e02c1cc 8530 fixS *fixP;
bd7ab16b 8531 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
29b0f896 8532
0cfa3eb3 8533 if (i.tm.opcode_modifier.jump == JUMP_BYTE)
29b0f896
AM
8534 {
8535 /* This is a loop or jecxz type instruction. */
8536 size = 1;
8537 if (i.prefix[ADDR_PREFIX] != 0)
8538 {
8539 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
8540 i.prefixes -= 1;
8541 }
8542 /* Pentium4 branch hints. */
8543 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8544 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8545 {
8546 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
8547 i.prefixes--;
3e73aa7c
JH
8548 }
8549 }
29b0f896
AM
8550 else
8551 {
8552 int code16;
3e73aa7c 8553
29b0f896
AM
8554 code16 = 0;
8555 if (flag_code == CODE_16BIT)
8556 code16 = CODE16;
3e73aa7c 8557
29b0f896
AM
8558 if (i.prefix[DATA_PREFIX] != 0)
8559 {
8560 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8561 i.prefixes -= 1;
376cd056 8562 code16 ^= flip_code16(code16);
29b0f896 8563 }
252b5132 8564
29b0f896
AM
8565 size = 4;
8566 if (code16)
8567 size = 2;
8568 }
9fcc94b6 8569
6cb0a70e
JB
8570 /* BND prefixed jump. */
8571 if (i.prefix[BND_PREFIX] != 0)
29b0f896 8572 {
6cb0a70e 8573 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
29b0f896
AM
8574 i.prefixes -= 1;
8575 }
252b5132 8576
6cb0a70e 8577 if (i.prefix[REX_PREFIX] != 0)
7e8b059b 8578 {
6cb0a70e 8579 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
7e8b059b
L
8580 i.prefixes -= 1;
8581 }
8582
f2810fe0
JB
8583 if (i.prefixes != 0)
8584 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
e0890092 8585
42164a71
L
8586 p = frag_more (i.tm.opcode_length + size);
8587 switch (i.tm.opcode_length)
8588 {
8589 case 2:
8590 *p++ = i.tm.base_opcode >> 8;
1a0670f3 8591 /* Fall through. */
42164a71
L
8592 case 1:
8593 *p++ = i.tm.base_opcode;
8594 break;
8595 default:
8596 abort ();
8597 }
e0890092 8598
bd7ab16b
L
8599#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8600 if (size == 4
8601 && jump_reloc == NO_RELOC
8602 && need_plt32_p (i.op[0].disps->X_add_symbol))
8603 jump_reloc = BFD_RELOC_X86_64_PLT32;
8604#endif
8605
8606 jump_reloc = reloc (size, 1, 1, jump_reloc);
8607
3e02c1cc 8608 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
bd7ab16b 8609 i.op[0].disps, 1, jump_reloc);
3e02c1cc
AM
8610
8611 /* All jumps handled here are signed, but don't use a signed limit
8612 check for 32 and 16 bit jumps as we want to allow wrap around at
8613 4G and 64k respectively. */
8614 if (size == 1)
8615 fixP->fx_signed = 1;
29b0f896 8616}
e0890092 8617
29b0f896 8618static void
e3bb37b5 8619output_interseg_jump (void)
29b0f896
AM
8620{
8621 char *p;
8622 int size;
8623 int prefix;
8624 int code16;
252b5132 8625
29b0f896
AM
8626 code16 = 0;
8627 if (flag_code == CODE_16BIT)
8628 code16 = CODE16;
a217f122 8629
29b0f896
AM
8630 prefix = 0;
8631 if (i.prefix[DATA_PREFIX] != 0)
8632 {
8633 prefix = 1;
8634 i.prefixes -= 1;
8635 code16 ^= CODE16;
8636 }
6cb0a70e
JB
8637
8638 gas_assert (!i.prefix[REX_PREFIX]);
252b5132 8639
29b0f896
AM
8640 size = 4;
8641 if (code16)
8642 size = 2;
252b5132 8643
f2810fe0
JB
8644 if (i.prefixes != 0)
8645 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
252b5132 8646
29b0f896
AM
8647 /* 1 opcode; 2 segment; offset */
8648 p = frag_more (prefix + 1 + 2 + size);
3e73aa7c 8649
29b0f896
AM
8650 if (i.prefix[DATA_PREFIX] != 0)
8651 *p++ = DATA_PREFIX_OPCODE;
252b5132 8652
29b0f896
AM
8653 if (i.prefix[REX_PREFIX] != 0)
8654 *p++ = i.prefix[REX_PREFIX];
252b5132 8655
29b0f896
AM
8656 *p++ = i.tm.base_opcode;
8657 if (i.op[1].imms->X_op == O_constant)
8658 {
8659 offsetT n = i.op[1].imms->X_add_number;
252b5132 8660
29b0f896
AM
8661 if (size == 2
8662 && !fits_in_unsigned_word (n)
8663 && !fits_in_signed_word (n))
8664 {
8665 as_bad (_("16-bit jump out of range"));
8666 return;
8667 }
8668 md_number_to_chars (p, n, size);
8669 }
8670 else
8671 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
d258b828 8672 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
29b0f896
AM
8673 if (i.op[0].imms->X_op != O_constant)
8674 as_bad (_("can't handle non absolute segment in `%s'"),
8675 i.tm.name);
8676 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8677}
a217f122 8678
b4a3a7b4
L
8679#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8680void
8681x86_cleanup (void)
8682{
8683 char *p;
8684 asection *seg = now_seg;
8685 subsegT subseg = now_subseg;
8686 asection *sec;
8687 unsigned int alignment, align_size_1;
8688 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8689 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8690 unsigned int padding;
8691
8692 if (!IS_ELF || !x86_used_note)
8693 return;
8694
b4a3a7b4
L
8695 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8696
8697 /* The .note.gnu.property section layout:
8698
8699 Field Length Contents
8700 ---- ---- ----
8701 n_namsz 4 4
8702 n_descsz 4 The note descriptor size
8703 n_type 4 NT_GNU_PROPERTY_TYPE_0
8704 n_name 4 "GNU"
8705 n_desc n_descsz The program property array
8706 .... .... ....
8707 */
8708
8709 /* Create the .note.gnu.property section. */
8710 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
fd361982 8711 bfd_set_section_flags (sec,
b4a3a7b4
L
8712 (SEC_ALLOC
8713 | SEC_LOAD
8714 | SEC_DATA
8715 | SEC_HAS_CONTENTS
8716 | SEC_READONLY));
8717
8718 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8719 {
8720 align_size_1 = 7;
8721 alignment = 3;
8722 }
8723 else
8724 {
8725 align_size_1 = 3;
8726 alignment = 2;
8727 }
8728
fd361982 8729 bfd_set_section_alignment (sec, alignment);
b4a3a7b4
L
8730 elf_section_type (sec) = SHT_NOTE;
8731
8732 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8733 + 4-byte data */
8734 isa_1_descsz_raw = 4 + 4 + 4;
8735 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8736 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8737
8738 feature_2_descsz_raw = isa_1_descsz;
8739 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8740 + 4-byte data */
8741 feature_2_descsz_raw += 4 + 4 + 4;
8742 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8743 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8744 & ~align_size_1);
8745
8746 descsz = feature_2_descsz;
8747 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8748 p = frag_more (4 + 4 + 4 + 4 + descsz);
8749
8750 /* Write n_namsz. */
8751 md_number_to_chars (p, (valueT) 4, 4);
8752
8753 /* Write n_descsz. */
8754 md_number_to_chars (p + 4, (valueT) descsz, 4);
8755
8756 /* Write n_type. */
8757 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8758
8759 /* Write n_name. */
8760 memcpy (p + 4 * 3, "GNU", 4);
8761
8762 /* Write 4-byte type. */
8763 md_number_to_chars (p + 4 * 4,
8764 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8765
8766 /* Write 4-byte data size. */
8767 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8768
8769 /* Write 4-byte data. */
8770 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8771
8772 /* Zero out paddings. */
8773 padding = isa_1_descsz - isa_1_descsz_raw;
8774 if (padding)
8775 memset (p + 4 * 7, 0, padding);
8776
8777 /* Write 4-byte type. */
8778 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8779 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8780
8781 /* Write 4-byte data size. */
8782 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8783
8784 /* Write 4-byte data. */
8785 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8786 (valueT) x86_feature_2_used, 4);
8787
8788 /* Zero out paddings. */
8789 padding = feature_2_descsz - feature_2_descsz_raw;
8790 if (padding)
8791 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8792
8793 /* We probably can't restore the current segment, for there likely
8794 isn't one yet... */
8795 if (seg && subseg)
8796 subseg_set (seg, subseg);
8797}
8798#endif
8799
9c33702b
JB
8800static unsigned int
8801encoding_length (const fragS *start_frag, offsetT start_off,
8802 const char *frag_now_ptr)
8803{
8804 unsigned int len = 0;
8805
8806 if (start_frag != frag_now)
8807 {
8808 const fragS *fr = start_frag;
8809
8810 do {
8811 len += fr->fr_fix;
8812 fr = fr->fr_next;
8813 } while (fr && fr != frag_now);
8814 }
8815
8816 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8817}
8818
e379e5f3 8819/* Return 1 for test, and, cmp, add, sub, inc and dec which may
79d72f45
HL
8820 be macro-fused with conditional jumps.
8821 NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
8822 or is one of the following format:
8823
8824 cmp m, imm
8825 add m, imm
8826 sub m, imm
8827 test m, imm
8828 and m, imm
8829 inc m
8830 dec m
8831
8832 it is unfusible. */
e379e5f3
L
8833
8834static int
79d72f45 8835maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
e379e5f3
L
8836{
8837 /* No RIP address. */
8838 if (i.base_reg && i.base_reg->reg_num == RegIP)
8839 return 0;
8840
8841 /* No VEX/EVEX encoding. */
8842 if (is_any_vex_encoding (&i.tm))
8843 return 0;
8844
79d72f45
HL
8845 /* add, sub without add/sub m, imm. */
8846 if (i.tm.base_opcode <= 5
e379e5f3
L
8847 || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8848 || ((i.tm.base_opcode | 3) == 0x83
79d72f45 8849 && (i.tm.extension_opcode == 0x5
e379e5f3 8850 || i.tm.extension_opcode == 0x0)))
79d72f45
HL
8851 {
8852 *mf_cmp_p = mf_cmp_alu_cmp;
8853 return !(i.mem_operands && i.imm_operands);
8854 }
e379e5f3 8855
79d72f45
HL
8856 /* and without and m, imm. */
8857 if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8858 || ((i.tm.base_opcode | 3) == 0x83
8859 && i.tm.extension_opcode == 0x4))
8860 {
8861 *mf_cmp_p = mf_cmp_test_and;
8862 return !(i.mem_operands && i.imm_operands);
8863 }
8864
8865 /* test without test m imm. */
e379e5f3
L
8866 if ((i.tm.base_opcode | 1) == 0x85
8867 || (i.tm.base_opcode | 1) == 0xa9
8868 || ((i.tm.base_opcode | 1) == 0xf7
79d72f45
HL
8869 && i.tm.extension_opcode == 0))
8870 {
8871 *mf_cmp_p = mf_cmp_test_and;
8872 return !(i.mem_operands && i.imm_operands);
8873 }
8874
8875 /* cmp without cmp m, imm. */
8876 if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
e379e5f3
L
8877 || ((i.tm.base_opcode | 3) == 0x83
8878 && (i.tm.extension_opcode == 0x7)))
79d72f45
HL
8879 {
8880 *mf_cmp_p = mf_cmp_alu_cmp;
8881 return !(i.mem_operands && i.imm_operands);
8882 }
e379e5f3 8883
79d72f45 8884 /* inc, dec without inc/dec m. */
e379e5f3
L
8885 if ((i.tm.cpu_flags.bitfield.cpuno64
8886 && (i.tm.base_opcode | 0xf) == 0x4f)
8887 || ((i.tm.base_opcode | 1) == 0xff
8888 && i.tm.extension_opcode <= 0x1))
79d72f45
HL
8889 {
8890 *mf_cmp_p = mf_cmp_incdec;
8891 return !i.mem_operands;
8892 }
e379e5f3
L
8893
8894 return 0;
8895}
8896
8897/* Return 1 if a FUSED_JCC_PADDING frag should be generated. */
8898
8899static int
79d72f45 8900add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
e379e5f3
L
8901{
8902 /* NB: Don't work with COND_JUMP86 without i386. */
8903 if (!align_branch_power
8904 || now_seg == absolute_section
8905 || !cpu_arch_flags.bitfield.cpui386
8906 || !(align_branch & align_branch_fused_bit))
8907 return 0;
8908
79d72f45 8909 if (maybe_fused_with_jcc_p (mf_cmp_p))
e379e5f3
L
8910 {
8911 if (last_insn.kind == last_insn_other
8912 || last_insn.seg != now_seg)
8913 return 1;
8914 if (flag_debug)
8915 as_warn_where (last_insn.file, last_insn.line,
8916 _("`%s` skips -malign-branch-boundary on `%s`"),
8917 last_insn.name, i.tm.name);
8918 }
8919
8920 return 0;
8921}
8922
8923/* Return 1 if a BRANCH_PREFIX frag should be generated. */
8924
8925static int
8926add_branch_prefix_frag_p (void)
8927{
8928 /* NB: Don't work with COND_JUMP86 without i386. Don't add prefix
8929 to PadLock instructions since they include prefixes in opcode. */
8930 if (!align_branch_power
8931 || !align_branch_prefix_size
8932 || now_seg == absolute_section
8933 || i.tm.cpu_flags.bitfield.cpupadlock
8934 || !cpu_arch_flags.bitfield.cpui386)
8935 return 0;
8936
8937 /* Don't add prefix if it is a prefix or there is no operand in case
8938 that segment prefix is special. */
8939 if (!i.operands || i.tm.opcode_modifier.isprefix)
8940 return 0;
8941
8942 if (last_insn.kind == last_insn_other
8943 || last_insn.seg != now_seg)
8944 return 1;
8945
8946 if (flag_debug)
8947 as_warn_where (last_insn.file, last_insn.line,
8948 _("`%s` skips -malign-branch-boundary on `%s`"),
8949 last_insn.name, i.tm.name);
8950
8951 return 0;
8952}
8953
8954/* Return 1 if a BRANCH_PADDING frag should be generated. */
8955
8956static int
79d72f45
HL
8957add_branch_padding_frag_p (enum align_branch_kind *branch_p,
8958 enum mf_jcc_kind *mf_jcc_p)
e379e5f3
L
8959{
8960 int add_padding;
8961
8962 /* NB: Don't work with COND_JUMP86 without i386. */
8963 if (!align_branch_power
8964 || now_seg == absolute_section
8965 || !cpu_arch_flags.bitfield.cpui386)
8966 return 0;
8967
8968 add_padding = 0;
8969
8970 /* Check for jcc and direct jmp. */
8971 if (i.tm.opcode_modifier.jump == JUMP)
8972 {
8973 if (i.tm.base_opcode == JUMP_PC_RELATIVE)
8974 {
8975 *branch_p = align_branch_jmp;
8976 add_padding = align_branch & align_branch_jmp_bit;
8977 }
8978 else
8979 {
79d72f45
HL
8980 /* Because J<cc> and JN<cc> share same group in macro-fusible table,
8981 igore the lowest bit. */
8982 *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
e379e5f3
L
8983 *branch_p = align_branch_jcc;
8984 if ((align_branch & align_branch_jcc_bit))
8985 add_padding = 1;
8986 }
8987 }
8988 else if (is_any_vex_encoding (&i.tm))
8989 return 0;
8990 else if ((i.tm.base_opcode | 1) == 0xc3)
8991 {
8992 /* Near ret. */
8993 *branch_p = align_branch_ret;
8994 if ((align_branch & align_branch_ret_bit))
8995 add_padding = 1;
8996 }
8997 else
8998 {
8999 /* Check for indirect jmp, direct and indirect calls. */
9000 if (i.tm.base_opcode == 0xe8)
9001 {
9002 /* Direct call. */
9003 *branch_p = align_branch_call;
9004 if ((align_branch & align_branch_call_bit))
9005 add_padding = 1;
9006 }
9007 else if (i.tm.base_opcode == 0xff
9008 && (i.tm.extension_opcode == 2
9009 || i.tm.extension_opcode == 4))
9010 {
9011 /* Indirect call and jmp. */
9012 *branch_p = align_branch_indirect;
9013 if ((align_branch & align_branch_indirect_bit))
9014 add_padding = 1;
9015 }
9016
9017 if (add_padding
9018 && i.disp_operands
9019 && tls_get_addr
9020 && (i.op[0].disps->X_op == O_symbol
9021 || (i.op[0].disps->X_op == O_subtract
9022 && i.op[0].disps->X_op_symbol == GOT_symbol)))
9023 {
9024 symbolS *s = i.op[0].disps->X_add_symbol;
9025 /* No padding to call to global or undefined tls_get_addr. */
9026 if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9027 && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9028 return 0;
9029 }
9030 }
9031
9032 if (add_padding
9033 && last_insn.kind != last_insn_other
9034 && last_insn.seg == now_seg)
9035 {
9036 if (flag_debug)
9037 as_warn_where (last_insn.file, last_insn.line,
9038 _("`%s` skips -malign-branch-boundary on `%s`"),
9039 last_insn.name, i.tm.name);
9040 return 0;
9041 }
9042
9043 return add_padding;
9044}
9045
29b0f896 9046static void
e3bb37b5 9047output_insn (void)
29b0f896 9048{
2bbd9c25
JJ
9049 fragS *insn_start_frag;
9050 offsetT insn_start_off;
e379e5f3
L
9051 fragS *fragP = NULL;
9052 enum align_branch_kind branch = align_branch_none;
79d72f45
HL
9053 /* The initializer is arbitrary just to avoid uninitialized error.
9054 it's actually either assigned in add_branch_padding_frag_p
9055 or never be used. */
9056 enum mf_jcc_kind mf_jcc = mf_jcc_jo;
2bbd9c25 9057
b4a3a7b4
L
9058#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9059 if (IS_ELF && x86_used_note)
9060 {
9061 if (i.tm.cpu_flags.bitfield.cpucmov)
9062 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
9063 if (i.tm.cpu_flags.bitfield.cpusse)
9064 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
9065 if (i.tm.cpu_flags.bitfield.cpusse2)
9066 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
9067 if (i.tm.cpu_flags.bitfield.cpusse3)
9068 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
9069 if (i.tm.cpu_flags.bitfield.cpussse3)
9070 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
9071 if (i.tm.cpu_flags.bitfield.cpusse4_1)
9072 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
9073 if (i.tm.cpu_flags.bitfield.cpusse4_2)
9074 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
9075 if (i.tm.cpu_flags.bitfield.cpuavx)
9076 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
9077 if (i.tm.cpu_flags.bitfield.cpuavx2)
9078 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
9079 if (i.tm.cpu_flags.bitfield.cpufma)
9080 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
9081 if (i.tm.cpu_flags.bitfield.cpuavx512f)
9082 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
9083 if (i.tm.cpu_flags.bitfield.cpuavx512cd)
9084 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
9085 if (i.tm.cpu_flags.bitfield.cpuavx512er)
9086 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
9087 if (i.tm.cpu_flags.bitfield.cpuavx512pf)
9088 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
9089 if (i.tm.cpu_flags.bitfield.cpuavx512vl)
9090 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
9091 if (i.tm.cpu_flags.bitfield.cpuavx512dq)
9092 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
9093 if (i.tm.cpu_flags.bitfield.cpuavx512bw)
9094 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
9095 if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
9096 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
9097 if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
9098 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
9099 if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
9100 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
9101 if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
9102 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
9103 if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
9104 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
9105 if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
9106 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
9107 if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
9108 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
462cac58
L
9109 if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
9110 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
b4a3a7b4
L
9111
9112 if (i.tm.cpu_flags.bitfield.cpu8087
9113 || i.tm.cpu_flags.bitfield.cpu287
9114 || i.tm.cpu_flags.bitfield.cpu387
9115 || i.tm.cpu_flags.bitfield.cpu687
9116 || i.tm.cpu_flags.bitfield.cpufisttp)
9117 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
319ff62c
JB
9118 if (i.has_regmmx
9119 || i.tm.base_opcode == 0xf77 /* emms */
a7e12755
L
9120 || i.tm.base_opcode == 0xf0e /* femms */
9121 || i.tm.base_opcode == 0xf2a /* cvtpi2ps */
9122 || i.tm.base_opcode == 0x660f2a /* cvtpi2pd */)
b4a3a7b4
L
9123 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9124 if (i.has_regxmm)
9125 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9126 if (i.has_regymm)
9127 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9128 if (i.has_regzmm)
9129 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9130 if (i.tm.cpu_flags.bitfield.cpufxsr)
9131 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9132 if (i.tm.cpu_flags.bitfield.cpuxsave)
9133 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9134 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9135 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9136 if (i.tm.cpu_flags.bitfield.cpuxsavec)
9137 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9138 }
9139#endif
9140
29b0f896
AM
9141 /* Tie dwarf2 debug info to the address at the start of the insn.
9142 We can't do this after the insn has been output as the current
9143 frag may have been closed off. eg. by frag_var. */
9144 dwarf2_emit_insn (0);
9145
2bbd9c25
JJ
9146 insn_start_frag = frag_now;
9147 insn_start_off = frag_now_fix ();
9148
79d72f45 9149 if (add_branch_padding_frag_p (&branch, &mf_jcc))
e379e5f3
L
9150 {
9151 char *p;
9152 /* Branch can be 8 bytes. Leave some room for prefixes. */
9153 unsigned int max_branch_padding_size = 14;
9154
9155 /* Align section to boundary. */
9156 record_alignment (now_seg, align_branch_power);
9157
9158 /* Make room for padding. */
9159 frag_grow (max_branch_padding_size);
9160
9161 /* Start of the padding. */
9162 p = frag_more (0);
9163
9164 fragP = frag_now;
9165
9166 frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9167 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9168 NULL, 0, p);
9169
79d72f45 9170 fragP->tc_frag_data.mf_type = mf_jcc;
e379e5f3
L
9171 fragP->tc_frag_data.branch_type = branch;
9172 fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9173 }
9174
29b0f896 9175 /* Output jumps. */
0cfa3eb3 9176 if (i.tm.opcode_modifier.jump == JUMP)
29b0f896 9177 output_branch ();
0cfa3eb3
JB
9178 else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9179 || i.tm.opcode_modifier.jump == JUMP_DWORD)
29b0f896 9180 output_jump ();
0cfa3eb3 9181 else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
29b0f896
AM
9182 output_interseg_jump ();
9183 else
9184 {
9185 /* Output normal instructions here. */
9186 char *p;
9187 unsigned char *q;
47465058 9188 unsigned int j;
331d2d0d 9189 unsigned int prefix;
79d72f45 9190 enum mf_cmp_kind mf_cmp;
4dffcebc 9191
e4e00185 9192 if (avoid_fence
c3949f43
JB
9193 && (i.tm.base_opcode == 0xfaee8
9194 || i.tm.base_opcode == 0xfaef0
9195 || i.tm.base_opcode == 0xfaef8))
e4e00185
AS
9196 {
9197 /* Encode lfence, mfence, and sfence as
9198 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
9199 offsetT val = 0x240483f0ULL;
9200 p = frag_more (5);
9201 md_number_to_chars (p, val, 5);
9202 return;
9203 }
9204
d022bddd
IT
9205 /* Some processors fail on LOCK prefix. This options makes
9206 assembler ignore LOCK prefix and serves as a workaround. */
9207 if (omit_lock_prefix)
9208 {
9209 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
9210 return;
9211 i.prefix[LOCK_PREFIX] = 0;
9212 }
9213
e379e5f3
L
9214 if (branch)
9215 /* Skip if this is a branch. */
9216 ;
79d72f45 9217 else if (add_fused_jcc_padding_frag_p (&mf_cmp))
e379e5f3
L
9218 {
9219 /* Make room for padding. */
9220 frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9221 p = frag_more (0);
9222
9223 fragP = frag_now;
9224
9225 frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9226 ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9227 NULL, 0, p);
9228
79d72f45 9229 fragP->tc_frag_data.mf_type = mf_cmp;
e379e5f3
L
9230 fragP->tc_frag_data.branch_type = align_branch_fused;
9231 fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9232 }
9233 else if (add_branch_prefix_frag_p ())
9234 {
9235 unsigned int max_prefix_size = align_branch_prefix_size;
9236
9237 /* Make room for padding. */
9238 frag_grow (max_prefix_size);
9239 p = frag_more (0);
9240
9241 fragP = frag_now;
9242
9243 frag_var (rs_machine_dependent, max_prefix_size, 0,
9244 ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9245 NULL, 0, p);
9246
9247 fragP->tc_frag_data.max_bytes = max_prefix_size;
9248 }
9249
43234a1e
L
9250 /* Since the VEX/EVEX prefix contains the implicit prefix, we
9251 don't need the explicit prefix. */
9252 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
bc4bd9ab 9253 {
c0f3af97 9254 switch (i.tm.opcode_length)
bc4bd9ab 9255 {
c0f3af97
L
9256 case 3:
9257 if (i.tm.base_opcode & 0xff000000)
4dffcebc 9258 {
c0f3af97 9259 prefix = (i.tm.base_opcode >> 24) & 0xff;
c3949f43
JB
9260 if (!i.tm.cpu_flags.bitfield.cpupadlock
9261 || prefix != REPE_PREFIX_OPCODE
9262 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
9263 add_prefix (prefix);
c0f3af97
L
9264 }
9265 break;
9266 case 2:
9267 if ((i.tm.base_opcode & 0xff0000) != 0)
9268 {
9269 prefix = (i.tm.base_opcode >> 16) & 0xff;
c3949f43 9270 add_prefix (prefix);
4dffcebc 9271 }
c0f3af97
L
9272 break;
9273 case 1:
9274 break;
390c91cf
L
9275 case 0:
9276 /* Check for pseudo prefixes. */
9277 as_bad_where (insn_start_frag->fr_file,
9278 insn_start_frag->fr_line,
9279 _("pseudo prefix without instruction"));
9280 return;
c0f3af97
L
9281 default:
9282 abort ();
bc4bd9ab 9283 }
c0f3af97 9284
6d19a37a 9285#if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
cf61b747
L
9286 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9287 R_X86_64_GOTTPOFF relocation so that linker can safely
14470f07
L
9288 perform IE->LE optimization. A dummy REX_OPCODE prefix
9289 is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9290 relocation for GDesc -> IE/LE optimization. */
cf61b747
L
9291 if (x86_elf_abi == X86_64_X32_ABI
9292 && i.operands == 2
14470f07
L
9293 && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9294 || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
cf61b747
L
9295 && i.prefix[REX_PREFIX] == 0)
9296 add_prefix (REX_OPCODE);
6d19a37a 9297#endif
cf61b747 9298
c0f3af97
L
9299 /* The prefix bytes. */
9300 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9301 if (*q)
9302 FRAG_APPEND_1_CHAR (*q);
0f10071e 9303 }
ae5c1c7b 9304 else
c0f3af97
L
9305 {
9306 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9307 if (*q)
9308 switch (j)
9309 {
c0f3af97
L
9310 case SEG_PREFIX:
9311 case ADDR_PREFIX:
9312 FRAG_APPEND_1_CHAR (*q);
9313 break;
9314 default:
9315 /* There should be no other prefixes for instructions
9316 with VEX prefix. */
9317 abort ();
9318 }
9319
43234a1e
L
9320 /* For EVEX instructions i.vrex should become 0 after
9321 build_evex_prefix. For VEX instructions upper 16 registers
9322 aren't available, so VREX should be 0. */
9323 if (i.vrex)
9324 abort ();
c0f3af97
L
9325 /* Now the VEX prefix. */
9326 p = frag_more (i.vex.length);
9327 for (j = 0; j < i.vex.length; j++)
9328 p[j] = i.vex.bytes[j];
9329 }
252b5132 9330
29b0f896 9331 /* Now the opcode; be careful about word order here! */
4dffcebc 9332 if (i.tm.opcode_length == 1)
29b0f896
AM
9333 {
9334 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9335 }
9336 else
9337 {
4dffcebc 9338 switch (i.tm.opcode_length)
331d2d0d 9339 {
43234a1e
L
9340 case 4:
9341 p = frag_more (4);
9342 *p++ = (i.tm.base_opcode >> 24) & 0xff;
9343 *p++ = (i.tm.base_opcode >> 16) & 0xff;
9344 break;
4dffcebc 9345 case 3:
331d2d0d
L
9346 p = frag_more (3);
9347 *p++ = (i.tm.base_opcode >> 16) & 0xff;
4dffcebc
L
9348 break;
9349 case 2:
9350 p = frag_more (2);
9351 break;
9352 default:
9353 abort ();
9354 break;
331d2d0d 9355 }
0f10071e 9356
29b0f896
AM
9357 /* Put out high byte first: can't use md_number_to_chars! */
9358 *p++ = (i.tm.base_opcode >> 8) & 0xff;
9359 *p = i.tm.base_opcode & 0xff;
9360 }
3e73aa7c 9361
29b0f896 9362 /* Now the modrm byte and sib byte (if present). */
40fb9820 9363 if (i.tm.opcode_modifier.modrm)
29b0f896 9364 {
4a3523fa
L
9365 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
9366 | i.rm.reg << 3
9367 | i.rm.mode << 6));
29b0f896
AM
9368 /* If i.rm.regmem == ESP (4)
9369 && i.rm.mode != (Register mode)
9370 && not 16 bit
9371 ==> need second modrm byte. */
9372 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9373 && i.rm.mode != 3
dc821c5f 9374 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
4a3523fa
L
9375 FRAG_APPEND_1_CHAR ((i.sib.base << 0
9376 | i.sib.index << 3
9377 | i.sib.scale << 6));
29b0f896 9378 }
3e73aa7c 9379
29b0f896 9380 if (i.disp_operands)
2bbd9c25 9381 output_disp (insn_start_frag, insn_start_off);
3e73aa7c 9382
29b0f896 9383 if (i.imm_operands)
2bbd9c25 9384 output_imm (insn_start_frag, insn_start_off);
9c33702b
JB
9385
9386 /*
9387 * frag_now_fix () returning plain abs_section_offset when we're in the
9388 * absolute section, and abs_section_offset not getting updated as data
9389 * gets added to the frag breaks the logic below.
9390 */
9391 if (now_seg != absolute_section)
9392 {
9393 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9394 if (j > 15)
9395 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9396 j);
e379e5f3
L
9397 else if (fragP)
9398 {
9399 /* NB: Don't add prefix with GOTPC relocation since
9400 output_disp() above depends on the fixed encoding
9401 length. Can't add prefix with TLS relocation since
9402 it breaks TLS linker optimization. */
9403 unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9404 /* Prefix count on the current instruction. */
9405 unsigned int count = i.vex.length;
9406 unsigned int k;
9407 for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9408 /* REX byte is encoded in VEX/EVEX prefix. */
9409 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9410 count++;
9411
9412 /* Count prefixes for extended opcode maps. */
9413 if (!i.vex.length)
9414 switch (i.tm.opcode_length)
9415 {
9416 case 3:
9417 if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
9418 {
9419 count++;
9420 switch ((i.tm.base_opcode >> 8) & 0xff)
9421 {
9422 case 0x38:
9423 case 0x3a:
9424 count++;
9425 break;
9426 default:
9427 break;
9428 }
9429 }
9430 break;
9431 case 2:
9432 if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
9433 count++;
9434 break;
9435 case 1:
9436 break;
9437 default:
9438 abort ();
9439 }
9440
9441 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9442 == BRANCH_PREFIX)
9443 {
9444 /* Set the maximum prefix size in BRANCH_PREFIX
9445 frag. */
9446 if (fragP->tc_frag_data.max_bytes > max)
9447 fragP->tc_frag_data.max_bytes = max;
9448 if (fragP->tc_frag_data.max_bytes > count)
9449 fragP->tc_frag_data.max_bytes -= count;
9450 else
9451 fragP->tc_frag_data.max_bytes = 0;
9452 }
9453 else
9454 {
9455 /* Remember the maximum prefix size in FUSED_JCC_PADDING
9456 frag. */
9457 unsigned int max_prefix_size;
9458 if (align_branch_prefix_size > max)
9459 max_prefix_size = max;
9460 else
9461 max_prefix_size = align_branch_prefix_size;
9462 if (max_prefix_size > count)
9463 fragP->tc_frag_data.max_prefix_length
9464 = max_prefix_size - count;
9465 }
9466
9467 /* Use existing segment prefix if possible. Use CS
9468 segment prefix in 64-bit mode. In 32-bit mode, use SS
9469 segment prefix with ESP/EBP base register and use DS
9470 segment prefix without ESP/EBP base register. */
9471 if (i.prefix[SEG_PREFIX])
9472 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9473 else if (flag_code == CODE_64BIT)
9474 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9475 else if (i.base_reg
9476 && (i.base_reg->reg_num == 4
9477 || i.base_reg->reg_num == 5))
9478 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9479 else
9480 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9481 }
9c33702b 9482 }
29b0f896 9483 }
252b5132 9484
e379e5f3
L
9485 /* NB: Don't work with COND_JUMP86 without i386. */
9486 if (align_branch_power
9487 && now_seg != absolute_section
9488 && cpu_arch_flags.bitfield.cpui386)
9489 {
9490 /* Terminate each frag so that we can add prefix and check for
9491 fused jcc. */
9492 frag_wane (frag_now);
9493 frag_new (0);
9494 }
9495
29b0f896
AM
9496#ifdef DEBUG386
9497 if (flag_debug)
9498 {
7b81dfbb 9499 pi ("" /*line*/, &i);
29b0f896
AM
9500 }
9501#endif /* DEBUG386 */
9502}
252b5132 9503
e205caa7
L
9504/* Return the size of the displacement operand N. */
9505
9506static int
9507disp_size (unsigned int n)
9508{
9509 int size = 4;
43234a1e 9510
b5014f7a 9511 if (i.types[n].bitfield.disp64)
40fb9820
L
9512 size = 8;
9513 else if (i.types[n].bitfield.disp8)
9514 size = 1;
9515 else if (i.types[n].bitfield.disp16)
9516 size = 2;
e205caa7
L
9517 return size;
9518}
9519
9520/* Return the size of the immediate operand N. */
9521
9522static int
9523imm_size (unsigned int n)
9524{
9525 int size = 4;
40fb9820
L
9526 if (i.types[n].bitfield.imm64)
9527 size = 8;
9528 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9529 size = 1;
9530 else if (i.types[n].bitfield.imm16)
9531 size = 2;
e205caa7
L
9532 return size;
9533}
9534
29b0f896 9535static void
64e74474 9536output_disp (fragS *insn_start_frag, offsetT insn_start_off)
29b0f896
AM
9537{
9538 char *p;
9539 unsigned int n;
252b5132 9540
29b0f896
AM
9541 for (n = 0; n < i.operands; n++)
9542 {
b5014f7a 9543 if (operand_type_check (i.types[n], disp))
29b0f896
AM
9544 {
9545 if (i.op[n].disps->X_op == O_constant)
9546 {
e205caa7 9547 int size = disp_size (n);
43234a1e 9548 offsetT val = i.op[n].disps->X_add_number;
252b5132 9549
629cfaf1
JB
9550 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9551 size);
29b0f896
AM
9552 p = frag_more (size);
9553 md_number_to_chars (p, val, size);
9554 }
9555 else
9556 {
f86103b7 9557 enum bfd_reloc_code_real reloc_type;
e205caa7 9558 int size = disp_size (n);
40fb9820 9559 int sign = i.types[n].bitfield.disp32s;
29b0f896 9560 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
02a86693 9561 fixS *fixP;
29b0f896 9562
e205caa7 9563 /* We can't have 8 bit displacement here. */
9c2799c2 9564 gas_assert (!i.types[n].bitfield.disp8);
e205caa7 9565
29b0f896
AM
9566 /* The PC relative address is computed relative
9567 to the instruction boundary, so in case immediate
9568 fields follows, we need to adjust the value. */
9569 if (pcrel && i.imm_operands)
9570 {
29b0f896 9571 unsigned int n1;
e205caa7 9572 int sz = 0;
252b5132 9573
29b0f896 9574 for (n1 = 0; n1 < i.operands; n1++)
40fb9820 9575 if (operand_type_check (i.types[n1], imm))
252b5132 9576 {
e205caa7
L
9577 /* Only one immediate is allowed for PC
9578 relative address. */
9c2799c2 9579 gas_assert (sz == 0);
e205caa7
L
9580 sz = imm_size (n1);
9581 i.op[n].disps->X_add_number -= sz;
252b5132 9582 }
29b0f896 9583 /* We should find the immediate. */
9c2799c2 9584 gas_assert (sz != 0);
29b0f896 9585 }
520dc8e8 9586
29b0f896 9587 p = frag_more (size);
d258b828 9588 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
d6ab8113 9589 if (GOT_symbol
2bbd9c25 9590 && GOT_symbol == i.op[n].disps->X_add_symbol
d6ab8113 9591 && (((reloc_type == BFD_RELOC_32
7b81dfbb
AJ
9592 || reloc_type == BFD_RELOC_X86_64_32S
9593 || (reloc_type == BFD_RELOC_64
9594 && object_64bit))
d6ab8113
JB
9595 && (i.op[n].disps->X_op == O_symbol
9596 || (i.op[n].disps->X_op == O_add
9597 && ((symbol_get_value_expression
9598 (i.op[n].disps->X_op_symbol)->X_op)
9599 == O_subtract))))
9600 || reloc_type == BFD_RELOC_32_PCREL))
2bbd9c25 9601 {
4fa24527 9602 if (!object_64bit)
7b81dfbb
AJ
9603 {
9604 reloc_type = BFD_RELOC_386_GOTPC;
e379e5f3 9605 i.has_gotpc_tls_reloc = TRUE;
d583596c
JB
9606 i.op[n].imms->X_add_number +=
9607 encoding_length (insn_start_frag, insn_start_off, p);
7b81dfbb
AJ
9608 }
9609 else if (reloc_type == BFD_RELOC_64)
9610 reloc_type = BFD_RELOC_X86_64_GOTPC64;
d6ab8113 9611 else
7b81dfbb
AJ
9612 /* Don't do the adjustment for x86-64, as there
9613 the pcrel addressing is relative to the _next_
9614 insn, and that is taken care of in other code. */
d6ab8113 9615 reloc_type = BFD_RELOC_X86_64_GOTPC32;
2bbd9c25 9616 }
e379e5f3
L
9617 else if (align_branch_power)
9618 {
9619 switch (reloc_type)
9620 {
9621 case BFD_RELOC_386_TLS_GD:
9622 case BFD_RELOC_386_TLS_LDM:
9623 case BFD_RELOC_386_TLS_IE:
9624 case BFD_RELOC_386_TLS_IE_32:
9625 case BFD_RELOC_386_TLS_GOTIE:
9626 case BFD_RELOC_386_TLS_GOTDESC:
9627 case BFD_RELOC_386_TLS_DESC_CALL:
9628 case BFD_RELOC_X86_64_TLSGD:
9629 case BFD_RELOC_X86_64_TLSLD:
9630 case BFD_RELOC_X86_64_GOTTPOFF:
9631 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9632 case BFD_RELOC_X86_64_TLSDESC_CALL:
9633 i.has_gotpc_tls_reloc = TRUE;
9634 default:
9635 break;
9636 }
9637 }
02a86693
L
9638 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9639 size, i.op[n].disps, pcrel,
9640 reloc_type);
9641 /* Check for "call/jmp *mem", "mov mem, %reg",
9642 "test %reg, mem" and "binop mem, %reg" where binop
9643 is one of adc, add, and, cmp, or, sbb, sub, xor
e60f4d3b
L
9644 instructions without data prefix. Always generate
9645 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
9646 if (i.prefix[DATA_PREFIX] == 0
9647 && (generate_relax_relocations
9648 || (!object_64bit
9649 && i.rm.mode == 0
9650 && i.rm.regmem == 5))
0cb4071e
L
9651 && (i.rm.mode == 2
9652 || (i.rm.mode == 0 && i.rm.regmem == 5))
2ae4c703 9653 && !is_any_vex_encoding(&i.tm)
02a86693
L
9654 && ((i.operands == 1
9655 && i.tm.base_opcode == 0xff
9656 && (i.rm.reg == 2 || i.rm.reg == 4))
9657 || (i.operands == 2
9658 && (i.tm.base_opcode == 0x8b
9659 || i.tm.base_opcode == 0x85
2ae4c703 9660 || (i.tm.base_opcode & ~0x38) == 0x03))))
02a86693
L
9661 {
9662 if (object_64bit)
9663 {
9664 fixP->fx_tcbit = i.rex != 0;
9665 if (i.base_reg
e968fc9b 9666 && (i.base_reg->reg_num == RegIP))
02a86693
L
9667 fixP->fx_tcbit2 = 1;
9668 }
9669 else
9670 fixP->fx_tcbit2 = 1;
9671 }
29b0f896
AM
9672 }
9673 }
9674 }
9675}
252b5132 9676
29b0f896 9677static void
64e74474 9678output_imm (fragS *insn_start_frag, offsetT insn_start_off)
29b0f896
AM
9679{
9680 char *p;
9681 unsigned int n;
252b5132 9682
29b0f896
AM
9683 for (n = 0; n < i.operands; n++)
9684 {
43234a1e
L
9685 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
9686 if (i.rounding && (int) n == i.rounding->operand)
9687 continue;
9688
40fb9820 9689 if (operand_type_check (i.types[n], imm))
29b0f896
AM
9690 {
9691 if (i.op[n].imms->X_op == O_constant)
9692 {
e205caa7 9693 int size = imm_size (n);
29b0f896 9694 offsetT val;
b4cac588 9695
29b0f896
AM
9696 val = offset_in_range (i.op[n].imms->X_add_number,
9697 size);
9698 p = frag_more (size);
9699 md_number_to_chars (p, val, size);
9700 }
9701 else
9702 {
9703 /* Not absolute_section.
9704 Need a 32-bit fixup (don't support 8bit
9705 non-absolute imms). Try to support other
9706 sizes ... */
f86103b7 9707 enum bfd_reloc_code_real reloc_type;
e205caa7
L
9708 int size = imm_size (n);
9709 int sign;
29b0f896 9710
40fb9820 9711 if (i.types[n].bitfield.imm32s
a7d61044 9712 && (i.suffix == QWORD_MNEM_SUFFIX
40fb9820 9713 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
29b0f896 9714 sign = 1;
e205caa7
L
9715 else
9716 sign = 0;
520dc8e8 9717
29b0f896 9718 p = frag_more (size);
d258b828 9719 reloc_type = reloc (size, 0, sign, i.reloc[n]);
f86103b7 9720
2bbd9c25
JJ
9721 /* This is tough to explain. We end up with this one if we
9722 * have operands that look like
9723 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
9724 * obtain the absolute address of the GOT, and it is strongly
9725 * preferable from a performance point of view to avoid using
9726 * a runtime relocation for this. The actual sequence of
9727 * instructions often look something like:
9728 *
9729 * call .L66
9730 * .L66:
9731 * popl %ebx
9732 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9733 *
9734 * The call and pop essentially return the absolute address
9735 * of the label .L66 and store it in %ebx. The linker itself
9736 * will ultimately change the first operand of the addl so
9737 * that %ebx points to the GOT, but to keep things simple, the
9738 * .o file must have this operand set so that it generates not
9739 * the absolute address of .L66, but the absolute address of
9740 * itself. This allows the linker itself simply treat a GOTPC
9741 * relocation as asking for a pcrel offset to the GOT to be
9742 * added in, and the addend of the relocation is stored in the
9743 * operand field for the instruction itself.
9744 *
9745 * Our job here is to fix the operand so that it would add
9746 * the correct offset so that %ebx would point to itself. The
9747 * thing that is tricky is that .-.L66 will point to the
9748 * beginning of the instruction, so we need to further modify
9749 * the operand so that it will point to itself. There are
9750 * other cases where you have something like:
9751 *
9752 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9753 *
9754 * and here no correction would be required. Internally in
9755 * the assembler we treat operands of this form as not being
9756 * pcrel since the '.' is explicitly mentioned, and I wonder
9757 * whether it would simplify matters to do it this way. Who
9758 * knows. In earlier versions of the PIC patches, the
9759 * pcrel_adjust field was used to store the correction, but
9760 * since the expression is not pcrel, I felt it would be
9761 * confusing to do it this way. */
9762
d6ab8113 9763 if ((reloc_type == BFD_RELOC_32
7b81dfbb
AJ
9764 || reloc_type == BFD_RELOC_X86_64_32S
9765 || reloc_type == BFD_RELOC_64)
29b0f896
AM
9766 && GOT_symbol
9767 && GOT_symbol == i.op[n].imms->X_add_symbol
9768 && (i.op[n].imms->X_op == O_symbol
9769 || (i.op[n].imms->X_op == O_add
9770 && ((symbol_get_value_expression
9771 (i.op[n].imms->X_op_symbol)->X_op)
9772 == O_subtract))))
9773 {
4fa24527 9774 if (!object_64bit)
d6ab8113 9775 reloc_type = BFD_RELOC_386_GOTPC;
7b81dfbb 9776 else if (size == 4)
d6ab8113 9777 reloc_type = BFD_RELOC_X86_64_GOTPC32;
7b81dfbb
AJ
9778 else if (size == 8)
9779 reloc_type = BFD_RELOC_X86_64_GOTPC64;
e379e5f3 9780 i.has_gotpc_tls_reloc = TRUE;
d583596c
JB
9781 i.op[n].imms->X_add_number +=
9782 encoding_length (insn_start_frag, insn_start_off, p);
29b0f896 9783 }
29b0f896
AM
9784 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9785 i.op[n].imms, 0, reloc_type);
9786 }
9787 }
9788 }
252b5132
RH
9789}
9790\f
d182319b
JB
9791/* x86_cons_fix_new is called via the expression parsing code when a
9792 reloc is needed. We use this hook to get the correct .got reloc. */
d182319b
JB
9793static int cons_sign = -1;
9794
9795void
e3bb37b5 9796x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
62ebcb5c 9797 expressionS *exp, bfd_reloc_code_real_type r)
d182319b 9798{
d258b828 9799 r = reloc (len, 0, cons_sign, r);
d182319b
JB
9800
9801#ifdef TE_PE
9802 if (exp->X_op == O_secrel)
9803 {
9804 exp->X_op = O_symbol;
9805 r = BFD_RELOC_32_SECREL;
9806 }
9807#endif
9808
9809 fix_new_exp (frag, off, len, exp, 0, r);
9810}
9811
357d1bd8
L
9812/* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9813 purpose of the `.dc.a' internal pseudo-op. */
9814
9815int
9816x86_address_bytes (void)
9817{
9818 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9819 return 4;
9820 return stdoutput->arch_info->bits_per_address / 8;
9821}
9822
d382c579
TG
9823#if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9824 || defined (LEX_AT)
d258b828 9825# define lex_got(reloc, adjust, types) NULL
718ddfc0 9826#else
f3c180ae
AM
9827/* Parse operands of the form
9828 <symbol>@GOTOFF+<nnn>
9829 and similar .plt or .got references.
9830
9831 If we find one, set up the correct relocation in RELOC and copy the
9832 input string, minus the `@GOTOFF' into a malloc'd buffer for
9833 parsing by the calling routine. Return this buffer, and if ADJUST
9834 is non-null set it to the length of the string we removed from the
9835 input line. Otherwise return NULL. */
9836static char *
91d6fa6a 9837lex_got (enum bfd_reloc_code_real *rel,
64e74474 9838 int *adjust,
d258b828 9839 i386_operand_type *types)
f3c180ae 9840{
7b81dfbb
AJ
9841 /* Some of the relocations depend on the size of what field is to
9842 be relocated. But in our callers i386_immediate and i386_displacement
9843 we don't yet know the operand size (this will be set by insn
9844 matching). Hence we record the word32 relocation here,
9845 and adjust the reloc according to the real size in reloc(). */
f3c180ae
AM
9846 static const struct {
9847 const char *str;
cff8d58a 9848 int len;
4fa24527 9849 const enum bfd_reloc_code_real rel[2];
40fb9820 9850 const i386_operand_type types64;
f3c180ae 9851 } gotrel[] = {
8ce3d284 9852#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8fd4256d
L
9853 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
9854 BFD_RELOC_SIZE32 },
9855 OPERAND_TYPE_IMM32_64 },
8ce3d284 9856#endif
cff8d58a
L
9857 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
9858 BFD_RELOC_X86_64_PLTOFF64 },
40fb9820 9859 OPERAND_TYPE_IMM64 },
cff8d58a
L
9860 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
9861 BFD_RELOC_X86_64_PLT32 },
40fb9820 9862 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9863 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
9864 BFD_RELOC_X86_64_GOTPLT64 },
40fb9820 9865 OPERAND_TYPE_IMM64_DISP64 },
cff8d58a
L
9866 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
9867 BFD_RELOC_X86_64_GOTOFF64 },
40fb9820 9868 OPERAND_TYPE_IMM64_DISP64 },
cff8d58a
L
9869 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9870 BFD_RELOC_X86_64_GOTPCREL },
40fb9820 9871 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9872 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
9873 BFD_RELOC_X86_64_TLSGD },
40fb9820 9874 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9875 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
9876 _dummy_first_bfd_reloc_code_real },
40fb9820 9877 OPERAND_TYPE_NONE },
cff8d58a
L
9878 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
9879 BFD_RELOC_X86_64_TLSLD },
40fb9820 9880 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9881 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9882 BFD_RELOC_X86_64_GOTTPOFF },
40fb9820 9883 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9884 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
9885 BFD_RELOC_X86_64_TPOFF32 },
40fb9820 9886 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
cff8d58a
L
9887 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
9888 _dummy_first_bfd_reloc_code_real },
40fb9820 9889 OPERAND_TYPE_NONE },
cff8d58a
L
9890 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
9891 BFD_RELOC_X86_64_DTPOFF32 },
40fb9820 9892 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
cff8d58a
L
9893 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9894 _dummy_first_bfd_reloc_code_real },
40fb9820 9895 OPERAND_TYPE_NONE },
cff8d58a
L
9896 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9897 _dummy_first_bfd_reloc_code_real },
40fb9820 9898 OPERAND_TYPE_NONE },
cff8d58a
L
9899 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
9900 BFD_RELOC_X86_64_GOT32 },
40fb9820 9901 OPERAND_TYPE_IMM32_32S_64_DISP32 },
cff8d58a
L
9902 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
9903 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
40fb9820 9904 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9905 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
9906 BFD_RELOC_X86_64_TLSDESC_CALL },
40fb9820 9907 OPERAND_TYPE_IMM32_32S_DISP32 },
f3c180ae
AM
9908 };
9909 char *cp;
9910 unsigned int j;
9911
d382c579 9912#if defined (OBJ_MAYBE_ELF)
718ddfc0
JB
9913 if (!IS_ELF)
9914 return NULL;
d382c579 9915#endif
718ddfc0 9916
f3c180ae 9917 for (cp = input_line_pointer; *cp != '@'; cp++)
67c11a9b 9918 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
f3c180ae
AM
9919 return NULL;
9920
47465058 9921 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
f3c180ae 9922 {
cff8d58a 9923 int len = gotrel[j].len;
28f81592 9924 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
f3c180ae 9925 {
4fa24527 9926 if (gotrel[j].rel[object_64bit] != 0)
f3c180ae 9927 {
28f81592
AM
9928 int first, second;
9929 char *tmpbuf, *past_reloc;
f3c180ae 9930
91d6fa6a 9931 *rel = gotrel[j].rel[object_64bit];
f3c180ae 9932
3956db08
JB
9933 if (types)
9934 {
9935 if (flag_code != CODE_64BIT)
40fb9820
L
9936 {
9937 types->bitfield.imm32 = 1;
9938 types->bitfield.disp32 = 1;
9939 }
3956db08
JB
9940 else
9941 *types = gotrel[j].types64;
9942 }
9943
8fd4256d 9944 if (j != 0 && GOT_symbol == NULL)
f3c180ae
AM
9945 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9946
28f81592 9947 /* The length of the first part of our input line. */
f3c180ae 9948 first = cp - input_line_pointer;
28f81592
AM
9949
9950 /* The second part goes from after the reloc token until
67c11a9b 9951 (and including) an end_of_line char or comma. */
28f81592 9952 past_reloc = cp + 1 + len;
67c11a9b
AM
9953 cp = past_reloc;
9954 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9955 ++cp;
9956 second = cp + 1 - past_reloc;
28f81592
AM
9957
9958 /* Allocate and copy string. The trailing NUL shouldn't
9959 be necessary, but be safe. */
add39d23 9960 tmpbuf = XNEWVEC (char, first + second + 2);
f3c180ae 9961 memcpy (tmpbuf, input_line_pointer, first);
0787a12d
AM
9962 if (second != 0 && *past_reloc != ' ')
9963 /* Replace the relocation token with ' ', so that
9964 errors like foo@GOTOFF1 will be detected. */
9965 tmpbuf[first++] = ' ';
af89796a
L
9966 else
9967 /* Increment length by 1 if the relocation token is
9968 removed. */
9969 len++;
9970 if (adjust)
9971 *adjust = len;
0787a12d
AM
9972 memcpy (tmpbuf + first, past_reloc, second);
9973 tmpbuf[first + second] = '\0';
f3c180ae
AM
9974 return tmpbuf;
9975 }
9976
4fa24527
JB
9977 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9978 gotrel[j].str, 1 << (5 + object_64bit));
f3c180ae
AM
9979 return NULL;
9980 }
9981 }
9982
9983 /* Might be a symbol version string. Don't as_bad here. */
9984 return NULL;
9985}
4e4f7c87 9986#endif
f3c180ae 9987
a988325c
NC
9988#ifdef TE_PE
9989#ifdef lex_got
9990#undef lex_got
9991#endif
9992/* Parse operands of the form
9993 <symbol>@SECREL32+<nnn>
9994
9995 If we find one, set up the correct relocation in RELOC and copy the
9996 input string, minus the `@SECREL32' into a malloc'd buffer for
9997 parsing by the calling routine. Return this buffer, and if ADJUST
9998 is non-null set it to the length of the string we removed from the
34bca508
L
9999 input line. Otherwise return NULL.
10000
a988325c
NC
10001 This function is copied from the ELF version above adjusted for PE targets. */
10002
10003static char *
10004lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
10005 int *adjust ATTRIBUTE_UNUSED,
d258b828 10006 i386_operand_type *types)
a988325c
NC
10007{
10008 static const struct
10009 {
10010 const char *str;
10011 int len;
10012 const enum bfd_reloc_code_real rel[2];
10013 const i386_operand_type types64;
10014 }
10015 gotrel[] =
10016 {
10017 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
10018 BFD_RELOC_32_SECREL },
10019 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
10020 };
10021
10022 char *cp;
10023 unsigned j;
10024
10025 for (cp = input_line_pointer; *cp != '@'; cp++)
10026 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10027 return NULL;
10028
10029 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10030 {
10031 int len = gotrel[j].len;
10032
10033 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10034 {
10035 if (gotrel[j].rel[object_64bit] != 0)
10036 {
10037 int first, second;
10038 char *tmpbuf, *past_reloc;
10039
10040 *rel = gotrel[j].rel[object_64bit];
10041 if (adjust)
10042 *adjust = len;
10043
10044 if (types)
10045 {
10046 if (flag_code != CODE_64BIT)
10047 {
10048 types->bitfield.imm32 = 1;
10049 types->bitfield.disp32 = 1;
10050 }
10051 else
10052 *types = gotrel[j].types64;
10053 }
10054
10055 /* The length of the first part of our input line. */
10056 first = cp - input_line_pointer;
10057
10058 /* The second part goes from after the reloc token until
10059 (and including) an end_of_line char or comma. */
10060 past_reloc = cp + 1 + len;
10061 cp = past_reloc;
10062 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10063 ++cp;
10064 second = cp + 1 - past_reloc;
10065
10066 /* Allocate and copy string. The trailing NUL shouldn't
10067 be necessary, but be safe. */
add39d23 10068 tmpbuf = XNEWVEC (char, first + second + 2);
a988325c
NC
10069 memcpy (tmpbuf, input_line_pointer, first);
10070 if (second != 0 && *past_reloc != ' ')
10071 /* Replace the relocation token with ' ', so that
10072 errors like foo@SECLREL321 will be detected. */
10073 tmpbuf[first++] = ' ';
10074 memcpy (tmpbuf + first, past_reloc, second);
10075 tmpbuf[first + second] = '\0';
10076 return tmpbuf;
10077 }
10078
10079 as_bad (_("@%s reloc is not supported with %d-bit output format"),
10080 gotrel[j].str, 1 << (5 + object_64bit));
10081 return NULL;
10082 }
10083 }
10084
10085 /* Might be a symbol version string. Don't as_bad here. */
10086 return NULL;
10087}
10088
10089#endif /* TE_PE */
10090
62ebcb5c 10091bfd_reloc_code_real_type
e3bb37b5 10092x86_cons (expressionS *exp, int size)
f3c180ae 10093{
62ebcb5c
AM
10094 bfd_reloc_code_real_type got_reloc = NO_RELOC;
10095
ee86248c
JB
10096 intel_syntax = -intel_syntax;
10097
3c7b9c2c 10098 exp->X_md = 0;
4fa24527 10099 if (size == 4 || (object_64bit && size == 8))
f3c180ae
AM
10100 {
10101 /* Handle @GOTOFF and the like in an expression. */
10102 char *save;
10103 char *gotfree_input_line;
4a57f2cf 10104 int adjust = 0;
f3c180ae
AM
10105
10106 save = input_line_pointer;
d258b828 10107 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
f3c180ae
AM
10108 if (gotfree_input_line)
10109 input_line_pointer = gotfree_input_line;
10110
10111 expression (exp);
10112
10113 if (gotfree_input_line)
10114 {
10115 /* expression () has merrily parsed up to the end of line,
10116 or a comma - in the wrong buffer. Transfer how far
10117 input_line_pointer has moved to the right buffer. */
10118 input_line_pointer = (save
10119 + (input_line_pointer - gotfree_input_line)
10120 + adjust);
10121 free (gotfree_input_line);
3992d3b7
AM
10122 if (exp->X_op == O_constant
10123 || exp->X_op == O_absent
10124 || exp->X_op == O_illegal
0398aac5 10125 || exp->X_op == O_register
3992d3b7
AM
10126 || exp->X_op == O_big)
10127 {
10128 char c = *input_line_pointer;
10129 *input_line_pointer = 0;
10130 as_bad (_("missing or invalid expression `%s'"), save);
10131 *input_line_pointer = c;
10132 }
b9519cfe
L
10133 else if ((got_reloc == BFD_RELOC_386_PLT32
10134 || got_reloc == BFD_RELOC_X86_64_PLT32)
10135 && exp->X_op != O_symbol)
10136 {
10137 char c = *input_line_pointer;
10138 *input_line_pointer = 0;
10139 as_bad (_("invalid PLT expression `%s'"), save);
10140 *input_line_pointer = c;
10141 }
f3c180ae
AM
10142 }
10143 }
10144 else
10145 expression (exp);
ee86248c
JB
10146
10147 intel_syntax = -intel_syntax;
10148
10149 if (intel_syntax)
10150 i386_intel_simplify (exp);
62ebcb5c
AM
10151
10152 return got_reloc;
f3c180ae 10153}
f3c180ae 10154
9f32dd5b
L
10155static void
10156signed_cons (int size)
6482c264 10157{
d182319b
JB
10158 if (flag_code == CODE_64BIT)
10159 cons_sign = 1;
10160 cons (size);
10161 cons_sign = -1;
6482c264
NC
10162}
10163
d182319b 10164#ifdef TE_PE
6482c264 10165static void
7016a5d5 10166pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
6482c264
NC
10167{
10168 expressionS exp;
10169
10170 do
10171 {
10172 expression (&exp);
10173 if (exp.X_op == O_symbol)
10174 exp.X_op = O_secrel;
10175
10176 emit_expr (&exp, 4);
10177 }
10178 while (*input_line_pointer++ == ',');
10179
10180 input_line_pointer--;
10181 demand_empty_rest_of_line ();
10182}
6482c264
NC
10183#endif
10184
43234a1e
L
10185/* Handle Vector operations. */
10186
10187static char *
10188check_VecOperations (char *op_string, char *op_end)
10189{
10190 const reg_entry *mask;
10191 const char *saved;
10192 char *end_op;
10193
10194 while (*op_string
10195 && (op_end == NULL || op_string < op_end))
10196 {
10197 saved = op_string;
10198 if (*op_string == '{')
10199 {
10200 op_string++;
10201
10202 /* Check broadcasts. */
10203 if (strncmp (op_string, "1to", 3) == 0)
10204 {
10205 int bcst_type;
10206
10207 if (i.broadcast)
10208 goto duplicated_vec_op;
10209
10210 op_string += 3;
10211 if (*op_string == '8')
8e6e0792 10212 bcst_type = 8;
b28d1bda 10213 else if (*op_string == '4')
8e6e0792 10214 bcst_type = 4;
b28d1bda 10215 else if (*op_string == '2')
8e6e0792 10216 bcst_type = 2;
43234a1e
L
10217 else if (*op_string == '1'
10218 && *(op_string+1) == '6')
10219 {
8e6e0792 10220 bcst_type = 16;
43234a1e
L
10221 op_string++;
10222 }
10223 else
10224 {
10225 as_bad (_("Unsupported broadcast: `%s'"), saved);
10226 return NULL;
10227 }
10228 op_string++;
10229
10230 broadcast_op.type = bcst_type;
10231 broadcast_op.operand = this_operand;
1f75763a 10232 broadcast_op.bytes = 0;
43234a1e
L
10233 i.broadcast = &broadcast_op;
10234 }
10235 /* Check masking operation. */
10236 else if ((mask = parse_register (op_string, &end_op)) != NULL)
10237 {
8a6fb3f9
JB
10238 if (mask == &bad_reg)
10239 return NULL;
10240
43234a1e 10241 /* k0 can't be used for write mask. */
f74a6307 10242 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
43234a1e 10243 {
6d2cd6b2
JB
10244 as_bad (_("`%s%s' can't be used for write mask"),
10245 register_prefix, mask->reg_name);
43234a1e
L
10246 return NULL;
10247 }
10248
10249 if (!i.mask)
10250 {
10251 mask_op.mask = mask;
10252 mask_op.zeroing = 0;
10253 mask_op.operand = this_operand;
10254 i.mask = &mask_op;
10255 }
10256 else
10257 {
10258 if (i.mask->mask)
10259 goto duplicated_vec_op;
10260
10261 i.mask->mask = mask;
10262
10263 /* Only "{z}" is allowed here. No need to check
10264 zeroing mask explicitly. */
10265 if (i.mask->operand != this_operand)
10266 {
10267 as_bad (_("invalid write mask `%s'"), saved);
10268 return NULL;
10269 }
10270 }
10271
10272 op_string = end_op;
10273 }
10274 /* Check zeroing-flag for masking operation. */
10275 else if (*op_string == 'z')
10276 {
10277 if (!i.mask)
10278 {
10279 mask_op.mask = NULL;
10280 mask_op.zeroing = 1;
10281 mask_op.operand = this_operand;
10282 i.mask = &mask_op;
10283 }
10284 else
10285 {
10286 if (i.mask->zeroing)
10287 {
10288 duplicated_vec_op:
10289 as_bad (_("duplicated `%s'"), saved);
10290 return NULL;
10291 }
10292
10293 i.mask->zeroing = 1;
10294
10295 /* Only "{%k}" is allowed here. No need to check mask
10296 register explicitly. */
10297 if (i.mask->operand != this_operand)
10298 {
10299 as_bad (_("invalid zeroing-masking `%s'"),
10300 saved);
10301 return NULL;
10302 }
10303 }
10304
10305 op_string++;
10306 }
10307 else
10308 goto unknown_vec_op;
10309
10310 if (*op_string != '}')
10311 {
10312 as_bad (_("missing `}' in `%s'"), saved);
10313 return NULL;
10314 }
10315 op_string++;
0ba3a731
L
10316
10317 /* Strip whitespace since the addition of pseudo prefixes
10318 changed how the scrubber treats '{'. */
10319 if (is_space_char (*op_string))
10320 ++op_string;
10321
43234a1e
L
10322 continue;
10323 }
10324 unknown_vec_op:
10325 /* We don't know this one. */
10326 as_bad (_("unknown vector operation: `%s'"), saved);
10327 return NULL;
10328 }
10329
6d2cd6b2
JB
10330 if (i.mask && i.mask->zeroing && !i.mask->mask)
10331 {
10332 as_bad (_("zeroing-masking only allowed with write mask"));
10333 return NULL;
10334 }
10335
43234a1e
L
10336 return op_string;
10337}
10338
252b5132 10339static int
70e41ade 10340i386_immediate (char *imm_start)
252b5132
RH
10341{
10342 char *save_input_line_pointer;
f3c180ae 10343 char *gotfree_input_line;
252b5132 10344 segT exp_seg = 0;
47926f60 10345 expressionS *exp;
40fb9820
L
10346 i386_operand_type types;
10347
0dfbf9d7 10348 operand_type_set (&types, ~0);
252b5132
RH
10349
10350 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10351 {
31b2323c
L
10352 as_bad (_("at most %d immediate operands are allowed"),
10353 MAX_IMMEDIATE_OPERANDS);
252b5132
RH
10354 return 0;
10355 }
10356
10357 exp = &im_expressions[i.imm_operands++];
520dc8e8 10358 i.op[this_operand].imms = exp;
252b5132
RH
10359
10360 if (is_space_char (*imm_start))
10361 ++imm_start;
10362
10363 save_input_line_pointer = input_line_pointer;
10364 input_line_pointer = imm_start;
10365
d258b828 10366 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
f3c180ae
AM
10367 if (gotfree_input_line)
10368 input_line_pointer = gotfree_input_line;
252b5132
RH
10369
10370 exp_seg = expression (exp);
10371
83183c0c 10372 SKIP_WHITESPACE ();
43234a1e
L
10373
10374 /* Handle vector operations. */
10375 if (*input_line_pointer == '{')
10376 {
10377 input_line_pointer = check_VecOperations (input_line_pointer,
10378 NULL);
10379 if (input_line_pointer == NULL)
10380 return 0;
10381 }
10382
252b5132 10383 if (*input_line_pointer)
f3c180ae 10384 as_bad (_("junk `%s' after expression"), input_line_pointer);
252b5132
RH
10385
10386 input_line_pointer = save_input_line_pointer;
f3c180ae 10387 if (gotfree_input_line)
ee86248c
JB
10388 {
10389 free (gotfree_input_line);
10390
10391 if (exp->X_op == O_constant || exp->X_op == O_register)
10392 exp->X_op = O_illegal;
10393 }
10394
10395 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10396}
252b5132 10397
ee86248c
JB
10398static int
10399i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10400 i386_operand_type types, const char *imm_start)
10401{
10402 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
252b5132 10403 {
313c53d1
L
10404 if (imm_start)
10405 as_bad (_("missing or invalid immediate expression `%s'"),
10406 imm_start);
3992d3b7 10407 return 0;
252b5132 10408 }
3e73aa7c 10409 else if (exp->X_op == O_constant)
252b5132 10410 {
47926f60 10411 /* Size it properly later. */
40fb9820 10412 i.types[this_operand].bitfield.imm64 = 1;
13f864ae
L
10413 /* If not 64bit, sign extend val. */
10414 if (flag_code != CODE_64BIT
4eed87de
AM
10415 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
10416 exp->X_add_number
10417 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
252b5132 10418 }
4c63da97 10419#if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
f86103b7 10420 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
31312f95 10421 && exp_seg != absolute_section
47926f60 10422 && exp_seg != text_section
24eab124
AM
10423 && exp_seg != data_section
10424 && exp_seg != bss_section
10425 && exp_seg != undefined_section
f86103b7 10426 && !bfd_is_com_section (exp_seg))
252b5132 10427 {
d0b47220 10428 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
252b5132
RH
10429 return 0;
10430 }
10431#endif
a841bdf5 10432 else if (!intel_syntax && exp_seg == reg_section)
bb8f5920 10433 {
313c53d1
L
10434 if (imm_start)
10435 as_bad (_("illegal immediate register operand %s"), imm_start);
bb8f5920
L
10436 return 0;
10437 }
252b5132
RH
10438 else
10439 {
10440 /* This is an address. The size of the address will be
24eab124 10441 determined later, depending on destination register,
3e73aa7c 10442 suffix, or the default for the section. */
40fb9820
L
10443 i.types[this_operand].bitfield.imm8 = 1;
10444 i.types[this_operand].bitfield.imm16 = 1;
10445 i.types[this_operand].bitfield.imm32 = 1;
10446 i.types[this_operand].bitfield.imm32s = 1;
10447 i.types[this_operand].bitfield.imm64 = 1;
c6fb90c8
L
10448 i.types[this_operand] = operand_type_and (i.types[this_operand],
10449 types);
252b5132
RH
10450 }
10451
10452 return 1;
10453}
10454
551c1ca1 10455static char *
e3bb37b5 10456i386_scale (char *scale)
252b5132 10457{
551c1ca1
AM
10458 offsetT val;
10459 char *save = input_line_pointer;
252b5132 10460
551c1ca1
AM
10461 input_line_pointer = scale;
10462 val = get_absolute_expression ();
10463
10464 switch (val)
252b5132 10465 {
551c1ca1 10466 case 1:
252b5132
RH
10467 i.log2_scale_factor = 0;
10468 break;
551c1ca1 10469 case 2:
252b5132
RH
10470 i.log2_scale_factor = 1;
10471 break;
551c1ca1 10472 case 4:
252b5132
RH
10473 i.log2_scale_factor = 2;
10474 break;
551c1ca1 10475 case 8:
252b5132
RH
10476 i.log2_scale_factor = 3;
10477 break;
10478 default:
a724f0f4
JB
10479 {
10480 char sep = *input_line_pointer;
10481
10482 *input_line_pointer = '\0';
10483 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10484 scale);
10485 *input_line_pointer = sep;
10486 input_line_pointer = save;
10487 return NULL;
10488 }
252b5132 10489 }
29b0f896 10490 if (i.log2_scale_factor != 0 && i.index_reg == 0)
252b5132
RH
10491 {
10492 as_warn (_("scale factor of %d without an index register"),
24eab124 10493 1 << i.log2_scale_factor);
252b5132 10494 i.log2_scale_factor = 0;
252b5132 10495 }
551c1ca1
AM
10496 scale = input_line_pointer;
10497 input_line_pointer = save;
10498 return scale;
252b5132
RH
10499}
10500
252b5132 10501static int
e3bb37b5 10502i386_displacement (char *disp_start, char *disp_end)
252b5132 10503{
29b0f896 10504 expressionS *exp;
252b5132
RH
10505 segT exp_seg = 0;
10506 char *save_input_line_pointer;
f3c180ae 10507 char *gotfree_input_line;
40fb9820
L
10508 int override;
10509 i386_operand_type bigdisp, types = anydisp;
3992d3b7 10510 int ret;
252b5132 10511
31b2323c
L
10512 if (i.disp_operands == MAX_MEMORY_OPERANDS)
10513 {
10514 as_bad (_("at most %d displacement operands are allowed"),
10515 MAX_MEMORY_OPERANDS);
10516 return 0;
10517 }
10518
0dfbf9d7 10519 operand_type_set (&bigdisp, 0);
6f2f06be 10520 if (i.jumpabsolute
48bcea9f 10521 || i.types[this_operand].bitfield.baseindex
0cfa3eb3
JB
10522 || (current_templates->start->opcode_modifier.jump != JUMP
10523 && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
e05278af 10524 {
48bcea9f 10525 i386_addressing_mode ();
e05278af 10526 override = (i.prefix[ADDR_PREFIX] != 0);
40fb9820
L
10527 if (flag_code == CODE_64BIT)
10528 {
10529 if (!override)
10530 {
10531 bigdisp.bitfield.disp32s = 1;
10532 bigdisp.bitfield.disp64 = 1;
10533 }
48bcea9f
JB
10534 else
10535 bigdisp.bitfield.disp32 = 1;
40fb9820
L
10536 }
10537 else if ((flag_code == CODE_16BIT) ^ override)
40fb9820 10538 bigdisp.bitfield.disp16 = 1;
48bcea9f
JB
10539 else
10540 bigdisp.bitfield.disp32 = 1;
e05278af
JB
10541 }
10542 else
10543 {
376cd056
JB
10544 /* For PC-relative branches, the width of the displacement may be
10545 dependent upon data size, but is never dependent upon address size.
10546 Also make sure to not unintentionally match against a non-PC-relative
10547 branch template. */
10548 static templates aux_templates;
10549 const insn_template *t = current_templates->start;
10550 bfd_boolean has_intel64 = FALSE;
10551
10552 aux_templates.start = t;
10553 while (++t < current_templates->end)
10554 {
10555 if (t->opcode_modifier.jump
10556 != current_templates->start->opcode_modifier.jump)
10557 break;
4b5aaf5f 10558 if ((t->opcode_modifier.isa64 >= INTEL64))
376cd056
JB
10559 has_intel64 = TRUE;
10560 }
10561 if (t < current_templates->end)
10562 {
10563 aux_templates.end = t;
10564 current_templates = &aux_templates;
10565 }
10566
e05278af 10567 override = (i.prefix[DATA_PREFIX] != 0);
40fb9820
L
10568 if (flag_code == CODE_64BIT)
10569 {
376cd056
JB
10570 if ((override || i.suffix == WORD_MNEM_SUFFIX)
10571 && (!intel64 || !has_intel64))
40fb9820
L
10572 bigdisp.bitfield.disp16 = 1;
10573 else
48bcea9f 10574 bigdisp.bitfield.disp32s = 1;
40fb9820
L
10575 }
10576 else
e05278af
JB
10577 {
10578 if (!override)
10579 override = (i.suffix == (flag_code != CODE_16BIT
10580 ? WORD_MNEM_SUFFIX
10581 : LONG_MNEM_SUFFIX));
40fb9820
L
10582 bigdisp.bitfield.disp32 = 1;
10583 if ((flag_code == CODE_16BIT) ^ override)
10584 {
10585 bigdisp.bitfield.disp32 = 0;
10586 bigdisp.bitfield.disp16 = 1;
10587 }
e05278af 10588 }
e05278af 10589 }
c6fb90c8
L
10590 i.types[this_operand] = operand_type_or (i.types[this_operand],
10591 bigdisp);
252b5132
RH
10592
10593 exp = &disp_expressions[i.disp_operands];
520dc8e8 10594 i.op[this_operand].disps = exp;
252b5132
RH
10595 i.disp_operands++;
10596 save_input_line_pointer = input_line_pointer;
10597 input_line_pointer = disp_start;
10598 END_STRING_AND_SAVE (disp_end);
10599
10600#ifndef GCC_ASM_O_HACK
10601#define GCC_ASM_O_HACK 0
10602#endif
10603#if GCC_ASM_O_HACK
10604 END_STRING_AND_SAVE (disp_end + 1);
40fb9820 10605 if (i.types[this_operand].bitfield.baseIndex
24eab124 10606 && displacement_string_end[-1] == '+')
252b5132
RH
10607 {
10608 /* This hack is to avoid a warning when using the "o"
24eab124
AM
10609 constraint within gcc asm statements.
10610 For instance:
10611
10612 #define _set_tssldt_desc(n,addr,limit,type) \
10613 __asm__ __volatile__ ( \
10614 "movw %w2,%0\n\t" \
10615 "movw %w1,2+%0\n\t" \
10616 "rorl $16,%1\n\t" \
10617 "movb %b1,4+%0\n\t" \
10618 "movb %4,5+%0\n\t" \
10619 "movb $0,6+%0\n\t" \
10620 "movb %h1,7+%0\n\t" \
10621 "rorl $16,%1" \
10622 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10623
10624 This works great except that the output assembler ends
10625 up looking a bit weird if it turns out that there is
10626 no offset. You end up producing code that looks like:
10627
10628 #APP
10629 movw $235,(%eax)
10630 movw %dx,2+(%eax)
10631 rorl $16,%edx
10632 movb %dl,4+(%eax)
10633 movb $137,5+(%eax)
10634 movb $0,6+(%eax)
10635 movb %dh,7+(%eax)
10636 rorl $16,%edx
10637 #NO_APP
10638
47926f60 10639 So here we provide the missing zero. */
24eab124
AM
10640
10641 *displacement_string_end = '0';
252b5132
RH
10642 }
10643#endif
d258b828 10644 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
f3c180ae
AM
10645 if (gotfree_input_line)
10646 input_line_pointer = gotfree_input_line;
252b5132 10647
24eab124 10648 exp_seg = expression (exp);
252b5132 10649
636c26b0
AM
10650 SKIP_WHITESPACE ();
10651 if (*input_line_pointer)
10652 as_bad (_("junk `%s' after expression"), input_line_pointer);
10653#if GCC_ASM_O_HACK
10654 RESTORE_END_STRING (disp_end + 1);
10655#endif
636c26b0 10656 input_line_pointer = save_input_line_pointer;
636c26b0 10657 if (gotfree_input_line)
ee86248c
JB
10658 {
10659 free (gotfree_input_line);
10660
10661 if (exp->X_op == O_constant || exp->X_op == O_register)
10662 exp->X_op = O_illegal;
10663 }
10664
10665 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10666
10667 RESTORE_END_STRING (disp_end);
10668
10669 return ret;
10670}
10671
10672static int
10673i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10674 i386_operand_type types, const char *disp_start)
10675{
10676 i386_operand_type bigdisp;
10677 int ret = 1;
636c26b0 10678
24eab124
AM
10679 /* We do this to make sure that the section symbol is in
10680 the symbol table. We will ultimately change the relocation
47926f60 10681 to be relative to the beginning of the section. */
1ae12ab7 10682 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
d6ab8113
JB
10683 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10684 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
24eab124 10685 {
636c26b0 10686 if (exp->X_op != O_symbol)
3992d3b7 10687 goto inv_disp;
636c26b0 10688
e5cb08ac 10689 if (S_IS_LOCAL (exp->X_add_symbol)
c64efb4b
L
10690 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10691 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
24eab124 10692 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
24eab124
AM
10693 exp->X_op = O_subtract;
10694 exp->X_op_symbol = GOT_symbol;
1ae12ab7 10695 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
29b0f896 10696 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
d6ab8113
JB
10697 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10698 i.reloc[this_operand] = BFD_RELOC_64;
23df1078 10699 else
29b0f896 10700 i.reloc[this_operand] = BFD_RELOC_32;
24eab124 10701 }
252b5132 10702
3992d3b7
AM
10703 else if (exp->X_op == O_absent
10704 || exp->X_op == O_illegal
ee86248c 10705 || exp->X_op == O_big)
2daf4fd8 10706 {
3992d3b7
AM
10707 inv_disp:
10708 as_bad (_("missing or invalid displacement expression `%s'"),
2daf4fd8 10709 disp_start);
3992d3b7 10710 ret = 0;
2daf4fd8
AM
10711 }
10712
0e1147d9
L
10713 else if (flag_code == CODE_64BIT
10714 && !i.prefix[ADDR_PREFIX]
10715 && exp->X_op == O_constant)
10716 {
10717 /* Since displacement is signed extended to 64bit, don't allow
10718 disp32 and turn off disp32s if they are out of range. */
10719 i.types[this_operand].bitfield.disp32 = 0;
10720 if (!fits_in_signed_long (exp->X_add_number))
10721 {
10722 i.types[this_operand].bitfield.disp32s = 0;
10723 if (i.types[this_operand].bitfield.baseindex)
10724 {
10725 as_bad (_("0x%lx out range of signed 32bit displacement"),
10726 (long) exp->X_add_number);
10727 ret = 0;
10728 }
10729 }
10730 }
10731
4c63da97 10732#if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
3992d3b7
AM
10733 else if (exp->X_op != O_constant
10734 && OUTPUT_FLAVOR == bfd_target_aout_flavour
10735 && exp_seg != absolute_section
10736 && exp_seg != text_section
10737 && exp_seg != data_section
10738 && exp_seg != bss_section
10739 && exp_seg != undefined_section
10740 && !bfd_is_com_section (exp_seg))
24eab124 10741 {
d0b47220 10742 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
3992d3b7 10743 ret = 0;
24eab124 10744 }
252b5132 10745#endif
3956db08 10746
48bcea9f
JB
10747 if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10748 /* Constants get taken care of by optimize_disp(). */
10749 && exp->X_op != O_constant)
10750 i.types[this_operand].bitfield.disp8 = 1;
10751
40fb9820
L
10752 /* Check if this is a displacement only operand. */
10753 bigdisp = i.types[this_operand];
10754 bigdisp.bitfield.disp8 = 0;
10755 bigdisp.bitfield.disp16 = 0;
10756 bigdisp.bitfield.disp32 = 0;
10757 bigdisp.bitfield.disp32s = 0;
10758 bigdisp.bitfield.disp64 = 0;
0dfbf9d7 10759 if (operand_type_all_zero (&bigdisp))
c6fb90c8
L
10760 i.types[this_operand] = operand_type_and (i.types[this_operand],
10761 types);
3956db08 10762
3992d3b7 10763 return ret;
252b5132
RH
10764}
10765
2abc2bec
JB
10766/* Return the active addressing mode, taking address override and
10767 registers forming the address into consideration. Update the
10768 address override prefix if necessary. */
47926f60 10769
2abc2bec
JB
10770static enum flag_code
10771i386_addressing_mode (void)
252b5132 10772{
be05d201
L
10773 enum flag_code addr_mode;
10774
10775 if (i.prefix[ADDR_PREFIX])
10776 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
a23b33b3
JB
10777 else if (flag_code == CODE_16BIT
10778 && current_templates->start->cpu_flags.bitfield.cpumpx
10779 /* Avoid replacing the "16-bit addressing not allowed" diagnostic
10780 from md_assemble() by "is not a valid base/index expression"
10781 when there is a base and/or index. */
10782 && !i.types[this_operand].bitfield.baseindex)
10783 {
10784 /* MPX insn memory operands with neither base nor index must be forced
10785 to use 32-bit addressing in 16-bit mode. */
10786 addr_mode = CODE_32BIT;
10787 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10788 ++i.prefixes;
10789 gas_assert (!i.types[this_operand].bitfield.disp16);
10790 gas_assert (!i.types[this_operand].bitfield.disp32);
10791 }
be05d201
L
10792 else
10793 {
10794 addr_mode = flag_code;
10795
24eab124 10796#if INFER_ADDR_PREFIX
be05d201
L
10797 if (i.mem_operands == 0)
10798 {
10799 /* Infer address prefix from the first memory operand. */
10800 const reg_entry *addr_reg = i.base_reg;
10801
10802 if (addr_reg == NULL)
10803 addr_reg = i.index_reg;
eecb386c 10804
be05d201
L
10805 if (addr_reg)
10806 {
e968fc9b 10807 if (addr_reg->reg_type.bitfield.dword)
be05d201
L
10808 addr_mode = CODE_32BIT;
10809 else if (flag_code != CODE_64BIT
dc821c5f 10810 && addr_reg->reg_type.bitfield.word)
be05d201
L
10811 addr_mode = CODE_16BIT;
10812
10813 if (addr_mode != flag_code)
10814 {
10815 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10816 i.prefixes += 1;
10817 /* Change the size of any displacement too. At most one
10818 of Disp16 or Disp32 is set.
10819 FIXME. There doesn't seem to be any real need for
10820 separate Disp16 and Disp32 flags. The same goes for
10821 Imm16 and Imm32. Removing them would probably clean
10822 up the code quite a lot. */
10823 if (flag_code != CODE_64BIT
10824 && (i.types[this_operand].bitfield.disp16
10825 || i.types[this_operand].bitfield.disp32))
10826 i.types[this_operand]
10827 = operand_type_xor (i.types[this_operand], disp16_32);
10828 }
10829 }
10830 }
24eab124 10831#endif
be05d201
L
10832 }
10833
2abc2bec
JB
10834 return addr_mode;
10835}
10836
10837/* Make sure the memory operand we've been dealt is valid.
10838 Return 1 on success, 0 on a failure. */
10839
10840static int
10841i386_index_check (const char *operand_string)
10842{
10843 const char *kind = "base/index";
10844 enum flag_code addr_mode = i386_addressing_mode ();
10845
fc0763e6 10846 if (current_templates->start->opcode_modifier.isstring
c3949f43 10847 && !current_templates->start->cpu_flags.bitfield.cpupadlock
fc0763e6
JB
10848 && (current_templates->end[-1].opcode_modifier.isstring
10849 || i.mem_operands))
10850 {
10851 /* Memory operands of string insns are special in that they only allow
10852 a single register (rDI, rSI, or rBX) as their memory address. */
be05d201
L
10853 const reg_entry *expected_reg;
10854 static const char *di_si[][2] =
10855 {
10856 { "esi", "edi" },
10857 { "si", "di" },
10858 { "rsi", "rdi" }
10859 };
10860 static const char *bx[] = { "ebx", "bx", "rbx" };
fc0763e6
JB
10861
10862 kind = "string address";
10863
8325cc63 10864 if (current_templates->start->opcode_modifier.repprefixok)
fc0763e6 10865 {
51c8edf6
JB
10866 int es_op = current_templates->end[-1].opcode_modifier.isstring
10867 - IS_STRING_ES_OP0;
10868 int op = 0;
fc0763e6 10869
51c8edf6 10870 if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
fc0763e6
JB
10871 || ((!i.mem_operands != !intel_syntax)
10872 && current_templates->end[-1].operand_types[1]
10873 .bitfield.baseindex))
51c8edf6
JB
10874 op = 1;
10875 expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
fc0763e6
JB
10876 }
10877 else
be05d201 10878 expected_reg = hash_find (reg_hash, bx[addr_mode]);
fc0763e6 10879
be05d201
L
10880 if (i.base_reg != expected_reg
10881 || i.index_reg
fc0763e6 10882 || operand_type_check (i.types[this_operand], disp))
fc0763e6 10883 {
be05d201
L
10884 /* The second memory operand must have the same size as
10885 the first one. */
10886 if (i.mem_operands
10887 && i.base_reg
10888 && !((addr_mode == CODE_64BIT
dc821c5f 10889 && i.base_reg->reg_type.bitfield.qword)
be05d201 10890 || (addr_mode == CODE_32BIT
dc821c5f
JB
10891 ? i.base_reg->reg_type.bitfield.dword
10892 : i.base_reg->reg_type.bitfield.word)))
be05d201
L
10893 goto bad_address;
10894
fc0763e6
JB
10895 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10896 operand_string,
10897 intel_syntax ? '[' : '(',
10898 register_prefix,
be05d201 10899 expected_reg->reg_name,
fc0763e6 10900 intel_syntax ? ']' : ')');
be05d201 10901 return 1;
fc0763e6 10902 }
be05d201
L
10903 else
10904 return 1;
10905
dc1e8a47 10906 bad_address:
be05d201
L
10907 as_bad (_("`%s' is not a valid %s expression"),
10908 operand_string, kind);
10909 return 0;
3e73aa7c
JH
10910 }
10911 else
10912 {
be05d201
L
10913 if (addr_mode != CODE_16BIT)
10914 {
10915 /* 32-bit/64-bit checks. */
10916 if ((i.base_reg
e968fc9b
JB
10917 && ((addr_mode == CODE_64BIT
10918 ? !i.base_reg->reg_type.bitfield.qword
10919 : !i.base_reg->reg_type.bitfield.dword)
10920 || (i.index_reg && i.base_reg->reg_num == RegIP)
10921 || i.base_reg->reg_num == RegIZ))
be05d201 10922 || (i.index_reg
1b54b8d7
JB
10923 && !i.index_reg->reg_type.bitfield.xmmword
10924 && !i.index_reg->reg_type.bitfield.ymmword
10925 && !i.index_reg->reg_type.bitfield.zmmword
be05d201 10926 && ((addr_mode == CODE_64BIT
e968fc9b
JB
10927 ? !i.index_reg->reg_type.bitfield.qword
10928 : !i.index_reg->reg_type.bitfield.dword)
be05d201
L
10929 || !i.index_reg->reg_type.bitfield.baseindex)))
10930 goto bad_address;
8178be5b
JB
10931
10932 /* bndmk, bndldx, and bndstx have special restrictions. */
10933 if (current_templates->start->base_opcode == 0xf30f1b
10934 || (current_templates->start->base_opcode & ~1) == 0x0f1a)
10935 {
10936 /* They cannot use RIP-relative addressing. */
e968fc9b 10937 if (i.base_reg && i.base_reg->reg_num == RegIP)
8178be5b
JB
10938 {
10939 as_bad (_("`%s' cannot be used here"), operand_string);
10940 return 0;
10941 }
10942
10943 /* bndldx and bndstx ignore their scale factor. */
10944 if (current_templates->start->base_opcode != 0xf30f1b
10945 && i.log2_scale_factor)
10946 as_warn (_("register scaling is being ignored here"));
10947 }
be05d201
L
10948 }
10949 else
3e73aa7c 10950 {
be05d201 10951 /* 16-bit checks. */
3e73aa7c 10952 if ((i.base_reg
dc821c5f 10953 && (!i.base_reg->reg_type.bitfield.word
40fb9820 10954 || !i.base_reg->reg_type.bitfield.baseindex))
3e73aa7c 10955 || (i.index_reg
dc821c5f 10956 && (!i.index_reg->reg_type.bitfield.word
40fb9820 10957 || !i.index_reg->reg_type.bitfield.baseindex
29b0f896
AM
10958 || !(i.base_reg
10959 && i.base_reg->reg_num < 6
10960 && i.index_reg->reg_num >= 6
10961 && i.log2_scale_factor == 0))))
be05d201 10962 goto bad_address;
3e73aa7c
JH
10963 }
10964 }
be05d201 10965 return 1;
24eab124 10966}
252b5132 10967
43234a1e
L
10968/* Handle vector immediates. */
10969
10970static int
10971RC_SAE_immediate (const char *imm_start)
10972{
10973 unsigned int match_found, j;
10974 const char *pstr = imm_start;
10975 expressionS *exp;
10976
10977 if (*pstr != '{')
10978 return 0;
10979
10980 pstr++;
10981 match_found = 0;
10982 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10983 {
10984 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10985 {
10986 if (!i.rounding)
10987 {
10988 rc_op.type = RC_NamesTable[j].type;
10989 rc_op.operand = this_operand;
10990 i.rounding = &rc_op;
10991 }
10992 else
10993 {
10994 as_bad (_("duplicated `%s'"), imm_start);
10995 return 0;
10996 }
10997 pstr += RC_NamesTable[j].len;
10998 match_found = 1;
10999 break;
11000 }
11001 }
11002 if (!match_found)
11003 return 0;
11004
11005 if (*pstr++ != '}')
11006 {
11007 as_bad (_("Missing '}': '%s'"), imm_start);
11008 return 0;
11009 }
11010 /* RC/SAE immediate string should contain nothing more. */;
11011 if (*pstr != 0)
11012 {
11013 as_bad (_("Junk after '}': '%s'"), imm_start);
11014 return 0;
11015 }
11016
11017 exp = &im_expressions[i.imm_operands++];
11018 i.op[this_operand].imms = exp;
11019
11020 exp->X_op = O_constant;
11021 exp->X_add_number = 0;
11022 exp->X_add_symbol = (symbolS *) 0;
11023 exp->X_op_symbol = (symbolS *) 0;
11024
11025 i.types[this_operand].bitfield.imm8 = 1;
11026 return 1;
11027}
11028
8325cc63
JB
11029/* Only string instructions can have a second memory operand, so
11030 reduce current_templates to just those if it contains any. */
11031static int
11032maybe_adjust_templates (void)
11033{
11034 const insn_template *t;
11035
11036 gas_assert (i.mem_operands == 1);
11037
11038 for (t = current_templates->start; t < current_templates->end; ++t)
11039 if (t->opcode_modifier.isstring)
11040 break;
11041
11042 if (t < current_templates->end)
11043 {
11044 static templates aux_templates;
11045 bfd_boolean recheck;
11046
11047 aux_templates.start = t;
11048 for (; t < current_templates->end; ++t)
11049 if (!t->opcode_modifier.isstring)
11050 break;
11051 aux_templates.end = t;
11052
11053 /* Determine whether to re-check the first memory operand. */
11054 recheck = (aux_templates.start != current_templates->start
11055 || t != current_templates->end);
11056
11057 current_templates = &aux_templates;
11058
11059 if (recheck)
11060 {
11061 i.mem_operands = 0;
11062 if (i.memop1_string != NULL
11063 && i386_index_check (i.memop1_string) == 0)
11064 return 0;
11065 i.mem_operands = 1;
11066 }
11067 }
11068
11069 return 1;
11070}
11071
fc0763e6 11072/* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
47926f60 11073 on error. */
252b5132 11074
252b5132 11075static int
a7619375 11076i386_att_operand (char *operand_string)
252b5132 11077{
af6bdddf
AM
11078 const reg_entry *r;
11079 char *end_op;
24eab124 11080 char *op_string = operand_string;
252b5132 11081
24eab124 11082 if (is_space_char (*op_string))
252b5132
RH
11083 ++op_string;
11084
24eab124 11085 /* We check for an absolute prefix (differentiating,
47926f60 11086 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
24eab124
AM
11087 if (*op_string == ABSOLUTE_PREFIX)
11088 {
11089 ++op_string;
11090 if (is_space_char (*op_string))
11091 ++op_string;
6f2f06be 11092 i.jumpabsolute = TRUE;
24eab124 11093 }
252b5132 11094
47926f60 11095 /* Check if operand is a register. */
4d1bb795 11096 if ((r = parse_register (op_string, &end_op)) != NULL)
24eab124 11097 {
40fb9820
L
11098 i386_operand_type temp;
11099
8a6fb3f9
JB
11100 if (r == &bad_reg)
11101 return 0;
11102
24eab124
AM
11103 /* Check for a segment override by searching for ':' after a
11104 segment register. */
11105 op_string = end_op;
11106 if (is_space_char (*op_string))
11107 ++op_string;
00cee14f 11108 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
24eab124
AM
11109 {
11110 switch (r->reg_num)
11111 {
11112 case 0:
11113 i.seg[i.mem_operands] = &es;
11114 break;
11115 case 1:
11116 i.seg[i.mem_operands] = &cs;
11117 break;
11118 case 2:
11119 i.seg[i.mem_operands] = &ss;
11120 break;
11121 case 3:
11122 i.seg[i.mem_operands] = &ds;
11123 break;
11124 case 4:
11125 i.seg[i.mem_operands] = &fs;
11126 break;
11127 case 5:
11128 i.seg[i.mem_operands] = &gs;
11129 break;
11130 }
252b5132 11131
24eab124 11132 /* Skip the ':' and whitespace. */
252b5132
RH
11133 ++op_string;
11134 if (is_space_char (*op_string))
24eab124 11135 ++op_string;
252b5132 11136
24eab124
AM
11137 if (!is_digit_char (*op_string)
11138 && !is_identifier_char (*op_string)
11139 && *op_string != '('
11140 && *op_string != ABSOLUTE_PREFIX)
11141 {
11142 as_bad (_("bad memory operand `%s'"), op_string);
11143 return 0;
11144 }
47926f60 11145 /* Handle case of %es:*foo. */
24eab124
AM
11146 if (*op_string == ABSOLUTE_PREFIX)
11147 {
11148 ++op_string;
11149 if (is_space_char (*op_string))
11150 ++op_string;
6f2f06be 11151 i.jumpabsolute = TRUE;
24eab124
AM
11152 }
11153 goto do_memory_reference;
11154 }
43234a1e
L
11155
11156 /* Handle vector operations. */
11157 if (*op_string == '{')
11158 {
11159 op_string = check_VecOperations (op_string, NULL);
11160 if (op_string == NULL)
11161 return 0;
11162 }
11163
24eab124
AM
11164 if (*op_string)
11165 {
d0b47220 11166 as_bad (_("junk `%s' after register"), op_string);
24eab124
AM
11167 return 0;
11168 }
40fb9820
L
11169 temp = r->reg_type;
11170 temp.bitfield.baseindex = 0;
c6fb90c8
L
11171 i.types[this_operand] = operand_type_or (i.types[this_operand],
11172 temp);
7d5e4556 11173 i.types[this_operand].bitfield.unspecified = 0;
520dc8e8 11174 i.op[this_operand].regs = r;
24eab124
AM
11175 i.reg_operands++;
11176 }
af6bdddf
AM
11177 else if (*op_string == REGISTER_PREFIX)
11178 {
11179 as_bad (_("bad register name `%s'"), op_string);
11180 return 0;
11181 }
24eab124 11182 else if (*op_string == IMMEDIATE_PREFIX)
ce8a8b2f 11183 {
24eab124 11184 ++op_string;
6f2f06be 11185 if (i.jumpabsolute)
24eab124 11186 {
d0b47220 11187 as_bad (_("immediate operand illegal with absolute jump"));
24eab124
AM
11188 return 0;
11189 }
11190 if (!i386_immediate (op_string))
11191 return 0;
11192 }
43234a1e
L
11193 else if (RC_SAE_immediate (operand_string))
11194 {
11195 /* If it is a RC or SAE immediate, do nothing. */
11196 ;
11197 }
24eab124
AM
11198 else if (is_digit_char (*op_string)
11199 || is_identifier_char (*op_string)
d02603dc 11200 || *op_string == '"'
e5cb08ac 11201 || *op_string == '(')
24eab124 11202 {
47926f60 11203 /* This is a memory reference of some sort. */
af6bdddf 11204 char *base_string;
252b5132 11205
47926f60 11206 /* Start and end of displacement string expression (if found). */
eecb386c
AM
11207 char *displacement_string_start;
11208 char *displacement_string_end;
43234a1e 11209 char *vop_start;
252b5132 11210
24eab124 11211 do_memory_reference:
8325cc63
JB
11212 if (i.mem_operands == 1 && !maybe_adjust_templates ())
11213 return 0;
24eab124 11214 if ((i.mem_operands == 1
40fb9820 11215 && !current_templates->start->opcode_modifier.isstring)
24eab124
AM
11216 || i.mem_operands == 2)
11217 {
11218 as_bad (_("too many memory references for `%s'"),
11219 current_templates->start->name);
11220 return 0;
11221 }
252b5132 11222
24eab124
AM
11223 /* Check for base index form. We detect the base index form by
11224 looking for an ')' at the end of the operand, searching
11225 for the '(' matching it, and finding a REGISTER_PREFIX or ','
11226 after the '('. */
af6bdddf 11227 base_string = op_string + strlen (op_string);
c3332e24 11228
43234a1e
L
11229 /* Handle vector operations. */
11230 vop_start = strchr (op_string, '{');
11231 if (vop_start && vop_start < base_string)
11232 {
11233 if (check_VecOperations (vop_start, base_string) == NULL)
11234 return 0;
11235 base_string = vop_start;
11236 }
11237
af6bdddf
AM
11238 --base_string;
11239 if (is_space_char (*base_string))
11240 --base_string;
252b5132 11241
47926f60 11242 /* If we only have a displacement, set-up for it to be parsed later. */
af6bdddf
AM
11243 displacement_string_start = op_string;
11244 displacement_string_end = base_string + 1;
252b5132 11245
24eab124
AM
11246 if (*base_string == ')')
11247 {
af6bdddf 11248 char *temp_string;
24eab124
AM
11249 unsigned int parens_balanced = 1;
11250 /* We've already checked that the number of left & right ()'s are
47926f60 11251 equal, so this loop will not be infinite. */
24eab124
AM
11252 do
11253 {
11254 base_string--;
11255 if (*base_string == ')')
11256 parens_balanced++;
11257 if (*base_string == '(')
11258 parens_balanced--;
11259 }
11260 while (parens_balanced);
c3332e24 11261
af6bdddf 11262 temp_string = base_string;
c3332e24 11263
24eab124 11264 /* Skip past '(' and whitespace. */
252b5132
RH
11265 ++base_string;
11266 if (is_space_char (*base_string))
24eab124 11267 ++base_string;
252b5132 11268
af6bdddf 11269 if (*base_string == ','
4eed87de
AM
11270 || ((i.base_reg = parse_register (base_string, &end_op))
11271 != NULL))
252b5132 11272 {
af6bdddf 11273 displacement_string_end = temp_string;
252b5132 11274
40fb9820 11275 i.types[this_operand].bitfield.baseindex = 1;
252b5132 11276
af6bdddf 11277 if (i.base_reg)
24eab124 11278 {
8a6fb3f9
JB
11279 if (i.base_reg == &bad_reg)
11280 return 0;
24eab124
AM
11281 base_string = end_op;
11282 if (is_space_char (*base_string))
11283 ++base_string;
af6bdddf
AM
11284 }
11285
11286 /* There may be an index reg or scale factor here. */
11287 if (*base_string == ',')
11288 {
11289 ++base_string;
11290 if (is_space_char (*base_string))
11291 ++base_string;
11292
4eed87de
AM
11293 if ((i.index_reg = parse_register (base_string, &end_op))
11294 != NULL)
24eab124 11295 {
8a6fb3f9
JB
11296 if (i.index_reg == &bad_reg)
11297 return 0;
af6bdddf 11298 base_string = end_op;
24eab124
AM
11299 if (is_space_char (*base_string))
11300 ++base_string;
af6bdddf
AM
11301 if (*base_string == ',')
11302 {
11303 ++base_string;
11304 if (is_space_char (*base_string))
11305 ++base_string;
11306 }
e5cb08ac 11307 else if (*base_string != ')')
af6bdddf 11308 {
4eed87de
AM
11309 as_bad (_("expecting `,' or `)' "
11310 "after index register in `%s'"),
af6bdddf
AM
11311 operand_string);
11312 return 0;
11313 }
24eab124 11314 }
af6bdddf 11315 else if (*base_string == REGISTER_PREFIX)
24eab124 11316 {
f76bf5e0
L
11317 end_op = strchr (base_string, ',');
11318 if (end_op)
11319 *end_op = '\0';
af6bdddf 11320 as_bad (_("bad register name `%s'"), base_string);
24eab124
AM
11321 return 0;
11322 }
252b5132 11323
47926f60 11324 /* Check for scale factor. */
551c1ca1 11325 if (*base_string != ')')
af6bdddf 11326 {
551c1ca1
AM
11327 char *end_scale = i386_scale (base_string);
11328
11329 if (!end_scale)
af6bdddf 11330 return 0;
24eab124 11331
551c1ca1 11332 base_string = end_scale;
af6bdddf
AM
11333 if (is_space_char (*base_string))
11334 ++base_string;
11335 if (*base_string != ')')
11336 {
4eed87de
AM
11337 as_bad (_("expecting `)' "
11338 "after scale factor in `%s'"),
af6bdddf
AM
11339 operand_string);
11340 return 0;
11341 }
11342 }
11343 else if (!i.index_reg)
24eab124 11344 {
4eed87de
AM
11345 as_bad (_("expecting index register or scale factor "
11346 "after `,'; got '%c'"),
af6bdddf 11347 *base_string);
24eab124
AM
11348 return 0;
11349 }
11350 }
af6bdddf 11351 else if (*base_string != ')')
24eab124 11352 {
4eed87de
AM
11353 as_bad (_("expecting `,' or `)' "
11354 "after base register in `%s'"),
af6bdddf 11355 operand_string);
24eab124
AM
11356 return 0;
11357 }
c3332e24 11358 }
af6bdddf 11359 else if (*base_string == REGISTER_PREFIX)
c3332e24 11360 {
f76bf5e0
L
11361 end_op = strchr (base_string, ',');
11362 if (end_op)
11363 *end_op = '\0';
af6bdddf 11364 as_bad (_("bad register name `%s'"), base_string);
24eab124 11365 return 0;
c3332e24 11366 }
24eab124
AM
11367 }
11368
11369 /* If there's an expression beginning the operand, parse it,
11370 assuming displacement_string_start and
11371 displacement_string_end are meaningful. */
11372 if (displacement_string_start != displacement_string_end)
11373 {
11374 if (!i386_displacement (displacement_string_start,
11375 displacement_string_end))
11376 return 0;
11377 }
11378
11379 /* Special case for (%dx) while doing input/output op. */
11380 if (i.base_reg
75e5731b
JB
11381 && i.base_reg->reg_type.bitfield.instance == RegD
11382 && i.base_reg->reg_type.bitfield.word
24eab124
AM
11383 && i.index_reg == 0
11384 && i.log2_scale_factor == 0
11385 && i.seg[i.mem_operands] == 0
40fb9820 11386 && !operand_type_check (i.types[this_operand], disp))
24eab124 11387 {
2fb5be8d 11388 i.types[this_operand] = i.base_reg->reg_type;
24eab124
AM
11389 return 1;
11390 }
11391
eecb386c
AM
11392 if (i386_index_check (operand_string) == 0)
11393 return 0;
c48dadc9 11394 i.flags[this_operand] |= Operand_Mem;
8325cc63
JB
11395 if (i.mem_operands == 0)
11396 i.memop1_string = xstrdup (operand_string);
24eab124
AM
11397 i.mem_operands++;
11398 }
11399 else
ce8a8b2f
AM
11400 {
11401 /* It's not a memory operand; argh! */
24eab124
AM
11402 as_bad (_("invalid char %s beginning operand %d `%s'"),
11403 output_invalid (*op_string),
11404 this_operand + 1,
11405 op_string);
11406 return 0;
11407 }
47926f60 11408 return 1; /* Normal return. */
252b5132
RH
11409}
11410\f
fa94de6b
RM
11411/* Calculate the maximum variable size (i.e., excluding fr_fix)
11412 that an rs_machine_dependent frag may reach. */
11413
11414unsigned int
11415i386_frag_max_var (fragS *frag)
11416{
11417 /* The only relaxable frags are for jumps.
11418 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
11419 gas_assert (frag->fr_type == rs_machine_dependent);
11420 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11421}
11422
b084df0b
L
11423#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11424static int
8dcea932 11425elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
b084df0b
L
11426{
11427 /* STT_GNU_IFUNC symbol must go through PLT. */
11428 if ((symbol_get_bfdsym (fr_symbol)->flags
11429 & BSF_GNU_INDIRECT_FUNCTION) != 0)
11430 return 0;
11431
11432 if (!S_IS_EXTERNAL (fr_symbol))
11433 /* Symbol may be weak or local. */
11434 return !S_IS_WEAK (fr_symbol);
11435
8dcea932
L
11436 /* Global symbols with non-default visibility can't be preempted. */
11437 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11438 return 1;
11439
11440 if (fr_var != NO_RELOC)
11441 switch ((enum bfd_reloc_code_real) fr_var)
11442 {
11443 case BFD_RELOC_386_PLT32:
11444 case BFD_RELOC_X86_64_PLT32:
33eaf5de 11445 /* Symbol with PLT relocation may be preempted. */
8dcea932
L
11446 return 0;
11447 default:
11448 abort ();
11449 }
11450
b084df0b
L
11451 /* Global symbols with default visibility in a shared library may be
11452 preempted by another definition. */
8dcea932 11453 return !shared;
b084df0b
L
11454}
11455#endif
11456
79d72f45
HL
11457/* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11458 Note also work for Skylake and Cascadelake.
11459---------------------------------------------------------------------
11460| JCC | ADD/SUB/CMP | INC/DEC | TEST/AND |
11461| ------ | ----------- | ------- | -------- |
11462| Jo | N | N | Y |
11463| Jno | N | N | Y |
11464| Jc/Jb | Y | N | Y |
11465| Jae/Jnb | Y | N | Y |
11466| Je/Jz | Y | Y | Y |
11467| Jne/Jnz | Y | Y | Y |
11468| Jna/Jbe | Y | N | Y |
11469| Ja/Jnbe | Y | N | Y |
11470| Js | N | N | Y |
11471| Jns | N | N | Y |
11472| Jp/Jpe | N | N | Y |
11473| Jnp/Jpo | N | N | Y |
11474| Jl/Jnge | Y | Y | Y |
11475| Jge/Jnl | Y | Y | Y |
11476| Jle/Jng | Y | Y | Y |
11477| Jg/Jnle | Y | Y | Y |
11478--------------------------------------------------------------------- */
11479static int
11480i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11481{
11482 if (mf_cmp == mf_cmp_alu_cmp)
11483 return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11484 || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11485 if (mf_cmp == mf_cmp_incdec)
11486 return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11487 || mf_jcc == mf_jcc_jle);
11488 if (mf_cmp == mf_cmp_test_and)
11489 return 1;
11490 return 0;
11491}
11492
e379e5f3
L
11493/* Return the next non-empty frag. */
11494
11495static fragS *
11496i386_next_non_empty_frag (fragS *fragP)
11497{
11498 /* There may be a frag with a ".fill 0" when there is no room in
11499 the current frag for frag_grow in output_insn. */
11500 for (fragP = fragP->fr_next;
11501 (fragP != NULL
11502 && fragP->fr_type == rs_fill
11503 && fragP->fr_fix == 0);
11504 fragP = fragP->fr_next)
11505 ;
11506 return fragP;
11507}
11508
11509/* Return the next jcc frag after BRANCH_PADDING. */
11510
11511static fragS *
79d72f45 11512i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
e379e5f3 11513{
79d72f45
HL
11514 fragS *branch_fragP;
11515 if (!pad_fragP)
e379e5f3
L
11516 return NULL;
11517
79d72f45
HL
11518 if (pad_fragP->fr_type == rs_machine_dependent
11519 && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
e379e5f3
L
11520 == BRANCH_PADDING))
11521 {
79d72f45
HL
11522 branch_fragP = i386_next_non_empty_frag (pad_fragP);
11523 if (branch_fragP->fr_type != rs_machine_dependent)
e379e5f3 11524 return NULL;
79d72f45
HL
11525 if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11526 && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11527 pad_fragP->tc_frag_data.mf_type))
11528 return branch_fragP;
e379e5f3
L
11529 }
11530
11531 return NULL;
11532}
11533
11534/* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags. */
11535
11536static void
11537i386_classify_machine_dependent_frag (fragS *fragP)
11538{
11539 fragS *cmp_fragP;
11540 fragS *pad_fragP;
11541 fragS *branch_fragP;
11542 fragS *next_fragP;
11543 unsigned int max_prefix_length;
11544
11545 if (fragP->tc_frag_data.classified)
11546 return;
11547
11548 /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING. Convert
11549 FUSED_JCC_PADDING and merge BRANCH_PADDING. */
11550 for (next_fragP = fragP;
11551 next_fragP != NULL;
11552 next_fragP = next_fragP->fr_next)
11553 {
11554 next_fragP->tc_frag_data.classified = 1;
11555 if (next_fragP->fr_type == rs_machine_dependent)
11556 switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11557 {
11558 case BRANCH_PADDING:
11559 /* The BRANCH_PADDING frag must be followed by a branch
11560 frag. */
11561 branch_fragP = i386_next_non_empty_frag (next_fragP);
11562 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11563 break;
11564 case FUSED_JCC_PADDING:
11565 /* Check if this is a fused jcc:
11566 FUSED_JCC_PADDING
11567 CMP like instruction
11568 BRANCH_PADDING
11569 COND_JUMP
11570 */
11571 cmp_fragP = i386_next_non_empty_frag (next_fragP);
11572 pad_fragP = i386_next_non_empty_frag (cmp_fragP);
79d72f45 11573 branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
e379e5f3
L
11574 if (branch_fragP)
11575 {
11576 /* The BRANCH_PADDING frag is merged with the
11577 FUSED_JCC_PADDING frag. */
11578 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11579 /* CMP like instruction size. */
11580 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11581 frag_wane (pad_fragP);
11582 /* Skip to branch_fragP. */
11583 next_fragP = branch_fragP;
11584 }
11585 else if (next_fragP->tc_frag_data.max_prefix_length)
11586 {
11587 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11588 a fused jcc. */
11589 next_fragP->fr_subtype
11590 = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11591 next_fragP->tc_frag_data.max_bytes
11592 = next_fragP->tc_frag_data.max_prefix_length;
11593 /* This will be updated in the BRANCH_PREFIX scan. */
11594 next_fragP->tc_frag_data.max_prefix_length = 0;
11595 }
11596 else
11597 frag_wane (next_fragP);
11598 break;
11599 }
11600 }
11601
11602 /* Stop if there is no BRANCH_PREFIX. */
11603 if (!align_branch_prefix_size)
11604 return;
11605
11606 /* Scan for BRANCH_PREFIX. */
11607 for (; fragP != NULL; fragP = fragP->fr_next)
11608 {
11609 if (fragP->fr_type != rs_machine_dependent
11610 || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11611 != BRANCH_PREFIX))
11612 continue;
11613
11614 /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11615 COND_JUMP_PREFIX. */
11616 max_prefix_length = 0;
11617 for (next_fragP = fragP;
11618 next_fragP != NULL;
11619 next_fragP = next_fragP->fr_next)
11620 {
11621 if (next_fragP->fr_type == rs_fill)
11622 /* Skip rs_fill frags. */
11623 continue;
11624 else if (next_fragP->fr_type != rs_machine_dependent)
11625 /* Stop for all other frags. */
11626 break;
11627
11628 /* rs_machine_dependent frags. */
11629 if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11630 == BRANCH_PREFIX)
11631 {
11632 /* Count BRANCH_PREFIX frags. */
11633 if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11634 {
11635 max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11636 frag_wane (next_fragP);
11637 }
11638 else
11639 max_prefix_length
11640 += next_fragP->tc_frag_data.max_bytes;
11641 }
11642 else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11643 == BRANCH_PADDING)
11644 || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11645 == FUSED_JCC_PADDING))
11646 {
11647 /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING. */
11648 fragP->tc_frag_data.u.padding_fragP = next_fragP;
11649 break;
11650 }
11651 else
11652 /* Stop for other rs_machine_dependent frags. */
11653 break;
11654 }
11655
11656 fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11657
11658 /* Skip to the next frag. */
11659 fragP = next_fragP;
11660 }
11661}
11662
11663/* Compute padding size for
11664
11665 FUSED_JCC_PADDING
11666 CMP like instruction
11667 BRANCH_PADDING
11668 COND_JUMP/UNCOND_JUMP
11669
11670 or
11671
11672 BRANCH_PADDING
11673 COND_JUMP/UNCOND_JUMP
11674 */
11675
11676static int
11677i386_branch_padding_size (fragS *fragP, offsetT address)
11678{
11679 unsigned int offset, size, padding_size;
11680 fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11681
11682 /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag. */
11683 if (!address)
11684 address = fragP->fr_address;
11685 address += fragP->fr_fix;
11686
11687 /* CMP like instrunction size. */
11688 size = fragP->tc_frag_data.cmp_size;
11689
11690 /* The base size of the branch frag. */
11691 size += branch_fragP->fr_fix;
11692
11693 /* Add opcode and displacement bytes for the rs_machine_dependent
11694 branch frag. */
11695 if (branch_fragP->fr_type == rs_machine_dependent)
11696 size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11697
11698 /* Check if branch is within boundary and doesn't end at the last
11699 byte. */
11700 offset = address & ((1U << align_branch_power) - 1);
11701 if ((offset + size) >= (1U << align_branch_power))
11702 /* Padding needed to avoid crossing boundary. */
11703 padding_size = (1U << align_branch_power) - offset;
11704 else
11705 /* No padding needed. */
11706 padding_size = 0;
11707
11708 /* The return value may be saved in tc_frag_data.length which is
11709 unsigned byte. */
11710 if (!fits_in_unsigned_byte (padding_size))
11711 abort ();
11712
11713 return padding_size;
11714}
11715
11716/* i386_generic_table_relax_frag()
11717
11718 Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11719 grow/shrink padding to align branch frags. Hand others to
11720 relax_frag(). */
11721
11722long
11723i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11724{
11725 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11726 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11727 {
11728 long padding_size = i386_branch_padding_size (fragP, 0);
11729 long grow = padding_size - fragP->tc_frag_data.length;
11730
11731 /* When the BRANCH_PREFIX frag is used, the computed address
11732 must match the actual address and there should be no padding. */
11733 if (fragP->tc_frag_data.padding_address
11734 && (fragP->tc_frag_data.padding_address != fragP->fr_address
11735 || padding_size))
11736 abort ();
11737
11738 /* Update the padding size. */
11739 if (grow)
11740 fragP->tc_frag_data.length = padding_size;
11741
11742 return grow;
11743 }
11744 else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11745 {
11746 fragS *padding_fragP, *next_fragP;
11747 long padding_size, left_size, last_size;
11748
11749 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11750 if (!padding_fragP)
11751 /* Use the padding set by the leading BRANCH_PREFIX frag. */
11752 return (fragP->tc_frag_data.length
11753 - fragP->tc_frag_data.last_length);
11754
11755 /* Compute the relative address of the padding frag in the very
11756 first time where the BRANCH_PREFIX frag sizes are zero. */
11757 if (!fragP->tc_frag_data.padding_address)
11758 fragP->tc_frag_data.padding_address
11759 = padding_fragP->fr_address - (fragP->fr_address - stretch);
11760
11761 /* First update the last length from the previous interation. */
11762 left_size = fragP->tc_frag_data.prefix_length;
11763 for (next_fragP = fragP;
11764 next_fragP != padding_fragP;
11765 next_fragP = next_fragP->fr_next)
11766 if (next_fragP->fr_type == rs_machine_dependent
11767 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11768 == BRANCH_PREFIX))
11769 {
11770 if (left_size)
11771 {
11772 int max = next_fragP->tc_frag_data.max_bytes;
11773 if (max)
11774 {
11775 int size;
11776 if (max > left_size)
11777 size = left_size;
11778 else
11779 size = max;
11780 left_size -= size;
11781 next_fragP->tc_frag_data.last_length = size;
11782 }
11783 }
11784 else
11785 next_fragP->tc_frag_data.last_length = 0;
11786 }
11787
11788 /* Check the padding size for the padding frag. */
11789 padding_size = i386_branch_padding_size
11790 (padding_fragP, (fragP->fr_address
11791 + fragP->tc_frag_data.padding_address));
11792
11793 last_size = fragP->tc_frag_data.prefix_length;
11794 /* Check if there is change from the last interation. */
11795 if (padding_size == last_size)
11796 {
11797 /* Update the expected address of the padding frag. */
11798 padding_fragP->tc_frag_data.padding_address
11799 = (fragP->fr_address + padding_size
11800 + fragP->tc_frag_data.padding_address);
11801 return 0;
11802 }
11803
11804 if (padding_size > fragP->tc_frag_data.max_prefix_length)
11805 {
11806 /* No padding if there is no sufficient room. Clear the
11807 expected address of the padding frag. */
11808 padding_fragP->tc_frag_data.padding_address = 0;
11809 padding_size = 0;
11810 }
11811 else
11812 /* Store the expected address of the padding frag. */
11813 padding_fragP->tc_frag_data.padding_address
11814 = (fragP->fr_address + padding_size
11815 + fragP->tc_frag_data.padding_address);
11816
11817 fragP->tc_frag_data.prefix_length = padding_size;
11818
11819 /* Update the length for the current interation. */
11820 left_size = padding_size;
11821 for (next_fragP = fragP;
11822 next_fragP != padding_fragP;
11823 next_fragP = next_fragP->fr_next)
11824 if (next_fragP->fr_type == rs_machine_dependent
11825 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11826 == BRANCH_PREFIX))
11827 {
11828 if (left_size)
11829 {
11830 int max = next_fragP->tc_frag_data.max_bytes;
11831 if (max)
11832 {
11833 int size;
11834 if (max > left_size)
11835 size = left_size;
11836 else
11837 size = max;
11838 left_size -= size;
11839 next_fragP->tc_frag_data.length = size;
11840 }
11841 }
11842 else
11843 next_fragP->tc_frag_data.length = 0;
11844 }
11845
11846 return (fragP->tc_frag_data.length
11847 - fragP->tc_frag_data.last_length);
11848 }
11849 return relax_frag (segment, fragP, stretch);
11850}
11851
ee7fcc42
AM
11852/* md_estimate_size_before_relax()
11853
11854 Called just before relax() for rs_machine_dependent frags. The x86
11855 assembler uses these frags to handle variable size jump
11856 instructions.
11857
11858 Any symbol that is now undefined will not become defined.
11859 Return the correct fr_subtype in the frag.
11860 Return the initial "guess for variable size of frag" to caller.
11861 The guess is actually the growth beyond the fixed part. Whatever
11862 we do to grow the fixed or variable part contributes to our
11863 returned value. */
11864
252b5132 11865int
7016a5d5 11866md_estimate_size_before_relax (fragS *fragP, segT segment)
252b5132 11867{
e379e5f3
L
11868 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11869 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11870 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11871 {
11872 i386_classify_machine_dependent_frag (fragP);
11873 return fragP->tc_frag_data.length;
11874 }
11875
252b5132 11876 /* We've already got fragP->fr_subtype right; all we have to do is
b98ef147
AM
11877 check for un-relaxable symbols. On an ELF system, we can't relax
11878 an externally visible symbol, because it may be overridden by a
11879 shared library. */
11880 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
6d249963 11881#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 11882 || (IS_ELF
8dcea932
L
11883 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11884 fragP->fr_var))
fbeb56a4
DK
11885#endif
11886#if defined (OBJ_COFF) && defined (TE_PE)
7ab9ffdd 11887 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
fbeb56a4 11888 && S_IS_WEAK (fragP->fr_symbol))
b98ef147
AM
11889#endif
11890 )
252b5132 11891 {
b98ef147
AM
11892 /* Symbol is undefined in this segment, or we need to keep a
11893 reloc so that weak symbols can be overridden. */
11894 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
f86103b7 11895 enum bfd_reloc_code_real reloc_type;
ee7fcc42
AM
11896 unsigned char *opcode;
11897 int old_fr_fix;
f6af82bd 11898
ee7fcc42 11899 if (fragP->fr_var != NO_RELOC)
1e9cc1c2 11900 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
b98ef147 11901 else if (size == 2)
f6af82bd 11902 reloc_type = BFD_RELOC_16_PCREL;
bd7ab16b
L
11903#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11904 else if (need_plt32_p (fragP->fr_symbol))
11905 reloc_type = BFD_RELOC_X86_64_PLT32;
11906#endif
f6af82bd
AM
11907 else
11908 reloc_type = BFD_RELOC_32_PCREL;
252b5132 11909
ee7fcc42
AM
11910 old_fr_fix = fragP->fr_fix;
11911 opcode = (unsigned char *) fragP->fr_opcode;
11912
fddf5b5b 11913 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
252b5132 11914 {
fddf5b5b
AM
11915 case UNCOND_JUMP:
11916 /* Make jmp (0xeb) a (d)word displacement jump. */
47926f60 11917 opcode[0] = 0xe9;
252b5132 11918 fragP->fr_fix += size;
062cd5e7
AS
11919 fix_new (fragP, old_fr_fix, size,
11920 fragP->fr_symbol,
11921 fragP->fr_offset, 1,
11922 reloc_type);
252b5132
RH
11923 break;
11924
fddf5b5b 11925 case COND_JUMP86:
412167cb
AM
11926 if (size == 2
11927 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
fddf5b5b
AM
11928 {
11929 /* Negate the condition, and branch past an
11930 unconditional jump. */
11931 opcode[0] ^= 1;
11932 opcode[1] = 3;
11933 /* Insert an unconditional jump. */
11934 opcode[2] = 0xe9;
11935 /* We added two extra opcode bytes, and have a two byte
11936 offset. */
11937 fragP->fr_fix += 2 + 2;
062cd5e7
AS
11938 fix_new (fragP, old_fr_fix + 2, 2,
11939 fragP->fr_symbol,
11940 fragP->fr_offset, 1,
11941 reloc_type);
fddf5b5b
AM
11942 break;
11943 }
11944 /* Fall through. */
11945
11946 case COND_JUMP:
412167cb
AM
11947 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11948 {
3e02c1cc
AM
11949 fixS *fixP;
11950
412167cb 11951 fragP->fr_fix += 1;
3e02c1cc
AM
11952 fixP = fix_new (fragP, old_fr_fix, 1,
11953 fragP->fr_symbol,
11954 fragP->fr_offset, 1,
11955 BFD_RELOC_8_PCREL);
11956 fixP->fx_signed = 1;
412167cb
AM
11957 break;
11958 }
93c2a809 11959
24eab124 11960 /* This changes the byte-displacement jump 0x7N
fddf5b5b 11961 to the (d)word-displacement jump 0x0f,0x8N. */
252b5132 11962 opcode[1] = opcode[0] + 0x10;
f6af82bd 11963 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
47926f60
KH
11964 /* We've added an opcode byte. */
11965 fragP->fr_fix += 1 + size;
062cd5e7
AS
11966 fix_new (fragP, old_fr_fix + 1, size,
11967 fragP->fr_symbol,
11968 fragP->fr_offset, 1,
11969 reloc_type);
252b5132 11970 break;
fddf5b5b
AM
11971
11972 default:
11973 BAD_CASE (fragP->fr_subtype);
11974 break;
252b5132
RH
11975 }
11976 frag_wane (fragP);
ee7fcc42 11977 return fragP->fr_fix - old_fr_fix;
252b5132 11978 }
93c2a809 11979
93c2a809
AM
11980 /* Guess size depending on current relax state. Initially the relax
11981 state will correspond to a short jump and we return 1, because
11982 the variable part of the frag (the branch offset) is one byte
11983 long. However, we can relax a section more than once and in that
11984 case we must either set fr_subtype back to the unrelaxed state,
11985 or return the value for the appropriate branch. */
11986 return md_relax_table[fragP->fr_subtype].rlx_length;
ee7fcc42
AM
11987}
11988
47926f60
KH
11989/* Called after relax() is finished.
11990
11991 In: Address of frag.
11992 fr_type == rs_machine_dependent.
11993 fr_subtype is what the address relaxed to.
11994
11995 Out: Any fixSs and constants are set up.
11996 Caller will turn frag into a ".space 0". */
11997
252b5132 11998void
7016a5d5
TG
11999md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
12000 fragS *fragP)
252b5132 12001{
29b0f896 12002 unsigned char *opcode;
252b5132 12003 unsigned char *where_to_put_displacement = NULL;
847f7ad4
AM
12004 offsetT target_address;
12005 offsetT opcode_address;
252b5132 12006 unsigned int extension = 0;
847f7ad4 12007 offsetT displacement_from_opcode_start;
252b5132 12008
e379e5f3
L
12009 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12010 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
12011 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12012 {
12013 /* Generate nop padding. */
12014 unsigned int size = fragP->tc_frag_data.length;
12015 if (size)
12016 {
12017 if (size > fragP->tc_frag_data.max_bytes)
12018 abort ();
12019
12020 if (flag_debug)
12021 {
12022 const char *msg;
12023 const char *branch = "branch";
12024 const char *prefix = "";
12025 fragS *padding_fragP;
12026 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12027 == BRANCH_PREFIX)
12028 {
12029 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12030 switch (fragP->tc_frag_data.default_prefix)
12031 {
12032 default:
12033 abort ();
12034 break;
12035 case CS_PREFIX_OPCODE:
12036 prefix = " cs";
12037 break;
12038 case DS_PREFIX_OPCODE:
12039 prefix = " ds";
12040 break;
12041 case ES_PREFIX_OPCODE:
12042 prefix = " es";
12043 break;
12044 case FS_PREFIX_OPCODE:
12045 prefix = " fs";
12046 break;
12047 case GS_PREFIX_OPCODE:
12048 prefix = " gs";
12049 break;
12050 case SS_PREFIX_OPCODE:
12051 prefix = " ss";
12052 break;
12053 }
12054 if (padding_fragP)
12055 msg = _("%s:%u: add %d%s at 0x%llx to align "
12056 "%s within %d-byte boundary\n");
12057 else
12058 msg = _("%s:%u: add additional %d%s at 0x%llx to "
12059 "align %s within %d-byte boundary\n");
12060 }
12061 else
12062 {
12063 padding_fragP = fragP;
12064 msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12065 "%s within %d-byte boundary\n");
12066 }
12067
12068 if (padding_fragP)
12069 switch (padding_fragP->tc_frag_data.branch_type)
12070 {
12071 case align_branch_jcc:
12072 branch = "jcc";
12073 break;
12074 case align_branch_fused:
12075 branch = "fused jcc";
12076 break;
12077 case align_branch_jmp:
12078 branch = "jmp";
12079 break;
12080 case align_branch_call:
12081 branch = "call";
12082 break;
12083 case align_branch_indirect:
12084 branch = "indiret branch";
12085 break;
12086 case align_branch_ret:
12087 branch = "ret";
12088 break;
12089 default:
12090 break;
12091 }
12092
12093 fprintf (stdout, msg,
12094 fragP->fr_file, fragP->fr_line, size, prefix,
12095 (long long) fragP->fr_address, branch,
12096 1 << align_branch_power);
12097 }
12098 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12099 memset (fragP->fr_opcode,
12100 fragP->tc_frag_data.default_prefix, size);
12101 else
12102 i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12103 size, 0);
12104 fragP->fr_fix += size;
12105 }
12106 return;
12107 }
12108
252b5132
RH
12109 opcode = (unsigned char *) fragP->fr_opcode;
12110
47926f60 12111 /* Address we want to reach in file space. */
252b5132 12112 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
252b5132 12113
47926f60 12114 /* Address opcode resides at in file space. */
252b5132
RH
12115 opcode_address = fragP->fr_address + fragP->fr_fix;
12116
47926f60 12117 /* Displacement from opcode start to fill into instruction. */
252b5132
RH
12118 displacement_from_opcode_start = target_address - opcode_address;
12119
fddf5b5b 12120 if ((fragP->fr_subtype & BIG) == 0)
252b5132 12121 {
47926f60
KH
12122 /* Don't have to change opcode. */
12123 extension = 1; /* 1 opcode + 1 displacement */
252b5132 12124 where_to_put_displacement = &opcode[1];
fddf5b5b
AM
12125 }
12126 else
12127 {
12128 if (no_cond_jump_promotion
12129 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
4eed87de
AM
12130 as_warn_where (fragP->fr_file, fragP->fr_line,
12131 _("long jump required"));
252b5132 12132
fddf5b5b
AM
12133 switch (fragP->fr_subtype)
12134 {
12135 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12136 extension = 4; /* 1 opcode + 4 displacement */
12137 opcode[0] = 0xe9;
12138 where_to_put_displacement = &opcode[1];
12139 break;
252b5132 12140
fddf5b5b
AM
12141 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12142 extension = 2; /* 1 opcode + 2 displacement */
12143 opcode[0] = 0xe9;
12144 where_to_put_displacement = &opcode[1];
12145 break;
252b5132 12146
fddf5b5b
AM
12147 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12148 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12149 extension = 5; /* 2 opcode + 4 displacement */
12150 opcode[1] = opcode[0] + 0x10;
12151 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12152 where_to_put_displacement = &opcode[2];
12153 break;
252b5132 12154
fddf5b5b
AM
12155 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12156 extension = 3; /* 2 opcode + 2 displacement */
12157 opcode[1] = opcode[0] + 0x10;
12158 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12159 where_to_put_displacement = &opcode[2];
12160 break;
252b5132 12161
fddf5b5b
AM
12162 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12163 extension = 4;
12164 opcode[0] ^= 1;
12165 opcode[1] = 3;
12166 opcode[2] = 0xe9;
12167 where_to_put_displacement = &opcode[3];
12168 break;
12169
12170 default:
12171 BAD_CASE (fragP->fr_subtype);
12172 break;
12173 }
252b5132 12174 }
fddf5b5b 12175
7b81dfbb
AJ
12176 /* If size if less then four we are sure that the operand fits,
12177 but if it's 4, then it could be that the displacement is larger
12178 then -/+ 2GB. */
12179 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12180 && object_64bit
12181 && ((addressT) (displacement_from_opcode_start - extension
4eed87de
AM
12182 + ((addressT) 1 << 31))
12183 > (((addressT) 2 << 31) - 1)))
7b81dfbb
AJ
12184 {
12185 as_bad_where (fragP->fr_file, fragP->fr_line,
12186 _("jump target out of range"));
12187 /* Make us emit 0. */
12188 displacement_from_opcode_start = extension;
12189 }
47926f60 12190 /* Now put displacement after opcode. */
252b5132
RH
12191 md_number_to_chars ((char *) where_to_put_displacement,
12192 (valueT) (displacement_from_opcode_start - extension),
fddf5b5b 12193 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
252b5132
RH
12194 fragP->fr_fix += extension;
12195}
12196\f
7016a5d5 12197/* Apply a fixup (fixP) to segment data, once it has been determined
252b5132
RH
12198 by our caller that we have all the info we need to fix it up.
12199
7016a5d5
TG
12200 Parameter valP is the pointer to the value of the bits.
12201
252b5132
RH
12202 On the 386, immediates, displacements, and data pointers are all in
12203 the same (little-endian) format, so we don't need to care about which
12204 we are handling. */
12205
94f592af 12206void
7016a5d5 12207md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
252b5132 12208{
94f592af 12209 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
c6682705 12210 valueT value = *valP;
252b5132 12211
f86103b7 12212#if !defined (TE_Mach)
93382f6d
AM
12213 if (fixP->fx_pcrel)
12214 {
12215 switch (fixP->fx_r_type)
12216 {
5865bb77
ILT
12217 default:
12218 break;
12219
d6ab8113
JB
12220 case BFD_RELOC_64:
12221 fixP->fx_r_type = BFD_RELOC_64_PCREL;
12222 break;
93382f6d 12223 case BFD_RELOC_32:
ae8887b5 12224 case BFD_RELOC_X86_64_32S:
93382f6d
AM
12225 fixP->fx_r_type = BFD_RELOC_32_PCREL;
12226 break;
12227 case BFD_RELOC_16:
12228 fixP->fx_r_type = BFD_RELOC_16_PCREL;
12229 break;
12230 case BFD_RELOC_8:
12231 fixP->fx_r_type = BFD_RELOC_8_PCREL;
12232 break;
12233 }
12234 }
252b5132 12235
a161fe53 12236 if (fixP->fx_addsy != NULL
31312f95 12237 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
d6ab8113 12238 || fixP->fx_r_type == BFD_RELOC_64_PCREL
31312f95 12239 || fixP->fx_r_type == BFD_RELOC_16_PCREL
d258b828 12240 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
31312f95 12241 && !use_rela_relocations)
252b5132 12242 {
31312f95
AM
12243 /* This is a hack. There should be a better way to handle this.
12244 This covers for the fact that bfd_install_relocation will
12245 subtract the current location (for partial_inplace, PC relative
12246 relocations); see more below. */
252b5132 12247#ifndef OBJ_AOUT
718ddfc0 12248 if (IS_ELF
252b5132
RH
12249#ifdef TE_PE
12250 || OUTPUT_FLAVOR == bfd_target_coff_flavour
12251#endif
12252 )
12253 value += fixP->fx_where + fixP->fx_frag->fr_address;
12254#endif
12255#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 12256 if (IS_ELF)
252b5132 12257 {
6539b54b 12258 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
2f66722d 12259
6539b54b 12260 if ((sym_seg == seg
2f66722d 12261 || (symbol_section_p (fixP->fx_addsy)
6539b54b 12262 && sym_seg != absolute_section))
af65af87 12263 && !generic_force_reloc (fixP))
2f66722d
AM
12264 {
12265 /* Yes, we add the values in twice. This is because
6539b54b
AM
12266 bfd_install_relocation subtracts them out again. I think
12267 bfd_install_relocation is broken, but I don't dare change
2f66722d
AM
12268 it. FIXME. */
12269 value += fixP->fx_where + fixP->fx_frag->fr_address;
12270 }
252b5132
RH
12271 }
12272#endif
12273#if defined (OBJ_COFF) && defined (TE_PE)
977cdf5a
NC
12274 /* For some reason, the PE format does not store a
12275 section address offset for a PC relative symbol. */
12276 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
7be1c489 12277 || S_IS_WEAK (fixP->fx_addsy))
252b5132
RH
12278 value += md_pcrel_from (fixP);
12279#endif
12280 }
fbeb56a4 12281#if defined (OBJ_COFF) && defined (TE_PE)
f01c1a09
NC
12282 if (fixP->fx_addsy != NULL
12283 && S_IS_WEAK (fixP->fx_addsy)
12284 /* PR 16858: Do not modify weak function references. */
12285 && ! fixP->fx_pcrel)
fbeb56a4 12286 {
296a8689
NC
12287#if !defined (TE_PEP)
12288 /* For x86 PE weak function symbols are neither PC-relative
12289 nor do they set S_IS_FUNCTION. So the only reliable way
12290 to detect them is to check the flags of their containing
12291 section. */
12292 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12293 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12294 ;
12295 else
12296#endif
fbeb56a4
DK
12297 value -= S_GET_VALUE (fixP->fx_addsy);
12298 }
12299#endif
252b5132
RH
12300
12301 /* Fix a few things - the dynamic linker expects certain values here,
0234cb7c 12302 and we must not disappoint it. */
252b5132 12303#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 12304 if (IS_ELF && fixP->fx_addsy)
47926f60
KH
12305 switch (fixP->fx_r_type)
12306 {
12307 case BFD_RELOC_386_PLT32:
3e73aa7c 12308 case BFD_RELOC_X86_64_PLT32:
b9519cfe
L
12309 /* Make the jump instruction point to the address of the operand.
12310 At runtime we merely add the offset to the actual PLT entry.
12311 NB: Subtract the offset size only for jump instructions. */
12312 if (fixP->fx_pcrel)
12313 value = -4;
47926f60 12314 break;
31312f95 12315
13ae64f3
JJ
12316 case BFD_RELOC_386_TLS_GD:
12317 case BFD_RELOC_386_TLS_LDM:
13ae64f3 12318 case BFD_RELOC_386_TLS_IE_32:
37e55690
JJ
12319 case BFD_RELOC_386_TLS_IE:
12320 case BFD_RELOC_386_TLS_GOTIE:
67a4f2b7 12321 case BFD_RELOC_386_TLS_GOTDESC:
bffbf940
JJ
12322 case BFD_RELOC_X86_64_TLSGD:
12323 case BFD_RELOC_X86_64_TLSLD:
12324 case BFD_RELOC_X86_64_GOTTPOFF:
67a4f2b7 12325 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
00f7efb6
JJ
12326 value = 0; /* Fully resolved at runtime. No addend. */
12327 /* Fallthrough */
12328 case BFD_RELOC_386_TLS_LE:
12329 case BFD_RELOC_386_TLS_LDO_32:
12330 case BFD_RELOC_386_TLS_LE_32:
12331 case BFD_RELOC_X86_64_DTPOFF32:
d6ab8113 12332 case BFD_RELOC_X86_64_DTPOFF64:
00f7efb6 12333 case BFD_RELOC_X86_64_TPOFF32:
d6ab8113 12334 case BFD_RELOC_X86_64_TPOFF64:
00f7efb6
JJ
12335 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12336 break;
12337
67a4f2b7
AO
12338 case BFD_RELOC_386_TLS_DESC_CALL:
12339 case BFD_RELOC_X86_64_TLSDESC_CALL:
12340 value = 0; /* Fully resolved at runtime. No addend. */
12341 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12342 fixP->fx_done = 0;
12343 return;
12344
47926f60
KH
12345 case BFD_RELOC_VTABLE_INHERIT:
12346 case BFD_RELOC_VTABLE_ENTRY:
12347 fixP->fx_done = 0;
94f592af 12348 return;
47926f60
KH
12349
12350 default:
12351 break;
12352 }
12353#endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
c6682705 12354 *valP = value;
f86103b7 12355#endif /* !defined (TE_Mach) */
3e73aa7c 12356
3e73aa7c 12357 /* Are we finished with this relocation now? */
c6682705 12358 if (fixP->fx_addsy == NULL)
3e73aa7c 12359 fixP->fx_done = 1;
fbeb56a4
DK
12360#if defined (OBJ_COFF) && defined (TE_PE)
12361 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12362 {
12363 fixP->fx_done = 0;
12364 /* Remember value for tc_gen_reloc. */
12365 fixP->fx_addnumber = value;
12366 /* Clear out the frag for now. */
12367 value = 0;
12368 }
12369#endif
3e73aa7c
JH
12370 else if (use_rela_relocations)
12371 {
12372 fixP->fx_no_overflow = 1;
062cd5e7
AS
12373 /* Remember value for tc_gen_reloc. */
12374 fixP->fx_addnumber = value;
3e73aa7c
JH
12375 value = 0;
12376 }
f86103b7 12377
94f592af 12378 md_number_to_chars (p, value, fixP->fx_size);
252b5132 12379}
252b5132 12380\f
6d4af3c2 12381const char *
499ac353 12382md_atof (int type, char *litP, int *sizeP)
252b5132 12383{
499ac353
NC
12384 /* This outputs the LITTLENUMs in REVERSE order;
12385 in accord with the bigendian 386. */
12386 return ieee_md_atof (type, litP, sizeP, FALSE);
252b5132
RH
12387}
12388\f
2d545b82 12389static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
252b5132 12390
252b5132 12391static char *
e3bb37b5 12392output_invalid (int c)
252b5132 12393{
3882b010 12394 if (ISPRINT (c))
f9f21a03
L
12395 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12396 "'%c'", c);
252b5132 12397 else
f9f21a03 12398 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
2d545b82 12399 "(0x%x)", (unsigned char) c);
252b5132
RH
12400 return output_invalid_buf;
12401}
12402
8a6fb3f9
JB
12403/* Verify that @r can be used in the current context. */
12404
12405static bfd_boolean check_register (const reg_entry *r)
12406{
12407 if (allow_pseudo_reg)
12408 return TRUE;
12409
12410 if (operand_type_all_zero (&r->reg_type))
12411 return FALSE;
12412
12413 if ((r->reg_type.bitfield.dword
12414 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12415 || r->reg_type.bitfield.class == RegCR
22e00a3f 12416 || r->reg_type.bitfield.class == RegDR)
8a6fb3f9
JB
12417 && !cpu_arch_flags.bitfield.cpui386)
12418 return FALSE;
12419
22e00a3f
JB
12420 if (r->reg_type.bitfield.class == RegTR
12421 && (flag_code == CODE_64BIT
12422 || !cpu_arch_flags.bitfield.cpui386
12423 || cpu_arch_isa_flags.bitfield.cpui586
12424 || cpu_arch_isa_flags.bitfield.cpui686))
12425 return FALSE;
12426
8a6fb3f9
JB
12427 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12428 return FALSE;
12429
12430 if (!cpu_arch_flags.bitfield.cpuavx512f)
12431 {
12432 if (r->reg_type.bitfield.zmmword
12433 || r->reg_type.bitfield.class == RegMask)
12434 return FALSE;
12435
12436 if (!cpu_arch_flags.bitfield.cpuavx)
12437 {
12438 if (r->reg_type.bitfield.ymmword)
12439 return FALSE;
12440
12441 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12442 return FALSE;
12443 }
12444 }
12445
12446 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12447 return FALSE;
12448
12449 /* Don't allow fake index register unless allow_index_reg isn't 0. */
12450 if (!allow_index_reg && r->reg_num == RegIZ)
12451 return FALSE;
12452
12453 /* Upper 16 vector registers are only available with VREX in 64bit
12454 mode, and require EVEX encoding. */
12455 if (r->reg_flags & RegVRex)
12456 {
12457 if (!cpu_arch_flags.bitfield.cpuavx512f
12458 || flag_code != CODE_64BIT)
12459 return FALSE;
12460
da4977e0
JB
12461 if (i.vec_encoding == vex_encoding_default)
12462 i.vec_encoding = vex_encoding_evex;
12463 else if (i.vec_encoding != vex_encoding_evex)
12464 i.vec_encoding = vex_encoding_error;
8a6fb3f9
JB
12465 }
12466
12467 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12468 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12469 && flag_code != CODE_64BIT)
12470 return FALSE;
12471
12472 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12473 && !intel_syntax)
12474 return FALSE;
12475
12476 return TRUE;
12477}
12478
af6bdddf 12479/* REG_STRING starts *before* REGISTER_PREFIX. */
252b5132
RH
12480
12481static const reg_entry *
4d1bb795 12482parse_real_register (char *reg_string, char **end_op)
252b5132 12483{
af6bdddf
AM
12484 char *s = reg_string;
12485 char *p;
252b5132
RH
12486 char reg_name_given[MAX_REG_NAME_SIZE + 1];
12487 const reg_entry *r;
12488
12489 /* Skip possible REGISTER_PREFIX and possible whitespace. */
12490 if (*s == REGISTER_PREFIX)
12491 ++s;
12492
12493 if (is_space_char (*s))
12494 ++s;
12495
12496 p = reg_name_given;
af6bdddf 12497 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
252b5132
RH
12498 {
12499 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
af6bdddf
AM
12500 return (const reg_entry *) NULL;
12501 s++;
252b5132
RH
12502 }
12503
6588847e
DN
12504 /* For naked regs, make sure that we are not dealing with an identifier.
12505 This prevents confusing an identifier like `eax_var' with register
12506 `eax'. */
12507 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12508 return (const reg_entry *) NULL;
12509
af6bdddf 12510 *end_op = s;
252b5132
RH
12511
12512 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
12513
5f47d35b 12514 /* Handle floating point regs, allowing spaces in the (i) part. */
47926f60 12515 if (r == i386_regtab /* %st is first entry of table */)
5f47d35b 12516 {
0e0eea78
JB
12517 if (!cpu_arch_flags.bitfield.cpu8087
12518 && !cpu_arch_flags.bitfield.cpu287
af32b722
JB
12519 && !cpu_arch_flags.bitfield.cpu387
12520 && !allow_pseudo_reg)
0e0eea78
JB
12521 return (const reg_entry *) NULL;
12522
5f47d35b
AM
12523 if (is_space_char (*s))
12524 ++s;
12525 if (*s == '(')
12526 {
af6bdddf 12527 ++s;
5f47d35b
AM
12528 if (is_space_char (*s))
12529 ++s;
12530 if (*s >= '0' && *s <= '7')
12531 {
db557034 12532 int fpr = *s - '0';
af6bdddf 12533 ++s;
5f47d35b
AM
12534 if (is_space_char (*s))
12535 ++s;
12536 if (*s == ')')
12537 {
12538 *end_op = s + 1;
1e9cc1c2 12539 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
db557034
AM
12540 know (r);
12541 return r + fpr;
5f47d35b 12542 }
5f47d35b 12543 }
47926f60 12544 /* We have "%st(" then garbage. */
5f47d35b
AM
12545 return (const reg_entry *) NULL;
12546 }
12547 }
12548
8a6fb3f9 12549 return r && check_register (r) ? r : NULL;
252b5132 12550}
4d1bb795
JB
12551
12552/* REG_STRING starts *before* REGISTER_PREFIX. */
12553
12554static const reg_entry *
12555parse_register (char *reg_string, char **end_op)
12556{
12557 const reg_entry *r;
12558
12559 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12560 r = parse_real_register (reg_string, end_op);
12561 else
12562 r = NULL;
12563 if (!r)
12564 {
12565 char *save = input_line_pointer;
12566 char c;
12567 symbolS *symbolP;
12568
12569 input_line_pointer = reg_string;
d02603dc 12570 c = get_symbol_name (&reg_string);
4d1bb795
JB
12571 symbolP = symbol_find (reg_string);
12572 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12573 {
12574 const expressionS *e = symbol_get_value_expression (symbolP);
12575
0398aac5 12576 know (e->X_op == O_register);
4eed87de 12577 know (e->X_add_number >= 0
c3fe08fa 12578 && (valueT) e->X_add_number < i386_regtab_size);
4d1bb795 12579 r = i386_regtab + e->X_add_number;
8a6fb3f9
JB
12580 if (!check_register (r))
12581 {
12582 as_bad (_("register '%s%s' cannot be used here"),
12583 register_prefix, r->reg_name);
12584 r = &bad_reg;
12585 }
4d1bb795
JB
12586 *end_op = input_line_pointer;
12587 }
12588 *input_line_pointer = c;
12589 input_line_pointer = save;
12590 }
12591 return r;
12592}
12593
12594int
12595i386_parse_name (char *name, expressionS *e, char *nextcharP)
12596{
12597 const reg_entry *r;
12598 char *end = input_line_pointer;
12599
12600 *end = *nextcharP;
12601 r = parse_register (name, &input_line_pointer);
12602 if (r && end <= input_line_pointer)
12603 {
12604 *nextcharP = *input_line_pointer;
12605 *input_line_pointer = 0;
8a6fb3f9
JB
12606 if (r != &bad_reg)
12607 {
12608 e->X_op = O_register;
12609 e->X_add_number = r - i386_regtab;
12610 }
12611 else
12612 e->X_op = O_illegal;
4d1bb795
JB
12613 return 1;
12614 }
12615 input_line_pointer = end;
12616 *end = 0;
ee86248c 12617 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
4d1bb795
JB
12618}
12619
12620void
12621md_operand (expressionS *e)
12622{
ee86248c
JB
12623 char *end;
12624 const reg_entry *r;
4d1bb795 12625
ee86248c
JB
12626 switch (*input_line_pointer)
12627 {
12628 case REGISTER_PREFIX:
12629 r = parse_real_register (input_line_pointer, &end);
4d1bb795
JB
12630 if (r)
12631 {
12632 e->X_op = O_register;
12633 e->X_add_number = r - i386_regtab;
12634 input_line_pointer = end;
12635 }
ee86248c
JB
12636 break;
12637
12638 case '[':
9c2799c2 12639 gas_assert (intel_syntax);
ee86248c
JB
12640 end = input_line_pointer++;
12641 expression (e);
12642 if (*input_line_pointer == ']')
12643 {
12644 ++input_line_pointer;
12645 e->X_op_symbol = make_expr_symbol (e);
12646 e->X_add_symbol = NULL;
12647 e->X_add_number = 0;
12648 e->X_op = O_index;
12649 }
12650 else
12651 {
12652 e->X_op = O_absent;
12653 input_line_pointer = end;
12654 }
12655 break;
4d1bb795
JB
12656 }
12657}
12658
252b5132 12659\f
4cc782b5 12660#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
b6f8c7c4 12661const char *md_shortopts = "kVQ:sqnO::";
252b5132 12662#else
b6f8c7c4 12663const char *md_shortopts = "qnO::";
252b5132 12664#endif
6e0b89ee 12665
3e73aa7c 12666#define OPTION_32 (OPTION_MD_BASE + 0)
b3b91714
AM
12667#define OPTION_64 (OPTION_MD_BASE + 1)
12668#define OPTION_DIVIDE (OPTION_MD_BASE + 2)
9103f4f4
L
12669#define OPTION_MARCH (OPTION_MD_BASE + 3)
12670#define OPTION_MTUNE (OPTION_MD_BASE + 4)
1efbbeb4
L
12671#define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12672#define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12673#define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12674#define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
bd5dea88 12675#define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
c0f3af97 12676#define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
daf50ae7 12677#define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
7bab8ab5
JB
12678#define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12679#define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12680#define OPTION_X32 (OPTION_MD_BASE + 14)
7e8b059b 12681#define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
43234a1e
L
12682#define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12683#define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
167ad85b 12684#define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
d1982f93 12685#define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
d3d3c6db 12686#define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
8dcea932 12687#define OPTION_MSHARED (OPTION_MD_BASE + 21)
5db04b09
L
12688#define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12689#define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
e4e00185 12690#define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
b4a3a7b4 12691#define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
03751133 12692#define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
e379e5f3
L
12693#define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12694#define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12695#define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
76cf450b 12696#define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
ae531041
L
12697#define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
12698#define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
12699#define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
b3b91714 12700
99ad8390
NC
12701struct option md_longopts[] =
12702{
3e73aa7c 12703 {"32", no_argument, NULL, OPTION_32},
321098a5 12704#if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
d382c579 12705 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
3e73aa7c 12706 {"64", no_argument, NULL, OPTION_64},
351f65ca
L
12707#endif
12708#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
570561f7 12709 {"x32", no_argument, NULL, OPTION_X32},
8dcea932 12710 {"mshared", no_argument, NULL, OPTION_MSHARED},
b4a3a7b4 12711 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
6e0b89ee 12712#endif
b3b91714 12713 {"divide", no_argument, NULL, OPTION_DIVIDE},
9103f4f4
L
12714 {"march", required_argument, NULL, OPTION_MARCH},
12715 {"mtune", required_argument, NULL, OPTION_MTUNE},
1efbbeb4
L
12716 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12717 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12718 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12719 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
c0f3af97 12720 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
daf50ae7 12721 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
7bab8ab5 12722 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
539f890d 12723 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
03751133 12724 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
7e8b059b 12725 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
43234a1e
L
12726 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12727 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
167ad85b
TG
12728# if defined (TE_PE) || defined (TE_PEP)
12729 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12730#endif
d1982f93 12731 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
e4e00185 12732 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
0cb4071e 12733 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
d3d3c6db 12734 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
e379e5f3
L
12735 {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12736 {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12737 {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
76cf450b 12738 {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
ae531041
L
12739 {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
12740 {"mlfence-before-indirect-branch", required_argument, NULL,
12741 OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
12742 {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
5db04b09
L
12743 {"mamd64", no_argument, NULL, OPTION_MAMD64},
12744 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
252b5132
RH
12745 {NULL, no_argument, NULL, 0}
12746};
12747size_t md_longopts_size = sizeof (md_longopts);
12748
12749int
17b9d67d 12750md_parse_option (int c, const char *arg)
252b5132 12751{
91d6fa6a 12752 unsigned int j;
e379e5f3 12753 char *arch, *next, *saved, *type;
9103f4f4 12754
252b5132
RH
12755 switch (c)
12756 {
12b55ccc
L
12757 case 'n':
12758 optimize_align_code = 0;
12759 break;
12760
a38cf1db
AM
12761 case 'q':
12762 quiet_warnings = 1;
252b5132
RH
12763 break;
12764
12765#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
a38cf1db
AM
12766 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12767 should be emitted or not. FIXME: Not implemented. */
12768 case 'Q':
d4693039
JB
12769 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12770 return 0;
252b5132
RH
12771 break;
12772
12773 /* -V: SVR4 argument to print version ID. */
12774 case 'V':
12775 print_version_id ();
12776 break;
12777
a38cf1db
AM
12778 /* -k: Ignore for FreeBSD compatibility. */
12779 case 'k':
252b5132 12780 break;
4cc782b5
ILT
12781
12782 case 's':
12783 /* -s: On i386 Solaris, this tells the native assembler to use
29b0f896 12784 .stab instead of .stab.excl. We always use .stab anyhow. */
4cc782b5 12785 break;
8dcea932
L
12786
12787 case OPTION_MSHARED:
12788 shared = 1;
12789 break;
b4a3a7b4
L
12790
12791 case OPTION_X86_USED_NOTE:
12792 if (strcasecmp (arg, "yes") == 0)
12793 x86_used_note = 1;
12794 else if (strcasecmp (arg, "no") == 0)
12795 x86_used_note = 0;
12796 else
12797 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12798 break;
12799
12800
99ad8390 12801#endif
321098a5 12802#if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
d382c579 12803 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
3e73aa7c
JH
12804 case OPTION_64:
12805 {
12806 const char **list, **l;
12807
3e73aa7c
JH
12808 list = bfd_target_list ();
12809 for (l = list; *l != NULL; l++)
8620418b 12810 if (CONST_STRNEQ (*l, "elf64-x86-64")
99ad8390
NC
12811 || strcmp (*l, "coff-x86-64") == 0
12812 || strcmp (*l, "pe-x86-64") == 0
d382c579
TG
12813 || strcmp (*l, "pei-x86-64") == 0
12814 || strcmp (*l, "mach-o-x86-64") == 0)
6e0b89ee
AM
12815 {
12816 default_arch = "x86_64";
12817 break;
12818 }
3e73aa7c 12819 if (*l == NULL)
2b5d6a91 12820 as_fatal (_("no compiled in support for x86_64"));
3e73aa7c
JH
12821 free (list);
12822 }
12823 break;
12824#endif
252b5132 12825
351f65ca 12826#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
570561f7 12827 case OPTION_X32:
351f65ca
L
12828 if (IS_ELF)
12829 {
12830 const char **list, **l;
12831
12832 list = bfd_target_list ();
12833 for (l = list; *l != NULL; l++)
12834 if (CONST_STRNEQ (*l, "elf32-x86-64"))
12835 {
12836 default_arch = "x86_64:32";
12837 break;
12838 }
12839 if (*l == NULL)
2b5d6a91 12840 as_fatal (_("no compiled in support for 32bit x86_64"));
351f65ca
L
12841 free (list);
12842 }
12843 else
12844 as_fatal (_("32bit x86_64 is only supported for ELF"));
12845 break;
12846#endif
12847
6e0b89ee
AM
12848 case OPTION_32:
12849 default_arch = "i386";
12850 break;
12851
b3b91714
AM
12852 case OPTION_DIVIDE:
12853#ifdef SVR4_COMMENT_CHARS
12854 {
12855 char *n, *t;
12856 const char *s;
12857
add39d23 12858 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
b3b91714
AM
12859 t = n;
12860 for (s = i386_comment_chars; *s != '\0'; s++)
12861 if (*s != '/')
12862 *t++ = *s;
12863 *t = '\0';
12864 i386_comment_chars = n;
12865 }
12866#endif
12867 break;
12868
9103f4f4 12869 case OPTION_MARCH:
293f5f65
L
12870 saved = xstrdup (arg);
12871 arch = saved;
12872 /* Allow -march=+nosse. */
12873 if (*arch == '+')
12874 arch++;
6305a203 12875 do
9103f4f4 12876 {
6305a203 12877 if (*arch == '.')
2b5d6a91 12878 as_fatal (_("invalid -march= option: `%s'"), arg);
6305a203
L
12879 next = strchr (arch, '+');
12880 if (next)
12881 *next++ = '\0';
91d6fa6a 12882 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9103f4f4 12883 {
91d6fa6a 12884 if (strcmp (arch, cpu_arch [j].name) == 0)
ccc9c027 12885 {
6305a203 12886 /* Processor. */
1ded5609
JB
12887 if (! cpu_arch[j].flags.bitfield.cpui386)
12888 continue;
12889
91d6fa6a 12890 cpu_arch_name = cpu_arch[j].name;
6305a203 12891 cpu_sub_arch_name = NULL;
91d6fa6a
NC
12892 cpu_arch_flags = cpu_arch[j].flags;
12893 cpu_arch_isa = cpu_arch[j].type;
12894 cpu_arch_isa_flags = cpu_arch[j].flags;
6305a203
L
12895 if (!cpu_arch_tune_set)
12896 {
12897 cpu_arch_tune = cpu_arch_isa;
12898 cpu_arch_tune_flags = cpu_arch_isa_flags;
12899 }
12900 break;
12901 }
91d6fa6a
NC
12902 else if (*cpu_arch [j].name == '.'
12903 && strcmp (arch, cpu_arch [j].name + 1) == 0)
6305a203 12904 {
33eaf5de 12905 /* ISA extension. */
6305a203 12906 i386_cpu_flags flags;
309d3373 12907
293f5f65
L
12908 flags = cpu_flags_or (cpu_arch_flags,
12909 cpu_arch[j].flags);
81486035 12910
5b64d091 12911 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
6305a203
L
12912 {
12913 if (cpu_sub_arch_name)
12914 {
12915 char *name = cpu_sub_arch_name;
12916 cpu_sub_arch_name = concat (name,
91d6fa6a 12917 cpu_arch[j].name,
1bf57e9f 12918 (const char *) NULL);
6305a203
L
12919 free (name);
12920 }
12921 else
91d6fa6a 12922 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
6305a203 12923 cpu_arch_flags = flags;
a586129e 12924 cpu_arch_isa_flags = flags;
6305a203 12925 }
0089dace
L
12926 else
12927 cpu_arch_isa_flags
12928 = cpu_flags_or (cpu_arch_isa_flags,
12929 cpu_arch[j].flags);
6305a203 12930 break;
ccc9c027 12931 }
9103f4f4 12932 }
6305a203 12933
293f5f65
L
12934 if (j >= ARRAY_SIZE (cpu_arch))
12935 {
33eaf5de 12936 /* Disable an ISA extension. */
293f5f65
L
12937 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12938 if (strcmp (arch, cpu_noarch [j].name) == 0)
12939 {
12940 i386_cpu_flags flags;
12941
12942 flags = cpu_flags_and_not (cpu_arch_flags,
12943 cpu_noarch[j].flags);
12944 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12945 {
12946 if (cpu_sub_arch_name)
12947 {
12948 char *name = cpu_sub_arch_name;
12949 cpu_sub_arch_name = concat (arch,
12950 (const char *) NULL);
12951 free (name);
12952 }
12953 else
12954 cpu_sub_arch_name = xstrdup (arch);
12955 cpu_arch_flags = flags;
12956 cpu_arch_isa_flags = flags;
12957 }
12958 break;
12959 }
12960
12961 if (j >= ARRAY_SIZE (cpu_noarch))
12962 j = ARRAY_SIZE (cpu_arch);
12963 }
12964
91d6fa6a 12965 if (j >= ARRAY_SIZE (cpu_arch))
2b5d6a91 12966 as_fatal (_("invalid -march= option: `%s'"), arg);
6305a203
L
12967
12968 arch = next;
9103f4f4 12969 }
293f5f65
L
12970 while (next != NULL);
12971 free (saved);
9103f4f4
L
12972 break;
12973
12974 case OPTION_MTUNE:
12975 if (*arg == '.')
2b5d6a91 12976 as_fatal (_("invalid -mtune= option: `%s'"), arg);
91d6fa6a 12977 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9103f4f4 12978 {
91d6fa6a 12979 if (strcmp (arg, cpu_arch [j].name) == 0)
9103f4f4 12980 {
ccc9c027 12981 cpu_arch_tune_set = 1;
91d6fa6a
NC
12982 cpu_arch_tune = cpu_arch [j].type;
12983 cpu_arch_tune_flags = cpu_arch[j].flags;
9103f4f4
L
12984 break;
12985 }
12986 }
91d6fa6a 12987 if (j >= ARRAY_SIZE (cpu_arch))
2b5d6a91 12988 as_fatal (_("invalid -mtune= option: `%s'"), arg);
9103f4f4
L
12989 break;
12990
1efbbeb4
L
12991 case OPTION_MMNEMONIC:
12992 if (strcasecmp (arg, "att") == 0)
12993 intel_mnemonic = 0;
12994 else if (strcasecmp (arg, "intel") == 0)
12995 intel_mnemonic = 1;
12996 else
2b5d6a91 12997 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
1efbbeb4
L
12998 break;
12999
13000 case OPTION_MSYNTAX:
13001 if (strcasecmp (arg, "att") == 0)
13002 intel_syntax = 0;
13003 else if (strcasecmp (arg, "intel") == 0)
13004 intel_syntax = 1;
13005 else
2b5d6a91 13006 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
1efbbeb4
L
13007 break;
13008
13009 case OPTION_MINDEX_REG:
13010 allow_index_reg = 1;
13011 break;
13012
13013 case OPTION_MNAKED_REG:
13014 allow_naked_reg = 1;
13015 break;
13016
c0f3af97
L
13017 case OPTION_MSSE2AVX:
13018 sse2avx = 1;
13019 break;
13020
daf50ae7
L
13021 case OPTION_MSSE_CHECK:
13022 if (strcasecmp (arg, "error") == 0)
7bab8ab5 13023 sse_check = check_error;
daf50ae7 13024 else if (strcasecmp (arg, "warning") == 0)
7bab8ab5 13025 sse_check = check_warning;
daf50ae7 13026 else if (strcasecmp (arg, "none") == 0)
7bab8ab5 13027 sse_check = check_none;
daf50ae7 13028 else
2b5d6a91 13029 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
daf50ae7
L
13030 break;
13031
7bab8ab5
JB
13032 case OPTION_MOPERAND_CHECK:
13033 if (strcasecmp (arg, "error") == 0)
13034 operand_check = check_error;
13035 else if (strcasecmp (arg, "warning") == 0)
13036 operand_check = check_warning;
13037 else if (strcasecmp (arg, "none") == 0)
13038 operand_check = check_none;
13039 else
13040 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
13041 break;
13042
539f890d
L
13043 case OPTION_MAVXSCALAR:
13044 if (strcasecmp (arg, "128") == 0)
13045 avxscalar = vex128;
13046 else if (strcasecmp (arg, "256") == 0)
13047 avxscalar = vex256;
13048 else
2b5d6a91 13049 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
539f890d
L
13050 break;
13051
03751133
L
13052 case OPTION_MVEXWIG:
13053 if (strcmp (arg, "0") == 0)
40c9c8de 13054 vexwig = vexw0;
03751133 13055 else if (strcmp (arg, "1") == 0)
40c9c8de 13056 vexwig = vexw1;
03751133
L
13057 else
13058 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
13059 break;
13060
7e8b059b
L
13061 case OPTION_MADD_BND_PREFIX:
13062 add_bnd_prefix = 1;
13063 break;
13064
43234a1e
L
13065 case OPTION_MEVEXLIG:
13066 if (strcmp (arg, "128") == 0)
13067 evexlig = evexl128;
13068 else if (strcmp (arg, "256") == 0)
13069 evexlig = evexl256;
13070 else if (strcmp (arg, "512") == 0)
13071 evexlig = evexl512;
13072 else
13073 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13074 break;
13075
d3d3c6db
IT
13076 case OPTION_MEVEXRCIG:
13077 if (strcmp (arg, "rne") == 0)
13078 evexrcig = rne;
13079 else if (strcmp (arg, "rd") == 0)
13080 evexrcig = rd;
13081 else if (strcmp (arg, "ru") == 0)
13082 evexrcig = ru;
13083 else if (strcmp (arg, "rz") == 0)
13084 evexrcig = rz;
13085 else
13086 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13087 break;
13088
43234a1e
L
13089 case OPTION_MEVEXWIG:
13090 if (strcmp (arg, "0") == 0)
13091 evexwig = evexw0;
13092 else if (strcmp (arg, "1") == 0)
13093 evexwig = evexw1;
13094 else
13095 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13096 break;
13097
167ad85b
TG
13098# if defined (TE_PE) || defined (TE_PEP)
13099 case OPTION_MBIG_OBJ:
13100 use_big_obj = 1;
13101 break;
13102#endif
13103
d1982f93 13104 case OPTION_MOMIT_LOCK_PREFIX:
d022bddd
IT
13105 if (strcasecmp (arg, "yes") == 0)
13106 omit_lock_prefix = 1;
13107 else if (strcasecmp (arg, "no") == 0)
13108 omit_lock_prefix = 0;
13109 else
13110 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13111 break;
13112
e4e00185
AS
13113 case OPTION_MFENCE_AS_LOCK_ADD:
13114 if (strcasecmp (arg, "yes") == 0)
13115 avoid_fence = 1;
13116 else if (strcasecmp (arg, "no") == 0)
13117 avoid_fence = 0;
13118 else
13119 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13120 break;
13121
ae531041
L
13122 case OPTION_MLFENCE_AFTER_LOAD:
13123 if (strcasecmp (arg, "yes") == 0)
13124 lfence_after_load = 1;
13125 else if (strcasecmp (arg, "no") == 0)
13126 lfence_after_load = 0;
13127 else
13128 as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13129 break;
13130
13131 case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13132 if (strcasecmp (arg, "all") == 0)
a09f656b 13133 {
13134 lfence_before_indirect_branch = lfence_branch_all;
13135 if (lfence_before_ret == lfence_before_ret_none)
13136 lfence_before_ret = lfence_before_ret_shl;
13137 }
ae531041
L
13138 else if (strcasecmp (arg, "memory") == 0)
13139 lfence_before_indirect_branch = lfence_branch_memory;
13140 else if (strcasecmp (arg, "register") == 0)
13141 lfence_before_indirect_branch = lfence_branch_register;
13142 else if (strcasecmp (arg, "none") == 0)
13143 lfence_before_indirect_branch = lfence_branch_none;
13144 else
13145 as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13146 arg);
13147 break;
13148
13149 case OPTION_MLFENCE_BEFORE_RET:
13150 if (strcasecmp (arg, "or") == 0)
13151 lfence_before_ret = lfence_before_ret_or;
13152 else if (strcasecmp (arg, "not") == 0)
13153 lfence_before_ret = lfence_before_ret_not;
a09f656b 13154 else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13155 lfence_before_ret = lfence_before_ret_shl;
ae531041
L
13156 else if (strcasecmp (arg, "none") == 0)
13157 lfence_before_ret = lfence_before_ret_none;
13158 else
13159 as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13160 arg);
13161 break;
13162
0cb4071e
L
13163 case OPTION_MRELAX_RELOCATIONS:
13164 if (strcasecmp (arg, "yes") == 0)
13165 generate_relax_relocations = 1;
13166 else if (strcasecmp (arg, "no") == 0)
13167 generate_relax_relocations = 0;
13168 else
13169 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13170 break;
13171
e379e5f3
L
13172 case OPTION_MALIGN_BRANCH_BOUNDARY:
13173 {
13174 char *end;
13175 long int align = strtoul (arg, &end, 0);
13176 if (*end == '\0')
13177 {
13178 if (align == 0)
13179 {
13180 align_branch_power = 0;
13181 break;
13182 }
13183 else if (align >= 16)
13184 {
13185 int align_power;
13186 for (align_power = 0;
13187 (align & 1) == 0;
13188 align >>= 1, align_power++)
13189 continue;
13190 /* Limit alignment power to 31. */
13191 if (align == 1 && align_power < 32)
13192 {
13193 align_branch_power = align_power;
13194 break;
13195 }
13196 }
13197 }
13198 as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13199 }
13200 break;
13201
13202 case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13203 {
13204 char *end;
13205 int align = strtoul (arg, &end, 0);
13206 /* Some processors only support 5 prefixes. */
13207 if (*end == '\0' && align >= 0 && align < 6)
13208 {
13209 align_branch_prefix_size = align;
13210 break;
13211 }
13212 as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13213 arg);
13214 }
13215 break;
13216
13217 case OPTION_MALIGN_BRANCH:
13218 align_branch = 0;
13219 saved = xstrdup (arg);
13220 type = saved;
13221 do
13222 {
13223 next = strchr (type, '+');
13224 if (next)
13225 *next++ = '\0';
13226 if (strcasecmp (type, "jcc") == 0)
13227 align_branch |= align_branch_jcc_bit;
13228 else if (strcasecmp (type, "fused") == 0)
13229 align_branch |= align_branch_fused_bit;
13230 else if (strcasecmp (type, "jmp") == 0)
13231 align_branch |= align_branch_jmp_bit;
13232 else if (strcasecmp (type, "call") == 0)
13233 align_branch |= align_branch_call_bit;
13234 else if (strcasecmp (type, "ret") == 0)
13235 align_branch |= align_branch_ret_bit;
13236 else if (strcasecmp (type, "indirect") == 0)
13237 align_branch |= align_branch_indirect_bit;
13238 else
13239 as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13240 type = next;
13241 }
13242 while (next != NULL);
13243 free (saved);
13244 break;
13245
76cf450b
L
13246 case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13247 align_branch_power = 5;
13248 align_branch_prefix_size = 5;
13249 align_branch = (align_branch_jcc_bit
13250 | align_branch_fused_bit
13251 | align_branch_jmp_bit);
13252 break;
13253
5db04b09 13254 case OPTION_MAMD64:
4b5aaf5f 13255 isa64 = amd64;
5db04b09
L
13256 break;
13257
13258 case OPTION_MINTEL64:
4b5aaf5f 13259 isa64 = intel64;
5db04b09
L
13260 break;
13261
b6f8c7c4
L
13262 case 'O':
13263 if (arg == NULL)
13264 {
13265 optimize = 1;
13266 /* Turn off -Os. */
13267 optimize_for_space = 0;
13268 }
13269 else if (*arg == 's')
13270 {
13271 optimize_for_space = 1;
13272 /* Turn on all encoding optimizations. */
41fd2579 13273 optimize = INT_MAX;
b6f8c7c4
L
13274 }
13275 else
13276 {
13277 optimize = atoi (arg);
13278 /* Turn off -Os. */
13279 optimize_for_space = 0;
13280 }
13281 break;
13282
252b5132
RH
13283 default:
13284 return 0;
13285 }
13286 return 1;
13287}
13288
8a2c8fef
L
13289#define MESSAGE_TEMPLATE \
13290" "
13291
293f5f65
L
13292static char *
13293output_message (FILE *stream, char *p, char *message, char *start,
13294 int *left_p, const char *name, int len)
13295{
13296 int size = sizeof (MESSAGE_TEMPLATE);
13297 int left = *left_p;
13298
13299 /* Reserve 2 spaces for ", " or ",\0" */
13300 left -= len + 2;
13301
13302 /* Check if there is any room. */
13303 if (left >= 0)
13304 {
13305 if (p != start)
13306 {
13307 *p++ = ',';
13308 *p++ = ' ';
13309 }
13310 p = mempcpy (p, name, len);
13311 }
13312 else
13313 {
13314 /* Output the current message now and start a new one. */
13315 *p++ = ',';
13316 *p = '\0';
13317 fprintf (stream, "%s\n", message);
13318 p = start;
13319 left = size - (start - message) - len - 2;
13320
13321 gas_assert (left >= 0);
13322
13323 p = mempcpy (p, name, len);
13324 }
13325
13326 *left_p = left;
13327 return p;
13328}
13329
8a2c8fef 13330static void
1ded5609 13331show_arch (FILE *stream, int ext, int check)
8a2c8fef
L
13332{
13333 static char message[] = MESSAGE_TEMPLATE;
13334 char *start = message + 27;
13335 char *p;
13336 int size = sizeof (MESSAGE_TEMPLATE);
13337 int left;
13338 const char *name;
13339 int len;
13340 unsigned int j;
13341
13342 p = start;
13343 left = size - (start - message);
13344 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13345 {
13346 /* Should it be skipped? */
13347 if (cpu_arch [j].skip)
13348 continue;
13349
13350 name = cpu_arch [j].name;
13351 len = cpu_arch [j].len;
13352 if (*name == '.')
13353 {
13354 /* It is an extension. Skip if we aren't asked to show it. */
13355 if (ext)
13356 {
13357 name++;
13358 len--;
13359 }
13360 else
13361 continue;
13362 }
13363 else if (ext)
13364 {
13365 /* It is an processor. Skip if we show only extension. */
13366 continue;
13367 }
1ded5609
JB
13368 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13369 {
13370 /* It is an impossible processor - skip. */
13371 continue;
13372 }
8a2c8fef 13373
293f5f65 13374 p = output_message (stream, p, message, start, &left, name, len);
8a2c8fef
L
13375 }
13376
293f5f65
L
13377 /* Display disabled extensions. */
13378 if (ext)
13379 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13380 {
13381 name = cpu_noarch [j].name;
13382 len = cpu_noarch [j].len;
13383 p = output_message (stream, p, message, start, &left, name,
13384 len);
13385 }
13386
8a2c8fef
L
13387 *p = '\0';
13388 fprintf (stream, "%s\n", message);
13389}
13390
252b5132 13391void
8a2c8fef 13392md_show_usage (FILE *stream)
252b5132 13393{
4cc782b5
ILT
13394#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13395 fprintf (stream, _("\
d4693039 13396 -Qy, -Qn ignored\n\
a38cf1db 13397 -V print assembler version number\n\
b3b91714
AM
13398 -k ignored\n"));
13399#endif
13400 fprintf (stream, _("\
12b55ccc 13401 -n Do not optimize code alignment\n\
b3b91714
AM
13402 -q quieten some warnings\n"));
13403#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13404 fprintf (stream, _("\
a38cf1db 13405 -s ignored\n"));
b3b91714 13406#endif
d7f449c0
L
13407#if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13408 || defined (TE_PE) || defined (TE_PEP))
751d281c 13409 fprintf (stream, _("\
570561f7 13410 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
751d281c 13411#endif
b3b91714
AM
13412#ifdef SVR4_COMMENT_CHARS
13413 fprintf (stream, _("\
13414 --divide do not treat `/' as a comment character\n"));
a38cf1db
AM
13415#else
13416 fprintf (stream, _("\
b3b91714 13417 --divide ignored\n"));
4cc782b5 13418#endif
9103f4f4 13419 fprintf (stream, _("\
6305a203 13420 -march=CPU[,+EXTENSION...]\n\
8a2c8fef 13421 generate code for CPU and EXTENSION, CPU is one of:\n"));
1ded5609 13422 show_arch (stream, 0, 1);
8a2c8fef
L
13423 fprintf (stream, _("\
13424 EXTENSION is combination of:\n"));
1ded5609 13425 show_arch (stream, 1, 0);
6305a203 13426 fprintf (stream, _("\
8a2c8fef 13427 -mtune=CPU optimize for CPU, CPU is one of:\n"));
1ded5609 13428 show_arch (stream, 0, 0);
ba104c83 13429 fprintf (stream, _("\
c0f3af97
L
13430 -msse2avx encode SSE instructions with VEX prefix\n"));
13431 fprintf (stream, _("\
7c5c05ef 13432 -msse-check=[none|error|warning] (default: warning)\n\
daf50ae7
L
13433 check SSE instructions\n"));
13434 fprintf (stream, _("\
7c5c05ef 13435 -moperand-check=[none|error|warning] (default: warning)\n\
7bab8ab5
JB
13436 check operand combinations for validity\n"));
13437 fprintf (stream, _("\
7c5c05ef
L
13438 -mavxscalar=[128|256] (default: 128)\n\
13439 encode scalar AVX instructions with specific vector\n\
539f890d
L
13440 length\n"));
13441 fprintf (stream, _("\
03751133
L
13442 -mvexwig=[0|1] (default: 0)\n\
13443 encode VEX instructions with specific VEX.W value\n\
13444 for VEX.W bit ignored instructions\n"));
13445 fprintf (stream, _("\
7c5c05ef
L
13446 -mevexlig=[128|256|512] (default: 128)\n\
13447 encode scalar EVEX instructions with specific vector\n\
43234a1e
L
13448 length\n"));
13449 fprintf (stream, _("\
7c5c05ef
L
13450 -mevexwig=[0|1] (default: 0)\n\
13451 encode EVEX instructions with specific EVEX.W value\n\
43234a1e
L
13452 for EVEX.W bit ignored instructions\n"));
13453 fprintf (stream, _("\
7c5c05ef 13454 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
d3d3c6db
IT
13455 encode EVEX instructions with specific EVEX.RC value\n\
13456 for SAE-only ignored instructions\n"));
13457 fprintf (stream, _("\
7c5c05ef
L
13458 -mmnemonic=[att|intel] "));
13459 if (SYSV386_COMPAT)
13460 fprintf (stream, _("(default: att)\n"));
13461 else
13462 fprintf (stream, _("(default: intel)\n"));
13463 fprintf (stream, _("\
13464 use AT&T/Intel mnemonic\n"));
ba104c83 13465 fprintf (stream, _("\
7c5c05ef
L
13466 -msyntax=[att|intel] (default: att)\n\
13467 use AT&T/Intel syntax\n"));
ba104c83
L
13468 fprintf (stream, _("\
13469 -mindex-reg support pseudo index registers\n"));
13470 fprintf (stream, _("\
13471 -mnaked-reg don't require `%%' prefix for registers\n"));
13472 fprintf (stream, _("\
7e8b059b 13473 -madd-bnd-prefix add BND prefix for all valid branches\n"));
b4a3a7b4 13474#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8dcea932
L
13475 fprintf (stream, _("\
13476 -mshared disable branch optimization for shared code\n"));
b4a3a7b4
L
13477 fprintf (stream, _("\
13478 -mx86-used-note=[no|yes] "));
13479 if (DEFAULT_X86_USED_NOTE)
13480 fprintf (stream, _("(default: yes)\n"));
13481 else
13482 fprintf (stream, _("(default: no)\n"));
13483 fprintf (stream, _("\
13484 generate x86 used ISA and feature properties\n"));
13485#endif
13486#if defined (TE_PE) || defined (TE_PEP)
167ad85b
TG
13487 fprintf (stream, _("\
13488 -mbig-obj generate big object files\n"));
13489#endif
d022bddd 13490 fprintf (stream, _("\
7c5c05ef 13491 -momit-lock-prefix=[no|yes] (default: no)\n\
d022bddd 13492 strip all lock prefixes\n"));
5db04b09 13493 fprintf (stream, _("\
7c5c05ef 13494 -mfence-as-lock-add=[no|yes] (default: no)\n\
e4e00185
AS
13495 encode lfence, mfence and sfence as\n\
13496 lock addl $0x0, (%%{re}sp)\n"));
13497 fprintf (stream, _("\
7c5c05ef
L
13498 -mrelax-relocations=[no|yes] "));
13499 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13500 fprintf (stream, _("(default: yes)\n"));
13501 else
13502 fprintf (stream, _("(default: no)\n"));
13503 fprintf (stream, _("\
0cb4071e
L
13504 generate relax relocations\n"));
13505 fprintf (stream, _("\
e379e5f3
L
13506 -malign-branch-boundary=NUM (default: 0)\n\
13507 align branches within NUM byte boundary\n"));
13508 fprintf (stream, _("\
13509 -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13510 TYPE is combination of jcc, fused, jmp, call, ret,\n\
13511 indirect\n\
13512 specify types of branches to align\n"));
13513 fprintf (stream, _("\
13514 -malign-branch-prefix-size=NUM (default: 5)\n\
13515 align branches with NUM prefixes per instruction\n"));
13516 fprintf (stream, _("\
76cf450b
L
13517 -mbranches-within-32B-boundaries\n\
13518 align branches within 32 byte boundary\n"));
13519 fprintf (stream, _("\
ae531041
L
13520 -mlfence-after-load=[no|yes] (default: no)\n\
13521 generate lfence after load\n"));
13522 fprintf (stream, _("\
13523 -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13524 generate lfence before indirect near branch\n"));
13525 fprintf (stream, _("\
a09f656b 13526 -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
ae531041
L
13527 generate lfence before ret\n"));
13528 fprintf (stream, _("\
7c5c05ef 13529 -mamd64 accept only AMD64 ISA [default]\n"));
5db04b09
L
13530 fprintf (stream, _("\
13531 -mintel64 accept only Intel64 ISA\n"));
252b5132
RH
13532}
13533
3e73aa7c 13534#if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
321098a5 13535 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
e57f8c65 13536 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
252b5132
RH
13537
13538/* Pick the target format to use. */
13539
47926f60 13540const char *
e3bb37b5 13541i386_target_format (void)
252b5132 13542{
351f65ca
L
13543 if (!strncmp (default_arch, "x86_64", 6))
13544 {
13545 update_code_flag (CODE_64BIT, 1);
13546 if (default_arch[6] == '\0')
7f56bc95 13547 x86_elf_abi = X86_64_ABI;
351f65ca 13548 else
7f56bc95 13549 x86_elf_abi = X86_64_X32_ABI;
351f65ca 13550 }
3e73aa7c 13551 else if (!strcmp (default_arch, "i386"))
78f12dd3 13552 update_code_flag (CODE_32BIT, 1);
5197d474
L
13553 else if (!strcmp (default_arch, "iamcu"))
13554 {
13555 update_code_flag (CODE_32BIT, 1);
13556 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13557 {
13558 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13559 cpu_arch_name = "iamcu";
13560 cpu_sub_arch_name = NULL;
13561 cpu_arch_flags = iamcu_flags;
13562 cpu_arch_isa = PROCESSOR_IAMCU;
13563 cpu_arch_isa_flags = iamcu_flags;
13564 if (!cpu_arch_tune_set)
13565 {
13566 cpu_arch_tune = cpu_arch_isa;
13567 cpu_arch_tune_flags = cpu_arch_isa_flags;
13568 }
13569 }
8d471ec1 13570 else if (cpu_arch_isa != PROCESSOR_IAMCU)
5197d474
L
13571 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13572 cpu_arch_name);
13573 }
3e73aa7c 13574 else
2b5d6a91 13575 as_fatal (_("unknown architecture"));
89507696
JB
13576
13577 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13578 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13579 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13580 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13581
252b5132
RH
13582 switch (OUTPUT_FLAVOR)
13583 {
9384f2ff 13584#if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
4c63da97 13585 case bfd_target_aout_flavour:
47926f60 13586 return AOUT_TARGET_FORMAT;
4c63da97 13587#endif
9384f2ff
AM
13588#if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13589# if defined (TE_PE) || defined (TE_PEP)
13590 case bfd_target_coff_flavour:
167ad85b
TG
13591 if (flag_code == CODE_64BIT)
13592 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13593 else
251dae91 13594 return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
9384f2ff 13595# elif defined (TE_GO32)
0561d57c
JK
13596 case bfd_target_coff_flavour:
13597 return "coff-go32";
9384f2ff 13598# else
252b5132
RH
13599 case bfd_target_coff_flavour:
13600 return "coff-i386";
9384f2ff 13601# endif
4c63da97 13602#endif
3e73aa7c 13603#if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
252b5132 13604 case bfd_target_elf_flavour:
3e73aa7c 13605 {
351f65ca
L
13606 const char *format;
13607
13608 switch (x86_elf_abi)
4fa24527 13609 {
351f65ca
L
13610 default:
13611 format = ELF_TARGET_FORMAT;
e379e5f3
L
13612#ifndef TE_SOLARIS
13613 tls_get_addr = "___tls_get_addr";
13614#endif
351f65ca 13615 break;
7f56bc95 13616 case X86_64_ABI:
351f65ca 13617 use_rela_relocations = 1;
4fa24527 13618 object_64bit = 1;
e379e5f3
L
13619#ifndef TE_SOLARIS
13620 tls_get_addr = "__tls_get_addr";
13621#endif
351f65ca
L
13622 format = ELF_TARGET_FORMAT64;
13623 break;
7f56bc95 13624 case X86_64_X32_ABI:
4fa24527 13625 use_rela_relocations = 1;
351f65ca 13626 object_64bit = 1;
e379e5f3
L
13627#ifndef TE_SOLARIS
13628 tls_get_addr = "__tls_get_addr";
13629#endif
862be3fb 13630 disallow_64bit_reloc = 1;
351f65ca
L
13631 format = ELF_TARGET_FORMAT32;
13632 break;
4fa24527 13633 }
3632d14b 13634 if (cpu_arch_isa == PROCESSOR_L1OM)
8a9036a4 13635 {
7f56bc95 13636 if (x86_elf_abi != X86_64_ABI)
8a9036a4
L
13637 as_fatal (_("Intel L1OM is 64bit only"));
13638 return ELF_TARGET_L1OM_FORMAT;
13639 }
b49f93f6 13640 else if (cpu_arch_isa == PROCESSOR_K1OM)
7a9068fe
L
13641 {
13642 if (x86_elf_abi != X86_64_ABI)
13643 as_fatal (_("Intel K1OM is 64bit only"));
13644 return ELF_TARGET_K1OM_FORMAT;
13645 }
81486035
L
13646 else if (cpu_arch_isa == PROCESSOR_IAMCU)
13647 {
13648 if (x86_elf_abi != I386_ABI)
13649 as_fatal (_("Intel MCU is 32bit only"));
13650 return ELF_TARGET_IAMCU_FORMAT;
13651 }
8a9036a4 13652 else
351f65ca 13653 return format;
3e73aa7c 13654 }
e57f8c65
TG
13655#endif
13656#if defined (OBJ_MACH_O)
13657 case bfd_target_mach_o_flavour:
d382c579
TG
13658 if (flag_code == CODE_64BIT)
13659 {
13660 use_rela_relocations = 1;
13661 object_64bit = 1;
13662 return "mach-o-x86-64";
13663 }
13664 else
13665 return "mach-o-i386";
4c63da97 13666#endif
252b5132
RH
13667 default:
13668 abort ();
13669 return NULL;
13670 }
13671}
13672
47926f60 13673#endif /* OBJ_MAYBE_ more than one */
252b5132 13674\f
252b5132 13675symbolS *
7016a5d5 13676md_undefined_symbol (char *name)
252b5132 13677{
18dc2407
ILT
13678 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13679 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13680 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13681 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
24eab124
AM
13682 {
13683 if (!GOT_symbol)
13684 {
13685 if (symbol_find (name))
13686 as_bad (_("GOT already in symbol table"));
13687 GOT_symbol = symbol_new (name, undefined_section,
13688 (valueT) 0, &zero_address_frag);
13689 };
13690 return GOT_symbol;
13691 }
252b5132
RH
13692 return 0;
13693}
13694
13695/* Round up a section size to the appropriate boundary. */
47926f60 13696
252b5132 13697valueT
7016a5d5 13698md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
252b5132 13699{
4c63da97
AM
13700#if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13701 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13702 {
13703 /* For a.out, force the section size to be aligned. If we don't do
13704 this, BFD will align it for us, but it will not write out the
13705 final bytes of the section. This may be a bug in BFD, but it is
13706 easier to fix it here since that is how the other a.out targets
13707 work. */
13708 int align;
13709
fd361982 13710 align = bfd_section_alignment (segment);
8d3842cd 13711 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
4c63da97 13712 }
252b5132
RH
13713#endif
13714
13715 return size;
13716}
13717
13718/* On the i386, PC-relative offsets are relative to the start of the
13719 next instruction. That is, the address of the offset, plus its
13720 size, since the offset is always the last part of the insn. */
13721
13722long
e3bb37b5 13723md_pcrel_from (fixS *fixP)
252b5132
RH
13724{
13725 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13726}
13727
13728#ifndef I386COFF
13729
13730static void
e3bb37b5 13731s_bss (int ignore ATTRIBUTE_UNUSED)
252b5132 13732{
29b0f896 13733 int temp;
252b5132 13734
8a75718c
JB
13735#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13736 if (IS_ELF)
13737 obj_elf_section_change_hook ();
13738#endif
252b5132
RH
13739 temp = get_absolute_expression ();
13740 subseg_set (bss_section, (subsegT) temp);
13741 demand_empty_rest_of_line ();
13742}
13743
13744#endif
13745
e379e5f3
L
13746/* Remember constant directive. */
13747
13748void
13749i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13750{
13751 if (last_insn.kind != last_insn_directive
13752 && (bfd_section_flags (now_seg) & SEC_CODE))
13753 {
13754 last_insn.seg = now_seg;
13755 last_insn.kind = last_insn_directive;
13756 last_insn.name = "constant directive";
13757 last_insn.file = as_where (&last_insn.line);
ae531041
L
13758 if (lfence_before_ret != lfence_before_ret_none)
13759 {
13760 if (lfence_before_indirect_branch != lfence_branch_none)
13761 as_warn (_("constant directive skips -mlfence-before-ret "
13762 "and -mlfence-before-indirect-branch"));
13763 else
13764 as_warn (_("constant directive skips -mlfence-before-ret"));
13765 }
13766 else if (lfence_before_indirect_branch != lfence_branch_none)
13767 as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
e379e5f3
L
13768 }
13769}
13770
252b5132 13771void
e3bb37b5 13772i386_validate_fix (fixS *fixp)
252b5132 13773{
02a86693 13774 if (fixp->fx_subsy)
252b5132 13775 {
02a86693 13776 if (fixp->fx_subsy == GOT_symbol)
23df1078 13777 {
02a86693
L
13778 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13779 {
13780 if (!object_64bit)
13781 abort ();
13782#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13783 if (fixp->fx_tcbit2)
56ceb5b5
L
13784 fixp->fx_r_type = (fixp->fx_tcbit
13785 ? BFD_RELOC_X86_64_REX_GOTPCRELX
13786 : BFD_RELOC_X86_64_GOTPCRELX);
02a86693
L
13787 else
13788#endif
13789 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13790 }
d6ab8113 13791 else
02a86693
L
13792 {
13793 if (!object_64bit)
13794 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13795 else
13796 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13797 }
13798 fixp->fx_subsy = 0;
23df1078 13799 }
252b5132 13800 }
02a86693
L
13801#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13802 else if (!object_64bit)
13803 {
13804 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13805 && fixp->fx_tcbit2)
13806 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13807 }
13808#endif
252b5132
RH
13809}
13810
252b5132 13811arelent *
7016a5d5 13812tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
252b5132
RH
13813{
13814 arelent *rel;
13815 bfd_reloc_code_real_type code;
13816
13817 switch (fixp->fx_r_type)
13818 {
8ce3d284 13819#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8fd4256d
L
13820 case BFD_RELOC_SIZE32:
13821 case BFD_RELOC_SIZE64:
13822 if (S_IS_DEFINED (fixp->fx_addsy)
13823 && !S_IS_EXTERNAL (fixp->fx_addsy))
13824 {
13825 /* Resolve size relocation against local symbol to size of
13826 the symbol plus addend. */
13827 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13828 if (fixp->fx_r_type == BFD_RELOC_SIZE32
13829 && !fits_in_unsigned_long (value))
13830 as_bad_where (fixp->fx_file, fixp->fx_line,
13831 _("symbol size computation overflow"));
13832 fixp->fx_addsy = NULL;
13833 fixp->fx_subsy = NULL;
13834 md_apply_fix (fixp, (valueT *) &value, NULL);
13835 return NULL;
13836 }
8ce3d284 13837#endif
1a0670f3 13838 /* Fall through. */
8fd4256d 13839
3e73aa7c
JH
13840 case BFD_RELOC_X86_64_PLT32:
13841 case BFD_RELOC_X86_64_GOT32:
13842 case BFD_RELOC_X86_64_GOTPCREL:
56ceb5b5
L
13843 case BFD_RELOC_X86_64_GOTPCRELX:
13844 case BFD_RELOC_X86_64_REX_GOTPCRELX:
252b5132
RH
13845 case BFD_RELOC_386_PLT32:
13846 case BFD_RELOC_386_GOT32:
02a86693 13847 case BFD_RELOC_386_GOT32X:
252b5132
RH
13848 case BFD_RELOC_386_GOTOFF:
13849 case BFD_RELOC_386_GOTPC:
13ae64f3
JJ
13850 case BFD_RELOC_386_TLS_GD:
13851 case BFD_RELOC_386_TLS_LDM:
13852 case BFD_RELOC_386_TLS_LDO_32:
13853 case BFD_RELOC_386_TLS_IE_32:
37e55690
JJ
13854 case BFD_RELOC_386_TLS_IE:
13855 case BFD_RELOC_386_TLS_GOTIE:
13ae64f3
JJ
13856 case BFD_RELOC_386_TLS_LE_32:
13857 case BFD_RELOC_386_TLS_LE:
67a4f2b7
AO
13858 case BFD_RELOC_386_TLS_GOTDESC:
13859 case BFD_RELOC_386_TLS_DESC_CALL:
bffbf940
JJ
13860 case BFD_RELOC_X86_64_TLSGD:
13861 case BFD_RELOC_X86_64_TLSLD:
13862 case BFD_RELOC_X86_64_DTPOFF32:
d6ab8113 13863 case BFD_RELOC_X86_64_DTPOFF64:
bffbf940
JJ
13864 case BFD_RELOC_X86_64_GOTTPOFF:
13865 case BFD_RELOC_X86_64_TPOFF32:
d6ab8113
JB
13866 case BFD_RELOC_X86_64_TPOFF64:
13867 case BFD_RELOC_X86_64_GOTOFF64:
13868 case BFD_RELOC_X86_64_GOTPC32:
7b81dfbb
AJ
13869 case BFD_RELOC_X86_64_GOT64:
13870 case BFD_RELOC_X86_64_GOTPCREL64:
13871 case BFD_RELOC_X86_64_GOTPC64:
13872 case BFD_RELOC_X86_64_GOTPLT64:
13873 case BFD_RELOC_X86_64_PLTOFF64:
67a4f2b7
AO
13874 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13875 case BFD_RELOC_X86_64_TLSDESC_CALL:
252b5132
RH
13876 case BFD_RELOC_RVA:
13877 case BFD_RELOC_VTABLE_ENTRY:
13878 case BFD_RELOC_VTABLE_INHERIT:
6482c264
NC
13879#ifdef TE_PE
13880 case BFD_RELOC_32_SECREL:
13881#endif
252b5132
RH
13882 code = fixp->fx_r_type;
13883 break;
dbbaec26
L
13884 case BFD_RELOC_X86_64_32S:
13885 if (!fixp->fx_pcrel)
13886 {
13887 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
13888 code = fixp->fx_r_type;
13889 break;
13890 }
1a0670f3 13891 /* Fall through. */
252b5132 13892 default:
93382f6d 13893 if (fixp->fx_pcrel)
252b5132 13894 {
93382f6d
AM
13895 switch (fixp->fx_size)
13896 {
13897 default:
b091f402
AM
13898 as_bad_where (fixp->fx_file, fixp->fx_line,
13899 _("can not do %d byte pc-relative relocation"),
13900 fixp->fx_size);
93382f6d
AM
13901 code = BFD_RELOC_32_PCREL;
13902 break;
13903 case 1: code = BFD_RELOC_8_PCREL; break;
13904 case 2: code = BFD_RELOC_16_PCREL; break;
d258b828 13905 case 4: code = BFD_RELOC_32_PCREL; break;
d6ab8113
JB
13906#ifdef BFD64
13907 case 8: code = BFD_RELOC_64_PCREL; break;
13908#endif
93382f6d
AM
13909 }
13910 }
13911 else
13912 {
13913 switch (fixp->fx_size)
13914 {
13915 default:
b091f402
AM
13916 as_bad_where (fixp->fx_file, fixp->fx_line,
13917 _("can not do %d byte relocation"),
13918 fixp->fx_size);
93382f6d
AM
13919 code = BFD_RELOC_32;
13920 break;
13921 case 1: code = BFD_RELOC_8; break;
13922 case 2: code = BFD_RELOC_16; break;
13923 case 4: code = BFD_RELOC_32; break;
937149dd 13924#ifdef BFD64
3e73aa7c 13925 case 8: code = BFD_RELOC_64; break;
937149dd 13926#endif
93382f6d 13927 }
252b5132
RH
13928 }
13929 break;
13930 }
252b5132 13931
d182319b
JB
13932 if ((code == BFD_RELOC_32
13933 || code == BFD_RELOC_32_PCREL
13934 || code == BFD_RELOC_X86_64_32S)
252b5132
RH
13935 && GOT_symbol
13936 && fixp->fx_addsy == GOT_symbol)
3e73aa7c 13937 {
4fa24527 13938 if (!object_64bit)
d6ab8113
JB
13939 code = BFD_RELOC_386_GOTPC;
13940 else
13941 code = BFD_RELOC_X86_64_GOTPC32;
3e73aa7c 13942 }
7b81dfbb
AJ
13943 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13944 && GOT_symbol
13945 && fixp->fx_addsy == GOT_symbol)
13946 {
13947 code = BFD_RELOC_X86_64_GOTPC64;
13948 }
252b5132 13949
add39d23
TS
13950 rel = XNEW (arelent);
13951 rel->sym_ptr_ptr = XNEW (asymbol *);
49309057 13952 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
252b5132
RH
13953
13954 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
c87db184 13955
3e73aa7c
JH
13956 if (!use_rela_relocations)
13957 {
13958 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
13959 vtable entry to be used in the relocation's section offset. */
13960 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
13961 rel->address = fixp->fx_offset;
fbeb56a4
DK
13962#if defined (OBJ_COFF) && defined (TE_PE)
13963 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
13964 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
13965 else
13966#endif
c6682705 13967 rel->addend = 0;
3e73aa7c
JH
13968 }
13969 /* Use the rela in 64bit mode. */
252b5132 13970 else
3e73aa7c 13971 {
862be3fb
L
13972 if (disallow_64bit_reloc)
13973 switch (code)
13974 {
862be3fb
L
13975 case BFD_RELOC_X86_64_DTPOFF64:
13976 case BFD_RELOC_X86_64_TPOFF64:
13977 case BFD_RELOC_64_PCREL:
13978 case BFD_RELOC_X86_64_GOTOFF64:
13979 case BFD_RELOC_X86_64_GOT64:
13980 case BFD_RELOC_X86_64_GOTPCREL64:
13981 case BFD_RELOC_X86_64_GOTPC64:
13982 case BFD_RELOC_X86_64_GOTPLT64:
13983 case BFD_RELOC_X86_64_PLTOFF64:
13984 as_bad_where (fixp->fx_file, fixp->fx_line,
13985 _("cannot represent relocation type %s in x32 mode"),
13986 bfd_get_reloc_code_name (code));
13987 break;
13988 default:
13989 break;
13990 }
13991
062cd5e7
AS
13992 if (!fixp->fx_pcrel)
13993 rel->addend = fixp->fx_offset;
13994 else
13995 switch (code)
13996 {
13997 case BFD_RELOC_X86_64_PLT32:
13998 case BFD_RELOC_X86_64_GOT32:
13999 case BFD_RELOC_X86_64_GOTPCREL:
56ceb5b5
L
14000 case BFD_RELOC_X86_64_GOTPCRELX:
14001 case BFD_RELOC_X86_64_REX_GOTPCRELX:
bffbf940
JJ
14002 case BFD_RELOC_X86_64_TLSGD:
14003 case BFD_RELOC_X86_64_TLSLD:
14004 case BFD_RELOC_X86_64_GOTTPOFF:
67a4f2b7
AO
14005 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14006 case BFD_RELOC_X86_64_TLSDESC_CALL:
062cd5e7
AS
14007 rel->addend = fixp->fx_offset - fixp->fx_size;
14008 break;
14009 default:
14010 rel->addend = (section->vma
14011 - fixp->fx_size
14012 + fixp->fx_addnumber
14013 + md_pcrel_from (fixp));
14014 break;
14015 }
3e73aa7c
JH
14016 }
14017
252b5132
RH
14018 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
14019 if (rel->howto == NULL)
14020 {
14021 as_bad_where (fixp->fx_file, fixp->fx_line,
d0b47220 14022 _("cannot represent relocation type %s"),
252b5132
RH
14023 bfd_get_reloc_code_name (code));
14024 /* Set howto to a garbage value so that we can keep going. */
14025 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
9c2799c2 14026 gas_assert (rel->howto != NULL);
252b5132
RH
14027 }
14028
14029 return rel;
14030}
14031
ee86248c 14032#include "tc-i386-intel.c"
54cfded0 14033
a60de03c
JB
14034void
14035tc_x86_parse_to_dw2regnum (expressionS *exp)
54cfded0 14036{
a60de03c
JB
14037 int saved_naked_reg;
14038 char saved_register_dot;
54cfded0 14039
a60de03c
JB
14040 saved_naked_reg = allow_naked_reg;
14041 allow_naked_reg = 1;
14042 saved_register_dot = register_chars['.'];
14043 register_chars['.'] = '.';
14044 allow_pseudo_reg = 1;
14045 expression_and_evaluate (exp);
14046 allow_pseudo_reg = 0;
14047 register_chars['.'] = saved_register_dot;
14048 allow_naked_reg = saved_naked_reg;
14049
e96d56a1 14050 if (exp->X_op == O_register && exp->X_add_number >= 0)
54cfded0 14051 {
a60de03c
JB
14052 if ((addressT) exp->X_add_number < i386_regtab_size)
14053 {
14054 exp->X_op = O_constant;
14055 exp->X_add_number = i386_regtab[exp->X_add_number]
14056 .dw2_regnum[flag_code >> 1];
14057 }
14058 else
14059 exp->X_op = O_illegal;
54cfded0 14060 }
54cfded0
AM
14061}
14062
14063void
14064tc_x86_frame_initial_instructions (void)
14065{
a60de03c
JB
14066 static unsigned int sp_regno[2];
14067
14068 if (!sp_regno[flag_code >> 1])
14069 {
14070 char *saved_input = input_line_pointer;
14071 char sp[][4] = {"esp", "rsp"};
14072 expressionS exp;
a4447b93 14073
a60de03c
JB
14074 input_line_pointer = sp[flag_code >> 1];
14075 tc_x86_parse_to_dw2regnum (&exp);
9c2799c2 14076 gas_assert (exp.X_op == O_constant);
a60de03c
JB
14077 sp_regno[flag_code >> 1] = exp.X_add_number;
14078 input_line_pointer = saved_input;
14079 }
a4447b93 14080
61ff971f
L
14081 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14082 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
54cfded0 14083}
d2b2c203 14084
d7921315
L
14085int
14086x86_dwarf2_addr_size (void)
14087{
14088#if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14089 if (x86_elf_abi == X86_64_X32_ABI)
14090 return 4;
14091#endif
14092 return bfd_arch_bits_per_address (stdoutput) / 8;
14093}
14094
d2b2c203
DJ
14095int
14096i386_elf_section_type (const char *str, size_t len)
14097{
14098 if (flag_code == CODE_64BIT
14099 && len == sizeof ("unwind") - 1
14100 && strncmp (str, "unwind", 6) == 0)
14101 return SHT_X86_64_UNWIND;
14102
14103 return -1;
14104}
bb41ade5 14105
ad5fec3b
EB
14106#ifdef TE_SOLARIS
14107void
14108i386_solaris_fix_up_eh_frame (segT sec)
14109{
14110 if (flag_code == CODE_64BIT)
14111 elf_section_type (sec) = SHT_X86_64_UNWIND;
14112}
14113#endif
14114
bb41ade5
AM
14115#ifdef TE_PE
14116void
14117tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14118{
91d6fa6a 14119 expressionS exp;
bb41ade5 14120
91d6fa6a
NC
14121 exp.X_op = O_secrel;
14122 exp.X_add_symbol = symbol;
14123 exp.X_add_number = 0;
14124 emit_expr (&exp, size);
bb41ade5
AM
14125}
14126#endif
3b22753a
L
14127
14128#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14129/* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
14130
01e1a5bc 14131bfd_vma
6d4af3c2 14132x86_64_section_letter (int letter, const char **ptr_msg)
3b22753a
L
14133{
14134 if (flag_code == CODE_64BIT)
14135 {
14136 if (letter == 'l')
14137 return SHF_X86_64_LARGE;
14138
8f3bae45 14139 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
64e74474 14140 }
3b22753a 14141 else
8f3bae45 14142 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
3b22753a
L
14143 return -1;
14144}
14145
01e1a5bc 14146bfd_vma
3b22753a
L
14147x86_64_section_word (char *str, size_t len)
14148{
8620418b 14149 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
3b22753a
L
14150 return SHF_X86_64_LARGE;
14151
14152 return -1;
14153}
14154
14155static void
14156handle_large_common (int small ATTRIBUTE_UNUSED)
14157{
14158 if (flag_code != CODE_64BIT)
14159 {
14160 s_comm_internal (0, elf_common_parse);
14161 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14162 }
14163 else
14164 {
14165 static segT lbss_section;
14166 asection *saved_com_section_ptr = elf_com_section_ptr;
14167 asection *saved_bss_section = bss_section;
14168
14169 if (lbss_section == NULL)
14170 {
14171 flagword applicable;
14172 segT seg = now_seg;
14173 subsegT subseg = now_subseg;
14174
14175 /* The .lbss section is for local .largecomm symbols. */
14176 lbss_section = subseg_new (".lbss", 0);
14177 applicable = bfd_applicable_section_flags (stdoutput);
fd361982 14178 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
3b22753a
L
14179 seg_info (lbss_section)->bss = 1;
14180
14181 subseg_set (seg, subseg);
14182 }
14183
14184 elf_com_section_ptr = &_bfd_elf_large_com_section;
14185 bss_section = lbss_section;
14186
14187 s_comm_internal (0, elf_common_parse);
14188
14189 elf_com_section_ptr = saved_com_section_ptr;
14190 bss_section = saved_bss_section;
14191 }
14192}
14193#endif /* OBJ_ELF || OBJ_MAYBE_ELF */
This page took 2.375282 seconds and 4 git commands to generate.